diff --git "a/wandb/run-20220228_163348-20lja62k/files/wandb-summary.json" "b/wandb/run-20220228_163348-20lja62k/files/wandb-summary.json" new file mode 100644--- /dev/null +++ "b/wandb/run-20220228_163348-20lja62k/files/wandb-summary.json" @@ -0,0 +1 @@ +{"train/loss": 4.4503, "train/learning_rate": 9.920000000000002e-06, "train/epoch": 0.42, "train/global_step": 500, "_runtime": 2848, "_timestamp": 1646068877, "_step": 500, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 7.0, 145.0, 645.0, 209.0, 10.0, 1.0, 0.0, 1.0], "bins": [-380.4229736328125, -373.9246826171875, -367.4263916015625, -360.9281005859375, -354.4298095703125, -347.9315185546875, -341.4332275390625, -334.9349365234375, -328.4366455078125, -321.9383544921875, -315.4400634765625, -308.9417724609375, -302.4434814453125, -295.9451904296875, -289.4468994140625, -282.9486083984375, -276.4503173828125, -269.9520263671875, -263.4537353515625, -256.9554443359375, -250.4571533203125, -243.9588623046875, -237.4605712890625, -230.9622802734375, -224.4639892578125, -217.9656982421875, -211.4674072265625, -204.9691162109375, -198.4708251953125, -191.9725341796875, -185.4742431640625, -178.9759521484375, -172.47767639160156, -165.97938537597656, -159.48109436035156, -152.98280334472656, -146.48451232910156, -139.98622131347656, -133.48793029785156, -126.98963928222656, -120.49134826660156, -113.99305725097656, -107.49476623535156, -100.99647521972656, -94.49818420410156, -87.99989318847656, -81.50160217285156, -75.00331115722656, -68.50502014160156, -62.00672912597656, -55.50843811035156, -49.01014709472656, -42.51185607910156, -36.01356506347656, -29.515274047851562, -23.016983032226562, -16.518688201904297, -10.020397186279297, -3.522106170654297, 2.976184844970703, 9.474475860595703, 15.972766876220703, 22.471057891845703, 28.969348907470703, 35.4676399230957]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 3.0, 8.0, 9.0, 15.0, 10.0, 11.0, 17.0, 25.0, 16.0, 20.0, 28.0, 28.0, 34.0, 24.0, 27.0, 34.0, 43.0, 39.0, 53.0, 38.0, 51.0, 41.0, 51.0, 40.0, 35.0, 41.0, 35.0, 28.0, 24.0, 26.0, 24.0, 20.0, 19.0, 14.0, 12.0, 12.0, 8.0, 7.0, 11.0, 7.0, 2.0, 5.0, 0.0, 2.0, 6.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-50.255489349365234, -48.58753967285156, -46.919586181640625, -45.25163650512695, -43.58368682861328, -41.915733337402344, -40.24778366088867, -38.579833984375, -36.91188049316406, -35.24393081665039, -33.57597732543945, -31.90802764892578, -30.24007797241211, -28.572126388549805, -26.9041748046875, -25.236225128173828, -23.568275451660156, -21.90032386779785, -20.23237419128418, -18.564422607421875, -16.896472930908203, -15.228521347045898, -13.560569763183594, -11.892619132995605, -10.224668502807617, -8.556717872619629, -6.888766765594482, -5.220815658569336, -3.5528650283813477, -1.8849143981933594, -0.2169628143310547, 1.4509878158569336, 3.1189346313476562, 4.7868852615356445, 6.454836368560791, 8.122787475585938, 9.790738105773926, 11.458688735961914, 13.126640319824219, 14.794590950012207, 16.462541580200195, 18.1304931640625, 19.798442840576172, 21.466394424438477, 23.13434600830078, 24.802295684814453, 26.470247268676758, 28.138198852539062, 29.806148529052734, 31.47410011291504, 33.142051696777344, 34.810001373291016, 36.47795104980469, 38.145904541015625, 39.8138542175293, 41.48180389404297, 43.149757385253906, 44.81770706176758, 46.485660552978516, 48.15361022949219, 49.82155990600586, 51.48950958251953, 53.15746307373047, 54.82541275024414, 56.49336242675781]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 4.0, 3.0, 5.0, 5.0, 7.0, 7.0, 11.0, 13.0, 10.0, 18.0, 23.0, 21.0, 23.0, 28.0, 16.0, 28.0, 36.0, 36.0, 26.0, 36.0, 39.0, 36.0, 40.0, 47.0, 54.0, 31.0, 38.0, 45.0, 33.0, 37.0, 29.0, 28.0, 22.0, 23.0, 18.0, 20.0, 20.0, 14.0, 21.0, 14.0, 9.0, 4.0, 6.0, 5.0, 6.0, 7.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.7109375, -3.593231201171875, -3.47552490234375, -3.357818603515625, -3.2401123046875, -3.122406005859375, -3.00469970703125, -2.886993408203125, -2.769287109375, -2.651580810546875, -2.53387451171875, -2.416168212890625, -2.2984619140625, -2.180755615234375, -2.06304931640625, -1.945343017578125, -1.82763671875, -1.709930419921875, -1.59222412109375, -1.474517822265625, -1.3568115234375, -1.239105224609375, -1.12139892578125, -1.003692626953125, -0.885986328125, -0.768280029296875, -0.65057373046875, -0.532867431640625, -0.4151611328125, -0.297454833984375, -0.17974853515625, -0.062042236328125, 0.0556640625, 0.173370361328125, 0.29107666015625, 0.408782958984375, 0.5264892578125, 0.644195556640625, 0.76190185546875, 0.879608154296875, 0.997314453125, 1.115020751953125, 1.23272705078125, 1.350433349609375, 1.4681396484375, 1.585845947265625, 1.70355224609375, 1.821258544921875, 1.93896484375, 2.056671142578125, 2.17437744140625, 2.292083740234375, 2.4097900390625, 2.527496337890625, 2.64520263671875, 2.762908935546875, 2.880615234375, 2.998321533203125, 3.11602783203125, 3.233734130859375, 3.3514404296875, 3.469146728515625, 3.58685302734375, 3.704559326171875, 3.822265625]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 2.0, 7.0, 12.0, 15.0, 10.0, 12.0, 23.0, 17.0, 27.0, 40.0, 59.0, 62.0, 94.0, 117.0, 147.0, 221.0, 275.0, 372.0, 544.0, 748.0, 1194.0, 1940.0, 3334.0, 6528.0, 15690.0, 56124.0, 430348.0, 2258171.0, 1227786.0, 139698.0, 27880.0, 10223.0, 4880.0, 2546.0, 1563.0, 1021.0, 713.0, 465.0, 316.0, 240.0, 209.0, 150.0, 116.0, 92.0, 59.0, 51.0, 38.0, 28.0, 27.0, 16.0, 8.0, 9.0, 9.0, 4.0, 4.0, 1.0, 4.0, 3.0, 1.0, 3.0, 1.0], "bins": [-9.8359375, -9.51611328125, -9.1962890625, -8.87646484375, -8.556640625, -8.23681640625, -7.9169921875, -7.59716796875, -7.27734375, -6.95751953125, -6.6376953125, -6.31787109375, -5.998046875, -5.67822265625, -5.3583984375, -5.03857421875, -4.71875, -4.39892578125, -4.0791015625, -3.75927734375, -3.439453125, -3.11962890625, -2.7998046875, -2.47998046875, -2.16015625, -1.84033203125, -1.5205078125, -1.20068359375, -0.880859375, -0.56103515625, -0.2412109375, 0.07861328125, 0.3984375, 0.71826171875, 1.0380859375, 1.35791015625, 1.677734375, 1.99755859375, 2.3173828125, 2.63720703125, 2.95703125, 3.27685546875, 3.5966796875, 3.91650390625, 4.236328125, 4.55615234375, 4.8759765625, 5.19580078125, 5.515625, 5.83544921875, 6.1552734375, 6.47509765625, 6.794921875, 7.11474609375, 7.4345703125, 7.75439453125, 8.07421875, 8.39404296875, 8.7138671875, 9.03369140625, 9.353515625, 9.67333984375, 9.9931640625, 10.31298828125, 10.6328125]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 4.0, 14.0, 18.0, 43.0, 58.0, 102.0, 267.0, 498.0, 1059.0, 1090.0, 479.0, 228.0, 107.0, 53.0, 23.0, 18.0, 10.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.8125, -38.84130859375, -37.8701171875, -36.89892578125, -35.927734375, -34.95654296875, -33.9853515625, -33.01416015625, -32.04296875, -31.07177734375, -30.1005859375, -29.12939453125, -28.158203125, -27.18701171875, -26.2158203125, -25.24462890625, -24.2734375, -23.30224609375, -22.3310546875, -21.35986328125, -20.388671875, -19.41748046875, -18.4462890625, -17.47509765625, -16.50390625, -15.53271484375, -14.5615234375, -13.59033203125, -12.619140625, -11.64794921875, -10.6767578125, -9.70556640625, -8.734375, -7.76318359375, -6.7919921875, -5.82080078125, -4.849609375, -3.87841796875, -2.9072265625, -1.93603515625, -0.96484375, 0.00634765625, 0.9775390625, 1.94873046875, 2.919921875, 3.89111328125, 4.8623046875, 5.83349609375, 6.8046875, 7.77587890625, 8.7470703125, 9.71826171875, 10.689453125, 11.66064453125, 12.6318359375, 13.60302734375, 14.57421875, 15.54541015625, 16.5166015625, 17.48779296875, 18.458984375, 19.43017578125, 20.4013671875, 21.37255859375, 22.34375]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 11.0, 12.0, 23.0, 44.0, 108.0, 253.0, 656.0, 2195.0, 273034.0, 3913385.0, 3248.0, 774.0, 294.0, 121.0, 65.0, 23.0, 19.0, 9.0, 6.0, 3.0, 1.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-120.25, -116.505859375, -112.76171875, -109.017578125, -105.2734375, -101.529296875, -97.78515625, -94.041015625, -90.296875, -86.552734375, -82.80859375, -79.064453125, -75.3203125, -71.576171875, -67.83203125, -64.087890625, -60.34375, -56.599609375, -52.85546875, -49.111328125, -45.3671875, -41.623046875, -37.87890625, -34.134765625, -30.390625, -26.646484375, -22.90234375, -19.158203125, -15.4140625, -11.669921875, -7.92578125, -4.181640625, -0.4375, 3.306640625, 7.05078125, 10.794921875, 14.5390625, 18.283203125, 22.02734375, 25.771484375, 29.515625, 33.259765625, 37.00390625, 40.748046875, 44.4921875, 48.236328125, 51.98046875, 55.724609375, 59.46875, 63.212890625, 66.95703125, 70.701171875, 74.4453125, 78.189453125, 81.93359375, 85.677734375, 89.421875, 93.166015625, 96.91015625, 100.654296875, 104.3984375, 108.142578125, 111.88671875, 115.630859375, 119.375]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 7.0, 32.0, 179.0, 451.0, 279.0, 56.0, 7.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.024173736572266, -23.016115188598633, -19.008056640625, -14.999998092651367, -10.991939544677734, -6.983880996704102, -2.9758224487304688, 1.032236099243164, 5.040294647216797, 9.04835319519043, 13.056411743164062, 17.064470291137695, 21.072528839111328, 25.08058738708496, 29.088645935058594, 33.096702575683594, 37.10476303100586, 41.112823486328125, 45.120880126953125, 49.128936767578125, 53.13699722290039, 57.145057678222656, 61.153114318847656, 65.16117095947266, 69.16923522949219, 73.17729187011719, 77.18534851074219, 81.19341278076172, 85.20146942138672, 89.20952606201172, 93.21759033203125, 97.22564697265625, 101.23368835449219, 105.24174499511719, 109.24980163574219, 113.25786590576172, 117.26592254638672, 121.27397918701172, 125.28204345703125, 129.29010009765625, 133.29815673828125, 137.30621337890625, 141.31427001953125, 145.32232666015625, 149.33038330078125, 153.3384552001953, 157.3465118408203, 161.3545684814453, 165.3626251220703, 169.3706817626953, 173.3787384033203, 177.3867950439453, 181.39486694335938, 185.40292358398438, 189.41098022460938, 193.41903686523438, 197.42709350585938, 201.43515014648438, 205.44320678710938, 209.45126342773438, 213.45932006835938, 217.46739196777344, 221.47544860839844, 225.48350524902344, 229.49156188964844]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 5.0, 8.0, 8.0, 7.0, 11.0, 8.0, 16.0, 14.0, 16.0, 32.0, 23.0, 36.0, 30.0, 26.0, 34.0, 48.0, 36.0, 50.0, 37.0, 48.0, 43.0, 28.0, 39.0, 32.0, 37.0, 40.0, 46.0, 32.0, 20.0, 30.0, 21.0, 32.0, 19.0, 15.0, 17.0, 14.0, 11.0, 17.0, 5.0, 9.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.370094299316406, -49.85137176513672, -48.33264923095703, -46.813926696777344, -45.29520034790039, -43.7764778137207, -42.257755279541016, -40.73903274536133, -39.220306396484375, -37.70158386230469, -36.182861328125, -34.66413879394531, -33.14541244506836, -31.626689910888672, -30.107967376708984, -28.589244842529297, -27.07052230834961, -25.551799774169922, -24.0330753326416, -22.514352798461914, -20.995628356933594, -19.476905822753906, -17.95818328857422, -16.43946075439453, -14.920736312866211, -13.402012825012207, -11.883289337158203, -10.364566802978516, -8.845843315124512, -7.327119827270508, -5.80839729309082, -4.289673805236816, -2.7709503173828125, -1.2522270679473877, 0.2664961814880371, 1.7852191925048828, 3.3039426803588867, 4.822666168212891, 6.341388702392578, 7.860112190246582, 9.378835678100586, 10.89755916595459, 12.416282653808594, 13.935005187988281, 15.453728675842285, 16.97245216369629, 18.491174697875977, 20.009899139404297, 21.528621673583984, 23.047344207763672, 24.566068649291992, 26.08479118347168, 27.603515625, 29.122238159179688, 30.640960693359375, 32.15968322753906, 33.67840576171875, 35.19712829589844, 36.715850830078125, 38.23457336425781, 39.753299713134766, 41.27202224731445, 42.79074478149414, 44.30946731567383, 45.82819366455078]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 10.0, 8.0, 13.0, 14.0, 16.0, 17.0, 20.0, 20.0, 36.0, 31.0, 38.0, 23.0, 29.0, 42.0, 47.0, 41.0, 54.0, 55.0, 51.0, 52.0, 41.0, 42.0, 40.0, 37.0, 31.0, 31.0, 26.0, 28.0, 28.0, 20.0, 13.0, 9.0, 11.0, 7.0, 10.0, 6.0, 0.0, 1.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.8203125, -4.6671142578125, -4.513916015625, -4.3607177734375, -4.20751953125, -4.0543212890625, -3.901123046875, -3.7479248046875, -3.5947265625, -3.4415283203125, -3.288330078125, -3.1351318359375, -2.98193359375, -2.8287353515625, -2.675537109375, -2.5223388671875, -2.369140625, -2.2159423828125, -2.062744140625, -1.9095458984375, -1.75634765625, -1.6031494140625, -1.449951171875, -1.2967529296875, -1.1435546875, -0.9903564453125, -0.837158203125, -0.6839599609375, -0.53076171875, -0.3775634765625, -0.224365234375, -0.0711669921875, 0.08203125, 0.2352294921875, 0.388427734375, 0.5416259765625, 0.69482421875, 0.8480224609375, 1.001220703125, 1.1544189453125, 1.3076171875, 1.4608154296875, 1.614013671875, 1.7672119140625, 1.92041015625, 2.0736083984375, 2.226806640625, 2.3800048828125, 2.533203125, 2.6864013671875, 2.839599609375, 2.9927978515625, 3.14599609375, 3.2991943359375, 3.452392578125, 3.6055908203125, 3.7587890625, 3.9119873046875, 4.065185546875, 4.2183837890625, 4.37158203125, 4.5247802734375, 4.677978515625, 4.8311767578125, 4.984375]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 12.0, 13.0, 21.0, 47.0, 46.0, 54.0, 73.0, 122.0, 187.0, 233.0, 362.0, 521.0, 759.0, 1179.0, 1729.0, 2494.0, 3912.0, 6015.0, 9328.0, 14500.0, 23182.0, 36697.0, 60992.0, 111132.0, 298998.0, 230525.0, 97474.0, 55122.0, 33656.0, 20910.0, 13296.0, 8549.0, 5474.0, 3639.0, 2388.0, 1608.0, 993.0, 734.0, 476.0, 343.0, 238.0, 166.0, 92.0, 73.0, 54.0, 40.0, 17.0, 24.0, 18.0, 11.0, 10.0, 8.0, 4.0, 2.0, 3.0, 4.0], "bins": [-0.90869140625, -0.881072998046875, -0.85345458984375, -0.825836181640625, -0.7982177734375, -0.770599365234375, -0.74298095703125, -0.715362548828125, -0.687744140625, -0.660125732421875, -0.63250732421875, -0.604888916015625, -0.5772705078125, -0.549652099609375, -0.52203369140625, -0.494415283203125, -0.466796875, -0.439178466796875, -0.41156005859375, -0.383941650390625, -0.3563232421875, -0.328704833984375, -0.30108642578125, -0.273468017578125, -0.245849609375, -0.218231201171875, -0.19061279296875, -0.162994384765625, -0.1353759765625, -0.107757568359375, -0.08013916015625, -0.052520751953125, -0.02490234375, 0.002716064453125, 0.03033447265625, 0.057952880859375, 0.0855712890625, 0.113189697265625, 0.14080810546875, 0.168426513671875, 0.196044921875, 0.223663330078125, 0.25128173828125, 0.278900146484375, 0.3065185546875, 0.334136962890625, 0.36175537109375, 0.389373779296875, 0.4169921875, 0.444610595703125, 0.47222900390625, 0.499847412109375, 0.5274658203125, 0.555084228515625, 0.58270263671875, 0.610321044921875, 0.637939453125, 0.665557861328125, 0.69317626953125, 0.720794677734375, 0.7484130859375, 0.776031494140625, 0.80364990234375, 0.831268310546875, 0.85888671875]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 10.0, 6.0, 2.0, 18.0, 20.0, 20.0, 24.0, 26.0, 42.0, 50.0, 41.0, 53.0, 51.0, 58.0, 71.0, 1090.0, 50.0, 58.0, 47.0, 50.0, 57.0, 34.0, 44.0, 22.0, 21.0, 10.0, 15.0, 8.0, 9.0, 8.0, 5.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.87890625, -4.753814697265625, -4.62872314453125, -4.503631591796875, -4.3785400390625, -4.253448486328125, -4.12835693359375, -4.003265380859375, -3.878173828125, -3.753082275390625, -3.62799072265625, -3.502899169921875, -3.3778076171875, -3.252716064453125, -3.12762451171875, -3.002532958984375, -2.87744140625, -2.752349853515625, -2.62725830078125, -2.502166748046875, -2.3770751953125, -2.251983642578125, -2.12689208984375, -2.001800537109375, -1.876708984375, -1.751617431640625, -1.62652587890625, -1.501434326171875, -1.3763427734375, -1.251251220703125, -1.12615966796875, -1.001068115234375, -0.8759765625, -0.750885009765625, -0.62579345703125, -0.500701904296875, -0.3756103515625, -0.250518798828125, -0.12542724609375, -0.000335693359375, 0.124755859375, 0.249847412109375, 0.37493896484375, 0.500030517578125, 0.6251220703125, 0.750213623046875, 0.87530517578125, 1.000396728515625, 1.12548828125, 1.250579833984375, 1.37567138671875, 1.500762939453125, 1.6258544921875, 1.750946044921875, 1.87603759765625, 2.001129150390625, 2.126220703125, 2.251312255859375, 2.37640380859375, 2.501495361328125, 2.6265869140625, 2.751678466796875, 2.87677001953125, 3.001861572265625, 3.126953125]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 2.0, 2.0, 11.0, 13.0, 7.0, 24.0, 26.0, 41.0, 62.0, 81.0, 160.0, 273.0, 502.0, 865.0, 1790.0, 3426.0, 6977.0, 14292.0, 31750.0, 75410.0, 226208.0, 1529533.0, 118211.0, 47338.0, 20547.0, 9653.0, 4706.0, 2417.0, 1283.0, 628.0, 367.0, 207.0, 109.0, 73.0, 58.0, 30.0, 15.0, 13.0, 10.0, 3.0, 8.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3466796875, -1.298980712890625, -1.25128173828125, -1.203582763671875, -1.1558837890625, -1.108184814453125, -1.06048583984375, -1.012786865234375, -0.965087890625, -0.917388916015625, -0.86968994140625, -0.821990966796875, -0.7742919921875, -0.726593017578125, -0.67889404296875, -0.631195068359375, -0.58349609375, -0.535797119140625, -0.48809814453125, -0.440399169921875, -0.3927001953125, -0.345001220703125, -0.29730224609375, -0.249603271484375, -0.201904296875, -0.154205322265625, -0.10650634765625, -0.058807373046875, -0.0111083984375, 0.036590576171875, 0.08428955078125, 0.131988525390625, 0.1796875, 0.227386474609375, 0.27508544921875, 0.322784423828125, 0.3704833984375, 0.418182373046875, 0.46588134765625, 0.513580322265625, 0.561279296875, 0.608978271484375, 0.65667724609375, 0.704376220703125, 0.7520751953125, 0.799774169921875, 0.84747314453125, 0.895172119140625, 0.94287109375, 0.990570068359375, 1.03826904296875, 1.085968017578125, 1.1336669921875, 1.181365966796875, 1.22906494140625, 1.276763916015625, 1.324462890625, 1.372161865234375, 1.41986083984375, 1.467559814453125, 1.5152587890625, 1.562957763671875, 1.61065673828125, 1.658355712890625, 1.7060546875]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 6.0, 6.0, 5.0, 9.0, 9.0, 12.0, 13.0, 13.0, 16.0, 20.0, 26.0, 26.0, 49.0, 68.0, 56.0, 61.0, 67.0, 55.0, 88.0, 59.0, 59.0, 53.0, 52.0, 34.0, 35.0, 28.0, 17.0, 10.0, 7.0, 8.0, 11.0, 6.0, 5.0, 4.0, 5.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.0006055831909179688, -0.0005895309150218964, -0.000573478639125824, -0.0005574263632297516, -0.0005413740873336792, -0.0005253218114376068, -0.0005092695355415344, -0.000493217259645462, -0.00047716498374938965, -0.00046111270785331726, -0.0004450604319572449, -0.0004290081560611725, -0.0004129558801651001, -0.0003969036042690277, -0.0003808513283729553, -0.00036479905247688293, -0.00034874677658081055, -0.00033269450068473816, -0.00031664222478866577, -0.0003005899488925934, -0.000284537672996521, -0.0002684853971004486, -0.0002524331212043762, -0.00023638084530830383, -0.00022032856941223145, -0.00020427629351615906, -0.00018822401762008667, -0.00017217174172401428, -0.0001561194658279419, -0.0001400671899318695, -0.00012401491403579712, -0.00010796263813972473, -9.191036224365234e-05, -7.585808634757996e-05, -5.980581045150757e-05, -4.375353455543518e-05, -2.7701258659362793e-05, -1.1648982763290405e-05, 4.403293132781982e-06, 2.045556902885437e-05, 3.650784492492676e-05, 5.2560120820999146e-05, 6.861239671707153e-05, 8.466467261314392e-05, 0.00010071694850921631, 0.0001167692244052887, 0.00013282150030136108, 0.00014887377619743347, 0.00016492605209350586, 0.00018097832798957825, 0.00019703060388565063, 0.00021308287978172302, 0.0002291351556777954, 0.0002451874315738678, 0.0002612397074699402, 0.0002772919833660126, 0.00029334425926208496, 0.00030939653515815735, 0.00032544881105422974, 0.0003415010869503021, 0.0003575533628463745, 0.0003736056387424469, 0.0003896579146385193, 0.0004057101905345917, 0.00042176246643066406]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 2.0, 6.0, 1.0, 2.0, 2.0, 4.0, 4.0, 5.0, 7.0, 15.0, 13.0, 20.0, 26.0, 36.0, 52.0, 54.0, 89.0, 110.0, 166.0, 217.0, 364.0, 528.0, 1114.0, 1033693.0, 9894.0, 751.0, 445.0, 275.0, 185.0, 119.0, 100.0, 57.0, 49.0, 33.0, 29.0, 32.0, 15.0, 16.0, 9.0, 8.0, 7.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00904083251953125, -0.008714914321899414, -0.008388996124267578, -0.008063077926635742, -0.007737159729003906, -0.00741124153137207, -0.007085323333740234, -0.0067594051361083984, -0.0064334869384765625, -0.0061075687408447266, -0.005781650543212891, -0.005455732345581055, -0.005129814147949219, -0.004803895950317383, -0.004477977752685547, -0.004152059555053711, -0.003826141357421875, -0.003500223159790039, -0.003174304962158203, -0.002848386764526367, -0.0025224685668945312, -0.0021965503692626953, -0.0018706321716308594, -0.0015447139739990234, -0.0012187957763671875, -0.0008928775787353516, -0.0005669593811035156, -0.0002410411834716797, 8.487701416015625e-05, 0.0004107952117919922, 0.0007367134094238281, 0.001062631607055664, 0.0013885498046875, 0.001714468002319336, 0.002040386199951172, 0.002366304397583008, 0.0026922225952148438, 0.0030181407928466797, 0.0033440589904785156, 0.0036699771881103516, 0.0039958953857421875, 0.0043218135833740234, 0.004647731781005859, 0.004973649978637695, 0.005299568176269531, 0.005625486373901367, 0.005951404571533203, 0.006277322769165039, 0.006603240966796875, 0.006929159164428711, 0.007255077362060547, 0.007580995559692383, 0.007906913757324219, 0.008232831954956055, 0.00855875015258789, 0.008884668350219727, 0.009210586547851562, 0.009536504745483398, 0.009862422943115234, 0.01018834114074707, 0.010514259338378906, 0.010840177536010742, 0.011166095733642578, 0.011492013931274414, 0.01181793212890625]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 39.0, 629.0, 329.0, 16.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003586577659007162, -0.0003222472150810063, -0.00028583669336512685, -0.00024942614254541695, -0.00021301560627762228, -0.00017660507000982761, -0.00014019451919011772, -0.00010378399747423828, -6.737344665452838e-05, -3.0962906748754904e-05, 5.447633157018572e-06, 4.1858176700770855e-05, 7.826871296856552e-05, 0.00011467924923636019, 0.0001510898000560701, 0.00018750032177194953, 0.00022391087259165943, 0.0002603214234113693, 0.00029673194512724876, 0.00033314249594695866, 0.00036955304676666856, 0.000405963568482548, 0.0004423741193022579, 0.00047878464101813734, 0.0005151951918378472, 0.0005516057135537267, 0.000588016293477267, 0.0006244268151931465, 0.0006608373369090259, 0.0006972479168325663, 0.0007336584385484457, 0.0007700689602643251, 0.0008064795983955264, 0.0008428901201114058, 0.0008793007000349462, 0.0009157112217508256, 0.0009521217434667051, 0.0009885323233902454, 0.0010249428451061249, 0.0010613533668220043, 0.0010977638885378838, 0.0011341744102537632, 0.0011705849319696426, 0.001206995453685522, 0.0012434060918167233, 0.0012798166135326028, 0.0013162271352484822, 0.0013526376569643617, 0.001389048295095563, 0.0014254588168114424, 0.0014618693385273218, 0.0014982798602432013, 0.0015346904983744025, 0.001571101020090282, 0.0016075115418061614, 0.0016439220635220408, 0.0016803325852379203, 0.0017167431069537997, 0.0017531536286696792, 0.0017895642668008804, 0.0018259747885167599, 0.0018623853102326393, 0.0018987958319485188, 0.0019352063536643982, 0.0019716168753802776]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 7.0, 5.0, 9.0, 15.0, 14.0, 9.0, 14.0, 14.0, 22.0, 19.0, 20.0, 26.0, 28.0, 31.0, 31.0, 30.0, 37.0, 56.0, 43.0, 43.0, 32.0, 38.0, 38.0, 36.0, 33.0, 28.0, 27.0, 38.0, 37.0, 37.0, 20.0, 25.0, 20.0, 26.0, 18.0, 18.0, 10.0, 12.0, 6.0, 8.0, 8.0, 10.0, 1.0, 0.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0002365708351135254, -0.00022920966148376465, -0.0002218484878540039, -0.00021448731422424316, -0.00020712614059448242, -0.00019976496696472168, -0.00019240379333496094, -0.0001850426197052002, -0.00017768144607543945, -0.0001703202724456787, -0.00016295909881591797, -0.00015559792518615723, -0.00014823675155639648, -0.00014087557792663574, -0.000133514404296875, -0.00012615323066711426, -0.00011879205703735352, -0.00011143088340759277, -0.00010406970977783203, -9.670853614807129e-05, -8.934736251831055e-05, -8.19861888885498e-05, -7.462501525878906e-05, -6.726384162902832e-05, -5.990266799926758e-05, -5.2541494369506836e-05, -4.5180320739746094e-05, -3.781914710998535e-05, -3.045797348022461e-05, -2.3096799850463867e-05, -1.5735626220703125e-05, -8.374452590942383e-06, -1.0132789611816406e-06, 6.3478946685791016e-06, 1.3709068298339844e-05, 2.1070241928100586e-05, 2.8431415557861328e-05, 3.579258918762207e-05, 4.315376281738281e-05, 5.0514936447143555e-05, 5.78761100769043e-05, 6.523728370666504e-05, 7.259845733642578e-05, 7.995963096618652e-05, 8.732080459594727e-05, 9.468197822570801e-05, 0.00010204315185546875, 0.00010940432548522949, 0.00011676549911499023, 0.00012412667274475098, 0.00013148784637451172, 0.00013884902000427246, 0.0001462101936340332, 0.00015357136726379395, 0.0001609325408935547, 0.00016829371452331543, 0.00017565488815307617, 0.00018301606178283691, 0.00019037723541259766, 0.0001977384090423584, 0.00020509958267211914, 0.00021246075630187988, 0.00021982192993164062, 0.00022718310356140137, 0.0002345442771911621]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 10.0, 8.0, 13.0, 14.0, 16.0, 17.0, 20.0, 20.0, 36.0, 31.0, 38.0, 23.0, 29.0, 42.0, 47.0, 41.0, 54.0, 55.0, 51.0, 52.0, 41.0, 42.0, 40.0, 37.0, 31.0, 31.0, 26.0, 28.0, 28.0, 20.0, 13.0, 9.0, 11.0, 7.0, 10.0, 6.0, 0.0, 1.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.8203125, -4.6671142578125, -4.513916015625, -4.3607177734375, -4.20751953125, -4.0543212890625, -3.901123046875, -3.7479248046875, -3.5947265625, -3.4415283203125, -3.288330078125, -3.1351318359375, -2.98193359375, -2.8287353515625, -2.675537109375, -2.5223388671875, -2.369140625, -2.2159423828125, -2.062744140625, -1.9095458984375, -1.75634765625, -1.6031494140625, -1.449951171875, -1.2967529296875, -1.1435546875, -0.9903564453125, -0.837158203125, -0.6839599609375, -0.53076171875, -0.3775634765625, -0.224365234375, -0.0711669921875, 0.08203125, 0.2352294921875, 0.388427734375, 0.5416259765625, 0.69482421875, 0.8480224609375, 1.001220703125, 1.1544189453125, 1.3076171875, 1.4608154296875, 1.614013671875, 1.7672119140625, 1.92041015625, 2.0736083984375, 2.226806640625, 2.3800048828125, 2.533203125, 2.6864013671875, 2.839599609375, 2.9927978515625, 3.14599609375, 3.2991943359375, 3.452392578125, 3.6055908203125, 3.7587890625, 3.9119873046875, 4.065185546875, 4.2183837890625, 4.37158203125, 4.5247802734375, 4.677978515625, 4.8311767578125, 4.984375]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 4.0, 6.0, 4.0, 13.0, 18.0, 26.0, 16.0, 42.0, 50.0, 75.0, 87.0, 127.0, 220.0, 254.0, 393.0, 498.0, 765.0, 1102.0, 1563.0, 2376.0, 3729.0, 6575.0, 14595.0, 81940.0, 869993.0, 37759.0, 10831.0, 5452.0, 3287.0, 2033.0, 1440.0, 975.0, 683.0, 448.0, 324.0, 231.0, 190.0, 124.0, 84.0, 63.0, 47.0, 33.0, 23.0, 21.0, 23.0, 5.0, 6.0, 3.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-33.4375, -32.40380859375, -31.3701171875, -30.33642578125, -29.302734375, -28.26904296875, -27.2353515625, -26.20166015625, -25.16796875, -24.13427734375, -23.1005859375, -22.06689453125, -21.033203125, -19.99951171875, -18.9658203125, -17.93212890625, -16.8984375, -15.86474609375, -14.8310546875, -13.79736328125, -12.763671875, -11.72998046875, -10.6962890625, -9.66259765625, -8.62890625, -7.59521484375, -6.5615234375, -5.52783203125, -4.494140625, -3.46044921875, -2.4267578125, -1.39306640625, -0.359375, 0.67431640625, 1.7080078125, 2.74169921875, 3.775390625, 4.80908203125, 5.8427734375, 6.87646484375, 7.91015625, 8.94384765625, 9.9775390625, 11.01123046875, 12.044921875, 13.07861328125, 14.1123046875, 15.14599609375, 16.1796875, 17.21337890625, 18.2470703125, 19.28076171875, 20.314453125, 21.34814453125, 22.3818359375, 23.41552734375, 24.44921875, 25.48291015625, 26.5166015625, 27.55029296875, 28.583984375, 29.61767578125, 30.6513671875, 31.68505859375, 32.71875]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 5.0, 7.0, 9.0, 9.0, 15.0, 13.0, 20.0, 19.0, 29.0, 35.0, 31.0, 43.0, 38.0, 50.0, 53.0, 75.0, 218.0, 1676.0, 233.0, 86.0, 33.0, 42.0, 41.0, 45.0, 48.0, 26.0, 32.0, 18.0, 22.0, 14.0, 16.0, 9.0, 12.0, 9.0, 6.0, 2.0, 1.0, 3.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.296875, -15.824462890625, -15.35205078125, -14.879638671875, -14.4072265625, -13.934814453125, -13.46240234375, -12.989990234375, -12.517578125, -12.045166015625, -11.57275390625, -11.100341796875, -10.6279296875, -10.155517578125, -9.68310546875, -9.210693359375, -8.73828125, -8.265869140625, -7.79345703125, -7.321044921875, -6.8486328125, -6.376220703125, -5.90380859375, -5.431396484375, -4.958984375, -4.486572265625, -4.01416015625, -3.541748046875, -3.0693359375, -2.596923828125, -2.12451171875, -1.652099609375, -1.1796875, -0.707275390625, -0.23486328125, 0.237548828125, 0.7099609375, 1.182373046875, 1.65478515625, 2.127197265625, 2.599609375, 3.072021484375, 3.54443359375, 4.016845703125, 4.4892578125, 4.961669921875, 5.43408203125, 5.906494140625, 6.37890625, 6.851318359375, 7.32373046875, 7.796142578125, 8.2685546875, 8.740966796875, 9.21337890625, 9.685791015625, 10.158203125, 10.630615234375, 11.10302734375, 11.575439453125, 12.0478515625, 12.520263671875, 12.99267578125, 13.465087890625, 13.9375]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 2.0, 3.0, 4.0, 5.0, 7.0, 10.0, 12.0, 14.0, 18.0, 17.0, 23.0, 26.0, 26.0, 35.0, 70.0, 45.0, 67.0, 208.0, 665.0, 11242.0, 3129852.0, 2477.0, 384.0, 154.0, 71.0, 45.0, 49.0, 31.0, 25.0, 19.0, 28.0, 18.0, 15.0, 10.0, 7.0, 6.0, 7.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.34375, -61.18603515625, -59.0283203125, -56.87060546875, -54.712890625, -52.55517578125, -50.3974609375, -48.23974609375, -46.08203125, -43.92431640625, -41.7666015625, -39.60888671875, -37.451171875, -35.29345703125, -33.1357421875, -30.97802734375, -28.8203125, -26.66259765625, -24.5048828125, -22.34716796875, -20.189453125, -18.03173828125, -15.8740234375, -13.71630859375, -11.55859375, -9.40087890625, -7.2431640625, -5.08544921875, -2.927734375, -0.77001953125, 1.3876953125, 3.54541015625, 5.703125, 7.86083984375, 10.0185546875, 12.17626953125, 14.333984375, 16.49169921875, 18.6494140625, 20.80712890625, 22.96484375, 25.12255859375, 27.2802734375, 29.43798828125, 31.595703125, 33.75341796875, 35.9111328125, 38.06884765625, 40.2265625, 42.38427734375, 44.5419921875, 46.69970703125, 48.857421875, 51.01513671875, 53.1728515625, 55.33056640625, 57.48828125, 59.64599609375, 61.8037109375, 63.96142578125, 66.119140625, 68.27685546875, 70.4345703125, 72.59228515625, 74.75]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [3.0, 373.0, 638.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.880212783813477, -4.562034606933594, -0.24385643005371094, 4.074321746826172, 8.392499923706055, 12.710678100585938, 17.02885627746582, 21.347034454345703, 25.665212631225586, 29.98339080810547, 34.30156707763672, 38.619747161865234, 42.93792724609375, 47.256103515625, 51.57427978515625, 55.892459869384766, 60.21063995361328, 64.52881622314453, 68.84700012207031, 73.16517639160156, 77.48335266113281, 81.80152893066406, 86.11970520019531, 90.4378890991211, 94.75606536865234, 99.0742416381836, 103.39242553710938, 107.71060180664062, 112.02877807617188, 116.34695434570312, 120.66513061523438, 124.98331451416016, 129.30148315429688, 133.61965942382812, 137.93783569335938, 142.25601196289062, 146.57418823242188, 150.8923797607422, 155.21055603027344, 159.5287322998047, 163.84690856933594, 168.1650848388672, 172.48326110839844, 176.8014373779297, 181.11962890625, 185.43780517578125, 189.7559814453125, 194.07415771484375, 198.392333984375, 202.71051025390625, 207.0286865234375, 211.34686279296875, 215.6650390625, 219.9832305908203, 224.30140686035156, 228.6195831298828, 232.93775939941406, 237.2559356689453, 241.57411193847656, 245.8922882080078, 250.21047973632812, 254.52865600585938, 258.8468322753906, 263.1650085449219, 267.4831848144531]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 2.0, 4.0, 2.0, 3.0, 6.0, 3.0, 11.0, 6.0, 13.0, 11.0, 12.0, 11.0, 16.0, 15.0, 16.0, 29.0, 17.0, 32.0, 19.0, 37.0, 42.0, 43.0, 51.0, 35.0, 33.0, 34.0, 50.0, 41.0, 47.0, 43.0, 38.0, 36.0, 29.0, 31.0, 33.0, 25.0, 24.0, 8.0, 19.0, 17.0, 13.0, 11.0, 5.0, 8.0, 5.0, 9.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-38.19447708129883, -36.93724822998047, -35.680023193359375, -34.422794342041016, -33.16556930541992, -31.908340454101562, -30.651113510131836, -29.39388656616211, -28.136659622192383, -26.879432678222656, -25.62220573425293, -24.364978790283203, -23.107749938964844, -21.85052490234375, -20.59329605102539, -19.336069107055664, -18.078842163085938, -16.82161521911621, -15.564388275146484, -14.307160377502441, -13.049933433532715, -11.792706489562988, -10.535478591918945, -9.278251647949219, -8.021024703979492, -6.763797760009766, -5.506570339202881, -4.249342918395996, -2.9921159744262695, -1.734889030456543, -0.4776616096496582, 0.7795658111572266, 2.036792755126953, 3.294019937515259, 4.5512471199035645, 5.808474540710449, 7.065701484680176, 8.322928428649902, 9.580156326293945, 10.837383270263672, 12.094610214233398, 13.351837158203125, 14.609064102172852, 15.866291999816895, 17.123519897460938, 18.38074493408203, 19.63797378540039, 20.895200729370117, 22.152427673339844, 23.40965461730957, 24.666881561279297, 25.924108505249023, 27.18133544921875, 28.43856430053711, 29.695791244506836, 30.953018188476562, 32.210243225097656, 33.467472076416016, 34.72469711303711, 35.98192596435547, 37.23915100097656, 38.49637985229492, 39.753604888916016, 41.010833740234375, 42.268062591552734]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 1.0, 0.0, 4.0, 2.0, 5.0, 7.0, 13.0, 16.0, 14.0, 20.0, 16.0, 22.0, 27.0, 27.0, 31.0, 28.0, 31.0, 30.0, 38.0, 52.0, 49.0, 49.0, 47.0, 47.0, 50.0, 46.0, 39.0, 49.0, 33.0, 28.0, 30.0, 26.0, 20.0, 29.0, 21.0, 12.0, 11.0, 10.0, 10.0, 9.0, 3.0, 0.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0703125, -4.912841796875, -4.75537109375, -4.597900390625, -4.4404296875, -4.282958984375, -4.12548828125, -3.968017578125, -3.810546875, -3.653076171875, -3.49560546875, -3.338134765625, -3.1806640625, -3.023193359375, -2.86572265625, -2.708251953125, -2.55078125, -2.393310546875, -2.23583984375, -2.078369140625, -1.9208984375, -1.763427734375, -1.60595703125, -1.448486328125, -1.291015625, -1.133544921875, -0.97607421875, -0.818603515625, -0.6611328125, -0.503662109375, -0.34619140625, -0.188720703125, -0.03125, 0.126220703125, 0.28369140625, 0.441162109375, 0.5986328125, 0.756103515625, 0.91357421875, 1.071044921875, 1.228515625, 1.385986328125, 1.54345703125, 1.700927734375, 1.8583984375, 2.015869140625, 2.17333984375, 2.330810546875, 2.48828125, 2.645751953125, 2.80322265625, 2.960693359375, 3.1181640625, 3.275634765625, 3.43310546875, 3.590576171875, 3.748046875, 3.905517578125, 4.06298828125, 4.220458984375, 4.3779296875, 4.535400390625, 4.69287109375, 4.850341796875, 5.0078125]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 1.0, 1.0, 7.0, 3.0, 4.0, 7.0, 7.0, 12.0, 10.0, 16.0, 31.0, 42.0, 52.0, 69.0, 121.0, 168.0, 324.0, 530.0, 989.0, 1956.0, 4100.0, 9431.0, 25377.0, 130955.0, 3583564.0, 377191.0, 36775.0, 12194.0, 5151.0, 2397.0, 1208.0, 606.0, 350.0, 214.0, 123.0, 101.0, 55.0, 45.0, 22.0, 15.0, 12.0, 14.0, 16.0, 5.0, 4.0, 7.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.171875, -28.219970703125, -27.26806640625, -26.316162109375, -25.3642578125, -24.412353515625, -23.46044921875, -22.508544921875, -21.556640625, -20.604736328125, -19.65283203125, -18.700927734375, -17.7490234375, -16.797119140625, -15.84521484375, -14.893310546875, -13.94140625, -12.989501953125, -12.03759765625, -11.085693359375, -10.1337890625, -9.181884765625, -8.22998046875, -7.278076171875, -6.326171875, -5.374267578125, -4.42236328125, -3.470458984375, -2.5185546875, -1.566650390625, -0.61474609375, 0.337158203125, 1.2890625, 2.240966796875, 3.19287109375, 4.144775390625, 5.0966796875, 6.048583984375, 7.00048828125, 7.952392578125, 8.904296875, 9.856201171875, 10.80810546875, 11.760009765625, 12.7119140625, 13.663818359375, 14.61572265625, 15.567626953125, 16.51953125, 17.471435546875, 18.42333984375, 19.375244140625, 20.3271484375, 21.279052734375, 22.23095703125, 23.182861328125, 24.134765625, 25.086669921875, 26.03857421875, 26.990478515625, 27.9423828125, 28.894287109375, 29.84619140625, 30.798095703125, 31.75]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 6.0, 7.0, 17.0, 16.0, 24.0, 39.0, 42.0, 63.0, 104.0, 160.0, 281.0, 481.0, 821.0, 769.0, 460.0, 280.0, 168.0, 107.0, 76.0, 41.0, 34.0, 28.0, 16.0, 13.0, 6.0, 10.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.484375, -24.539306640625, -23.59423828125, -22.649169921875, -21.7041015625, -20.759033203125, -19.81396484375, -18.868896484375, -17.923828125, -16.978759765625, -16.03369140625, -15.088623046875, -14.1435546875, -13.198486328125, -12.25341796875, -11.308349609375, -10.36328125, -9.418212890625, -8.47314453125, -7.528076171875, -6.5830078125, -5.637939453125, -4.69287109375, -3.747802734375, -2.802734375, -1.857666015625, -0.91259765625, 0.032470703125, 0.9775390625, 1.922607421875, 2.86767578125, 3.812744140625, 4.7578125, 5.702880859375, 6.64794921875, 7.593017578125, 8.5380859375, 9.483154296875, 10.42822265625, 11.373291015625, 12.318359375, 13.263427734375, 14.20849609375, 15.153564453125, 16.0986328125, 17.043701171875, 17.98876953125, 18.933837890625, 19.87890625, 20.823974609375, 21.76904296875, 22.714111328125, 23.6591796875, 24.604248046875, 25.54931640625, 26.494384765625, 27.439453125, 28.384521484375, 29.32958984375, 30.274658203125, 31.2197265625, 32.164794921875, 33.10986328125, 34.054931640625, 35.0]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 5.0, 2.0, 11.0, 12.0, 16.0, 14.0, 33.0, 54.0, 88.0, 121.0, 183.0, 351.0, 805.0, 430359.0, 3760436.0, 911.0, 368.0, 194.0, 109.0, 78.0, 42.0, 32.0, 16.0, 25.0, 10.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-191.375, -186.34765625, -181.3203125, -176.29296875, -171.265625, -166.23828125, -161.2109375, -156.18359375, -151.15625, -146.12890625, -141.1015625, -136.07421875, -131.046875, -126.01953125, -120.9921875, -115.96484375, -110.9375, -105.91015625, -100.8828125, -95.85546875, -90.828125, -85.80078125, -80.7734375, -75.74609375, -70.71875, -65.69140625, -60.6640625, -55.63671875, -50.609375, -45.58203125, -40.5546875, -35.52734375, -30.5, -25.47265625, -20.4453125, -15.41796875, -10.390625, -5.36328125, -0.3359375, 4.69140625, 9.71875, 14.74609375, 19.7734375, 24.80078125, 29.828125, 34.85546875, 39.8828125, 44.91015625, 49.9375, 54.96484375, 59.9921875, 65.01953125, 70.046875, 75.07421875, 80.1015625, 85.12890625, 90.15625, 95.18359375, 100.2109375, 105.23828125, 110.265625, 115.29296875, 120.3203125, 125.34765625, 130.375]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 12.0, 17.0, 70.0, 126.0, 183.0, 197.0, 187.0, 120.0, 58.0, 23.0, 8.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-88.92253112792969, -87.16098022460938, -85.39942169189453, -83.63787078857422, -81.87631225585938, -80.11476135253906, -78.35321044921875, -76.5916519165039, -74.8301010131836, -73.06855010986328, -71.30699157714844, -69.54544067382812, -67.78388977050781, -66.02233123779297, -64.26078033447266, -62.49922561645508, -60.7376708984375, -58.97611618041992, -57.214561462402344, -55.45301055908203, -53.69145584106445, -51.929901123046875, -50.16835021972656, -48.406795501708984, -46.645240783691406, -44.88368606567383, -43.12213134765625, -41.36058044433594, -39.59902572631836, -37.83747100830078, -36.07592010498047, -34.31436538696289, -32.55281448364258, -30.791259765625, -29.029706954956055, -27.26815414428711, -25.50659942626953, -23.745044708251953, -21.983491897583008, -20.221939086914062, -18.460384368896484, -16.698829650878906, -14.937276840209961, -13.1757230758667, -11.414169311523438, -9.652615547180176, -7.891061782836914, -6.129508018493652, -4.367954254150391, -2.606400489807129, -0.8448467254638672, 0.9167070388793945, 2.6782608032226562, 4.439814567565918, 6.20136833190918, 7.962922096252441, 9.724475860595703, 11.486029624938965, 13.247583389282227, 15.009137153625488, 16.77069091796875, 18.532245635986328, 20.293798446655273, 22.05535125732422, 23.816905975341797]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 7.0, 5.0, 8.0, 3.0, 5.0, 7.0, 6.0, 11.0, 7.0, 14.0, 13.0, 26.0, 17.0, 21.0, 16.0, 18.0, 34.0, 38.0, 34.0, 40.0, 41.0, 31.0, 31.0, 41.0, 50.0, 42.0, 42.0, 45.0, 32.0, 39.0, 22.0, 33.0, 30.0, 30.0, 24.0, 27.0, 13.0, 20.0, 14.0, 11.0, 11.0, 12.0, 12.0, 8.0, 3.0, 1.0, 5.0, 4.0, 1.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-62.28947067260742, -60.07530975341797, -57.86115264892578, -55.64699172973633, -53.43283462524414, -51.21867370605469, -49.0045166015625, -46.79035568237305, -44.576194763183594, -42.36203384399414, -40.14787673950195, -37.9337158203125, -35.71955871582031, -33.50539779663086, -31.29123878479004, -29.07707977294922, -26.86292266845703, -24.64876365661621, -22.43460464477539, -20.220443725585938, -18.00628662109375, -15.792126655578613, -13.577966690063477, -11.363807678222656, -9.149648666381836, -6.935489654541016, -4.721330165863037, -2.5071706771850586, -0.2930116653442383, 1.921147346496582, 4.135307312011719, 6.349466323852539, 8.563629150390625, 10.777788162231445, 12.991947174072266, 15.206107139587402, 17.420265197753906, 19.63442611694336, 21.84858512878418, 24.062744140625, 26.27690315246582, 28.49106216430664, 30.70522117614746, 32.91938018798828, 35.133541107177734, 37.34769821166992, 39.561859130859375, 41.77601623535156, 43.990177154541016, 46.20433807373047, 48.418495178222656, 50.63265609741211, 52.8468132019043, 55.06097412109375, 57.27513122558594, 59.48929214477539, 61.703453063964844, 63.9176139831543, 66.13177490234375, 68.34593200683594, 70.56008911132812, 72.77424621582031, 74.98841094970703, 77.20256805419922, 79.4167251586914]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 3.0, 4.0, 8.0, 9.0, 8.0, 16.0, 13.0, 15.0, 14.0, 18.0, 15.0, 27.0, 32.0, 33.0, 25.0, 32.0, 42.0, 29.0, 48.0, 46.0, 43.0, 54.0, 54.0, 50.0, 36.0, 43.0, 37.0, 28.0, 32.0, 26.0, 36.0, 25.0, 23.0, 15.0, 14.0, 14.0, 11.0, 4.0, 5.0, 8.0, 4.0, 3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6328125, -4.4781494140625, -4.323486328125, -4.1688232421875, -4.01416015625, -3.8594970703125, -3.704833984375, -3.5501708984375, -3.3955078125, -3.2408447265625, -3.086181640625, -2.9315185546875, -2.77685546875, -2.6221923828125, -2.467529296875, -2.3128662109375, -2.158203125, -2.0035400390625, -1.848876953125, -1.6942138671875, -1.53955078125, -1.3848876953125, -1.230224609375, -1.0755615234375, -0.9208984375, -0.7662353515625, -0.611572265625, -0.4569091796875, -0.30224609375, -0.1475830078125, 0.007080078125, 0.1617431640625, 0.31640625, 0.4710693359375, 0.625732421875, 0.7803955078125, 0.93505859375, 1.0897216796875, 1.244384765625, 1.3990478515625, 1.5537109375, 1.7083740234375, 1.863037109375, 2.0177001953125, 2.17236328125, 2.3270263671875, 2.481689453125, 2.6363525390625, 2.791015625, 2.9456787109375, 3.100341796875, 3.2550048828125, 3.40966796875, 3.5643310546875, 3.718994140625, 3.8736572265625, 4.0283203125, 4.1829833984375, 4.337646484375, 4.4923095703125, 4.64697265625, 4.8016357421875, 4.956298828125, 5.1109619140625, 5.265625]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 7.0, 7.0, 2.0, 2.0, 9.0, 10.0, 21.0, 27.0, 52.0, 65.0, 78.0, 121.0, 188.0, 287.0, 395.0, 609.0, 902.0, 1264.0, 2040.0, 2972.0, 4534.0, 6944.0, 10692.0, 16588.0, 25903.0, 41150.0, 66786.0, 119940.0, 308699.0, 196966.0, 92131.0, 54074.0, 33825.0, 21374.0, 13703.0, 9017.0, 5747.0, 3832.0, 2466.0, 1628.0, 1115.0, 812.0, 520.0, 334.0, 210.0, 172.0, 116.0, 72.0, 52.0, 33.0, 21.0, 19.0, 20.0, 11.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.90673828125, -0.877288818359375, -0.84783935546875, -0.818389892578125, -0.7889404296875, -0.759490966796875, -0.73004150390625, -0.700592041015625, -0.671142578125, -0.641693115234375, -0.61224365234375, -0.582794189453125, -0.5533447265625, -0.523895263671875, -0.49444580078125, -0.464996337890625, -0.435546875, -0.406097412109375, -0.37664794921875, -0.347198486328125, -0.3177490234375, -0.288299560546875, -0.25885009765625, -0.229400634765625, -0.199951171875, -0.170501708984375, -0.14105224609375, -0.111602783203125, -0.0821533203125, -0.052703857421875, -0.02325439453125, 0.006195068359375, 0.03564453125, 0.065093994140625, 0.09454345703125, 0.123992919921875, 0.1534423828125, 0.182891845703125, 0.21234130859375, 0.241790771484375, 0.271240234375, 0.300689697265625, 0.33013916015625, 0.359588623046875, 0.3890380859375, 0.418487548828125, 0.44793701171875, 0.477386474609375, 0.5068359375, 0.536285400390625, 0.56573486328125, 0.595184326171875, 0.6246337890625, 0.654083251953125, 0.68353271484375, 0.712982177734375, 0.742431640625, 0.771881103515625, 0.80133056640625, 0.830780029296875, 0.8602294921875, 0.889678955078125, 0.91912841796875, 0.948577880859375, 0.97802734375]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 1.0, 8.0, 7.0, 3.0, 1.0, 6.0, 5.0, 7.0, 16.0, 14.0, 12.0, 11.0, 17.0, 15.0, 30.0, 22.0, 21.0, 35.0, 30.0, 34.0, 34.0, 48.0, 32.0, 40.0, 40.0, 1062.0, 34.0, 44.0, 46.0, 35.0, 40.0, 26.0, 28.0, 28.0, 29.0, 31.0, 25.0, 19.0, 15.0, 14.0, 11.0, 9.0, 12.0, 7.0, 4.0, 8.0, 7.0, 9.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.52734375, -2.437896728515625, -2.34844970703125, -2.259002685546875, -2.1695556640625, -2.080108642578125, -1.99066162109375, -1.901214599609375, -1.811767578125, -1.722320556640625, -1.63287353515625, -1.543426513671875, -1.4539794921875, -1.364532470703125, -1.27508544921875, -1.185638427734375, -1.09619140625, -1.006744384765625, -0.91729736328125, -0.827850341796875, -0.7384033203125, -0.648956298828125, -0.55950927734375, -0.470062255859375, -0.380615234375, -0.291168212890625, -0.20172119140625, -0.112274169921875, -0.0228271484375, 0.066619873046875, 0.15606689453125, 0.245513916015625, 0.3349609375, 0.424407958984375, 0.51385498046875, 0.603302001953125, 0.6927490234375, 0.782196044921875, 0.87164306640625, 0.961090087890625, 1.050537109375, 1.139984130859375, 1.22943115234375, 1.318878173828125, 1.4083251953125, 1.497772216796875, 1.58721923828125, 1.676666259765625, 1.76611328125, 1.855560302734375, 1.94500732421875, 2.034454345703125, 2.1239013671875, 2.213348388671875, 2.30279541015625, 2.392242431640625, 2.481689453125, 2.571136474609375, 2.66058349609375, 2.750030517578125, 2.8394775390625, 2.928924560546875, 3.01837158203125, 3.107818603515625, 3.197265625]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 4.0, 5.0, 8.0, 12.0, 22.0, 19.0, 30.0, 57.0, 96.0, 138.0, 183.0, 266.0, 412.0, 680.0, 1012.0, 1484.0, 2338.0, 3804.0, 5738.0, 8903.0, 14315.0, 23246.0, 38402.0, 68383.0, 139101.0, 1418636.0, 176242.0, 79068.0, 44006.0, 26187.0, 16161.0, 10088.0, 6329.0, 4169.0, 2717.0, 1632.0, 1089.0, 731.0, 469.0, 312.0, 188.0, 124.0, 111.0, 78.0, 50.0, 29.0, 14.0, 15.0, 13.0, 11.0, 2.0, 4.0, 3.0, 3.0], "bins": [-1.1142578125, -1.082977294921875, -1.05169677734375, -1.020416259765625, -0.9891357421875, -0.957855224609375, -0.92657470703125, -0.895294189453125, -0.864013671875, -0.832733154296875, -0.80145263671875, -0.770172119140625, -0.7388916015625, -0.707611083984375, -0.67633056640625, -0.645050048828125, -0.61376953125, -0.582489013671875, -0.55120849609375, -0.519927978515625, -0.4886474609375, -0.457366943359375, -0.42608642578125, -0.394805908203125, -0.363525390625, -0.332244873046875, -0.30096435546875, -0.269683837890625, -0.2384033203125, -0.207122802734375, -0.17584228515625, -0.144561767578125, -0.11328125, -0.082000732421875, -0.05072021484375, -0.019439697265625, 0.0118408203125, 0.043121337890625, 0.07440185546875, 0.105682373046875, 0.136962890625, 0.168243408203125, 0.19952392578125, 0.230804443359375, 0.2620849609375, 0.293365478515625, 0.32464599609375, 0.355926513671875, 0.38720703125, 0.418487548828125, 0.44976806640625, 0.481048583984375, 0.5123291015625, 0.543609619140625, 0.57489013671875, 0.606170654296875, 0.637451171875, 0.668731689453125, 0.70001220703125, 0.731292724609375, 0.7625732421875, 0.793853759765625, 0.82513427734375, 0.856414794921875, 0.8876953125]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 5.0, 5.0, 8.0, 4.0, 10.0, 13.0, 11.0, 24.0, 33.0, 38.0, 48.0, 59.0, 73.0, 67.0, 80.0, 93.0, 97.0, 66.0, 60.0, 48.0, 35.0, 30.0, 14.0, 14.0, 15.0, 12.0, 5.0, 10.0, 4.0, 2.0, 2.0, 5.0, 2.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007071495056152344, -0.0006811767816543579, -0.0006552040576934814, -0.000629231333732605, -0.0006032586097717285, -0.000577285885810852, -0.0005513131618499756, -0.0005253404378890991, -0.0004993677139282227, -0.0004733949899673462, -0.0004474222660064697, -0.00042144954204559326, -0.0003954768180847168, -0.00036950409412384033, -0.00034353137016296387, -0.0003175586462020874, -0.00029158592224121094, -0.00026561319828033447, -0.000239640474319458, -0.00021366775035858154, -0.00018769502639770508, -0.0001617223024368286, -0.00013574957847595215, -0.00010977685451507568, -8.380413055419922e-05, -5.7831406593322754e-05, -3.185868263244629e-05, -5.885958671569824e-06, 2.008676528930664e-05, 4.6059489250183105e-05, 7.203221321105957e-05, 9.800493717193604e-05, 0.0001239776611328125, 0.00014995038509368896, 0.00017592310905456543, 0.0002018958330154419, 0.00022786855697631836, 0.0002538412809371948, 0.0002798140048980713, 0.00030578672885894775, 0.0003317594528198242, 0.0003577321767807007, 0.00038370490074157715, 0.0004096776247024536, 0.0004356503486633301, 0.00046162307262420654, 0.000487595796585083, 0.0005135685205459595, 0.0005395412445068359, 0.0005655139684677124, 0.0005914866924285889, 0.0006174594163894653, 0.0006434321403503418, 0.0006694048643112183, 0.0006953775882720947, 0.0007213503122329712, 0.0007473230361938477, 0.0007732957601547241, 0.0007992684841156006, 0.000825241208076477, 0.0008512139320373535, 0.00087718665599823, 0.0009031593799591064, 0.0009291321039199829, 0.0009551048278808594]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 7.0, 4.0, 3.0, 4.0, 11.0, 12.0, 18.0, 16.0, 19.0, 47.0, 74.0, 124.0, 215.0, 430.0, 2696.0, 1043215.0, 917.0, 285.0, 158.0, 84.0, 65.0, 58.0, 24.0, 20.0, 16.0, 5.0, 6.0, 6.0, 6.0, 5.0, 0.0, 6.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0263671875, -0.025659561157226562, -0.024951934814453125, -0.024244308471679688, -0.02353668212890625, -0.022829055786132812, -0.022121429443359375, -0.021413803100585938, -0.0207061767578125, -0.019998550415039062, -0.019290924072265625, -0.018583297729492188, -0.01787567138671875, -0.017168045043945312, -0.016460418701171875, -0.015752792358398438, -0.015045166015625, -0.014337539672851562, -0.013629913330078125, -0.012922286987304688, -0.01221466064453125, -0.011507034301757812, -0.010799407958984375, -0.010091781616210938, -0.0093841552734375, -0.008676528930664062, -0.007968902587890625, -0.0072612762451171875, -0.00655364990234375, -0.0058460235595703125, -0.005138397216796875, -0.0044307708740234375, -0.00372314453125, -0.0030155181884765625, -0.002307891845703125, -0.0016002655029296875, -0.00089263916015625, -0.0001850128173828125, 0.000522613525390625, 0.0012302398681640625, 0.0019378662109375, 0.0026454925537109375, 0.003353118896484375, 0.0040607452392578125, 0.00476837158203125, 0.0054759979248046875, 0.006183624267578125, 0.0068912506103515625, 0.007598876953125, 0.008306503295898438, 0.009014129638671875, 0.009721755981445312, 0.01042938232421875, 0.011137008666992188, 0.011844635009765625, 0.012552261352539062, 0.0132598876953125, 0.013967514038085938, 0.014675140380859375, 0.015382766723632812, 0.01609039306640625, 0.016798019409179688, 0.017505645751953125, 0.018213272094726562, 0.0189208984375]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 62.0, 898.0, 54.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0038358247838914394, -0.0037702531553804874, -0.003704681294038892, -0.00363910966552794, -0.003573537804186344, -0.003507966175675392, -0.0034423943143337965, -0.0033768226858228445, -0.003311250824481249, -0.003245679195970297, -0.003180107334628701, -0.003114535706117749, -0.0030489638447761536, -0.0029833922162652016, -0.002917820354923606, -0.002852248726412654, -0.0027866768650710583, -0.0027211052365601063, -0.0026555333752185106, -0.0025899617467075586, -0.002524389885365963, -0.002458818256855011, -0.0023932463955134153, -0.0023276747670024633, -0.0022621031384915113, -0.0021965315099805593, -0.0021309596486389637, -0.0020653880201280117, -0.001999816158786416, -0.0019342444138601422, -0.0018686726689338684, -0.0018031010404229164, -0.0017375292954966426, -0.0016719575505703688, -0.001606385805644095, -0.0015408140607178211, -0.0014752423157915473, -0.0014096705708652735, -0.0013440989423543215, -0.0012785270810127258, -0.0012129554525017738, -0.0011473837075755, -0.0010818119626492262, -0.0010162402177229524, -0.0009506684727966785, -0.0008850967278704047, -0.0008195250411517918, -0.000753953296225518, -0.0006883814930915833, -0.0006228097481653094, -0.0005572380032390356, -0.0004916662583127618, -0.0004260945424903184, -0.0003605227975640446, -0.00029495108174160123, -0.0002293793368153274, -0.00016380762099288404, -9.823588334256783e-05, -3.266414569225162e-05, 3.290758468210697e-05, 9.84793296083808e-05, 0.00016405107453465462, 0.00022962279035709798, 0.0002951945352833718, 0.00036076628020964563]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 9.0, 7.0, 7.0, 8.0, 13.0, 20.0, 13.0, 27.0, 22.0, 30.0, 18.0, 22.0, 32.0, 35.0, 35.0, 32.0, 33.0, 36.0, 35.0, 39.0, 43.0, 52.0, 27.0, 33.0, 28.0, 37.0, 31.0, 32.0, 24.0, 29.0, 32.0, 23.0, 16.0, 19.0, 19.0, 16.0, 11.0, 11.0, 8.0, 9.0, 5.0, 3.0, 5.0, 3.0, 4.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0003237724304199219, -0.0003135325387120247, -0.0003032926470041275, -0.0002930527552962303, -0.00028281286358833313, -0.00027257297188043594, -0.00026233308017253876, -0.00025209318846464157, -0.00024185329675674438, -0.0002316134050488472, -0.00022137351334095, -0.00021113362163305283, -0.00020089372992515564, -0.00019065383821725845, -0.00018041394650936127, -0.00017017405480146408, -0.0001599341630935669, -0.0001496942713856697, -0.00013945437967777252, -0.00012921448796987534, -0.00011897459626197815, -0.00010873470455408096, -9.849481284618378e-05, -8.825492113828659e-05, -7.80150294303894e-05, -6.777513772249222e-05, -5.753524601459503e-05, -4.7295354306697845e-05, -3.705546259880066e-05, -2.6815570890903473e-05, -1.6575679183006287e-05, -6.3357874751091e-06, 3.904104232788086e-06, 1.4143995940685272e-05, 2.438388764858246e-05, 3.4623779356479645e-05, 4.486367106437683e-05, 5.510356277227402e-05, 6.53434544801712e-05, 7.558334618806839e-05, 8.582323789596558e-05, 9.606312960386276e-05, 0.00010630302131175995, 0.00011654291301965714, 0.00012678280472755432, 0.0001370226964354515, 0.0001472625881433487, 0.00015750247985124588, 0.00016774237155914307, 0.00017798226326704025, 0.00018822215497493744, 0.00019846204668283463, 0.0002087019383907318, 0.000218941830098629, 0.00022918172180652618, 0.00023942161351442337, 0.00024966150522232056, 0.00025990139693021774, 0.00027014128863811493, 0.0002803811803460121, 0.0002906210720539093, 0.0003008609637618065, 0.0003111008554697037, 0.00032134074717760086, 0.00033158063888549805]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 3.0, 4.0, 8.0, 9.0, 8.0, 16.0, 13.0, 15.0, 14.0, 18.0, 15.0, 27.0, 32.0, 33.0, 25.0, 32.0, 42.0, 29.0, 48.0, 46.0, 43.0, 54.0, 54.0, 50.0, 36.0, 43.0, 37.0, 28.0, 32.0, 26.0, 36.0, 25.0, 23.0, 15.0, 14.0, 14.0, 11.0, 4.0, 5.0, 8.0, 4.0, 3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6328125, -4.4781494140625, -4.323486328125, -4.1688232421875, -4.01416015625, -3.8594970703125, -3.704833984375, -3.5501708984375, -3.3955078125, -3.2408447265625, -3.086181640625, -2.9315185546875, -2.77685546875, -2.6221923828125, -2.467529296875, -2.3128662109375, -2.158203125, -2.0035400390625, -1.848876953125, -1.6942138671875, -1.53955078125, -1.3848876953125, -1.230224609375, -1.0755615234375, -0.9208984375, -0.7662353515625, -0.611572265625, -0.4569091796875, -0.30224609375, -0.1475830078125, 0.007080078125, 0.1617431640625, 0.31640625, 0.4710693359375, 0.625732421875, 0.7803955078125, 0.93505859375, 1.0897216796875, 1.244384765625, 1.3990478515625, 1.5537109375, 1.7083740234375, 1.863037109375, 2.0177001953125, 2.17236328125, 2.3270263671875, 2.481689453125, 2.6363525390625, 2.791015625, 2.9456787109375, 3.100341796875, 3.2550048828125, 3.40966796875, 3.5643310546875, 3.718994140625, 3.8736572265625, 4.0283203125, 4.1829833984375, 4.337646484375, 4.4923095703125, 4.64697265625, 4.8016357421875, 4.956298828125, 5.1109619140625, 5.265625]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 7.0, 4.0, 11.0, 11.0, 17.0, 19.0, 49.0, 44.0, 54.0, 83.0, 115.0, 182.0, 259.0, 396.0, 597.0, 1001.0, 2050.0, 4349.0, 10769.0, 31768.0, 116817.0, 473789.0, 300505.0, 69513.0, 21136.0, 7723.0, 3249.0, 1566.0, 900.0, 504.0, 325.0, 232.0, 144.0, 110.0, 80.0, 49.0, 32.0, 27.0, 22.0, 15.0, 11.0, 8.0, 3.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.7265625, -4.57318115234375, -4.4197998046875, -4.26641845703125, -4.113037109375, -3.95965576171875, -3.8062744140625, -3.65289306640625, -3.49951171875, -3.34613037109375, -3.1927490234375, -3.03936767578125, -2.885986328125, -2.73260498046875, -2.5792236328125, -2.42584228515625, -2.2724609375, -2.11907958984375, -1.9656982421875, -1.81231689453125, -1.658935546875, -1.50555419921875, -1.3521728515625, -1.19879150390625, -1.04541015625, -0.89202880859375, -0.7386474609375, -0.58526611328125, -0.431884765625, -0.27850341796875, -0.1251220703125, 0.02825927734375, 0.181640625, 0.33502197265625, 0.4884033203125, 0.64178466796875, 0.795166015625, 0.94854736328125, 1.1019287109375, 1.25531005859375, 1.40869140625, 1.56207275390625, 1.7154541015625, 1.86883544921875, 2.022216796875, 2.17559814453125, 2.3289794921875, 2.48236083984375, 2.6357421875, 2.78912353515625, 2.9425048828125, 3.09588623046875, 3.249267578125, 3.40264892578125, 3.5560302734375, 3.70941162109375, 3.86279296875, 4.01617431640625, 4.1695556640625, 4.32293701171875, 4.476318359375, 4.62969970703125, 4.7830810546875, 4.93646240234375, 5.08984375]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 6.0, 2.0, 2.0, 6.0, 8.0, 11.0, 16.0, 15.0, 13.0, 23.0, 24.0, 18.0, 37.0, 31.0, 47.0, 27.0, 41.0, 43.0, 51.0, 71.0, 254.0, 1705.0, 109.0, 75.0, 48.0, 40.0, 47.0, 48.0, 37.0, 33.0, 24.0, 23.0, 21.0, 15.0, 14.0, 19.0, 12.0, 7.0, 5.0, 6.0, 3.0, 7.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.40625, -12.914306640625, -12.42236328125, -11.930419921875, -11.4384765625, -10.946533203125, -10.45458984375, -9.962646484375, -9.470703125, -8.978759765625, -8.48681640625, -7.994873046875, -7.5029296875, -7.010986328125, -6.51904296875, -6.027099609375, -5.53515625, -5.043212890625, -4.55126953125, -4.059326171875, -3.5673828125, -3.075439453125, -2.58349609375, -2.091552734375, -1.599609375, -1.107666015625, -0.61572265625, -0.123779296875, 0.3681640625, 0.860107421875, 1.35205078125, 1.843994140625, 2.3359375, 2.827880859375, 3.31982421875, 3.811767578125, 4.3037109375, 4.795654296875, 5.28759765625, 5.779541015625, 6.271484375, 6.763427734375, 7.25537109375, 7.747314453125, 8.2392578125, 8.731201171875, 9.22314453125, 9.715087890625, 10.20703125, 10.698974609375, 11.19091796875, 11.682861328125, 12.1748046875, 12.666748046875, 13.15869140625, 13.650634765625, 14.142578125, 14.634521484375, 15.12646484375, 15.618408203125, 16.1103515625, 16.602294921875, 17.09423828125, 17.586181640625, 18.078125]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 5.0, 5.0, 2.0, 4.0, 9.0, 5.0, 15.0, 14.0, 18.0, 20.0, 23.0, 21.0, 32.0, 45.0, 57.0, 70.0, 104.0, 181.0, 366.0, 1230.0, 9939.0, 3081126.0, 49052.0, 2111.0, 560.0, 227.0, 98.0, 75.0, 50.0, 54.0, 38.0, 19.0, 29.0, 20.0, 11.0, 18.0, 11.0, 12.0, 10.0, 5.0, 3.0, 5.0, 5.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-41.59375, -40.45947265625, -39.3251953125, -38.19091796875, -37.056640625, -35.92236328125, -34.7880859375, -33.65380859375, -32.51953125, -31.38525390625, -30.2509765625, -29.11669921875, -27.982421875, -26.84814453125, -25.7138671875, -24.57958984375, -23.4453125, -22.31103515625, -21.1767578125, -20.04248046875, -18.908203125, -17.77392578125, -16.6396484375, -15.50537109375, -14.37109375, -13.23681640625, -12.1025390625, -10.96826171875, -9.833984375, -8.69970703125, -7.5654296875, -6.43115234375, -5.296875, -4.16259765625, -3.0283203125, -1.89404296875, -0.759765625, 0.37451171875, 1.5087890625, 2.64306640625, 3.77734375, 4.91162109375, 6.0458984375, 7.18017578125, 8.314453125, 9.44873046875, 10.5830078125, 11.71728515625, 12.8515625, 13.98583984375, 15.1201171875, 16.25439453125, 17.388671875, 18.52294921875, 19.6572265625, 20.79150390625, 21.92578125, 23.06005859375, 24.1943359375, 25.32861328125, 26.462890625, 27.59716796875, 28.7314453125, 29.86572265625, 31.0]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 4.0, 9.0, 32.0, 68.0, 176.0, 294.0, 253.0, 112.0, 45.0, 17.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.510897636413574, -10.615629196166992, -9.72036075592041, -8.825092315673828, -7.929824352264404, -7.034555912017822, -6.139287948608398, -5.244019508361816, -4.348751068115234, -3.4534826278686523, -2.5582144260406494, -1.6629462242126465, -0.7676777839660645, 0.12759065628051758, 1.0228586196899414, 1.9181270599365234, 2.8133955001831055, 3.7086639404296875, 4.6039323806762695, 5.499200344085693, 6.394468784332275, 7.289737224578857, 8.185005187988281, 9.080273628234863, 9.975542068481445, 10.870810508728027, 11.76607894897461, 12.661346435546875, 13.556615829467773, 14.451883316040039, 15.347151756286621, 16.242420196533203, 17.13768768310547, 18.032955169677734, 18.928224563598633, 19.8234920501709, 20.718761444091797, 21.614028930664062, 22.509296417236328, 23.404565811157227, 24.299835205078125, 25.19510269165039, 26.09037208557129, 26.985639572143555, 27.880908966064453, 28.77617645263672, 29.671443939208984, 30.566713333129883, 31.46198081970215, 32.35725021362305, 33.25251770019531, 34.14778518676758, 35.043052673339844, 35.938323974609375, 36.83359146118164, 37.728858947753906, 38.62412643432617, 39.51939392089844, 40.4146614074707, 41.309932708740234, 42.2052001953125, 43.100467681884766, 43.99573516845703, 44.89100646972656, 45.78627395629883]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 3.0, 3.0, 1.0, 2.0, 4.0, 5.0, 10.0, 11.0, 15.0, 16.0, 17.0, 23.0, 41.0, 32.0, 28.0, 32.0, 39.0, 47.0, 52.0, 39.0, 54.0, 57.0, 43.0, 48.0, 42.0, 33.0, 39.0, 33.0, 39.0, 28.0, 22.0, 20.0, 23.0, 19.0, 16.0, 14.0, 13.0, 10.0, 8.0, 13.0, 5.0, 4.0, 1.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-56.343387603759766, -54.68840789794922, -53.03342819213867, -51.378448486328125, -49.72346878051758, -48.06848907470703, -46.413509368896484, -44.75852966308594, -43.10354995727539, -41.448570251464844, -39.7935905456543, -38.13861083984375, -36.4836311340332, -34.828651428222656, -33.17367172241211, -31.518692016601562, -29.863712310791016, -28.20873260498047, -26.553752899169922, -24.898773193359375, -23.243793487548828, -21.58881378173828, -19.933834075927734, -18.278854370117188, -16.62387466430664, -14.968894958496094, -13.313915252685547, -11.658935546875, -10.003955841064453, -8.348976135253906, -6.693996429443359, -5.0390167236328125, -3.384033203125, -1.7290534973144531, -0.07407379150390625, 1.5809059143066406, 3.2358856201171875, 4.890865325927734, 6.545845031738281, 8.200824737548828, 9.855804443359375, 11.510784149169922, 13.165763854980469, 14.820743560791016, 16.475723266601562, 18.13070297241211, 19.785682678222656, 21.440662384033203, 23.09564208984375, 24.750621795654297, 26.405601501464844, 28.06058120727539, 29.715560913085938, 31.370540618896484, 33.02552032470703, 34.68050003051758, 36.335479736328125, 37.99045944213867, 39.64543914794922, 41.300418853759766, 42.95539855957031, 44.61037826538086, 46.265357971191406, 47.92033767700195, 49.5753173828125]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 4.0, 3.0, 6.0, 8.0, 9.0, 11.0, 12.0, 16.0, 9.0, 18.0, 19.0, 18.0, 28.0, 25.0, 31.0, 39.0, 24.0, 38.0, 44.0, 48.0, 46.0, 41.0, 58.0, 43.0, 46.0, 39.0, 34.0, 51.0, 26.0, 23.0, 35.0, 34.0, 25.0, 16.0, 18.0, 16.0, 10.0, 8.0, 7.0, 3.0, 7.0, 5.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.8515625, -4.6937255859375, -4.535888671875, -4.3780517578125, -4.22021484375, -4.0623779296875, -3.904541015625, -3.7467041015625, -3.5888671875, -3.4310302734375, -3.273193359375, -3.1153564453125, -2.95751953125, -2.7996826171875, -2.641845703125, -2.4840087890625, -2.326171875, -2.1683349609375, -2.010498046875, -1.8526611328125, -1.69482421875, -1.5369873046875, -1.379150390625, -1.2213134765625, -1.0634765625, -0.9056396484375, -0.747802734375, -0.5899658203125, -0.43212890625, -0.2742919921875, -0.116455078125, 0.0413818359375, 0.19921875, 0.3570556640625, 0.514892578125, 0.6727294921875, 0.83056640625, 0.9884033203125, 1.146240234375, 1.3040771484375, 1.4619140625, 1.6197509765625, 1.777587890625, 1.9354248046875, 2.09326171875, 2.2510986328125, 2.408935546875, 2.5667724609375, 2.724609375, 2.8824462890625, 3.040283203125, 3.1981201171875, 3.35595703125, 3.5137939453125, 3.671630859375, 3.8294677734375, 3.9873046875, 4.1451416015625, 4.302978515625, 4.4608154296875, 4.61865234375, 4.7764892578125, 4.934326171875, 5.0921630859375, 5.25]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 3.0, 5.0, 4.0, 3.0, 14.0, 7.0, 9.0, 19.0, 16.0, 13.0, 36.0, 39.0, 63.0, 55.0, 99.0, 170.0, 273.0, 626.0, 1786.0, 9970.0, 140417.0, 2436292.0, 1520890.0, 74373.0, 6542.0, 1308.0, 534.0, 213.0, 143.0, 89.0, 60.0, 55.0, 40.0, 27.0, 23.0, 14.0, 17.0, 11.0, 10.0, 9.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.84375, -13.364501953125, -12.88525390625, -12.406005859375, -11.9267578125, -11.447509765625, -10.96826171875, -10.489013671875, -10.009765625, -9.530517578125, -9.05126953125, -8.572021484375, -8.0927734375, -7.613525390625, -7.13427734375, -6.655029296875, -6.17578125, -5.696533203125, -5.21728515625, -4.738037109375, -4.2587890625, -3.779541015625, -3.30029296875, -2.821044921875, -2.341796875, -1.862548828125, -1.38330078125, -0.904052734375, -0.4248046875, 0.054443359375, 0.53369140625, 1.012939453125, 1.4921875, 1.971435546875, 2.45068359375, 2.929931640625, 3.4091796875, 3.888427734375, 4.36767578125, 4.846923828125, 5.326171875, 5.805419921875, 6.28466796875, 6.763916015625, 7.2431640625, 7.722412109375, 8.20166015625, 8.680908203125, 9.16015625, 9.639404296875, 10.11865234375, 10.597900390625, 11.0771484375, 11.556396484375, 12.03564453125, 12.514892578125, 12.994140625, 13.473388671875, 13.95263671875, 14.431884765625, 14.9111328125, 15.390380859375, 15.86962890625, 16.348876953125, 16.828125]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 5.0, 10.0, 28.0, 44.0, 56.0, 107.0, 156.0, 290.0, 511.0, 937.0, 855.0, 463.0, 247.0, 151.0, 89.0, 55.0, 28.0, 15.0, 13.0, 11.0, 4.0, 4.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-43.59375, -42.599609375, -41.60546875, -40.611328125, -39.6171875, -38.623046875, -37.62890625, -36.634765625, -35.640625, -34.646484375, -33.65234375, -32.658203125, -31.6640625, -30.669921875, -29.67578125, -28.681640625, -27.6875, -26.693359375, -25.69921875, -24.705078125, -23.7109375, -22.716796875, -21.72265625, -20.728515625, -19.734375, -18.740234375, -17.74609375, -16.751953125, -15.7578125, -14.763671875, -13.76953125, -12.775390625, -11.78125, -10.787109375, -9.79296875, -8.798828125, -7.8046875, -6.810546875, -5.81640625, -4.822265625, -3.828125, -2.833984375, -1.83984375, -0.845703125, 0.1484375, 1.142578125, 2.13671875, 3.130859375, 4.125, 5.119140625, 6.11328125, 7.107421875, 8.1015625, 9.095703125, 10.08984375, 11.083984375, 12.078125, 13.072265625, 14.06640625, 15.060546875, 16.0546875, 17.048828125, 18.04296875, 19.037109375, 20.03125]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 6.0, 8.0, 13.0, 21.0, 44.0, 68.0, 143.0, 262.0, 526.0, 4532.0, 4183976.0, 3651.0, 521.0, 224.0, 140.0, 73.0, 28.0, 36.0, 8.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-88.4375, -84.3212890625, -80.205078125, -76.0888671875, -71.97265625, -67.8564453125, -63.740234375, -59.6240234375, -55.5078125, -51.3916015625, -47.275390625, -43.1591796875, -39.04296875, -34.9267578125, -30.810546875, -26.6943359375, -22.578125, -18.4619140625, -14.345703125, -10.2294921875, -6.11328125, -1.9970703125, 2.119140625, 6.2353515625, 10.3515625, 14.4677734375, 18.583984375, 22.7001953125, 26.81640625, 30.9326171875, 35.048828125, 39.1650390625, 43.28125, 47.3974609375, 51.513671875, 55.6298828125, 59.74609375, 63.8623046875, 67.978515625, 72.0947265625, 76.2109375, 80.3271484375, 84.443359375, 88.5595703125, 92.67578125, 96.7919921875, 100.908203125, 105.0244140625, 109.140625, 113.2568359375, 117.373046875, 121.4892578125, 125.60546875, 129.7216796875, 133.837890625, 137.9541015625, 142.0703125, 146.1865234375, 150.302734375, 154.4189453125, 158.53515625, 162.6513671875, 166.767578125, 170.8837890625, 175.0]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 16.0, 184.0, 567.0, 229.0, 18.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-252.74034118652344, -246.93943786621094, -241.13853454589844, -235.33763122558594, -229.53672790527344, -223.73582458496094, -217.93490600585938, -212.13400268554688, -206.33309936523438, -200.53219604492188, -194.73129272460938, -188.93038940429688, -183.12948608398438, -177.32858276367188, -171.52767944335938, -165.72677612304688, -159.92587280273438, -154.12496948242188, -148.32406616210938, -142.52316284179688, -136.72225952148438, -130.92135620117188, -125.12044525146484, -119.31954193115234, -113.51863861083984, -107.71773529052734, -101.91683197021484, -96.11592102050781, -90.31501770019531, -84.51411437988281, -78.71321105957031, -72.91230773925781, -67.11140441894531, -61.31050109863281, -55.50959777832031, -49.70869064331055, -43.90778732299805, -38.10688400268555, -32.30597686767578, -26.50507354736328, -20.70417022705078, -14.903265953063965, -9.102361679077148, -3.3014564514160156, 2.4994468688964844, 8.300350189208984, 14.10125732421875, 19.90216064453125, 25.70306396484375, 31.50396728515625, 37.30487060546875, 43.105777740478516, 48.906681060791016, 54.707584381103516, 60.50849151611328, 66.30939483642578, 72.11029815673828, 77.91120147705078, 83.71210479736328, 89.51301574707031, 95.31391906738281, 101.11482238769531, 106.91572570800781, 112.71662902832031, 118.51753234863281]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 1.0, 6.0, 5.0, 11.0, 6.0, 13.0, 21.0, 12.0, 19.0, 15.0, 19.0, 28.0, 24.0, 21.0, 30.0, 33.0, 40.0, 43.0, 45.0, 35.0, 49.0, 39.0, 46.0, 45.0, 45.0, 46.0, 32.0, 31.0, 31.0, 38.0, 30.0, 24.0, 13.0, 19.0, 19.0, 9.0, 14.0, 10.0, 8.0, 9.0, 7.0, 2.0, 8.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-60.50434112548828, -58.59681701660156, -56.68928909301758, -54.78176498413086, -52.874237060546875, -50.966712951660156, -49.05918502807617, -47.15166091918945, -45.24413299560547, -43.33660888671875, -41.429080963134766, -39.52155685424805, -37.61402893066406, -35.706504821777344, -33.79897689819336, -31.89145278930664, -29.98392677307129, -28.076400756835938, -26.168874740600586, -24.261348724365234, -22.353822708129883, -20.44629669189453, -18.538772583007812, -16.631244659423828, -14.723719596862793, -12.816193580627441, -10.90866756439209, -9.001142501831055, -7.093616008758545, -5.186090469360352, -3.278564453125, -1.3710384368896484, 0.5364875793457031, 2.4440135955810547, 4.351539611816406, 6.2590651512146, 8.16659164428711, 10.074116706848145, 11.981642723083496, 13.889168739318848, 15.7966947555542, 17.704219818115234, 19.611745834350586, 21.519271850585938, 23.42679786682129, 25.33432388305664, 27.241849899291992, 29.149375915527344, 31.056901931762695, 32.96442794799805, 34.871952056884766, 36.77947998046875, 38.68700408935547, 40.59453201293945, 42.50205612182617, 44.409584045410156, 46.317108154296875, 48.224632263183594, 50.13216018676758, 52.0396842956543, 53.94721221923828, 55.854736328125, 57.762264251708984, 59.6697883605957, 61.57731628417969]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 1.0, 1.0, 7.0, 7.0, 4.0, 13.0, 14.0, 7.0, 17.0, 13.0, 19.0, 26.0, 22.0, 27.0, 25.0, 19.0, 31.0, 37.0, 23.0, 45.0, 48.0, 40.0, 45.0, 38.0, 34.0, 44.0, 45.0, 39.0, 43.0, 31.0, 29.0, 40.0, 27.0, 19.0, 23.0, 18.0, 15.0, 16.0, 13.0, 12.0, 4.0, 5.0, 6.0, 1.0, 5.0, 3.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.78515625, -4.6356201171875, -4.486083984375, -4.3365478515625, -4.18701171875, -4.0374755859375, -3.887939453125, -3.7384033203125, -3.5888671875, -3.4393310546875, -3.289794921875, -3.1402587890625, -2.99072265625, -2.8411865234375, -2.691650390625, -2.5421142578125, -2.392578125, -2.2430419921875, -2.093505859375, -1.9439697265625, -1.79443359375, -1.6448974609375, -1.495361328125, -1.3458251953125, -1.1962890625, -1.0467529296875, -0.897216796875, -0.7476806640625, -0.59814453125, -0.4486083984375, -0.299072265625, -0.1495361328125, 0.0, 0.1495361328125, 0.299072265625, 0.4486083984375, 0.59814453125, 0.7476806640625, 0.897216796875, 1.0467529296875, 1.1962890625, 1.3458251953125, 1.495361328125, 1.6448974609375, 1.79443359375, 1.9439697265625, 2.093505859375, 2.2430419921875, 2.392578125, 2.5421142578125, 2.691650390625, 2.8411865234375, 2.99072265625, 3.1402587890625, 3.289794921875, 3.4393310546875, 3.5888671875, 3.7384033203125, 3.887939453125, 4.0374755859375, 4.18701171875, 4.3365478515625, 4.486083984375, 4.6356201171875, 4.78515625]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 8.0, 9.0, 7.0, 18.0, 20.0, 47.0, 44.0, 84.0, 113.0, 178.0, 251.0, 388.0, 541.0, 804.0, 1170.0, 1820.0, 2643.0, 3986.0, 6139.0, 9385.0, 14666.0, 23172.0, 37371.0, 62690.0, 112315.0, 282149.0, 234013.0, 101973.0, 57020.0, 34453.0, 21329.0, 13647.0, 8757.0, 5836.0, 3842.0, 2462.0, 1744.0, 1087.0, 816.0, 471.0, 374.0, 251.0, 147.0, 118.0, 64.0, 52.0, 36.0, 23.0, 9.0, 10.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.986328125, -0.9554290771484375, -0.924530029296875, -0.8936309814453125, -0.86273193359375, -0.8318328857421875, -0.800933837890625, -0.7700347900390625, -0.7391357421875, -0.7082366943359375, -0.677337646484375, -0.6464385986328125, -0.61553955078125, -0.5846405029296875, -0.553741455078125, -0.5228424072265625, -0.491943359375, -0.4610443115234375, -0.430145263671875, -0.3992462158203125, -0.36834716796875, -0.3374481201171875, -0.306549072265625, -0.2756500244140625, -0.2447509765625, -0.2138519287109375, -0.182952880859375, -0.1520538330078125, -0.12115478515625, -0.0902557373046875, -0.059356689453125, -0.0284576416015625, 0.00244140625, 0.0333404541015625, 0.064239501953125, 0.0951385498046875, 0.12603759765625, 0.1569366455078125, 0.187835693359375, 0.2187347412109375, 0.2496337890625, 0.2805328369140625, 0.311431884765625, 0.3423309326171875, 0.37322998046875, 0.4041290283203125, 0.435028076171875, 0.4659271240234375, 0.496826171875, 0.5277252197265625, 0.558624267578125, 0.5895233154296875, 0.62042236328125, 0.6513214111328125, 0.682220458984375, 0.7131195068359375, 0.7440185546875, 0.7749176025390625, 0.805816650390625, 0.8367156982421875, 0.86761474609375, 0.8985137939453125, 0.929412841796875, 0.9603118896484375, 0.9912109375]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 4.0, 3.0, 5.0, 12.0, 4.0, 13.0, 13.0, 16.0, 17.0, 20.0, 22.0, 24.0, 24.0, 32.0, 25.0, 32.0, 27.0, 38.0, 45.0, 37.0, 45.0, 1070.0, 49.0, 49.0, 37.0, 51.0, 29.0, 36.0, 32.0, 17.0, 22.0, 23.0, 31.0, 22.0, 15.0, 16.0, 18.0, 6.0, 16.0, 12.0, 4.0, 4.0, 2.0, 4.0, 1.0, 4.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.927734375, -2.8360595703125, -2.744384765625, -2.6527099609375, -2.56103515625, -2.4693603515625, -2.377685546875, -2.2860107421875, -2.1943359375, -2.1026611328125, -2.010986328125, -1.9193115234375, -1.82763671875, -1.7359619140625, -1.644287109375, -1.5526123046875, -1.4609375, -1.3692626953125, -1.277587890625, -1.1859130859375, -1.09423828125, -1.0025634765625, -0.910888671875, -0.8192138671875, -0.7275390625, -0.6358642578125, -0.544189453125, -0.4525146484375, -0.36083984375, -0.2691650390625, -0.177490234375, -0.0858154296875, 0.005859375, 0.0975341796875, 0.189208984375, 0.2808837890625, 0.37255859375, 0.4642333984375, 0.555908203125, 0.6475830078125, 0.7392578125, 0.8309326171875, 0.922607421875, 1.0142822265625, 1.10595703125, 1.1976318359375, 1.289306640625, 1.3809814453125, 1.47265625, 1.5643310546875, 1.656005859375, 1.7476806640625, 1.83935546875, 1.9310302734375, 2.022705078125, 2.1143798828125, 2.2060546875, 2.2977294921875, 2.389404296875, 2.4810791015625, 2.57275390625, 2.6644287109375, 2.756103515625, 2.8477783203125, 2.939453125]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 10.0, 7.0, 19.0, 13.0, 22.0, 29.0, 60.0, 74.0, 123.0, 188.0, 263.0, 469.0, 704.0, 1066.0, 1703.0, 2784.0, 4381.0, 7183.0, 11736.0, 19116.0, 30986.0, 53095.0, 102412.0, 1363103.0, 273790.0, 96287.0, 50323.0, 29650.0, 18108.0, 11164.0, 6848.0, 4245.0, 2621.0, 1613.0, 1026.0, 662.0, 415.0, 286.0, 183.0, 126.0, 76.0, 58.0, 40.0, 26.0, 14.0, 10.0, 9.0, 6.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0263671875, -0.9942474365234375, -0.962127685546875, -0.9300079345703125, -0.89788818359375, -0.8657684326171875, -0.833648681640625, -0.8015289306640625, -0.7694091796875, -0.7372894287109375, -0.705169677734375, -0.6730499267578125, -0.64093017578125, -0.6088104248046875, -0.576690673828125, -0.5445709228515625, -0.512451171875, -0.4803314208984375, -0.448211669921875, -0.4160919189453125, -0.38397216796875, -0.3518524169921875, -0.319732666015625, -0.2876129150390625, -0.2554931640625, -0.2233734130859375, -0.191253662109375, -0.1591339111328125, -0.12701416015625, -0.0948944091796875, -0.062774658203125, -0.0306549072265625, 0.00146484375, 0.0335845947265625, 0.065704345703125, 0.0978240966796875, 0.12994384765625, 0.1620635986328125, 0.194183349609375, 0.2263031005859375, 0.2584228515625, 0.2905426025390625, 0.322662353515625, 0.3547821044921875, 0.38690185546875, 0.4190216064453125, 0.451141357421875, 0.4832611083984375, 0.515380859375, 0.5475006103515625, 0.579620361328125, 0.6117401123046875, 0.64385986328125, 0.6759796142578125, 0.708099365234375, 0.7402191162109375, 0.7723388671875, 0.8044586181640625, 0.836578369140625, 0.8686981201171875, 0.90081787109375, 0.9329376220703125, 0.965057373046875, 0.9971771240234375, 1.029296875]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 5.0, 3.0, 4.0, 7.0, 6.0, 7.0, 5.0, 12.0, 17.0, 15.0, 13.0, 28.0, 24.0, 29.0, 32.0, 30.0, 35.0, 37.0, 39.0, 56.0, 53.0, 47.0, 46.0, 52.0, 46.0, 54.0, 50.0, 41.0, 33.0, 18.0, 35.0, 34.0, 13.0, 11.0, 12.0, 10.0, 8.0, 9.0, 6.0, 4.0, 6.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.0005059242248535156, -0.0004913359880447388, -0.0004767477512359619, -0.00046215951442718506, -0.0004475712776184082, -0.00043298304080963135, -0.0004183948040008545, -0.00040380656719207764, -0.0003892183303833008, -0.0003746300935745239, -0.00036004185676574707, -0.0003454536199569702, -0.00033086538314819336, -0.0003162771463394165, -0.00030168890953063965, -0.0002871006727218628, -0.00027251243591308594, -0.0002579241991043091, -0.00024333596229553223, -0.00022874772548675537, -0.00021415948867797852, -0.00019957125186920166, -0.0001849830150604248, -0.00017039477825164795, -0.0001558065414428711, -0.00014121830463409424, -0.00012663006782531738, -0.00011204183101654053, -9.745359420776367e-05, -8.286535739898682e-05, -6.827712059020996e-05, -5.3688883781433105e-05, -3.910064697265625e-05, -2.4512410163879395e-05, -9.924173355102539e-06, 4.664063453674316e-06, 1.9252300262451172e-05, 3.384053707122803e-05, 4.842877388000488e-05, 6.301701068878174e-05, 7.76052474975586e-05, 9.219348430633545e-05, 0.0001067817211151123, 0.00012136995792388916, 0.00013595819473266602, 0.00015054643154144287, 0.00016513466835021973, 0.00017972290515899658, 0.00019431114196777344, 0.0002088993787765503, 0.00022348761558532715, 0.000238075852394104, 0.00025266408920288086, 0.0002672523260116577, 0.00028184056282043457, 0.0002964287996292114, 0.0003110170364379883, 0.00032560527324676514, 0.000340193510055542, 0.00035478174686431885, 0.0003693699836730957, 0.00038395822048187256, 0.0003985464572906494, 0.00041313469409942627, 0.0004277229309082031]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 6.0, 2.0, 2.0, 3.0, 11.0, 14.0, 12.0, 21.0, 18.0, 32.0, 30.0, 35.0, 50.0, 60.0, 88.0, 130.0, 223.0, 462.0, 1658.0, 1041655.0, 2730.0, 542.0, 250.0, 121.0, 92.0, 61.0, 60.0, 34.0, 36.0, 17.0, 22.0, 18.0, 15.0, 9.0, 11.0, 5.0, 6.0, 6.0, 4.0, 2.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.01290130615234375, -0.012479066848754883, -0.012056827545166016, -0.011634588241577148, -0.011212348937988281, -0.010790109634399414, -0.010367870330810547, -0.00994563102722168, -0.009523391723632812, -0.009101152420043945, -0.008678913116455078, -0.008256673812866211, -0.007834434509277344, -0.0074121952056884766, -0.006989955902099609, -0.006567716598510742, -0.006145477294921875, -0.005723237991333008, -0.005300998687744141, -0.0048787593841552734, -0.004456520080566406, -0.004034280776977539, -0.003612041473388672, -0.0031898021697998047, -0.0027675628662109375, -0.0023453235626220703, -0.0019230842590332031, -0.001500844955444336, -0.0010786056518554688, -0.0006563663482666016, -0.00023412704467773438, 0.0001881122589111328, 0.0006103515625, 0.0010325908660888672, 0.0014548301696777344, 0.0018770694732666016, 0.0022993087768554688, 0.002721548080444336, 0.003143787384033203, 0.0035660266876220703, 0.0039882659912109375, 0.004410505294799805, 0.004832744598388672, 0.005254983901977539, 0.005677223205566406, 0.0060994625091552734, 0.006521701812744141, 0.006943941116333008, 0.007366180419921875, 0.007788419723510742, 0.00821065902709961, 0.008632898330688477, 0.009055137634277344, 0.009477376937866211, 0.009899616241455078, 0.010321855545043945, 0.010744094848632812, 0.01116633415222168, 0.011588573455810547, 0.012010812759399414, 0.012433052062988281, 0.012855291366577148, 0.013277530670166016, 0.013699769973754883, 0.01412200927734375]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 8.0, 215.0, 673.0, 114.0, 6.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002901624538935721, -0.00024495599791407585, -0.00019974951283074915, -0.00015454304229933769, -0.00010933657176792622, -6.413010123651475e-05, -1.8923630705103278e-05, 2.628285437822342e-05, 7.148931035771966e-05, 0.00011669578088913113, 0.0001619022514205426, 0.00020710872195195407, 0.00025231519248336554, 0.0002975216484628618, 0.0003427281335461885, 0.00038793461862951517, 0.0004331410746090114, 0.00047834753058850765, 0.0005235540447756648, 0.000568760500755161, 0.0006139669567346573, 0.0006591734127141535, 0.0007043798686936498, 0.0007495863828808069, 0.0007947928388603032, 0.0008399992948397994, 0.0008852058090269566, 0.0009304122650064528, 0.000975618720985949, 0.0010208252351731062, 0.0010660316329449415, 0.0011112381471320987, 0.0011564446613192558, 0.001201651175506413, 0.0012468575732782483, 0.0012920640874654055, 0.0013372704852372408, 0.001382476999424398, 0.001427683513611555, 0.0014728899113833904, 0.0015180964255705476, 0.0015633029397577047, 0.00160850933752954, 0.0016537158517166972, 0.0016989223659038544, 0.0017441287636756897, 0.0017893352778628469, 0.001834541792050004, 0.0018797481898218393, 0.0019249547040089965, 0.0019701612181961536, 0.002015367615967989, 0.0020605740137398243, 0.0021057806443423033, 0.0021509870421141386, 0.002196193439885974, 0.002241400070488453, 0.0022866064682602882, 0.0023318130988627672, 0.0023770194966346025, 0.002422225894406438, 0.002467432525008917, 0.002512638922780752, 0.0025578453205525875, 0.002603051718324423]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 6.0, 2.0, 7.0, 8.0, 5.0, 8.0, 13.0, 12.0, 15.0, 14.0, 14.0, 30.0, 27.0, 36.0, 28.0, 37.0, 40.0, 48.0, 50.0, 45.0, 40.0, 41.0, 46.0, 38.0, 48.0, 47.0, 40.0, 36.0, 29.0, 34.0, 25.0, 22.0, 17.0, 19.0, 14.0, 15.0, 13.0, 12.0, 7.0, 9.0, 5.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002866387367248535, -0.00027763936668634415, -0.0002686399966478348, -0.0002596406266093254, -0.00025064125657081604, -0.00024164188653230667, -0.0002326425164937973, -0.00022364314645528793, -0.00021464377641677856, -0.0002056444063782692, -0.00019664503633975983, -0.00018764566630125046, -0.0001786462962627411, -0.00016964692622423172, -0.00016064755618572235, -0.00015164818614721298, -0.0001426488161087036, -0.00013364944607019424, -0.00012465007603168488, -0.0001156507059931755, -0.00010665133595466614, -9.765196591615677e-05, -8.86525958776474e-05, -7.965322583913803e-05, -7.065385580062866e-05, -6.165448576211929e-05, -5.2655115723609924e-05, -4.3655745685100555e-05, -3.4656375646591187e-05, -2.5657005608081818e-05, -1.665763556957245e-05, -7.65826553106308e-06, 1.341104507446289e-06, 1.0340474545955658e-05, 1.9339844584465027e-05, 2.8339214622974396e-05, 3.7338584661483765e-05, 4.6337954699993134e-05, 5.53373247385025e-05, 6.433669477701187e-05, 7.333606481552124e-05, 8.233543485403061e-05, 9.133480489253998e-05, 0.00010033417493104935, 0.00010933354496955872, 0.00011833291500806808, 0.00012733228504657745, 0.00013633165508508682, 0.0001453310251235962, 0.00015433039516210556, 0.00016332976520061493, 0.0001723291352391243, 0.00018132850527763367, 0.00019032787531614304, 0.0001993272453546524, 0.00020832661539316177, 0.00021732598543167114, 0.0002263253554701805, 0.00023532472550868988, 0.00024432409554719925, 0.0002533234655857086, 0.000262322835624218, 0.00027132220566272736, 0.0002803215757012367, 0.0002893209457397461]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 1.0, 1.0, 7.0, 7.0, 4.0, 13.0, 14.0, 7.0, 17.0, 13.0, 19.0, 26.0, 22.0, 27.0, 25.0, 19.0, 31.0, 37.0, 23.0, 45.0, 48.0, 40.0, 45.0, 38.0, 34.0, 44.0, 45.0, 39.0, 43.0, 31.0, 29.0, 40.0, 27.0, 19.0, 23.0, 18.0, 15.0, 16.0, 13.0, 12.0, 4.0, 5.0, 6.0, 1.0, 5.0, 3.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.78515625, -4.6356201171875, -4.486083984375, -4.3365478515625, -4.18701171875, -4.0374755859375, -3.887939453125, -3.7384033203125, -3.5888671875, -3.4393310546875, -3.289794921875, -3.1402587890625, -2.99072265625, -2.8411865234375, -2.691650390625, -2.5421142578125, -2.392578125, -2.2430419921875, -2.093505859375, -1.9439697265625, -1.79443359375, -1.6448974609375, -1.495361328125, -1.3458251953125, -1.1962890625, -1.0467529296875, -0.897216796875, -0.7476806640625, -0.59814453125, -0.4486083984375, -0.299072265625, -0.1495361328125, 0.0, 0.1495361328125, 0.299072265625, 0.4486083984375, 0.59814453125, 0.7476806640625, 0.897216796875, 1.0467529296875, 1.1962890625, 1.3458251953125, 1.495361328125, 1.6448974609375, 1.79443359375, 1.9439697265625, 2.093505859375, 2.2430419921875, 2.392578125, 2.5421142578125, 2.691650390625, 2.8411865234375, 2.99072265625, 3.1402587890625, 3.289794921875, 3.4393310546875, 3.5888671875, 3.7384033203125, 3.887939453125, 4.0374755859375, 4.18701171875, 4.3365478515625, 4.486083984375, 4.6356201171875, 4.78515625]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 5.0, 14.0, 8.0, 17.0, 18.0, 29.0, 43.0, 65.0, 100.0, 134.0, 165.0, 283.0, 403.0, 576.0, 924.0, 1573.0, 2919.0, 5711.0, 12399.0, 29940.0, 77039.0, 227586.0, 439785.0, 152683.0, 54507.0, 21695.0, 9324.0, 4553.0, 2311.0, 1302.0, 795.0, 531.0, 337.0, 214.0, 162.0, 116.0, 88.0, 66.0, 38.0, 37.0, 14.0, 15.0, 9.0, 12.0, 7.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.21484375, -3.112213134765625, -3.00958251953125, -2.906951904296875, -2.8043212890625, -2.701690673828125, -2.59906005859375, -2.496429443359375, -2.393798828125, -2.291168212890625, -2.18853759765625, -2.085906982421875, -1.9832763671875, -1.880645751953125, -1.77801513671875, -1.675384521484375, -1.57275390625, -1.470123291015625, -1.36749267578125, -1.264862060546875, -1.1622314453125, -1.059600830078125, -0.95697021484375, -0.854339599609375, -0.751708984375, -0.649078369140625, -0.54644775390625, -0.443817138671875, -0.3411865234375, -0.238555908203125, -0.13592529296875, -0.033294677734375, 0.0693359375, 0.171966552734375, 0.27459716796875, 0.377227783203125, 0.4798583984375, 0.582489013671875, 0.68511962890625, 0.787750244140625, 0.890380859375, 0.993011474609375, 1.09564208984375, 1.198272705078125, 1.3009033203125, 1.403533935546875, 1.50616455078125, 1.608795166015625, 1.71142578125, 1.814056396484375, 1.91668701171875, 2.019317626953125, 2.1219482421875, 2.224578857421875, 2.32720947265625, 2.429840087890625, 2.532470703125, 2.635101318359375, 2.73773193359375, 2.840362548828125, 2.9429931640625, 3.045623779296875, 3.14825439453125, 3.250885009765625, 3.353515625]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 5.0, 7.0, 5.0, 3.0, 6.0, 13.0, 11.0, 14.0, 5.0, 22.0, 10.0, 27.0, 27.0, 22.0, 35.0, 40.0, 34.0, 29.0, 40.0, 48.0, 54.0, 123.0, 1744.0, 199.0, 71.0, 47.0, 49.0, 56.0, 36.0, 31.0, 34.0, 28.0, 30.0, 23.0, 22.0, 23.0, 16.0, 12.0, 10.0, 8.0, 9.0, 5.0, 2.0, 2.0, 5.0, 3.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-17.15625, -16.64697265625, -16.1376953125, -15.62841796875, -15.119140625, -14.60986328125, -14.1005859375, -13.59130859375, -13.08203125, -12.57275390625, -12.0634765625, -11.55419921875, -11.044921875, -10.53564453125, -10.0263671875, -9.51708984375, -9.0078125, -8.49853515625, -7.9892578125, -7.47998046875, -6.970703125, -6.46142578125, -5.9521484375, -5.44287109375, -4.93359375, -4.42431640625, -3.9150390625, -3.40576171875, -2.896484375, -2.38720703125, -1.8779296875, -1.36865234375, -0.859375, -0.35009765625, 0.1591796875, 0.66845703125, 1.177734375, 1.68701171875, 2.1962890625, 2.70556640625, 3.21484375, 3.72412109375, 4.2333984375, 4.74267578125, 5.251953125, 5.76123046875, 6.2705078125, 6.77978515625, 7.2890625, 7.79833984375, 8.3076171875, 8.81689453125, 9.326171875, 9.83544921875, 10.3447265625, 10.85400390625, 11.36328125, 11.87255859375, 12.3818359375, 12.89111328125, 13.400390625, 13.90966796875, 14.4189453125, 14.92822265625, 15.4375]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 1.0, 2.0, 7.0, 3.0, 13.0, 7.0, 11.0, 16.0, 20.0, 20.0, 21.0, 28.0, 36.0, 46.0, 57.0, 79.0, 115.0, 215.0, 374.0, 815.0, 4514.0, 481611.0, 2648287.0, 7264.0, 1045.0, 366.0, 207.0, 121.0, 66.0, 72.0, 54.0, 38.0, 27.0, 32.0, 18.0, 15.0, 16.0, 8.0, 12.0, 16.0, 4.0, 4.0, 6.0, 8.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-26.84375, -25.980224609375, -25.11669921875, -24.253173828125, -23.3896484375, -22.526123046875, -21.66259765625, -20.799072265625, -19.935546875, -19.072021484375, -18.20849609375, -17.344970703125, -16.4814453125, -15.617919921875, -14.75439453125, -13.890869140625, -13.02734375, -12.163818359375, -11.30029296875, -10.436767578125, -9.5732421875, -8.709716796875, -7.84619140625, -6.982666015625, -6.119140625, -5.255615234375, -4.39208984375, -3.528564453125, -2.6650390625, -1.801513671875, -0.93798828125, -0.074462890625, 0.7890625, 1.652587890625, 2.51611328125, 3.379638671875, 4.2431640625, 5.106689453125, 5.97021484375, 6.833740234375, 7.697265625, 8.560791015625, 9.42431640625, 10.287841796875, 11.1513671875, 12.014892578125, 12.87841796875, 13.741943359375, 14.60546875, 15.468994140625, 16.33251953125, 17.196044921875, 18.0595703125, 18.923095703125, 19.78662109375, 20.650146484375, 21.513671875, 22.377197265625, 23.24072265625, 24.104248046875, 24.9677734375, 25.831298828125, 26.69482421875, 27.558349609375, 28.421875]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 300.0, 686.0, 23.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.977336883544922, -26.33390998840332, -22.69048309326172, -19.047056198120117, -15.403629302978516, -11.760202407836914, -8.116775512695312, -4.473348617553711, -0.8299217224121094, 2.813505172729492, 6.456932067871094, 10.100358963012695, 13.743785858154297, 17.3872127532959, 21.0306396484375, 24.6740665435791, 28.317493438720703, 31.960920333862305, 35.604347229003906, 39.247772216796875, 42.89120101928711, 46.534629821777344, 50.17805480957031, 53.82147979736328, 57.464908599853516, 61.10833740234375, 64.75176239013672, 68.39518737792969, 72.03861999511719, 75.68204498291016, 79.32546997070312, 82.9688949584961, 86.61231994628906, 90.25574493408203, 93.899169921875, 97.5426025390625, 101.18602752685547, 104.82945251464844, 108.47288513183594, 112.1163101196289, 115.75973510742188, 119.40316009521484, 123.04658508300781, 126.69001770019531, 130.33343505859375, 133.97686767578125, 137.62030029296875, 141.2637176513672, 144.9071502685547, 148.5505828857422, 152.19400024414062, 155.83743286132812, 159.48086547851562, 163.12428283691406, 166.76771545410156, 170.4111328125, 174.0545654296875, 177.697998046875, 181.34141540527344, 184.98484802246094, 188.62826538085938, 192.27169799804688, 195.91513061523438, 199.5585479736328, 203.2019805908203]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 4.0, 4.0, 3.0, 11.0, 7.0, 10.0, 13.0, 14.0, 21.0, 20.0, 20.0, 22.0, 22.0, 15.0, 28.0, 36.0, 31.0, 34.0, 32.0, 30.0, 36.0, 36.0, 44.0, 49.0, 42.0, 41.0, 35.0, 29.0, 29.0, 35.0, 38.0, 25.0, 21.0, 19.0, 20.0, 21.0, 23.0, 16.0, 12.0, 5.0, 6.0, 11.0, 9.0, 7.0, 5.0, 5.0, 2.0, 4.0, 2.0, 2.0, 1.0, 5.0, 0.0, 0.0, 1.0, 1.0], "bins": [-52.56560516357422, -50.89552307128906, -49.225440979003906, -47.55535888671875, -45.88528060913086, -44.2151985168457, -42.54511642456055, -40.87503433227539, -39.2049560546875, -37.534873962402344, -35.86479187011719, -34.19470977783203, -32.52463150024414, -30.854549407958984, -29.184467315673828, -27.514385223388672, -25.844303131103516, -24.17422103881836, -22.504140853881836, -20.83405876159668, -19.163978576660156, -17.493896484375, -15.823814392089844, -14.153733253479004, -12.483652114868164, -10.813570976257324, -9.143489837646484, -7.473407745361328, -5.803326606750488, -4.133245468139648, -2.463163375854492, -0.7930822372436523, 0.8769989013671875, 2.5470802783966064, 4.217161655426025, 5.887243270874023, 7.557324409484863, 9.227405548095703, 10.89748764038086, 12.5675687789917, 14.237649917602539, 15.907731056213379, 17.57781219482422, 19.247894287109375, 20.91797637939453, 22.588056564331055, 24.25813865661621, 25.928218841552734, 27.59830093383789, 29.268383026123047, 30.93846321105957, 32.608543395996094, 34.27862548828125, 35.948707580566406, 37.61878967285156, 39.28887176513672, 40.958953857421875, 42.62903594970703, 44.29911804199219, 45.969200134277344, 47.639278411865234, 49.30936050415039, 50.97944259643555, 52.6495246887207, 54.319602966308594]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 1.0, 2.0, 6.0, 5.0, 6.0, 12.0, 10.0, 16.0, 14.0, 16.0, 13.0, 26.0, 20.0, 27.0, 25.0, 20.0, 23.0, 35.0, 35.0, 32.0, 55.0, 43.0, 40.0, 31.0, 37.0, 43.0, 36.0, 44.0, 43.0, 31.0, 26.0, 40.0, 27.0, 21.0, 30.0, 21.0, 19.0, 17.0, 8.0, 12.0, 10.0, 4.0, 7.0, 3.0, 5.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.90234375, -4.7509765625, -4.599609375, -4.4482421875, -4.296875, -4.1455078125, -3.994140625, -3.8427734375, -3.69140625, -3.5400390625, -3.388671875, -3.2373046875, -3.0859375, -2.9345703125, -2.783203125, -2.6318359375, -2.48046875, -2.3291015625, -2.177734375, -2.0263671875, -1.875, -1.7236328125, -1.572265625, -1.4208984375, -1.26953125, -1.1181640625, -0.966796875, -0.8154296875, -0.6640625, -0.5126953125, -0.361328125, -0.2099609375, -0.05859375, 0.0927734375, 0.244140625, 0.3955078125, 0.546875, 0.6982421875, 0.849609375, 1.0009765625, 1.15234375, 1.3037109375, 1.455078125, 1.6064453125, 1.7578125, 1.9091796875, 2.060546875, 2.2119140625, 2.36328125, 2.5146484375, 2.666015625, 2.8173828125, 2.96875, 3.1201171875, 3.271484375, 3.4228515625, 3.57421875, 3.7255859375, 3.876953125, 4.0283203125, 4.1796875, 4.3310546875, 4.482421875, 4.6337890625, 4.78515625]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 0.0, 1.0, 4.0, 4.0, 12.0, 10.0, 7.0, 11.0, 16.0, 16.0, 21.0, 12.0, 21.0, 23.0, 15.0, 39.0, 27.0, 30.0, 24.0, 56.0, 178.0, 927.0, 24435.0, 3753295.0, 411499.0, 2837.0, 344.0, 75.0, 48.0, 31.0, 27.0, 37.0, 34.0, 28.0, 27.0, 23.0, 12.0, 16.0, 11.0, 17.0, 11.0, 2.0, 6.0, 6.0, 2.0, 3.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.0, -30.9912109375, -29.982421875, -28.9736328125, -27.96484375, -26.9560546875, -25.947265625, -24.9384765625, -23.9296875, -22.9208984375, -21.912109375, -20.9033203125, -19.89453125, -18.8857421875, -17.876953125, -16.8681640625, -15.859375, -14.8505859375, -13.841796875, -12.8330078125, -11.82421875, -10.8154296875, -9.806640625, -8.7978515625, -7.7890625, -6.7802734375, -5.771484375, -4.7626953125, -3.75390625, -2.7451171875, -1.736328125, -0.7275390625, 0.28125, 1.2900390625, 2.298828125, 3.3076171875, 4.31640625, 5.3251953125, 6.333984375, 7.3427734375, 8.3515625, 9.3603515625, 10.369140625, 11.3779296875, 12.38671875, 13.3955078125, 14.404296875, 15.4130859375, 16.421875, 17.4306640625, 18.439453125, 19.4482421875, 20.45703125, 21.4658203125, 22.474609375, 23.4833984375, 24.4921875, 25.5009765625, 26.509765625, 27.5185546875, 28.52734375, 29.5361328125, 30.544921875, 31.5537109375, 32.5625]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 6.0, 13.0, 21.0, 38.0, 42.0, 81.0, 125.0, 235.0, 387.0, 675.0, 874.0, 663.0, 416.0, 197.0, 122.0, 60.0, 47.0, 26.0, 23.0, 7.0, 7.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.171875, -28.371337890625, -27.57080078125, -26.770263671875, -25.9697265625, -25.169189453125, -24.36865234375, -23.568115234375, -22.767578125, -21.967041015625, -21.16650390625, -20.365966796875, -19.5654296875, -18.764892578125, -17.96435546875, -17.163818359375, -16.36328125, -15.562744140625, -14.76220703125, -13.961669921875, -13.1611328125, -12.360595703125, -11.56005859375, -10.759521484375, -9.958984375, -9.158447265625, -8.35791015625, -7.557373046875, -6.7568359375, -5.956298828125, -5.15576171875, -4.355224609375, -3.5546875, -2.754150390625, -1.95361328125, -1.153076171875, -0.3525390625, 0.447998046875, 1.24853515625, 2.049072265625, 2.849609375, 3.650146484375, 4.45068359375, 5.251220703125, 6.0517578125, 6.852294921875, 7.65283203125, 8.453369140625, 9.25390625, 10.054443359375, 10.85498046875, 11.655517578125, 12.4560546875, 13.256591796875, 14.05712890625, 14.857666015625, 15.658203125, 16.458740234375, 17.25927734375, 18.059814453125, 18.8603515625, 19.660888671875, 20.46142578125, 21.261962890625, 22.0625]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 9.0, 10.0, 15.0, 37.0, 54.0, 99.0, 155.0, 271.0, 553.0, 7318.0, 4180635.0, 3954.0, 530.0, 262.0, 143.0, 93.0, 54.0, 34.0, 20.0, 7.0, 7.0, 5.0, 4.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-102.125, -98.404296875, -94.68359375, -90.962890625, -87.2421875, -83.521484375, -79.80078125, -76.080078125, -72.359375, -68.638671875, -64.91796875, -61.197265625, -57.4765625, -53.755859375, -50.03515625, -46.314453125, -42.59375, -38.873046875, -35.15234375, -31.431640625, -27.7109375, -23.990234375, -20.26953125, -16.548828125, -12.828125, -9.107421875, -5.38671875, -1.666015625, 2.0546875, 5.775390625, 9.49609375, 13.216796875, 16.9375, 20.658203125, 24.37890625, 28.099609375, 31.8203125, 35.541015625, 39.26171875, 42.982421875, 46.703125, 50.423828125, 54.14453125, 57.865234375, 61.5859375, 65.306640625, 69.02734375, 72.748046875, 76.46875, 80.189453125, 83.91015625, 87.630859375, 91.3515625, 95.072265625, 98.79296875, 102.513671875, 106.234375, 109.955078125, 113.67578125, 117.396484375, 121.1171875, 124.837890625, 128.55859375, 132.279296875, 136.0]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [22.0, 272.0, 571.0, 142.0, 11.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.531647682189941, -8.851028442382812, -2.1704092025756836, 4.510210990905762, 11.190829277038574, 17.871448516845703, 24.55207061767578, 31.232688903808594, 37.913307189941406, 44.59392547607422, 51.27454376220703, 57.95516586303711, 64.63578796386719, 71.31640625, 77.99702453613281, 84.67764282226562, 91.35826110839844, 98.03887939453125, 104.71949768066406, 111.40011596679688, 118.08073425292969, 124.7613525390625, 131.44198608398438, 138.12258911132812, 144.80320739746094, 151.48382568359375, 158.16444396972656, 164.84506225585938, 171.5256805419922, 178.206298828125, 184.88693237304688, 191.56753540039062, 198.2481689453125, 204.9287872314453, 211.60940551757812, 218.29002380371094, 224.97064208984375, 231.65126037597656, 238.33187866210938, 245.01251220703125, 251.693115234375, 258.3737487792969, 265.0543518066406, 271.7349853515625, 278.41558837890625, 285.0962219238281, 291.7768249511719, 298.45745849609375, 305.1380615234375, 311.8186950683594, 318.4992980957031, 325.179931640625, 331.86053466796875, 338.5411682128906, 345.2217712402344, 351.90240478515625, 358.5830383300781, 365.263671875, 371.94427490234375, 378.6249084472656, 385.3055114746094, 391.98614501953125, 398.666748046875, 405.3473815917969, 412.0279846191406]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 6.0, 3.0, 6.0, 4.0, 7.0, 7.0, 15.0, 11.0, 14.0, 21.0, 14.0, 25.0, 28.0, 18.0, 27.0, 30.0, 25.0, 35.0, 40.0, 41.0, 43.0, 30.0, 36.0, 35.0, 45.0, 44.0, 43.0, 36.0, 47.0, 36.0, 22.0, 22.0, 22.0, 33.0, 20.0, 24.0, 24.0, 10.0, 20.0, 13.0, 9.0, 2.0, 6.0, 3.0, 1.0, 5.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-53.591064453125, -51.98184585571289, -50.372623443603516, -48.763404846191406, -47.15418243408203, -45.54496383666992, -43.93574523925781, -42.32652282714844, -40.71730041503906, -39.10808181762695, -37.49885940551758, -35.88964080810547, -34.280418395996094, -32.671199798583984, -31.061979293823242, -29.4527587890625, -27.84354019165039, -26.23431968688965, -24.625099182128906, -23.015880584716797, -21.406658172607422, -19.797439575195312, -18.18821907043457, -16.578998565673828, -14.969778060913086, -13.360557556152344, -11.751337051391602, -10.142117500305176, -8.532896995544434, -6.923676490783691, -5.314456939697266, -3.7052364349365234, -2.0960159301757812, -0.48679566383361816, 1.122424602508545, 2.731644630432129, 4.340865135192871, 5.950085639953613, 7.559305191040039, 9.168525695800781, 10.777746200561523, 12.386966705322266, 13.996187210083008, 15.605406761169434, 17.21462631225586, 18.823848724365234, 20.433067321777344, 22.042287826538086, 23.651508331298828, 25.26072883605957, 26.869949340820312, 28.479167938232422, 30.088390350341797, 31.697608947753906, 33.30683135986328, 34.91604995727539, 36.5252685546875, 38.13448715209961, 39.743709564208984, 41.352928161621094, 42.96215057373047, 44.57136917114258, 46.18058776855469, 47.78981018066406, 49.39903259277344]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 1.0, 5.0, 8.0, 6.0, 7.0, 18.0, 8.0, 18.0, 13.0, 24.0, 16.0, 20.0, 21.0, 20.0, 28.0, 38.0, 30.0, 32.0, 33.0, 39.0, 40.0, 42.0, 48.0, 45.0, 30.0, 34.0, 43.0, 36.0, 37.0, 44.0, 31.0, 28.0, 29.0, 15.0, 23.0, 23.0, 19.0, 7.0, 8.0, 6.0, 8.0, 8.0, 4.0, 6.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-5.21875, -5.062744140625, -4.90673828125, -4.750732421875, -4.5947265625, -4.438720703125, -4.28271484375, -4.126708984375, -3.970703125, -3.814697265625, -3.65869140625, -3.502685546875, -3.3466796875, -3.190673828125, -3.03466796875, -2.878662109375, -2.72265625, -2.566650390625, -2.41064453125, -2.254638671875, -2.0986328125, -1.942626953125, -1.78662109375, -1.630615234375, -1.474609375, -1.318603515625, -1.16259765625, -1.006591796875, -0.8505859375, -0.694580078125, -0.53857421875, -0.382568359375, -0.2265625, -0.070556640625, 0.08544921875, 0.241455078125, 0.3974609375, 0.553466796875, 0.70947265625, 0.865478515625, 1.021484375, 1.177490234375, 1.33349609375, 1.489501953125, 1.6455078125, 1.801513671875, 1.95751953125, 2.113525390625, 2.26953125, 2.425537109375, 2.58154296875, 2.737548828125, 2.8935546875, 3.049560546875, 3.20556640625, 3.361572265625, 3.517578125, 3.673583984375, 3.82958984375, 3.985595703125, 4.1416015625, 4.297607421875, 4.45361328125, 4.609619140625, 4.765625]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 5.0, 3.0, 4.0, 5.0, 5.0, 13.0, 13.0, 24.0, 41.0, 46.0, 74.0, 105.0, 158.0, 205.0, 321.0, 447.0, 754.0, 1085.0, 1591.0, 2507.0, 3691.0, 5998.0, 9274.0, 14315.0, 23300.0, 38129.0, 66051.0, 119981.0, 294959.0, 217142.0, 101329.0, 56743.0, 33683.0, 20525.0, 12864.0, 8130.0, 5247.0, 3313.0, 2169.0, 1427.0, 968.0, 622.0, 413.0, 264.0, 180.0, 141.0, 100.0, 59.0, 51.0, 28.0, 17.0, 19.0, 12.0, 4.0, 5.0, 2.0, 4.0, 2.0, 0.0, 2.0, 2.0], "bins": [-1.0458984375, -1.0130767822265625, -0.980255126953125, -0.9474334716796875, -0.91461181640625, -0.8817901611328125, -0.848968505859375, -0.8161468505859375, -0.7833251953125, -0.7505035400390625, -0.717681884765625, -0.6848602294921875, -0.65203857421875, -0.6192169189453125, -0.586395263671875, -0.5535736083984375, -0.520751953125, -0.4879302978515625, -0.455108642578125, -0.4222869873046875, -0.38946533203125, -0.3566436767578125, -0.323822021484375, -0.2910003662109375, -0.2581787109375, -0.2253570556640625, -0.192535400390625, -0.1597137451171875, -0.12689208984375, -0.0940704345703125, -0.061248779296875, -0.0284271240234375, 0.00439453125, 0.0372161865234375, 0.070037841796875, 0.1028594970703125, 0.13568115234375, 0.1685028076171875, 0.201324462890625, 0.2341461181640625, 0.2669677734375, 0.2997894287109375, 0.332611083984375, 0.3654327392578125, 0.39825439453125, 0.4310760498046875, 0.463897705078125, 0.4967193603515625, 0.529541015625, 0.5623626708984375, 0.595184326171875, 0.6280059814453125, 0.66082763671875, 0.6936492919921875, 0.726470947265625, 0.7592926025390625, 0.7921142578125, 0.8249359130859375, 0.857757568359375, 0.8905792236328125, 0.92340087890625, 0.9562225341796875, 0.989044189453125, 1.0218658447265625, 1.0546875]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 2.0, 2.0, 2.0, 7.0, 6.0, 7.0, 8.0, 14.0, 13.0, 15.0, 30.0, 18.0, 31.0, 39.0, 39.0, 39.0, 39.0, 60.0, 46.0, 41.0, 1087.0, 39.0, 42.0, 36.0, 44.0, 45.0, 54.0, 37.0, 31.0, 33.0, 23.0, 17.0, 15.0, 21.0, 15.0, 6.0, 10.0, 8.0, 6.0, 1.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.875, -3.75274658203125, -3.6304931640625, -3.50823974609375, -3.385986328125, -3.26373291015625, -3.1414794921875, -3.01922607421875, -2.89697265625, -2.77471923828125, -2.6524658203125, -2.53021240234375, -2.407958984375, -2.28570556640625, -2.1634521484375, -2.04119873046875, -1.9189453125, -1.79669189453125, -1.6744384765625, -1.55218505859375, -1.429931640625, -1.30767822265625, -1.1854248046875, -1.06317138671875, -0.94091796875, -0.81866455078125, -0.6964111328125, -0.57415771484375, -0.451904296875, -0.32965087890625, -0.2073974609375, -0.08514404296875, 0.037109375, 0.15936279296875, 0.2816162109375, 0.40386962890625, 0.526123046875, 0.64837646484375, 0.7706298828125, 0.89288330078125, 1.01513671875, 1.13739013671875, 1.2596435546875, 1.38189697265625, 1.504150390625, 1.62640380859375, 1.7486572265625, 1.87091064453125, 1.9931640625, 2.11541748046875, 2.2376708984375, 2.35992431640625, 2.482177734375, 2.60443115234375, 2.7266845703125, 2.84893798828125, 2.97119140625, 3.09344482421875, 3.2156982421875, 3.33795166015625, 3.460205078125, 3.58245849609375, 3.7047119140625, 3.82696533203125, 3.94921875]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 4.0, 14.0, 5.0, 24.0, 44.0, 56.0, 82.0, 140.0, 198.0, 310.0, 500.0, 826.0, 1334.0, 2252.0, 4041.0, 6983.0, 12467.0, 22599.0, 42953.0, 86959.0, 216791.0, 1446668.0, 124925.0, 58652.0, 29979.0, 16468.0, 9123.0, 5277.0, 2999.0, 1806.0, 1029.0, 610.0, 369.0, 215.0, 155.0, 93.0, 59.0, 46.0, 27.0, 14.0, 5.0, 10.0, 9.0, 7.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3740234375, -1.331390380859375, -1.28875732421875, -1.246124267578125, -1.2034912109375, -1.160858154296875, -1.11822509765625, -1.075592041015625, -1.032958984375, -0.990325927734375, -0.94769287109375, -0.905059814453125, -0.8624267578125, -0.819793701171875, -0.77716064453125, -0.734527587890625, -0.69189453125, -0.649261474609375, -0.60662841796875, -0.563995361328125, -0.5213623046875, -0.478729248046875, -0.43609619140625, -0.393463134765625, -0.350830078125, -0.308197021484375, -0.26556396484375, -0.222930908203125, -0.1802978515625, -0.137664794921875, -0.09503173828125, -0.052398681640625, -0.009765625, 0.032867431640625, 0.07550048828125, 0.118133544921875, 0.1607666015625, 0.203399658203125, 0.24603271484375, 0.288665771484375, 0.331298828125, 0.373931884765625, 0.41656494140625, 0.459197998046875, 0.5018310546875, 0.544464111328125, 0.58709716796875, 0.629730224609375, 0.67236328125, 0.714996337890625, 0.75762939453125, 0.800262451171875, 0.8428955078125, 0.885528564453125, 0.92816162109375, 0.970794677734375, 1.013427734375, 1.056060791015625, 1.09869384765625, 1.141326904296875, 1.1839599609375, 1.226593017578125, 1.26922607421875, 1.311859130859375, 1.3544921875]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 1.0, 5.0, 4.0, 3.0, 6.0, 6.0, 6.0, 7.0, 4.0, 10.0, 15.0, 10.0, 24.0, 21.0, 29.0, 37.0, 36.0, 31.0, 39.0, 54.0, 58.0, 69.0, 57.0, 63.0, 72.0, 54.0, 40.0, 42.0, 34.0, 34.0, 20.0, 28.0, 18.0, 11.0, 15.0, 8.0, 7.0, 6.0, 3.0, 1.0, 5.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0007090568542480469, -0.0006872490048408508, -0.0006654411554336548, -0.0006436333060264587, -0.0006218254566192627, -0.0006000176072120667, -0.0005782097578048706, -0.0005564019083976746, -0.0005345940589904785, -0.0005127862095832825, -0.0004909783601760864, -0.0004691705107688904, -0.00044736266136169434, -0.0004255548119544983, -0.00040374696254730225, -0.0003819391131401062, -0.00036013126373291016, -0.0003383234143257141, -0.00031651556491851807, -0.000294707715511322, -0.000272899866104126, -0.00025109201669692993, -0.0002292841672897339, -0.00020747631788253784, -0.0001856684684753418, -0.00016386061906814575, -0.0001420527696609497, -0.00012024492025375366, -9.843707084655762e-05, -7.662922143936157e-05, -5.482137203216553e-05, -3.301352262496948e-05, -1.1205673217773438e-05, 1.0602176189422607e-05, 3.241002559661865e-05, 5.42178750038147e-05, 7.602572441101074e-05, 9.783357381820679e-05, 0.00011964142322540283, 0.00014144927263259888, 0.00016325712203979492, 0.00018506497144699097, 0.000206872820854187, 0.00022868067026138306, 0.0002504885196685791, 0.00027229636907577515, 0.0002941042184829712, 0.00031591206789016724, 0.0003377199172973633, 0.0003595277667045593, 0.00038133561611175537, 0.0004031434655189514, 0.00042495131492614746, 0.0004467591643333435, 0.00046856701374053955, 0.0004903748631477356, 0.0005121827125549316, 0.0005339905619621277, 0.0005557984113693237, 0.0005776062607765198, 0.0005994141101837158, 0.0006212219595909119, 0.0006430298089981079, 0.000664837658405304, 0.0006866455078125]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 3.0, 4.0, 5.0, 4.0, 4.0, 10.0, 13.0, 10.0, 11.0, 18.0, 32.0, 21.0, 45.0, 69.0, 84.0, 138.0, 243.0, 451.0, 1041.0, 1035435.0, 9572.0, 565.0, 277.0, 142.0, 86.0, 63.0, 52.0, 41.0, 32.0, 12.0, 8.0, 11.0, 9.0, 10.0, 6.0, 8.0, 6.0, 7.0, 4.0, 2.0, 1.0, 3.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.017059326171875, -0.01650404930114746, -0.015948772430419922, -0.015393495559692383, -0.014838218688964844, -0.014282941818237305, -0.013727664947509766, -0.013172388076782227, -0.012617111206054688, -0.012061834335327148, -0.01150655746459961, -0.01095128059387207, -0.010396003723144531, -0.009840726852416992, -0.009285449981689453, -0.008730173110961914, -0.008174896240234375, -0.007619619369506836, -0.007064342498779297, -0.006509065628051758, -0.005953788757324219, -0.00539851188659668, -0.004843235015869141, -0.0042879581451416016, -0.0037326812744140625, -0.0031774044036865234, -0.0026221275329589844, -0.0020668506622314453, -0.0015115737915039062, -0.0009562969207763672, -0.0004010200500488281, 0.00015425682067871094, 0.00070953369140625, 0.001264810562133789, 0.0018200874328613281, 0.002375364303588867, 0.0029306411743164062, 0.0034859180450439453, 0.004041194915771484, 0.0045964717864990234, 0.0051517486572265625, 0.0057070255279541016, 0.006262302398681641, 0.00681757926940918, 0.007372856140136719, 0.007928133010864258, 0.008483409881591797, 0.009038686752319336, 0.009593963623046875, 0.010149240493774414, 0.010704517364501953, 0.011259794235229492, 0.011815071105957031, 0.01237034797668457, 0.01292562484741211, 0.013480901718139648, 0.014036178588867188, 0.014591455459594727, 0.015146732330322266, 0.015702009201049805, 0.016257286071777344, 0.016812562942504883, 0.017367839813232422, 0.01792311668395996, 0.0184783935546875]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 47.0, 454.0, 456.0, 53.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0013614033814519644, -0.0013109676074236631, -0.00126053171698004, -0.001210095826536417, -0.0011596600525081158, -0.0011092242784798145, -0.0010587883880361915, -0.0010083524975925684, -0.0009579167235642672, -0.000907480891328305, -0.0008570450590923429, -0.0008066092268563807, -0.0007561733946204185, -0.0007057375623844564, -0.0006553017301484942, -0.0006048658979125321, -0.0005544300656765699, -0.0005039942334406078, -0.00045355840120464563, -0.0004031225689686835, -0.00035268673673272133, -0.0003022509044967592, -0.000251815072260797, -0.00020137924002483487, -0.00015094340778887272, -0.00010050757555291057, -5.0071743316948414e-05, 3.6408891901373863e-07, 5.079992115497589e-05, 0.00010123575339093804, 0.0001516715856269002, 0.00020210741786286235, 0.00025254336651414633, 0.0003029791987501085, 0.00035341503098607063, 0.0004038508632220328, 0.00045428669545799494, 0.0005047225276939571, 0.0005551583599299192, 0.0006055941921658814, 0.0006560300244018435, 0.0007064658566378057, 0.0007569016888737679, 0.00080733752110973, 0.0008577733533456922, 0.0009082091855816543, 0.0009586450178176165, 0.0010090807918459177, 0.0010595166822895408, 0.0011099525727331638, 0.001160388346761465, 0.0012108241207897663, 0.0012612600112333894, 0.0013116959016770124, 0.0013621316757053137, 0.001412567449733615, 0.001463003340177238, 0.001513439230620861, 0.0015638750046491623, 0.0016143107786774635, 0.0016647466691210866, 0.0017151825595647097, 0.001765618333593011, 0.0018160541076213121, 0.0018664899980649352]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 4.0, 5.0, 6.0, 10.0, 5.0, 7.0, 4.0, 9.0, 19.0, 16.0, 21.0, 26.0, 18.0, 38.0, 37.0, 27.0, 39.0, 46.0, 40.0, 36.0, 35.0, 56.0, 46.0, 33.0, 45.0, 46.0, 41.0, 30.0, 34.0, 25.0, 31.0, 28.0, 21.0, 25.0, 15.0, 15.0, 14.0, 10.0, 8.0, 12.0, 6.0, 3.0, 6.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0003910064697265625, -0.00037881452590227127, -0.00036662258207798004, -0.0003544306382536888, -0.0003422386944293976, -0.00033004675060510635, -0.0003178548067808151, -0.0003056628629565239, -0.00029347091913223267, -0.00028127897530794144, -0.0002690870314836502, -0.000256895087659359, -0.00024470314383506775, -0.00023251120001077652, -0.0002203192561864853, -0.00020812731236219406, -0.00019593536853790283, -0.0001837434247136116, -0.00017155148088932037, -0.00015935953706502914, -0.00014716759324073792, -0.00013497564941644669, -0.00012278370559215546, -0.00011059176176786423, -9.8399817943573e-05, -8.620787411928177e-05, -7.401593029499054e-05, -6.182398647069931e-05, -4.963204264640808e-05, -3.744009882211685e-05, -2.5248154997825623e-05, -1.3056211173534393e-05, -8.642673492431641e-07, 1.1327676475048065e-05, 2.3519620299339294e-05, 3.5711564123630524e-05, 4.790350794792175e-05, 6.009545177221298e-05, 7.228739559650421e-05, 8.447933942079544e-05, 9.667128324508667e-05, 0.0001088632270693779, 0.00012105517089366913, 0.00013324711471796036, 0.0001454390585422516, 0.00015763100236654282, 0.00016982294619083405, 0.00018201489001512527, 0.0001942068338394165, 0.00020639877766370773, 0.00021859072148799896, 0.0002307826653122902, 0.00024297460913658142, 0.00025516655296087265, 0.0002673584967851639, 0.0002795504406094551, 0.00029174238443374634, 0.00030393432825803757, 0.0003161262720823288, 0.00032831821590662, 0.00034051015973091125, 0.0003527021035552025, 0.0003648940473794937, 0.00037708599120378494, 0.00038927793502807617]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 1.0, 5.0, 8.0, 6.0, 7.0, 18.0, 8.0, 18.0, 13.0, 24.0, 16.0, 20.0, 21.0, 20.0, 28.0, 38.0, 30.0, 32.0, 33.0, 39.0, 40.0, 42.0, 48.0, 45.0, 30.0, 34.0, 43.0, 36.0, 37.0, 44.0, 31.0, 28.0, 29.0, 15.0, 23.0, 23.0, 19.0, 7.0, 8.0, 6.0, 8.0, 8.0, 4.0, 6.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-5.21875, -5.062744140625, -4.90673828125, -4.750732421875, -4.5947265625, -4.438720703125, -4.28271484375, -4.126708984375, -3.970703125, -3.814697265625, -3.65869140625, -3.502685546875, -3.3466796875, -3.190673828125, -3.03466796875, -2.878662109375, -2.72265625, -2.566650390625, -2.41064453125, -2.254638671875, -2.0986328125, -1.942626953125, -1.78662109375, -1.630615234375, -1.474609375, -1.318603515625, -1.16259765625, -1.006591796875, -0.8505859375, -0.694580078125, -0.53857421875, -0.382568359375, -0.2265625, -0.070556640625, 0.08544921875, 0.241455078125, 0.3974609375, 0.553466796875, 0.70947265625, 0.865478515625, 1.021484375, 1.177490234375, 1.33349609375, 1.489501953125, 1.6455078125, 1.801513671875, 1.95751953125, 2.113525390625, 2.26953125, 2.425537109375, 2.58154296875, 2.737548828125, 2.8935546875, 3.049560546875, 3.20556640625, 3.361572265625, 3.517578125, 3.673583984375, 3.82958984375, 3.985595703125, 4.1416015625, 4.297607421875, 4.45361328125, 4.609619140625, 4.765625]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 2.0, 5.0, 5.0, 4.0, 5.0, 12.0, 10.0, 24.0, 22.0, 31.0, 49.0, 46.0, 78.0, 99.0, 121.0, 181.0, 225.0, 315.0, 421.0, 717.0, 1122.0, 1715.0, 3138.0, 5626.0, 11692.0, 28085.0, 84247.0, 318212.0, 417127.0, 110453.0, 34714.0, 13880.0, 6747.0, 3541.0, 2105.0, 1198.0, 823.0, 500.0, 364.0, 248.0, 146.0, 128.0, 100.0, 72.0, 51.0, 37.0, 38.0, 21.0, 17.0, 11.0, 10.0, 7.0, 8.0, 4.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0], "bins": [-3.439453125, -3.33233642578125, -3.2252197265625, -3.11810302734375, -3.010986328125, -2.90386962890625, -2.7967529296875, -2.68963623046875, -2.58251953125, -2.47540283203125, -2.3682861328125, -2.26116943359375, -2.154052734375, -2.04693603515625, -1.9398193359375, -1.83270263671875, -1.7255859375, -1.61846923828125, -1.5113525390625, -1.40423583984375, -1.297119140625, -1.19000244140625, -1.0828857421875, -0.97576904296875, -0.86865234375, -0.76153564453125, -0.6544189453125, -0.54730224609375, -0.440185546875, -0.33306884765625, -0.2259521484375, -0.11883544921875, -0.01171875, 0.09539794921875, 0.2025146484375, 0.30963134765625, 0.416748046875, 0.52386474609375, 0.6309814453125, 0.73809814453125, 0.84521484375, 0.95233154296875, 1.0594482421875, 1.16656494140625, 1.273681640625, 1.38079833984375, 1.4879150390625, 1.59503173828125, 1.7021484375, 1.80926513671875, 1.9163818359375, 2.02349853515625, 2.130615234375, 2.23773193359375, 2.3448486328125, 2.45196533203125, 2.55908203125, 2.66619873046875, 2.7733154296875, 2.88043212890625, 2.987548828125, 3.09466552734375, 3.2017822265625, 3.30889892578125, 3.416015625]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 4.0, 4.0, 6.0, 12.0, 6.0, 8.0, 12.0, 13.0, 12.0, 18.0, 12.0, 18.0, 24.0, 13.0, 31.0, 29.0, 25.0, 40.0, 39.0, 44.0, 47.0, 95.0, 1758.0, 271.0, 55.0, 43.0, 34.0, 47.0, 35.0, 40.0, 31.0, 30.0, 22.0, 22.0, 24.0, 16.0, 14.0, 19.0, 17.0, 14.0, 10.0, 6.0, 9.0, 5.0, 4.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-15.578125, -15.0882568359375, -14.598388671875, -14.1085205078125, -13.61865234375, -13.1287841796875, -12.638916015625, -12.1490478515625, -11.6591796875, -11.1693115234375, -10.679443359375, -10.1895751953125, -9.69970703125, -9.2098388671875, -8.719970703125, -8.2301025390625, -7.740234375, -7.2503662109375, -6.760498046875, -6.2706298828125, -5.78076171875, -5.2908935546875, -4.801025390625, -4.3111572265625, -3.8212890625, -3.3314208984375, -2.841552734375, -2.3516845703125, -1.86181640625, -1.3719482421875, -0.882080078125, -0.3922119140625, 0.09765625, 0.5875244140625, 1.077392578125, 1.5672607421875, 2.05712890625, 2.5469970703125, 3.036865234375, 3.5267333984375, 4.0166015625, 4.5064697265625, 4.996337890625, 5.4862060546875, 5.97607421875, 6.4659423828125, 6.955810546875, 7.4456787109375, 7.935546875, 8.4254150390625, 8.915283203125, 9.4051513671875, 9.89501953125, 10.3848876953125, 10.874755859375, 11.3646240234375, 11.8544921875, 12.3443603515625, 12.834228515625, 13.3240966796875, 13.81396484375, 14.3038330078125, 14.793701171875, 15.2835693359375, 15.7734375]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 5.0, 4.0, 6.0, 7.0, 7.0, 9.0, 16.0, 17.0, 17.0, 11.0, 26.0, 23.0, 23.0, 36.0, 42.0, 64.0, 90.0, 136.0, 193.0, 261.0, 569.0, 1977.0, 69682.0, 3058555.0, 11667.0, 1054.0, 384.0, 230.0, 167.0, 100.0, 66.0, 53.0, 33.0, 27.0, 29.0, 17.0, 17.0, 12.0, 11.0, 10.0, 16.0, 5.0, 7.0, 10.0, 4.0, 3.0, 1.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0], "bins": [-26.046875, -25.24072265625, -24.4345703125, -23.62841796875, -22.822265625, -22.01611328125, -21.2099609375, -20.40380859375, -19.59765625, -18.79150390625, -17.9853515625, -17.17919921875, -16.373046875, -15.56689453125, -14.7607421875, -13.95458984375, -13.1484375, -12.34228515625, -11.5361328125, -10.72998046875, -9.923828125, -9.11767578125, -8.3115234375, -7.50537109375, -6.69921875, -5.89306640625, -5.0869140625, -4.28076171875, -3.474609375, -2.66845703125, -1.8623046875, -1.05615234375, -0.25, 0.55615234375, 1.3623046875, 2.16845703125, 2.974609375, 3.78076171875, 4.5869140625, 5.39306640625, 6.19921875, 7.00537109375, 7.8115234375, 8.61767578125, 9.423828125, 10.22998046875, 11.0361328125, 11.84228515625, 12.6484375, 13.45458984375, 14.2607421875, 15.06689453125, 15.873046875, 16.67919921875, 17.4853515625, 18.29150390625, 19.09765625, 19.90380859375, 20.7099609375, 21.51611328125, 22.322265625, 23.12841796875, 23.9345703125, 24.74072265625, 25.546875]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [2.0, 5.0, 1.0, 28.0, 72.0, 155.0, 246.0, 256.0, 153.0, 69.0, 20.0, 8.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.558652400970459, -4.77003812789917, -3.9814236164093018, -3.1928091049194336, -2.4041948318481445, -1.6155805587768555, -0.8269658088684082, -0.03835153579711914, 0.7502627372741699, 1.5388771295547485, 2.327491521835327, 3.1161060333251953, 3.9047203063964844, 4.693334579467773, 5.481949329376221, 6.27056360244751, 7.059177875518799, 7.847792148590088, 8.636406898498535, 9.425021171569824, 10.213635444641113, 11.002249717712402, 11.790864944458008, 12.579479217529297, 13.368093490600586, 14.156707763671875, 14.945322036743164, 15.733936309814453, 16.522550582885742, 17.31116485595703, 18.099781036376953, 18.88839340209961, 19.67700958251953, 20.46562385559082, 21.25423812866211, 22.0428524017334, 22.831466674804688, 23.620080947875977, 24.408695220947266, 25.197311401367188, 25.985923767089844, 26.774538040161133, 27.563152313232422, 28.35176658630371, 29.140380859375, 29.92899513244629, 30.717609405517578, 31.5062255859375, 32.294837951660156, 33.08345413208008, 33.872066497802734, 34.660682678222656, 35.44929504394531, 36.237911224365234, 37.02652359008789, 37.81513977050781, 38.603755950927734, 39.392372131347656, 40.18098449707031, 40.969600677490234, 41.75821304321289, 42.54682922363281, 43.33544158935547, 44.12405776977539, 44.91267013549805]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 2.0, 4.0, 7.0, 4.0, 7.0, 13.0, 19.0, 13.0, 17.0, 10.0, 14.0, 22.0, 31.0, 31.0, 35.0, 42.0, 31.0, 43.0, 36.0, 37.0, 43.0, 40.0, 39.0, 36.0, 50.0, 47.0, 28.0, 33.0, 38.0, 32.0, 23.0, 25.0, 18.0, 22.0, 16.0, 13.0, 19.0, 14.0, 14.0, 8.0, 7.0, 4.0, 3.0, 3.0, 6.0, 1.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-51.31560134887695, -49.705810546875, -48.09601974487305, -46.486228942871094, -44.876441955566406, -43.26665115356445, -41.6568603515625, -40.04706954956055, -38.437278747558594, -36.82748794555664, -35.21769714355469, -33.60791015625, -31.998119354248047, -30.388328552246094, -28.77853775024414, -27.168746948242188, -25.5589599609375, -23.949169158935547, -22.339380264282227, -20.729589462280273, -19.119800567626953, -17.510009765625, -15.900218963623047, -14.29042911529541, -12.680639266967773, -11.070849418640137, -9.4610595703125, -7.851268768310547, -6.24147891998291, -4.631689071655273, -3.0218982696533203, -1.4121084213256836, 0.1976776123046875, 1.8074676990509033, 3.417257785797119, 5.027048110961914, 6.636837959289551, 8.246627807617188, 9.85641860961914, 11.466208457946777, 13.075998306274414, 14.68578815460205, 16.295578002929688, 17.90536880493164, 19.515159606933594, 21.124948501586914, 22.734739303588867, 24.344528198242188, 25.95431900024414, 27.564109802246094, 29.173898696899414, 30.783689498901367, 32.39347839355469, 34.00326919555664, 35.613059997558594, 37.22285079956055, 38.8326416015625, 40.44243240356445, 42.052223205566406, 43.662010192871094, 45.27180099487305, 46.881591796875, 48.49138259887695, 50.101173400878906, 51.710960388183594]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 1.0, 1.0, 2.0, 7.0, 7.0, 8.0, 13.0, 9.0, 8.0, 18.0, 13.0, 21.0, 24.0, 17.0, 18.0, 26.0, 30.0, 27.0, 36.0, 25.0, 36.0, 36.0, 41.0, 46.0, 41.0, 40.0, 41.0, 24.0, 42.0, 43.0, 39.0, 30.0, 35.0, 29.0, 28.0, 20.0, 29.0, 17.0, 20.0, 12.0, 8.0, 7.0, 8.0, 5.0, 7.0, 1.0, 8.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-5.21484375, -5.0595703125, -4.904296875, -4.7490234375, -4.59375, -4.4384765625, -4.283203125, -4.1279296875, -3.97265625, -3.8173828125, -3.662109375, -3.5068359375, -3.3515625, -3.1962890625, -3.041015625, -2.8857421875, -2.73046875, -2.5751953125, -2.419921875, -2.2646484375, -2.109375, -1.9541015625, -1.798828125, -1.6435546875, -1.48828125, -1.3330078125, -1.177734375, -1.0224609375, -0.8671875, -0.7119140625, -0.556640625, -0.4013671875, -0.24609375, -0.0908203125, 0.064453125, 0.2197265625, 0.375, 0.5302734375, 0.685546875, 0.8408203125, 0.99609375, 1.1513671875, 1.306640625, 1.4619140625, 1.6171875, 1.7724609375, 1.927734375, 2.0830078125, 2.23828125, 2.3935546875, 2.548828125, 2.7041015625, 2.859375, 3.0146484375, 3.169921875, 3.3251953125, 3.48046875, 3.6357421875, 3.791015625, 3.9462890625, 4.1015625, 4.2568359375, 4.412109375, 4.5673828125, 4.72265625]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 5.0, 10.0, 8.0, 6.0, 9.0, 5.0, 13.0, 17.0, 17.0, 24.0, 33.0, 47.0, 65.0, 94.0, 131.0, 246.0, 446.0, 1307.0, 4643.0, 21051.0, 140324.0, 1002933.0, 2187289.0, 715552.0, 98960.0, 15395.0, 3521.0, 1027.0, 416.0, 210.0, 141.0, 90.0, 57.0, 33.0, 32.0, 21.0, 29.0, 15.0, 9.0, 10.0, 8.0, 8.0, 9.0, 3.0, 3.0, 2.0, 4.0, 1.0, 4.0, 2.0, 1.0, 2.0], "bins": [-9.953125, -9.663818359375, -9.37451171875, -9.085205078125, -8.7958984375, -8.506591796875, -8.21728515625, -7.927978515625, -7.638671875, -7.349365234375, -7.06005859375, -6.770751953125, -6.4814453125, -6.192138671875, -5.90283203125, -5.613525390625, -5.32421875, -5.034912109375, -4.74560546875, -4.456298828125, -4.1669921875, -3.877685546875, -3.58837890625, -3.299072265625, -3.009765625, -2.720458984375, -2.43115234375, -2.141845703125, -1.8525390625, -1.563232421875, -1.27392578125, -0.984619140625, -0.6953125, -0.406005859375, -0.11669921875, 0.172607421875, 0.4619140625, 0.751220703125, 1.04052734375, 1.329833984375, 1.619140625, 1.908447265625, 2.19775390625, 2.487060546875, 2.7763671875, 3.065673828125, 3.35498046875, 3.644287109375, 3.93359375, 4.222900390625, 4.51220703125, 4.801513671875, 5.0908203125, 5.380126953125, 5.66943359375, 5.958740234375, 6.248046875, 6.537353515625, 6.82666015625, 7.115966796875, 7.4052734375, 7.694580078125, 7.98388671875, 8.273193359375, 8.5625]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 3.0, 3.0, 2.0, 6.0, 14.0, 15.0, 18.0, 25.0, 30.0, 58.0, 82.0, 134.0, 225.0, 329.0, 525.0, 709.0, 622.0, 456.0, 296.0, 173.0, 121.0, 82.0, 55.0, 35.0, 14.0, 17.0, 10.0, 5.0, 6.0, 4.0, 6.0, 0.0, 4.0, 2.0, 2.0], "bins": [-29.859375, -29.19189453125, -28.5244140625, -27.85693359375, -27.189453125, -26.52197265625, -25.8544921875, -25.18701171875, -24.51953125, -23.85205078125, -23.1845703125, -22.51708984375, -21.849609375, -21.18212890625, -20.5146484375, -19.84716796875, -19.1796875, -18.51220703125, -17.8447265625, -17.17724609375, -16.509765625, -15.84228515625, -15.1748046875, -14.50732421875, -13.83984375, -13.17236328125, -12.5048828125, -11.83740234375, -11.169921875, -10.50244140625, -9.8349609375, -9.16748046875, -8.5, -7.83251953125, -7.1650390625, -6.49755859375, -5.830078125, -5.16259765625, -4.4951171875, -3.82763671875, -3.16015625, -2.49267578125, -1.8251953125, -1.15771484375, -0.490234375, 0.17724609375, 0.8447265625, 1.51220703125, 2.1796875, 2.84716796875, 3.5146484375, 4.18212890625, 4.849609375, 5.51708984375, 6.1845703125, 6.85205078125, 7.51953125, 8.18701171875, 8.8544921875, 9.52197265625, 10.189453125, 10.85693359375, 11.5244140625, 12.19189453125, 12.859375]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 6.0, 6.0, 10.0, 11.0, 18.0, 28.0, 34.0, 51.0, 85.0, 126.0, 215.0, 379.0, 1186.0, 190204.0, 3998534.0, 2308.0, 451.0, 223.0, 119.0, 101.0, 55.0, 29.0, 32.0, 17.0, 16.0, 12.0, 9.0, 3.0, 2.0, 1.0, 5.0, 4.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.71875, -59.75634765625, -56.7939453125, -53.83154296875, -50.869140625, -47.90673828125, -44.9443359375, -41.98193359375, -39.01953125, -36.05712890625, -33.0947265625, -30.13232421875, -27.169921875, -24.20751953125, -21.2451171875, -18.28271484375, -15.3203125, -12.35791015625, -9.3955078125, -6.43310546875, -3.470703125, -0.50830078125, 2.4541015625, 5.41650390625, 8.37890625, 11.34130859375, 14.3037109375, 17.26611328125, 20.228515625, 23.19091796875, 26.1533203125, 29.11572265625, 32.078125, 35.04052734375, 38.0029296875, 40.96533203125, 43.927734375, 46.89013671875, 49.8525390625, 52.81494140625, 55.77734375, 58.73974609375, 61.7021484375, 64.66455078125, 67.626953125, 70.58935546875, 73.5517578125, 76.51416015625, 79.4765625, 82.43896484375, 85.4013671875, 88.36376953125, 91.326171875, 94.28857421875, 97.2509765625, 100.21337890625, 103.17578125, 106.13818359375, 109.1005859375, 112.06298828125, 115.025390625, 117.98779296875, 120.9501953125, 123.91259765625, 126.875]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 145.0, 828.0, 44.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-699.7406616210938, -686.6278076171875, -673.5150146484375, -660.4021606445312, -647.2893676757812, -634.176513671875, -621.0636596679688, -607.9508666992188, -594.8380126953125, -581.7251586914062, -568.6123657226562, -555.49951171875, -542.38671875, -529.2738647460938, -516.1610107421875, -503.0482177734375, -489.93536376953125, -476.8225402832031, -463.709716796875, -450.59686279296875, -437.4840393066406, -424.3712158203125, -411.2583923339844, -398.14556884765625, -385.0327453613281, -371.919921875, -358.8070983886719, -345.6942443847656, -332.5814208984375, -319.4685974121094, -306.35577392578125, -293.242919921875, -280.13006591796875, -267.0172424316406, -253.90440368652344, -240.7915802001953, -227.67874145507812, -214.56591796875, -201.45309448242188, -188.3402557373047, -175.22744750976562, -162.1146240234375, -149.0017852783203, -135.8889617919922, -122.776123046875, -109.66329956054688, -96.55046844482422, -83.43763732910156, -70.32479858398438, -57.21196746826172, -44.09913635253906, -30.986309051513672, -17.873477935791016, -4.760650634765625, 8.352180480957031, 21.465011596679688, 34.577842712402344, 47.690673828125, 60.803504943847656, 73.91633605957031, 87.02915954589844, 100.1419906616211, 113.25482177734375, 126.3676528930664, 139.48048400878906]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 5.0, 7.0, 4.0, 5.0, 6.0, 7.0, 8.0, 3.0, 5.0, 11.0, 16.0, 13.0, 19.0, 26.0, 16.0, 25.0, 27.0, 21.0, 24.0, 31.0, 32.0, 30.0, 40.0, 36.0, 34.0, 46.0, 29.0, 44.0, 43.0, 30.0, 27.0, 24.0, 32.0, 35.0, 24.0, 20.0, 25.0, 21.0, 22.0, 26.0, 21.0, 13.0, 24.0, 14.0, 9.0, 6.0, 7.0, 5.0, 6.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.25187301635742, -42.79163360595703, -41.331398010253906, -39.87116241455078, -38.41092300415039, -36.95068359375, -35.490447998046875, -34.03021240234375, -32.56997299194336, -31.1097354888916, -29.649497985839844, -28.189260482788086, -26.729022979736328, -25.26878547668457, -23.808547973632812, -22.348310470581055, -20.888072967529297, -19.42783546447754, -17.96759796142578, -16.507360458374023, -15.047122955322266, -13.586885452270508, -12.12664794921875, -10.666410446166992, -9.206172943115234, -7.745935440063477, -6.285697937011719, -4.825460433959961, -3.365222930908203, -1.9049854278564453, -0.4447479248046875, 1.0154895782470703, 2.4757232666015625, 3.9359607696533203, 5.396198272705078, 6.856435775756836, 8.316673278808594, 9.776910781860352, 11.23714828491211, 12.697385787963867, 14.157623291015625, 15.617860794067383, 17.07809829711914, 18.5383358001709, 19.998573303222656, 21.458810806274414, 22.919048309326172, 24.37928581237793, 25.839523315429688, 27.299760818481445, 28.759998321533203, 30.22023582458496, 31.68047332763672, 33.140708923339844, 34.600948333740234, 36.061187744140625, 37.52142333984375, 38.981658935546875, 40.441898345947266, 41.902137756347656, 43.36237335205078, 44.822608947753906, 46.2828483581543, 47.74308776855469, 49.20332336425781]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 3.0, 6.0, 11.0, 5.0, 5.0, 4.0, 12.0, 14.0, 16.0, 18.0, 16.0, 23.0, 29.0, 35.0, 22.0, 31.0, 23.0, 38.0, 33.0, 32.0, 42.0, 41.0, 42.0, 37.0, 34.0, 35.0, 38.0, 42.0, 42.0, 25.0, 38.0, 31.0, 32.0, 17.0, 32.0, 22.0, 12.0, 12.0, 7.0, 11.0, 5.0, 4.0, 10.0, 5.0, 4.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.1171875, -4.9609375, -4.8046875, -4.6484375, -4.4921875, -4.3359375, -4.1796875, -4.0234375, -3.8671875, -3.7109375, -3.5546875, -3.3984375, -3.2421875, -3.0859375, -2.9296875, -2.7734375, -2.6171875, -2.4609375, -2.3046875, -2.1484375, -1.9921875, -1.8359375, -1.6796875, -1.5234375, -1.3671875, -1.2109375, -1.0546875, -0.8984375, -0.7421875, -0.5859375, -0.4296875, -0.2734375, -0.1171875, 0.0390625, 0.1953125, 0.3515625, 0.5078125, 0.6640625, 0.8203125, 0.9765625, 1.1328125, 1.2890625, 1.4453125, 1.6015625, 1.7578125, 1.9140625, 2.0703125, 2.2265625, 2.3828125, 2.5390625, 2.6953125, 2.8515625, 3.0078125, 3.1640625, 3.3203125, 3.4765625, 3.6328125, 3.7890625, 3.9453125, 4.1015625, 4.2578125, 4.4140625, 4.5703125, 4.7265625, 4.8828125]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 4.0, 1.0, 4.0, 6.0, 7.0, 19.0, 18.0, 25.0, 33.0, 53.0, 87.0, 114.0, 147.0, 235.0, 376.0, 522.0, 759.0, 1167.0, 1637.0, 2429.0, 3604.0, 5352.0, 8212.0, 12405.0, 18742.0, 29494.0, 46679.0, 77638.0, 143872.0, 315618.0, 157232.0, 82815.0, 49397.0, 31223.0, 19552.0, 13225.0, 8544.0, 5492.0, 3875.0, 2486.0, 1793.0, 1150.0, 822.0, 556.0, 365.0, 236.0, 184.0, 127.0, 76.0, 53.0, 34.0, 30.0, 21.0, 9.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.99853515625, -0.967864990234375, -0.93719482421875, -0.906524658203125, -0.8758544921875, -0.845184326171875, -0.81451416015625, -0.783843994140625, -0.753173828125, -0.722503662109375, -0.69183349609375, -0.661163330078125, -0.6304931640625, -0.599822998046875, -0.56915283203125, -0.538482666015625, -0.5078125, -0.477142333984375, -0.44647216796875, -0.415802001953125, -0.3851318359375, -0.354461669921875, -0.32379150390625, -0.293121337890625, -0.262451171875, -0.231781005859375, -0.20111083984375, -0.170440673828125, -0.1397705078125, -0.109100341796875, -0.07843017578125, -0.047760009765625, -0.01708984375, 0.013580322265625, 0.04425048828125, 0.074920654296875, 0.1055908203125, 0.136260986328125, 0.16693115234375, 0.197601318359375, 0.228271484375, 0.258941650390625, 0.28961181640625, 0.320281982421875, 0.3509521484375, 0.381622314453125, 0.41229248046875, 0.442962646484375, 0.4736328125, 0.504302978515625, 0.53497314453125, 0.565643310546875, 0.5963134765625, 0.626983642578125, 0.65765380859375, 0.688323974609375, 0.718994140625, 0.749664306640625, 0.78033447265625, 0.811004638671875, 0.8416748046875, 0.872344970703125, 0.90301513671875, 0.933685302734375, 0.96435546875]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 6.0, 3.0, 3.0, 5.0, 3.0, 5.0, 13.0, 16.0, 5.0, 16.0, 15.0, 25.0, 14.0, 29.0, 25.0, 34.0, 36.0, 34.0, 41.0, 39.0, 44.0, 35.0, 36.0, 35.0, 1058.0, 41.0, 22.0, 40.0, 43.0, 37.0, 34.0, 28.0, 38.0, 29.0, 19.0, 24.0, 21.0, 16.0, 11.0, 7.0, 7.0, 9.0, 7.0, 5.0, 6.0, 4.0, 5.0, 4.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.271484375, -3.169647216796875, -3.06781005859375, -2.965972900390625, -2.8641357421875, -2.762298583984375, -2.66046142578125, -2.558624267578125, -2.456787109375, -2.354949951171875, -2.25311279296875, -2.151275634765625, -2.0494384765625, -1.947601318359375, -1.84576416015625, -1.743927001953125, -1.64208984375, -1.540252685546875, -1.43841552734375, -1.336578369140625, -1.2347412109375, -1.132904052734375, -1.03106689453125, -0.929229736328125, -0.827392578125, -0.725555419921875, -0.62371826171875, -0.521881103515625, -0.4200439453125, -0.318206787109375, -0.21636962890625, -0.114532470703125, -0.0126953125, 0.089141845703125, 0.19097900390625, 0.292816162109375, 0.3946533203125, 0.496490478515625, 0.59832763671875, 0.700164794921875, 0.802001953125, 0.903839111328125, 1.00567626953125, 1.107513427734375, 1.2093505859375, 1.311187744140625, 1.41302490234375, 1.514862060546875, 1.61669921875, 1.718536376953125, 1.82037353515625, 1.922210693359375, 2.0240478515625, 2.125885009765625, 2.22772216796875, 2.329559326171875, 2.431396484375, 2.533233642578125, 2.63507080078125, 2.736907958984375, 2.8387451171875, 2.940582275390625, 3.04241943359375, 3.144256591796875, 3.24609375]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 5.0, 7.0, 12.0, 12.0, 15.0, 28.0, 46.0, 80.0, 89.0, 137.0, 193.0, 316.0, 480.0, 765.0, 1166.0, 1894.0, 2911.0, 4583.0, 7319.0, 11694.0, 19406.0, 32859.0, 57100.0, 109513.0, 1335708.0, 268375.0, 105261.0, 55749.0, 31645.0, 18874.0, 11438.0, 7092.0, 4380.0, 2834.0, 1797.0, 1173.0, 748.0, 520.0, 305.0, 194.0, 128.0, 103.0, 68.0, 40.0, 29.0, 14.0, 9.0, 11.0, 9.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.1376953125, -1.10211181640625, -1.0665283203125, -1.03094482421875, -0.995361328125, -0.95977783203125, -0.9241943359375, -0.88861083984375, -0.85302734375, -0.81744384765625, -0.7818603515625, -0.74627685546875, -0.710693359375, -0.67510986328125, -0.6395263671875, -0.60394287109375, -0.568359375, -0.53277587890625, -0.4971923828125, -0.46160888671875, -0.426025390625, -0.39044189453125, -0.3548583984375, -0.31927490234375, -0.28369140625, -0.24810791015625, -0.2125244140625, -0.17694091796875, -0.141357421875, -0.10577392578125, -0.0701904296875, -0.03460693359375, 0.0009765625, 0.03656005859375, 0.0721435546875, 0.10772705078125, 0.143310546875, 0.17889404296875, 0.2144775390625, 0.25006103515625, 0.28564453125, 0.32122802734375, 0.3568115234375, 0.39239501953125, 0.427978515625, 0.46356201171875, 0.4991455078125, 0.53472900390625, 0.5703125, 0.60589599609375, 0.6414794921875, 0.67706298828125, 0.712646484375, 0.74822998046875, 0.7838134765625, 0.81939697265625, 0.85498046875, 0.89056396484375, 0.9261474609375, 0.96173095703125, 0.997314453125, 1.03289794921875, 1.0684814453125, 1.10406494140625, 1.1396484375]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 5.0, 6.0, 7.0, 10.0, 7.0, 16.0, 19.0, 15.0, 36.0, 26.0, 41.0, 37.0, 58.0, 75.0, 63.0, 78.0, 90.0, 71.0, 67.0, 63.0, 56.0, 26.0, 29.0, 20.0, 15.0, 15.0, 11.0, 10.0, 8.0, 4.0, 3.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0], "bins": [-0.0006504058837890625, -0.0006311535835266113, -0.0006119012832641602, -0.000592648983001709, -0.0005733966827392578, -0.0005541443824768066, -0.0005348920822143555, -0.0005156397819519043, -0.0004963874816894531, -0.00047713518142700195, -0.0004578828811645508, -0.0004386305809020996, -0.00041937828063964844, -0.00040012598037719727, -0.0003808736801147461, -0.0003616213798522949, -0.00034236907958984375, -0.0003231167793273926, -0.0003038644790649414, -0.00028461217880249023, -0.00026535987854003906, -0.0002461075782775879, -0.00022685527801513672, -0.00020760297775268555, -0.00018835067749023438, -0.0001690983772277832, -0.00014984607696533203, -0.00013059377670288086, -0.00011134147644042969, -9.208917617797852e-05, -7.283687591552734e-05, -5.358457565307617e-05, -3.4332275390625e-05, -1.5079975128173828e-05, 4.172325134277344e-06, 2.3424625396728516e-05, 4.267692565917969e-05, 6.192922592163086e-05, 8.118152618408203e-05, 0.0001004338264465332, 0.00011968612670898438, 0.00013893842697143555, 0.00015819072723388672, 0.0001774430274963379, 0.00019669532775878906, 0.00021594762802124023, 0.0002351999282836914, 0.0002544522285461426, 0.00027370452880859375, 0.0002929568290710449, 0.0003122091293334961, 0.00033146142959594727, 0.00035071372985839844, 0.0003699660301208496, 0.0003892183303833008, 0.00040847063064575195, 0.0004277229309082031, 0.0004469752311706543, 0.00046622753143310547, 0.00048547983169555664, 0.0005047321319580078, 0.000523984432220459, 0.0005432367324829102, 0.0005624890327453613, 0.0005817413330078125]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 0.0, 7.0, 4.0, 5.0, 9.0, 13.0, 6.0, 15.0, 17.0, 27.0, 33.0, 59.0, 122.0, 182.0, 342.0, 844.0, 528441.0, 516755.0, 817.0, 358.0, 168.0, 92.0, 62.0, 47.0, 27.0, 25.0, 15.0, 17.0, 8.0, 8.0, 10.0, 4.0, 4.0, 3.0, 3.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0151214599609375, -0.014633655548095703, -0.014145851135253906, -0.01365804672241211, -0.013170242309570312, -0.012682437896728516, -0.012194633483886719, -0.011706829071044922, -0.011219024658203125, -0.010731220245361328, -0.010243415832519531, -0.009755611419677734, -0.009267807006835938, -0.00878000259399414, -0.008292198181152344, -0.007804393768310547, -0.00731658935546875, -0.006828784942626953, -0.006340980529785156, -0.005853176116943359, -0.0053653717041015625, -0.004877567291259766, -0.004389762878417969, -0.003901958465576172, -0.003414154052734375, -0.002926349639892578, -0.0024385452270507812, -0.0019507408142089844, -0.0014629364013671875, -0.0009751319885253906, -0.00048732757568359375, 4.76837158203125e-07, 0.00048828125, 0.0009760856628417969, 0.0014638900756835938, 0.0019516944885253906, 0.0024394989013671875, 0.0029273033142089844, 0.0034151077270507812, 0.003902912139892578, 0.004390716552734375, 0.004878520965576172, 0.005366325378417969, 0.005854129791259766, 0.0063419342041015625, 0.006829738616943359, 0.007317543029785156, 0.007805347442626953, 0.00829315185546875, 0.008780956268310547, 0.009268760681152344, 0.00975656509399414, 0.010244369506835938, 0.010732173919677734, 0.011219978332519531, 0.011707782745361328, 0.012195587158203125, 0.012683391571044922, 0.013171195983886719, 0.013659000396728516, 0.014146804809570312, 0.01463460922241211, 0.015122413635253906, 0.015610218048095703, 0.0160980224609375]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 6.0, 19.0, 31.0, 64.0, 124.0, 158.0, 185.0, 160.0, 123.0, 71.0, 39.0, 15.0, 10.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000505690579302609, -0.0004914581659249961, -0.00047722572344355285, -0.00046299331006594, -0.00044876086758449674, -0.0004345284542068839, -0.0004202960408292711, -0.0004060635983478278, -0.0003918311558663845, -0.0003775987424887717, -0.0003633663000073284, -0.00034913388662971556, -0.0003349014441482723, -0.00032066903077065945, -0.0003064366173930466, -0.00029220417491160333, -0.0002779717615339905, -0.0002637393481563777, -0.0002495069056749344, -0.00023527449229732156, -0.00022104204981587827, -0.00020680963643826544, -0.00019257720850873739, -0.00017834478057920933, -0.00016411235264968127, -0.0001498799247201532, -0.00013564749679062515, -0.00012141507613705471, -0.00010718264820752665, -9.29502202779986e-05, -7.871779962442815e-05, -6.44853716949001e-05, -5.0252972869202495e-05, -3.602054493967444e-05, -2.1788120648125187e-05, -7.555696356575936e-06, 6.6767315729521215e-06, 2.090915950248018e-05, 3.514158015605062e-05, 4.937400808557868e-05, 6.360643601510674e-05, 7.78388639446348e-05, 9.207129187416285e-05, 0.0001063037125277333, 0.00012053614045726135, 0.00013476857566274703, 0.00014900098904035985, 0.0001632334169698879, 0.00017746584489941597, 0.00019169827282894403, 0.00020593070075847208, 0.00022016311413608491, 0.0002343955566175282, 0.00024862796999514103, 0.00026286038337275386, 0.00027709282585419714, 0.00029132526833564043, 0.00030555768171325326, 0.00031979012419469655, 0.0003340225375723094, 0.00034825498005375266, 0.0003624873934313655, 0.0003767198068089783, 0.0003909522492904216, 0.00040518466266803443]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 3.0, 7.0, 15.0, 12.0, 10.0, 18.0, 13.0, 15.0, 15.0, 18.0, 25.0, 35.0, 23.0, 28.0, 39.0, 34.0, 43.0, 48.0, 54.0, 35.0, 36.0, 39.0, 36.0, 40.0, 33.0, 36.0, 28.0, 31.0, 39.0, 21.0, 25.0, 21.0, 17.0, 26.0, 16.0, 18.0, 10.0, 7.0, 10.0, 3.0, 3.0, 3.0, 4.0, 4.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00024396181106567383, -0.0002355361357331276, -0.00022711046040058136, -0.00021868478506803513, -0.0002102591097354889, -0.00020183343440294266, -0.00019340775907039642, -0.0001849820837378502, -0.00017655640840530396, -0.00016813073307275772, -0.0001597050577402115, -0.00015127938240766525, -0.00014285370707511902, -0.00013442803174257278, -0.00012600235641002655, -0.00011757668107748032, -0.00010915100574493408, -0.00010072533041238785, -9.229965507984161e-05, -8.387397974729538e-05, -7.544830441474915e-05, -6.702262908220291e-05, -5.859695374965668e-05, -5.017127841711044e-05, -4.174560308456421e-05, -3.3319927752017975e-05, -2.489425241947174e-05, -1.6468577086925507e-05, -8.042901754379272e-06, 3.8277357816696167e-07, 8.808448910713196e-06, 1.723412424325943e-05, 2.5659799575805664e-05, 3.40854749083519e-05, 4.251115024089813e-05, 5.0936825573444366e-05, 5.93625009059906e-05, 6.778817623853683e-05, 7.621385157108307e-05, 8.46395269036293e-05, 9.306520223617554e-05, 0.00010149087756872177, 0.000109916552901268, 0.00011834222823381424, 0.00012676790356636047, 0.0001351935788989067, 0.00014361925423145294, 0.00015204492956399918, 0.0001604706048965454, 0.00016889628022909164, 0.00017732195556163788, 0.0001857476308941841, 0.00019417330622673035, 0.00020259898155927658, 0.00021102465689182281, 0.00021945033222436905, 0.00022787600755691528, 0.00023630168288946152, 0.00024472735822200775, 0.000253153033554554, 0.0002615787088871002, 0.00027000438421964645, 0.0002784300595521927, 0.0002868557348847389, 0.00029528141021728516]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 3.0, 6.0, 11.0, 5.0, 5.0, 4.0, 12.0, 14.0, 16.0, 18.0, 16.0, 23.0, 29.0, 35.0, 22.0, 31.0, 23.0, 38.0, 33.0, 32.0, 42.0, 41.0, 42.0, 37.0, 34.0, 35.0, 38.0, 42.0, 42.0, 26.0, 37.0, 31.0, 32.0, 17.0, 32.0, 22.0, 12.0, 12.0, 7.0, 11.0, 5.0, 4.0, 10.0, 5.0, 4.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.1171875, -4.9609375, -4.8046875, -4.6484375, -4.4921875, -4.3359375, -4.1796875, -4.0234375, -3.8671875, -3.7109375, -3.5546875, -3.3984375, -3.2421875, -3.0859375, -2.9296875, -2.7734375, -2.6171875, -2.4609375, -2.3046875, -2.1484375, -1.9921875, -1.8359375, -1.6796875, -1.5234375, -1.3671875, -1.2109375, -1.0546875, -0.8984375, -0.7421875, -0.5859375, -0.4296875, -0.2734375, -0.1171875, 0.0390625, 0.1953125, 0.3515625, 0.5078125, 0.6640625, 0.8203125, 0.9765625, 1.1328125, 1.2890625, 1.4453125, 1.6015625, 1.7578125, 1.9140625, 2.0703125, 2.2265625, 2.3828125, 2.5390625, 2.6953125, 2.8515625, 3.0078125, 3.1640625, 3.3203125, 3.4765625, 3.6328125, 3.7890625, 3.9453125, 4.1015625, 4.2578125, 4.4140625, 4.5703125, 4.7265625, 4.8828125]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 9.0, 11.0, 6.0, 5.0, 7.0, 14.0, 25.0, 37.0, 41.0, 72.0, 140.0, 200.0, 368.0, 630.0, 1094.0, 2104.0, 4019.0, 8175.0, 18180.0, 43693.0, 118562.0, 316456.0, 328423.0, 124043.0, 45689.0, 18736.0, 8651.0, 4243.0, 2136.0, 1160.0, 642.0, 382.0, 208.0, 139.0, 75.0, 55.0, 30.0, 28.0, 18.0, 10.0, 5.0, 10.0, 7.0, 5.0, 6.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.212890625, -3.1156005859375, -3.018310546875, -2.9210205078125, -2.82373046875, -2.7264404296875, -2.629150390625, -2.5318603515625, -2.4345703125, -2.3372802734375, -2.239990234375, -2.1427001953125, -2.04541015625, -1.9481201171875, -1.850830078125, -1.7535400390625, -1.65625, -1.5589599609375, -1.461669921875, -1.3643798828125, -1.26708984375, -1.1697998046875, -1.072509765625, -0.9752197265625, -0.8779296875, -0.7806396484375, -0.683349609375, -0.5860595703125, -0.48876953125, -0.3914794921875, -0.294189453125, -0.1968994140625, -0.099609375, -0.0023193359375, 0.094970703125, 0.1922607421875, 0.28955078125, 0.3868408203125, 0.484130859375, 0.5814208984375, 0.6787109375, 0.7760009765625, 0.873291015625, 0.9705810546875, 1.06787109375, 1.1651611328125, 1.262451171875, 1.3597412109375, 1.45703125, 1.5543212890625, 1.651611328125, 1.7489013671875, 1.84619140625, 1.9434814453125, 2.040771484375, 2.1380615234375, 2.2353515625, 2.3326416015625, 2.429931640625, 2.5272216796875, 2.62451171875, 2.7218017578125, 2.819091796875, 2.9163818359375, 3.013671875]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 6.0, 7.0, 8.0, 9.0, 8.0, 14.0, 23.0, 23.0, 29.0, 30.0, 40.0, 45.0, 44.0, 54.0, 64.0, 112.0, 1773.0, 277.0, 104.0, 59.0, 49.0, 45.0, 61.0, 29.0, 28.0, 21.0, 27.0, 24.0, 8.0, 11.0, 6.0, 5.0, 3.0, 7.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.6875, -23.9345703125, -23.181640625, -22.4287109375, -21.67578125, -20.9228515625, -20.169921875, -19.4169921875, -18.6640625, -17.9111328125, -17.158203125, -16.4052734375, -15.65234375, -14.8994140625, -14.146484375, -13.3935546875, -12.640625, -11.8876953125, -11.134765625, -10.3818359375, -9.62890625, -8.8759765625, -8.123046875, -7.3701171875, -6.6171875, -5.8642578125, -5.111328125, -4.3583984375, -3.60546875, -2.8525390625, -2.099609375, -1.3466796875, -0.59375, 0.1591796875, 0.912109375, 1.6650390625, 2.41796875, 3.1708984375, 3.923828125, 4.6767578125, 5.4296875, 6.1826171875, 6.935546875, 7.6884765625, 8.44140625, 9.1943359375, 9.947265625, 10.7001953125, 11.453125, 12.2060546875, 12.958984375, 13.7119140625, 14.46484375, 15.2177734375, 15.970703125, 16.7236328125, 17.4765625, 18.2294921875, 18.982421875, 19.7353515625, 20.48828125, 21.2412109375, 21.994140625, 22.7470703125, 23.5]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 4.0, 9.0, 9.0, 12.0, 24.0, 27.0, 20.0, 33.0, 51.0, 92.0, 119.0, 187.0, 361.0, 1127.0, 32352.0, 3101385.0, 8301.0, 772.0, 283.0, 176.0, 109.0, 59.0, 47.0, 26.0, 24.0, 30.0, 16.0, 13.0, 8.0, 8.0, 9.0, 7.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.8125, -36.5673828125, -35.322265625, -34.0771484375, -32.83203125, -31.5869140625, -30.341796875, -29.0966796875, -27.8515625, -26.6064453125, -25.361328125, -24.1162109375, -22.87109375, -21.6259765625, -20.380859375, -19.1357421875, -17.890625, -16.6455078125, -15.400390625, -14.1552734375, -12.91015625, -11.6650390625, -10.419921875, -9.1748046875, -7.9296875, -6.6845703125, -5.439453125, -4.1943359375, -2.94921875, -1.7041015625, -0.458984375, 0.7861328125, 2.03125, 3.2763671875, 4.521484375, 5.7666015625, 7.01171875, 8.2568359375, 9.501953125, 10.7470703125, 11.9921875, 13.2373046875, 14.482421875, 15.7275390625, 16.97265625, 18.2177734375, 19.462890625, 20.7080078125, 21.953125, 23.1982421875, 24.443359375, 25.6884765625, 26.93359375, 28.1787109375, 29.423828125, 30.6689453125, 31.9140625, 33.1591796875, 34.404296875, 35.6494140625, 36.89453125, 38.1396484375, 39.384765625, 40.6298828125, 41.875]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 10.0, 181.0, 631.0, 186.0, 8.0, 1.0, 0.0, 1.0], "bins": [-170.9716339111328, -168.04742431640625, -165.12322998046875, -162.1990203857422, -159.27481079101562, -156.35061645507812, -153.42640686035156, -150.502197265625, -147.57798767089844, -144.65377807617188, -141.72958374023438, -138.8053741455078, -135.88116455078125, -132.95697021484375, -130.0327606201172, -127.10855102539062, -124.18435668945312, -121.2601547241211, -118.33594512939453, -115.4117431640625, -112.48753356933594, -109.5633316040039, -106.63912963867188, -103.71492004394531, -100.79071044921875, -97.86650848388672, -94.94229888916016, -92.01809692382812, -89.09388732910156, -86.16968536376953, -83.2454833984375, -80.32127380371094, -77.39707946777344, -74.4728775024414, -71.54866790771484, -68.62446594238281, -65.70025634765625, -62.77605438232422, -59.85184860229492, -56.927642822265625, -54.00343704223633, -51.07923126220703, -48.155025482177734, -45.23081970214844, -42.306617736816406, -39.38241195678711, -36.45820617675781, -33.53400421142578, -30.60979652404785, -27.685590744018555, -24.76138687133789, -21.837181091308594, -18.912975311279297, -15.988771438598633, -13.064565658569336, -10.140361785888672, -7.216156005859375, -4.2919511795043945, -1.3677458763122559, 1.5564594268798828, 4.480664253234863, 7.404869079589844, 10.32907485961914, 13.253278732299805, 16.1774845123291]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 6.0, 5.0, 5.0, 4.0, 11.0, 9.0, 12.0, 12.0, 8.0, 14.0, 20.0, 18.0, 18.0, 29.0, 23.0, 32.0, 30.0, 33.0, 28.0, 48.0, 48.0, 43.0, 48.0, 36.0, 35.0, 34.0, 35.0, 33.0, 42.0, 29.0, 33.0, 30.0, 27.0, 29.0, 22.0, 21.0, 17.0, 23.0, 8.0, 10.0, 11.0, 4.0, 6.0, 7.0, 5.0, 2.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-55.55311584472656, -53.806236267089844, -52.05936050415039, -50.31248092651367, -48.56560516357422, -46.8187255859375, -45.07184600830078, -43.32496643066406, -41.57809066772461, -39.83121109008789, -38.08433532714844, -36.33745574951172, -34.590576171875, -32.84370040893555, -31.096820831298828, -29.349943161010742, -27.603065490722656, -25.85618782043457, -24.109310150146484, -22.362430572509766, -20.61555290222168, -18.868675231933594, -17.121795654296875, -15.374917984008789, -13.628040313720703, -11.881162643432617, -10.134284019470215, -8.387405395507812, -6.640527725219727, -4.893650054931641, -3.1467714309692383, -1.399892807006836, 0.3469810485839844, 2.0938591957092285, 3.8407373428344727, 5.587615489959717, 7.334493637084961, 9.081371307373047, 10.82824993133545, 12.575128555297852, 14.322006225585938, 16.068883895874023, 17.81576156616211, 19.562641143798828, 21.309518814086914, 23.056396484375, 24.80327606201172, 26.550153732299805, 28.29703140258789, 30.043909072875977, 31.790786743164062, 33.53766632080078, 35.2845458984375, 37.03142166137695, 38.77830123901367, 40.525177001953125, 42.272056579589844, 44.01893615722656, 45.765811920166016, 47.512691497802734, 49.25956726074219, 51.006446838378906, 52.753326416015625, 54.500205993652344, 56.2470817565918]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 5.0, 0.0, 2.0, 2.0, 5.0, 6.0, 6.0, 11.0, 7.0, 5.0, 4.0, 15.0, 17.0, 13.0, 20.0, 28.0, 20.0, 24.0, 33.0, 26.0, 36.0, 26.0, 36.0, 39.0, 37.0, 41.0, 41.0, 30.0, 38.0, 38.0, 34.0, 42.0, 41.0, 35.0, 32.0, 26.0, 32.0, 27.0, 25.0, 19.0, 18.0, 14.0, 8.0, 7.0, 10.0, 7.0, 6.0, 6.0, 3.0, 5.0, 4.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-5.19921875, -5.0416259765625, -4.884033203125, -4.7264404296875, -4.56884765625, -4.4112548828125, -4.253662109375, -4.0960693359375, -3.9384765625, -3.7808837890625, -3.623291015625, -3.4656982421875, -3.30810546875, -3.1505126953125, -2.992919921875, -2.8353271484375, -2.677734375, -2.5201416015625, -2.362548828125, -2.2049560546875, -2.04736328125, -1.8897705078125, -1.732177734375, -1.5745849609375, -1.4169921875, -1.2593994140625, -1.101806640625, -0.9442138671875, -0.78662109375, -0.6290283203125, -0.471435546875, -0.3138427734375, -0.15625, 0.0013427734375, 0.158935546875, 0.3165283203125, 0.47412109375, 0.6317138671875, 0.789306640625, 0.9468994140625, 1.1044921875, 1.2620849609375, 1.419677734375, 1.5772705078125, 1.73486328125, 1.8924560546875, 2.050048828125, 2.2076416015625, 2.365234375, 2.5228271484375, 2.680419921875, 2.8380126953125, 2.99560546875, 3.1531982421875, 3.310791015625, 3.4683837890625, 3.6259765625, 3.7835693359375, 3.941162109375, 4.0987548828125, 4.25634765625, 4.4139404296875, 4.571533203125, 4.7291259765625, 4.88671875]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 4.0, 3.0, 2.0, 7.0, 2.0, 6.0, 3.0, 13.0, 9.0, 16.0, 16.0, 15.0, 20.0, 24.0, 25.0, 32.0, 54.0, 69.0, 80.0, 153.0, 319.0, 911.0, 6174.0, 87355.0, 2157071.0, 1861282.0, 73500.0, 5366.0, 939.0, 278.0, 148.0, 79.0, 69.0, 42.0, 31.0, 33.0, 39.0, 18.0, 15.0, 9.0, 12.0, 8.0, 7.0, 8.0, 10.0, 7.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.8359375, -15.3245849609375, -14.813232421875, -14.3018798828125, -13.79052734375, -13.2791748046875, -12.767822265625, -12.2564697265625, -11.7451171875, -11.2337646484375, -10.722412109375, -10.2110595703125, -9.69970703125, -9.1883544921875, -8.677001953125, -8.1656494140625, -7.654296875, -7.1429443359375, -6.631591796875, -6.1202392578125, -5.60888671875, -5.0975341796875, -4.586181640625, -4.0748291015625, -3.5634765625, -3.0521240234375, -2.540771484375, -2.0294189453125, -1.51806640625, -1.0067138671875, -0.495361328125, 0.0159912109375, 0.52734375, 1.0386962890625, 1.550048828125, 2.0614013671875, 2.57275390625, 3.0841064453125, 3.595458984375, 4.1068115234375, 4.6181640625, 5.1295166015625, 5.640869140625, 6.1522216796875, 6.66357421875, 7.1749267578125, 7.686279296875, 8.1976318359375, 8.708984375, 9.2203369140625, 9.731689453125, 10.2430419921875, 10.75439453125, 11.2657470703125, 11.777099609375, 12.2884521484375, 12.7998046875, 13.3111572265625, 13.822509765625, 14.3338623046875, 14.84521484375, 15.3565673828125, 15.867919921875, 16.3792724609375, 16.890625]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 4.0, 2.0, 7.0, 5.0, 11.0, 13.0, 24.0, 14.0, 31.0, 39.0, 39.0, 54.0, 81.0, 113.0, 134.0, 200.0, 240.0, 278.0, 378.0, 457.0, 441.0, 360.0, 319.0, 192.0, 151.0, 123.0, 88.0, 73.0, 53.0, 41.0, 23.0, 25.0, 18.0, 10.0, 9.0, 10.0, 9.0, 4.0, 2.0, 0.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-15.3515625, -14.9227294921875, -14.493896484375, -14.0650634765625, -13.63623046875, -13.2073974609375, -12.778564453125, -12.3497314453125, -11.9208984375, -11.4920654296875, -11.063232421875, -10.6343994140625, -10.20556640625, -9.7767333984375, -9.347900390625, -8.9190673828125, -8.490234375, -8.0614013671875, -7.632568359375, -7.2037353515625, -6.77490234375, -6.3460693359375, -5.917236328125, -5.4884033203125, -5.0595703125, -4.6307373046875, -4.201904296875, -3.7730712890625, -3.34423828125, -2.9154052734375, -2.486572265625, -2.0577392578125, -1.62890625, -1.2000732421875, -0.771240234375, -0.3424072265625, 0.08642578125, 0.5152587890625, 0.944091796875, 1.3729248046875, 1.8017578125, 2.2305908203125, 2.659423828125, 3.0882568359375, 3.51708984375, 3.9459228515625, 4.374755859375, 4.8035888671875, 5.232421875, 5.6612548828125, 6.090087890625, 6.5189208984375, 6.94775390625, 7.3765869140625, 7.805419921875, 8.2342529296875, 8.6630859375, 9.0919189453125, 9.520751953125, 9.9495849609375, 10.37841796875, 10.8072509765625, 11.236083984375, 11.6649169921875, 12.09375]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 6.0, 5.0, 7.0, 11.0, 11.0, 16.0, 30.0, 22.0, 46.0, 44.0, 71.0, 94.0, 117.0, 160.0, 257.0, 453.0, 1635.0, 72092.0, 4100838.0, 16056.0, 1078.0, 409.0, 209.0, 152.0, 141.0, 96.0, 52.0, 39.0, 40.0, 32.0, 18.0, 16.0, 5.0, 7.0, 6.0, 7.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.5, -62.4443359375, -60.388671875, -58.3330078125, -56.27734375, -54.2216796875, -52.166015625, -50.1103515625, -48.0546875, -45.9990234375, -43.943359375, -41.8876953125, -39.83203125, -37.7763671875, -35.720703125, -33.6650390625, -31.609375, -29.5537109375, -27.498046875, -25.4423828125, -23.38671875, -21.3310546875, -19.275390625, -17.2197265625, -15.1640625, -13.1083984375, -11.052734375, -8.9970703125, -6.94140625, -4.8857421875, -2.830078125, -0.7744140625, 1.28125, 3.3369140625, 5.392578125, 7.4482421875, 9.50390625, 11.5595703125, 13.615234375, 15.6708984375, 17.7265625, 19.7822265625, 21.837890625, 23.8935546875, 25.94921875, 28.0048828125, 30.060546875, 32.1162109375, 34.171875, 36.2275390625, 38.283203125, 40.3388671875, 42.39453125, 44.4501953125, 46.505859375, 48.5615234375, 50.6171875, 52.6728515625, 54.728515625, 56.7841796875, 58.83984375, 60.8955078125, 62.951171875, 65.0068359375, 67.0625]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 16.0, 14.0, 31.0, 50.0, 57.0, 80.0, 112.0, 125.0, 121.0, 123.0, 90.0, 68.0, 49.0, 22.0, 21.0, 12.0, 4.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-72.62271118164062, -71.08028411865234, -69.53784942626953, -67.99542236328125, -66.45298767089844, -64.91056060791016, -63.368133544921875, -61.82570266723633, -60.28327178955078, -58.740840911865234, -57.19841003417969, -55.655982971191406, -54.11355209350586, -52.57112121582031, -51.02869415283203, -49.486263275146484, -47.94383239746094, -46.40140151977539, -44.858970642089844, -43.31654357910156, -41.774112701416016, -40.23168182373047, -38.68925476074219, -37.14682388305664, -35.604393005371094, -34.06196212768555, -32.51953125, -30.97710418701172, -29.434673309326172, -27.892242431640625, -26.34981346130371, -24.807384490966797, -23.264955520629883, -21.72252655029297, -20.180095672607422, -18.637664794921875, -17.09523582458496, -15.55280590057373, -14.0103759765625, -12.46794605255127, -10.925516128540039, -9.383086204528809, -7.840656280517578, -6.298226356506348, -4.755796432495117, -3.2133665084838867, -1.6709365844726562, -0.12850666046142578, 1.4139232635498047, 2.956353187561035, 4.498783111572266, 6.041213035583496, 7.583642959594727, 9.126072883605957, 10.668502807617188, 12.210932731628418, 13.753362655639648, 15.295792579650879, 16.83822250366211, 18.380653381347656, 19.92308235168457, 21.465511322021484, 23.00794219970703, 24.550373077392578, 26.092802047729492]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 0.0, 3.0, 6.0, 0.0, 7.0, 11.0, 13.0, 11.0, 28.0, 16.0, 19.0, 21.0, 24.0, 26.0, 42.0, 43.0, 38.0, 36.0, 44.0, 27.0, 49.0, 34.0, 52.0, 41.0, 39.0, 43.0, 42.0, 42.0, 45.0, 28.0, 30.0, 22.0, 25.0, 23.0, 16.0, 12.0, 7.0, 14.0, 9.0, 10.0, 1.0, 2.0, 7.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.82147979736328, -55.1296501159668, -53.43782043457031, -51.74598693847656, -50.05415725708008, -48.362327575683594, -46.670494079589844, -44.97866439819336, -43.286834716796875, -41.59500503540039, -39.903175354003906, -38.211341857910156, -36.51951217651367, -34.82768249511719, -33.13584899902344, -31.444019317626953, -29.75218963623047, -28.060359954833984, -26.368528366088867, -24.67669677734375, -22.984867095947266, -21.29303741455078, -19.601205825805664, -17.909374237060547, -16.217544555664062, -14.525713920593262, -12.833883285522461, -11.14205265045166, -9.45022201538086, -7.758391380310059, -6.066560745239258, -4.374730110168457, -2.6828994750976562, -0.9910688400268555, 0.7007617950439453, 2.392592430114746, 4.084423065185547, 5.776253700256348, 7.468084335327148, 9.15991497039795, 10.85174560546875, 12.54357624053955, 14.235406875610352, 15.927237510681152, 17.619068145751953, 19.310897827148438, 21.002729415893555, 22.694561004638672, 24.386390686035156, 26.07822036743164, 27.770051956176758, 29.461883544921875, 31.15371322631836, 32.845542907714844, 34.537376403808594, 36.22920608520508, 37.92103576660156, 39.61286544799805, 41.30469512939453, 42.99652862548828, 44.688358306884766, 46.38018798828125, 48.072021484375, 49.763851165771484, 51.45568084716797]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 0.0, 2.0, 5.0, 4.0, 5.0, 13.0, 7.0, 10.0, 13.0, 14.0, 15.0, 11.0, 28.0, 25.0, 32.0, 23.0, 30.0, 30.0, 38.0, 31.0, 41.0, 44.0, 31.0, 48.0, 47.0, 33.0, 43.0, 42.0, 32.0, 39.0, 40.0, 26.0, 22.0, 30.0, 24.0, 22.0, 20.0, 15.0, 10.0, 9.0, 7.0, 10.0, 3.0, 9.0, 6.0, 4.0, 5.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0], "bins": [-5.7265625, -5.562255859375, -5.39794921875, -5.233642578125, -5.0693359375, -4.905029296875, -4.74072265625, -4.576416015625, -4.412109375, -4.247802734375, -4.08349609375, -3.919189453125, -3.7548828125, -3.590576171875, -3.42626953125, -3.261962890625, -3.09765625, -2.933349609375, -2.76904296875, -2.604736328125, -2.4404296875, -2.276123046875, -2.11181640625, -1.947509765625, -1.783203125, -1.618896484375, -1.45458984375, -1.290283203125, -1.1259765625, -0.961669921875, -0.79736328125, -0.633056640625, -0.46875, -0.304443359375, -0.14013671875, 0.024169921875, 0.1884765625, 0.352783203125, 0.51708984375, 0.681396484375, 0.845703125, 1.010009765625, 1.17431640625, 1.338623046875, 1.5029296875, 1.667236328125, 1.83154296875, 1.995849609375, 2.16015625, 2.324462890625, 2.48876953125, 2.653076171875, 2.8173828125, 2.981689453125, 3.14599609375, 3.310302734375, 3.474609375, 3.638916015625, 3.80322265625, 3.967529296875, 4.1318359375, 4.296142578125, 4.46044921875, 4.624755859375, 4.7890625]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 7.0, 14.0, 18.0, 31.0, 43.0, 59.0, 98.0, 132.0, 192.0, 264.0, 365.0, 526.0, 815.0, 1082.0, 1576.0, 2346.0, 3285.0, 4778.0, 7164.0, 10514.0, 15839.0, 24186.0, 37867.0, 61811.0, 114102.0, 313472.0, 208030.0, 91006.0, 52380.0, 32753.0, 20720.0, 13772.0, 9223.0, 6243.0, 4242.0, 2958.0, 1960.0, 1447.0, 996.0, 716.0, 470.0, 347.0, 225.0, 172.0, 111.0, 56.0, 52.0, 36.0, 21.0, 12.0, 13.0, 6.0, 5.0, 4.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.974609375, -0.9419403076171875, -0.909271240234375, -0.8766021728515625, -0.84393310546875, -0.8112640380859375, -0.778594970703125, -0.7459259033203125, -0.7132568359375, -0.6805877685546875, -0.647918701171875, -0.6152496337890625, -0.58258056640625, -0.5499114990234375, -0.517242431640625, -0.4845733642578125, -0.451904296875, -0.4192352294921875, -0.386566162109375, -0.3538970947265625, -0.32122802734375, -0.2885589599609375, -0.255889892578125, -0.2232208251953125, -0.1905517578125, -0.1578826904296875, -0.125213623046875, -0.0925445556640625, -0.05987548828125, -0.0272064208984375, 0.005462646484375, 0.0381317138671875, 0.07080078125, 0.1034698486328125, 0.136138916015625, 0.1688079833984375, 0.20147705078125, 0.2341461181640625, 0.266815185546875, 0.2994842529296875, 0.3321533203125, 0.3648223876953125, 0.397491455078125, 0.4301605224609375, 0.46282958984375, 0.4954986572265625, 0.528167724609375, 0.5608367919921875, 0.593505859375, 0.6261749267578125, 0.658843994140625, 0.6915130615234375, 0.72418212890625, 0.7568511962890625, 0.789520263671875, 0.8221893310546875, 0.8548583984375, 0.8875274658203125, 0.920196533203125, 0.9528656005859375, 0.98553466796875, 1.0182037353515625, 1.050872802734375, 1.0835418701171875, 1.1162109375]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 2.0, 7.0, 2.0, 7.0, 10.0, 6.0, 7.0, 12.0, 12.0, 19.0, 14.0, 21.0, 11.0, 25.0, 18.0, 30.0, 26.0, 38.0, 29.0, 28.0, 40.0, 34.0, 41.0, 34.0, 1066.0, 41.0, 26.0, 48.0, 28.0, 36.0, 22.0, 32.0, 33.0, 30.0, 34.0, 22.0, 26.0, 16.0, 12.0, 18.0, 19.0, 12.0, 8.0, 6.0, 3.0, 5.0, 5.0, 6.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 3.0, 2.0], "bins": [-3.21875, -3.120452880859375, -3.02215576171875, -2.923858642578125, -2.8255615234375, -2.727264404296875, -2.62896728515625, -2.530670166015625, -2.432373046875, -2.334075927734375, -2.23577880859375, -2.137481689453125, -2.0391845703125, -1.940887451171875, -1.84259033203125, -1.744293212890625, -1.64599609375, -1.547698974609375, -1.44940185546875, -1.351104736328125, -1.2528076171875, -1.154510498046875, -1.05621337890625, -0.957916259765625, -0.859619140625, -0.761322021484375, -0.66302490234375, -0.564727783203125, -0.4664306640625, -0.368133544921875, -0.26983642578125, -0.171539306640625, -0.0732421875, 0.025054931640625, 0.12335205078125, 0.221649169921875, 0.3199462890625, 0.418243408203125, 0.51654052734375, 0.614837646484375, 0.713134765625, 0.811431884765625, 0.90972900390625, 1.008026123046875, 1.1063232421875, 1.204620361328125, 1.30291748046875, 1.401214599609375, 1.49951171875, 1.597808837890625, 1.69610595703125, 1.794403076171875, 1.8927001953125, 1.990997314453125, 2.08929443359375, 2.187591552734375, 2.285888671875, 2.384185791015625, 2.48248291015625, 2.580780029296875, 2.6790771484375, 2.777374267578125, 2.87567138671875, 2.973968505859375, 3.072265625]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 0.0, 2.0, 4.0, 3.0, 11.0, 14.0, 22.0, 29.0, 26.0, 47.0, 70.0, 120.0, 175.0, 239.0, 366.0, 552.0, 907.0, 1346.0, 1999.0, 3166.0, 4859.0, 7556.0, 12023.0, 18515.0, 30346.0, 50598.0, 90673.0, 210549.0, 1382877.0, 118446.0, 62138.0, 37093.0, 22674.0, 14280.0, 9077.0, 5794.0, 3716.0, 2288.0, 1534.0, 1014.0, 637.0, 445.0, 281.0, 210.0, 143.0, 86.0, 52.0, 43.0, 37.0, 19.0, 11.0, 16.0, 7.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.076171875, -1.0416717529296875, -1.007171630859375, -0.9726715087890625, -0.93817138671875, -0.9036712646484375, -0.869171142578125, -0.8346710205078125, -0.8001708984375, -0.7656707763671875, -0.731170654296875, -0.6966705322265625, -0.66217041015625, -0.6276702880859375, -0.593170166015625, -0.5586700439453125, -0.524169921875, -0.4896697998046875, -0.455169677734375, -0.4206695556640625, -0.38616943359375, -0.3516693115234375, -0.317169189453125, -0.2826690673828125, -0.2481689453125, -0.2136688232421875, -0.179168701171875, -0.1446685791015625, -0.11016845703125, -0.0756683349609375, -0.041168212890625, -0.0066680908203125, 0.02783203125, 0.0623321533203125, 0.096832275390625, 0.1313323974609375, 0.16583251953125, 0.2003326416015625, 0.234832763671875, 0.2693328857421875, 0.3038330078125, 0.3383331298828125, 0.372833251953125, 0.4073333740234375, 0.44183349609375, 0.4763336181640625, 0.510833740234375, 0.5453338623046875, 0.579833984375, 0.6143341064453125, 0.648834228515625, 0.6833343505859375, 0.71783447265625, 0.7523345947265625, 0.786834716796875, 0.8213348388671875, 0.8558349609375, 0.8903350830078125, 0.924835205078125, 0.9593353271484375, 0.99383544921875, 1.0283355712890625, 1.062835693359375, 1.0973358154296875, 1.1318359375]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 5.0, 4.0, 3.0, 5.0, 7.0, 10.0, 13.0, 15.0, 20.0, 20.0, 28.0, 30.0, 39.0, 55.0, 50.0, 74.0, 73.0, 51.0, 69.0, 55.0, 46.0, 65.0, 51.0, 43.0, 43.0, 27.0, 23.0, 14.0, 10.0, 9.0, 11.0, 8.0, 7.0, 5.0, 4.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0007162094116210938, -0.000693202018737793, -0.0006701946258544922, -0.0006471872329711914, -0.0006241798400878906, -0.0006011724472045898, -0.0005781650543212891, -0.0005551576614379883, -0.0005321502685546875, -0.0005091428756713867, -0.00048613548278808594, -0.00046312808990478516, -0.0004401206970214844, -0.0004171133041381836, -0.0003941059112548828, -0.00037109851837158203, -0.00034809112548828125, -0.00032508373260498047, -0.0003020763397216797, -0.0002790689468383789, -0.0002560615539550781, -0.00023305416107177734, -0.00021004676818847656, -0.00018703937530517578, -0.000164031982421875, -0.00014102458953857422, -0.00011801719665527344, -9.500980377197266e-05, -7.200241088867188e-05, -4.8995018005371094e-05, -2.5987625122070312e-05, -2.9802322387695312e-06, 2.002716064453125e-05, 4.303455352783203e-05, 6.604194641113281e-05, 8.90493392944336e-05, 0.00011205673217773438, 0.00013506412506103516, 0.00015807151794433594, 0.00018107891082763672, 0.0002040863037109375, 0.00022709369659423828, 0.00025010108947753906, 0.00027310848236083984, 0.0002961158752441406, 0.0003191232681274414, 0.0003421306610107422, 0.00036513805389404297, 0.00038814544677734375, 0.00041115283966064453, 0.0004341602325439453, 0.0004571676254272461, 0.0004801750183105469, 0.0005031824111938477, 0.0005261898040771484, 0.0005491971969604492, 0.00057220458984375, 0.0005952119827270508, 0.0006182193756103516, 0.0006412267684936523, 0.0006642341613769531, 0.0006872415542602539, 0.0007102489471435547, 0.0007332563400268555, 0.0007562637329101562]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 4.0, 6.0, 6.0, 5.0, 7.0, 9.0, 7.0, 15.0, 8.0, 24.0, 33.0, 27.0, 48.0, 71.0, 109.0, 175.0, 382.0, 1279.0, 1031729.0, 13301.0, 595.0, 241.0, 123.0, 90.0, 58.0, 50.0, 35.0, 30.0, 20.0, 17.0, 13.0, 15.0, 5.0, 6.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.018707275390625, -0.018117427825927734, -0.01752758026123047, -0.016937732696533203, -0.016347885131835938, -0.015758037567138672, -0.015168190002441406, -0.01457834243774414, -0.013988494873046875, -0.01339864730834961, -0.012808799743652344, -0.012218952178955078, -0.011629104614257812, -0.011039257049560547, -0.010449409484863281, -0.009859561920166016, -0.00926971435546875, -0.008679866790771484, -0.008090019226074219, -0.007500171661376953, -0.0069103240966796875, -0.006320476531982422, -0.005730628967285156, -0.005140781402587891, -0.004550933837890625, -0.003961086273193359, -0.0033712387084960938, -0.002781391143798828, -0.0021915435791015625, -0.0016016960144042969, -0.0010118484497070312, -0.0004220008850097656, 0.0001678466796875, 0.0007576942443847656, 0.0013475418090820312, 0.0019373893737792969, 0.0025272369384765625, 0.003117084503173828, 0.0037069320678710938, 0.004296779632568359, 0.004886627197265625, 0.005476474761962891, 0.006066322326660156, 0.006656169891357422, 0.0072460174560546875, 0.007835865020751953, 0.008425712585449219, 0.009015560150146484, 0.00960540771484375, 0.010195255279541016, 0.010785102844238281, 0.011374950408935547, 0.011964797973632812, 0.012554645538330078, 0.013144493103027344, 0.01373434066772461, 0.014324188232421875, 0.01491403579711914, 0.015503883361816406, 0.016093730926513672, 0.016683578491210938, 0.017273426055908203, 0.01786327362060547, 0.018453121185302734, 0.01904296875]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 15.0, 51.0, 151.0, 260.0, 294.0, 157.0, 59.0, 20.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00041670113569125533, -0.00038898017373867333, -0.00036125918268226087, -0.00033353822072967887, -0.0003058172296732664, -0.0002780962677206844, -0.0002503753057681024, -0.00022265432926360518, -0.00019493335275910795, -0.00016721237625461072, -0.0001394913997501135, -0.00011177043779753149, -8.404946129303426e-05, -5.6328484788537025e-05, -2.8607522835955024e-05, -8.865463314577937e-07, 2.6834430173039436e-05, 5.455540303955786e-05, 8.227637590607628e-05, 0.0001099973451346159, 0.00013771832163911313, 0.00016543929814361036, 0.00019316026009619236, 0.0002208812366006896, 0.0002486022131051868, 0.0002763231750577688, 0.0003040441661141813, 0.0003317651280667633, 0.0003594860900193453, 0.00038720708107575774, 0.00041492804302833974, 0.00044264900498092175, 0.0004703700542449951, 0.0004980910453014076, 0.0005258119781501591, 0.0005535329692065716, 0.000581253960262984, 0.0006089749513193965, 0.000636695884168148, 0.0006644168752245605, 0.000692137866280973, 0.0007198588573373854, 0.000747579790186137, 0.0007753007812425494, 0.0008030217722989619, 0.0008307427633553743, 0.0008584636962041259, 0.0008861846872605383, 0.0009139056201092899, 0.0009416266111657023, 0.0009693475440144539, 0.0009970685932785273, 0.0010247895261272788, 0.0010525104589760303, 0.0010802315082401037, 0.0011079524410888553, 0.0011356733739376068, 0.0011633943067863584, 0.0011911153560504317, 0.0012188362888991833, 0.0012465572217479348, 0.0012742782710120082, 0.0013019992038607597, 0.0013297201367095113, 0.0013574411859735847]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 4.0, 2.0, 4.0, 4.0, 3.0, 7.0, 11.0, 9.0, 7.0, 10.0, 17.0, 16.0, 23.0, 22.0, 19.0, 25.0, 17.0, 25.0, 28.0, 41.0, 29.0, 40.0, 34.0, 44.0, 44.0, 46.0, 37.0, 29.0, 31.0, 44.0, 42.0, 34.0, 34.0, 29.0, 26.0, 26.0, 33.0, 26.0, 18.0, 15.0, 8.0, 10.0, 7.0, 7.0, 4.0, 8.0, 5.0, 2.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00030231475830078125, -0.00029151327908039093, -0.0002807117998600006, -0.0002699103206396103, -0.00025910884141921997, -0.00024830736219882965, -0.00023750588297843933, -0.000226704403758049, -0.0002159029245376587, -0.00020510144531726837, -0.00019429996609687805, -0.00018349848687648773, -0.0001726970076560974, -0.0001618955284357071, -0.00015109404921531677, -0.00014029256999492645, -0.00012949109077453613, -0.00011868961155414581, -0.00010788813233375549, -9.708665311336517e-05, -8.628517389297485e-05, -7.548369467258453e-05, -6.468221545219421e-05, -5.3880736231803894e-05, -4.3079257011413574e-05, -3.2277777791023254e-05, -2.1476298570632935e-05, -1.0674819350242615e-05, 1.2665987014770508e-07, 1.0928139090538025e-05, 2.1729618310928345e-05, 3.2531097531318665e-05, 4.3332576751708984e-05, 5.4134055972099304e-05, 6.493553519248962e-05, 7.573701441287994e-05, 8.653849363327026e-05, 9.733997285366058e-05, 0.0001081414520740509, 0.00011894293129444122, 0.00012974441051483154, 0.00014054588973522186, 0.00015134736895561218, 0.0001621488481760025, 0.00017295032739639282, 0.00018375180661678314, 0.00019455328583717346, 0.00020535476505756378, 0.0002161562442779541, 0.00022695772349834442, 0.00023775920271873474, 0.00024856068193912506, 0.0002593621611595154, 0.0002701636403799057, 0.000280965119600296, 0.00029176659882068634, 0.00030256807804107666, 0.000313369557261467, 0.0003241710364818573, 0.0003349725157022476, 0.00034577399492263794, 0.00035657547414302826, 0.0003673769533634186, 0.0003781784325838089, 0.0003889799118041992]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 0.0, 2.0, 5.0, 4.0, 5.0, 13.0, 7.0, 10.0, 13.0, 14.0, 15.0, 11.0, 28.0, 25.0, 32.0, 23.0, 30.0, 30.0, 38.0, 31.0, 41.0, 44.0, 31.0, 48.0, 47.0, 33.0, 43.0, 42.0, 32.0, 39.0, 40.0, 26.0, 22.0, 30.0, 24.0, 22.0, 20.0, 15.0, 10.0, 9.0, 7.0, 10.0, 3.0, 9.0, 6.0, 4.0, 5.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0], "bins": [-5.7265625, -5.562255859375, -5.39794921875, -5.233642578125, -5.0693359375, -4.905029296875, -4.74072265625, -4.576416015625, -4.412109375, -4.247802734375, -4.08349609375, -3.919189453125, -3.7548828125, -3.590576171875, -3.42626953125, -3.261962890625, -3.09765625, -2.933349609375, -2.76904296875, -2.604736328125, -2.4404296875, -2.276123046875, -2.11181640625, -1.947509765625, -1.783203125, -1.618896484375, -1.45458984375, -1.290283203125, -1.1259765625, -0.961669921875, -0.79736328125, -0.633056640625, -0.46875, -0.304443359375, -0.14013671875, 0.024169921875, 0.1884765625, 0.352783203125, 0.51708984375, 0.681396484375, 0.845703125, 1.010009765625, 1.17431640625, 1.338623046875, 1.5029296875, 1.667236328125, 1.83154296875, 1.995849609375, 2.16015625, 2.324462890625, 2.48876953125, 2.653076171875, 2.8173828125, 2.981689453125, 3.14599609375, 3.310302734375, 3.474609375, 3.638916015625, 3.80322265625, 3.967529296875, 4.1318359375, 4.296142578125, 4.46044921875, 4.624755859375, 4.7890625]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 5.0, 1.0, 4.0, 1.0, 3.0, 6.0, 10.0, 13.0, 19.0, 28.0, 42.0, 41.0, 51.0, 79.0, 109.0, 119.0, 209.0, 290.0, 429.0, 614.0, 865.0, 1414.0, 2153.0, 3365.0, 5671.0, 9485.0, 17676.0, 36405.0, 90230.0, 302989.0, 378127.0, 109276.0, 41557.0, 19948.0, 10667.0, 6012.0, 3679.0, 2332.0, 1435.0, 946.0, 675.0, 463.0, 324.0, 215.0, 166.0, 118.0, 76.0, 78.0, 41.0, 36.0, 24.0, 20.0, 7.0, 9.0, 5.0, 4.0, 1.0, 2.0, 1.0, 2.0], "bins": [-4.29296875, -4.167022705078125, -4.04107666015625, -3.915130615234375, -3.7891845703125, -3.663238525390625, -3.53729248046875, -3.411346435546875, -3.285400390625, -3.159454345703125, -3.03350830078125, -2.907562255859375, -2.7816162109375, -2.655670166015625, -2.52972412109375, -2.403778076171875, -2.27783203125, -2.151885986328125, -2.02593994140625, -1.899993896484375, -1.7740478515625, -1.648101806640625, -1.52215576171875, -1.396209716796875, -1.270263671875, -1.144317626953125, -1.01837158203125, -0.892425537109375, -0.7664794921875, -0.640533447265625, -0.51458740234375, -0.388641357421875, -0.2626953125, -0.136749267578125, -0.01080322265625, 0.115142822265625, 0.2410888671875, 0.367034912109375, 0.49298095703125, 0.618927001953125, 0.744873046875, 0.870819091796875, 0.99676513671875, 1.122711181640625, 1.2486572265625, 1.374603271484375, 1.50054931640625, 1.626495361328125, 1.75244140625, 1.878387451171875, 2.00433349609375, 2.130279541015625, 2.2562255859375, 2.382171630859375, 2.50811767578125, 2.634063720703125, 2.760009765625, 2.885955810546875, 3.01190185546875, 3.137847900390625, 3.2637939453125, 3.389739990234375, 3.51568603515625, 3.641632080078125, 3.767578125]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 3.0, 6.0, 8.0, 4.0, 14.0, 16.0, 14.0, 19.0, 18.0, 27.0, 23.0, 27.0, 18.0, 21.0, 27.0, 44.0, 44.0, 57.0, 84.0, 126.0, 1688.0, 249.0, 75.0, 41.0, 54.0, 46.0, 36.0, 35.0, 23.0, 33.0, 25.0, 17.0, 29.0, 21.0, 7.0, 14.0, 12.0, 10.0, 9.0, 3.0, 5.0, 2.0, 4.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-19.9375, -19.32861328125, -18.7197265625, -18.11083984375, -17.501953125, -16.89306640625, -16.2841796875, -15.67529296875, -15.06640625, -14.45751953125, -13.8486328125, -13.23974609375, -12.630859375, -12.02197265625, -11.4130859375, -10.80419921875, -10.1953125, -9.58642578125, -8.9775390625, -8.36865234375, -7.759765625, -7.15087890625, -6.5419921875, -5.93310546875, -5.32421875, -4.71533203125, -4.1064453125, -3.49755859375, -2.888671875, -2.27978515625, -1.6708984375, -1.06201171875, -0.453125, 0.15576171875, 0.7646484375, 1.37353515625, 1.982421875, 2.59130859375, 3.2001953125, 3.80908203125, 4.41796875, 5.02685546875, 5.6357421875, 6.24462890625, 6.853515625, 7.46240234375, 8.0712890625, 8.68017578125, 9.2890625, 9.89794921875, 10.5068359375, 11.11572265625, 11.724609375, 12.33349609375, 12.9423828125, 13.55126953125, 14.16015625, 14.76904296875, 15.3779296875, 15.98681640625, 16.595703125, 17.20458984375, 17.8134765625, 18.42236328125, 19.03125]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [4.0, 2.0, 0.0, 4.0, 3.0, 6.0, 7.0, 4.0, 9.0, 3.0, 7.0, 10.0, 9.0, 20.0, 14.0, 20.0, 37.0, 33.0, 41.0, 71.0, 67.0, 89.0, 153.0, 242.0, 355.0, 795.0, 5427.0, 811565.0, 2317878.0, 6760.0, 892.0, 350.0, 240.0, 172.0, 100.0, 66.0, 47.0, 45.0, 32.0, 27.0, 25.0, 19.0, 20.0, 11.0, 6.0, 8.0, 7.0, 7.0, 6.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.96875, -30.82861328125, -29.6884765625, -28.54833984375, -27.408203125, -26.26806640625, -25.1279296875, -23.98779296875, -22.84765625, -21.70751953125, -20.5673828125, -19.42724609375, -18.287109375, -17.14697265625, -16.0068359375, -14.86669921875, -13.7265625, -12.58642578125, -11.4462890625, -10.30615234375, -9.166015625, -8.02587890625, -6.8857421875, -5.74560546875, -4.60546875, -3.46533203125, -2.3251953125, -1.18505859375, -0.044921875, 1.09521484375, 2.2353515625, 3.37548828125, 4.515625, 5.65576171875, 6.7958984375, 7.93603515625, 9.076171875, 10.21630859375, 11.3564453125, 12.49658203125, 13.63671875, 14.77685546875, 15.9169921875, 17.05712890625, 18.197265625, 19.33740234375, 20.4775390625, 21.61767578125, 22.7578125, 23.89794921875, 25.0380859375, 26.17822265625, 27.318359375, 28.45849609375, 29.5986328125, 30.73876953125, 31.87890625, 33.01904296875, 34.1591796875, 35.29931640625, 36.439453125, 37.57958984375, 38.7197265625, 39.85986328125, 41.0]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 7.0, 111.0, 642.0, 238.0, 18.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.43412208557129, -24.741304397583008, -21.048486709594727, -17.355667114257812, -13.662850379943848, -9.97003173828125, -6.277214050292969, -2.5843963623046875, 1.1084213256835938, 4.801239013671875, 8.494056701660156, 12.186875343322754, 15.879693031311035, 19.572511672973633, 23.265329360961914, 26.958147048950195, 30.650964736938477, 34.34378433227539, 38.03660202026367, 41.72941970825195, 45.422237396240234, 49.115055084228516, 52.8078727722168, 56.50069046020508, 60.19350814819336, 63.88632583618164, 67.57914733886719, 71.27196502685547, 74.96478271484375, 78.65760040283203, 82.35041809082031, 86.0432357788086, 89.73604583740234, 93.42886352539062, 97.1216812133789, 100.81449890136719, 104.50731658935547, 108.20013427734375, 111.89295196533203, 115.58576965332031, 119.2785873413086, 122.97140502929688, 126.66422271728516, 130.35704040527344, 134.04986572265625, 137.74267578125, 141.4355010986328, 145.12831115722656, 148.82113647460938, 152.5139617919922, 156.20677185058594, 159.89959716796875, 163.5924072265625, 167.2852325439453, 170.97804260253906, 174.67086791992188, 178.36367797851562, 182.05650329589844, 185.7493133544922, 189.442138671875, 193.13494873046875, 196.82777404785156, 200.5205841064453, 204.21340942382812, 207.90621948242188]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 6.0, 5.0, 5.0, 9.0, 11.0, 10.0, 8.0, 9.0, 11.0, 26.0, 32.0, 24.0, 29.0, 32.0, 35.0, 30.0, 38.0, 62.0, 55.0, 51.0, 51.0, 35.0, 43.0, 49.0, 33.0, 44.0, 39.0, 34.0, 29.0, 23.0, 26.0, 19.0, 21.0, 21.0, 8.0, 10.0, 8.0, 6.0, 6.0, 5.0, 7.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.3575439453125, -65.1562728881836, -62.95500564575195, -60.75373840332031, -58.552467346191406, -56.3511962890625, -54.14992904663086, -51.94866180419922, -49.74739074707031, -47.546119689941406, -45.344852447509766, -43.143585205078125, -40.94231414794922, -38.74104309082031, -36.53977584838867, -34.33850860595703, -32.137237548828125, -29.93596839904785, -27.734699249267578, -25.533430099487305, -23.33216094970703, -21.130891799926758, -18.929622650146484, -16.72835350036621, -14.527084350585938, -12.325815200805664, -10.12454605102539, -7.923276901245117, -5.722007751464844, -3.5207386016845703, -1.3194694519042969, 0.8817996978759766, 3.08306884765625, 5.284337997436523, 7.485607147216797, 9.68687629699707, 11.888145446777344, 14.089414596557617, 16.29068374633789, 18.491952896118164, 20.693222045898438, 22.89449119567871, 25.095760345458984, 27.297029495239258, 29.49829864501953, 31.699567794799805, 33.90083694458008, 36.10210418701172, 38.303375244140625, 40.50464630126953, 42.70591354370117, 44.90718078613281, 47.10845184326172, 49.309722900390625, 51.510990142822266, 53.712257385253906, 55.91352844238281, 58.11479949951172, 60.31606674194336, 62.517333984375, 64.7186050415039, 66.91987609863281, 69.12113952636719, 71.3224105834961, 73.523681640625]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 1.0, 8.0, 4.0, 8.0, 10.0, 6.0, 6.0, 17.0, 12.0, 10.0, 21.0, 18.0, 29.0, 26.0, 26.0, 40.0, 29.0, 30.0, 25.0, 36.0, 43.0, 41.0, 46.0, 35.0, 42.0, 45.0, 48.0, 37.0, 30.0, 34.0, 22.0, 36.0, 22.0, 29.0, 16.0, 23.0, 18.0, 8.0, 11.0, 9.0, 5.0, 10.0, 5.0, 2.0, 9.0, 5.0, 4.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.5078125, -5.34112548828125, -5.1744384765625, -5.00775146484375, -4.841064453125, -4.67437744140625, -4.5076904296875, -4.34100341796875, -4.17431640625, -4.00762939453125, -3.8409423828125, -3.67425537109375, -3.507568359375, -3.34088134765625, -3.1741943359375, -3.00750732421875, -2.8408203125, -2.67413330078125, -2.5074462890625, -2.34075927734375, -2.174072265625, -2.00738525390625, -1.8406982421875, -1.67401123046875, -1.50732421875, -1.34063720703125, -1.1739501953125, -1.00726318359375, -0.840576171875, -0.67388916015625, -0.5072021484375, -0.34051513671875, -0.173828125, -0.00714111328125, 0.1595458984375, 0.32623291015625, 0.492919921875, 0.65960693359375, 0.8262939453125, 0.99298095703125, 1.15966796875, 1.32635498046875, 1.4930419921875, 1.65972900390625, 1.826416015625, 1.99310302734375, 2.1597900390625, 2.32647705078125, 2.4931640625, 2.65985107421875, 2.8265380859375, 2.99322509765625, 3.159912109375, 3.32659912109375, 3.4932861328125, 3.65997314453125, 3.82666015625, 3.99334716796875, 4.1600341796875, 4.32672119140625, 4.493408203125, 4.66009521484375, 4.8267822265625, 4.99346923828125, 5.16015625]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 2.0, 7.0, 6.0, 9.0, 11.0, 22.0, 30.0, 32.0, 43.0, 67.0, 98.0, 145.0, 224.0, 415.0, 791.0, 1761.0, 4149.0, 11716.0, 41057.0, 175818.0, 707016.0, 1643338.0, 1154409.0, 341356.0, 79142.0, 20518.0, 6844.0, 2622.0, 1156.0, 537.0, 310.0, 178.0, 134.0, 93.0, 51.0, 50.0, 33.0, 19.0, 27.0, 21.0, 7.0, 11.0, 3.0, 1.0, 3.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.0234375, -6.808837890625, -6.59423828125, -6.379638671875, -6.1650390625, -5.950439453125, -5.73583984375, -5.521240234375, -5.306640625, -5.092041015625, -4.87744140625, -4.662841796875, -4.4482421875, -4.233642578125, -4.01904296875, -3.804443359375, -3.58984375, -3.375244140625, -3.16064453125, -2.946044921875, -2.7314453125, -2.516845703125, -2.30224609375, -2.087646484375, -1.873046875, -1.658447265625, -1.44384765625, -1.229248046875, -1.0146484375, -0.800048828125, -0.58544921875, -0.370849609375, -0.15625, 0.058349609375, 0.27294921875, 0.487548828125, 0.7021484375, 0.916748046875, 1.13134765625, 1.345947265625, 1.560546875, 1.775146484375, 1.98974609375, 2.204345703125, 2.4189453125, 2.633544921875, 2.84814453125, 3.062744140625, 3.27734375, 3.491943359375, 3.70654296875, 3.921142578125, 4.1357421875, 4.350341796875, 4.56494140625, 4.779541015625, 4.994140625, 5.208740234375, 5.42333984375, 5.637939453125, 5.8525390625, 6.067138671875, 6.28173828125, 6.496337890625, 6.7109375]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 5.0, 1.0, 7.0, 5.0, 11.0, 13.0, 9.0, 21.0, 24.0, 35.0, 44.0, 38.0, 57.0, 69.0, 84.0, 108.0, 119.0, 172.0, 236.0, 285.0, 294.0, 379.0, 383.0, 370.0, 284.0, 191.0, 172.0, 143.0, 111.0, 80.0, 63.0, 49.0, 53.0, 39.0, 34.0, 24.0, 12.0, 14.0, 6.0, 8.0, 9.0, 4.0, 5.0, 2.0, 5.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.3984375, -10.0394287109375, -9.680419921875, -9.3214111328125, -8.96240234375, -8.6033935546875, -8.244384765625, -7.8853759765625, -7.5263671875, -7.1673583984375, -6.808349609375, -6.4493408203125, -6.09033203125, -5.7313232421875, -5.372314453125, -5.0133056640625, -4.654296875, -4.2952880859375, -3.936279296875, -3.5772705078125, -3.21826171875, -2.8592529296875, -2.500244140625, -2.1412353515625, -1.7822265625, -1.4232177734375, -1.064208984375, -0.7052001953125, -0.34619140625, 0.0128173828125, 0.371826171875, 0.7308349609375, 1.08984375, 1.4488525390625, 1.807861328125, 2.1668701171875, 2.52587890625, 2.8848876953125, 3.243896484375, 3.6029052734375, 3.9619140625, 4.3209228515625, 4.679931640625, 5.0389404296875, 5.39794921875, 5.7569580078125, 6.115966796875, 6.4749755859375, 6.833984375, 7.1929931640625, 7.552001953125, 7.9110107421875, 8.27001953125, 8.6290283203125, 8.988037109375, 9.3470458984375, 9.7060546875, 10.0650634765625, 10.424072265625, 10.7830810546875, 11.14208984375, 11.5010986328125, 11.860107421875, 12.2191162109375, 12.578125]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 5.0, 3.0, 3.0, 12.0, 6.0, 15.0, 21.0, 36.0, 24.0, 42.0, 62.0, 71.0, 98.0, 142.0, 181.0, 359.0, 758.0, 11647.0, 4042625.0, 135471.0, 1423.0, 424.0, 251.0, 155.0, 111.0, 76.0, 70.0, 35.0, 40.0, 30.0, 24.0, 17.0, 13.0, 9.0, 9.0, 5.0, 5.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.28125, -58.25146484375, -56.2216796875, -54.19189453125, -52.162109375, -50.13232421875, -48.1025390625, -46.07275390625, -44.04296875, -42.01318359375, -39.9833984375, -37.95361328125, -35.923828125, -33.89404296875, -31.8642578125, -29.83447265625, -27.8046875, -25.77490234375, -23.7451171875, -21.71533203125, -19.685546875, -17.65576171875, -15.6259765625, -13.59619140625, -11.56640625, -9.53662109375, -7.5068359375, -5.47705078125, -3.447265625, -1.41748046875, 0.6123046875, 2.64208984375, 4.671875, 6.70166015625, 8.7314453125, 10.76123046875, 12.791015625, 14.82080078125, 16.8505859375, 18.88037109375, 20.91015625, 22.93994140625, 24.9697265625, 26.99951171875, 29.029296875, 31.05908203125, 33.0888671875, 35.11865234375, 37.1484375, 39.17822265625, 41.2080078125, 43.23779296875, 45.267578125, 47.29736328125, 49.3271484375, 51.35693359375, 53.38671875, 55.41650390625, 57.4462890625, 59.47607421875, 61.505859375, 63.53564453125, 65.5654296875, 67.59521484375, 69.625]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 7.0, 33.0, 116.0, 319.0, 329.0, 155.0, 42.0, 7.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-201.307861328125, -196.52037048339844, -191.73287963867188, -186.9453887939453, -182.15789794921875, -177.37039184570312, -172.58290100097656, -167.79541015625, -163.00791931152344, -158.22042846679688, -153.4329376220703, -148.64544677734375, -143.85794067382812, -139.07044982910156, -134.282958984375, -129.49546813964844, -124.70797729492188, -119.92048645019531, -115.13299560546875, -110.34549713134766, -105.5580062866211, -100.77051544189453, -95.98301696777344, -91.19552612304688, -86.40803527832031, -81.62054443359375, -76.83305358886719, -72.0455551147461, -67.25806427001953, -62.47057342529297, -57.68307876586914, -52.89558410644531, -48.10809326171875, -43.32060241699219, -38.53310775756836, -33.74561309814453, -28.95812225341797, -24.170629501342773, -19.383136749267578, -14.59564208984375, -9.808151245117188, -5.020658493041992, -0.23316574096679688, 4.554327011108398, 9.341819763183594, 14.129312515258789, 18.916805267333984, 23.704299926757812, 28.491790771484375, 33.27928161621094, 38.066776275634766, 42.854270935058594, 47.641761779785156, 52.42925262451172, 57.21674728393555, 62.004241943359375, 66.79173278808594, 71.5792236328125, 76.36671447753906, 81.15421295166016, 85.94170379638672, 90.72919464111328, 95.51669311523438, 100.30418395996094, 105.0916748046875]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 2.0, 4.0, 3.0, 3.0, 4.0, 8.0, 11.0, 9.0, 17.0, 11.0, 12.0, 18.0, 22.0, 29.0, 19.0, 29.0, 45.0, 31.0, 37.0, 38.0, 32.0, 25.0, 33.0, 30.0, 44.0, 47.0, 34.0, 41.0, 42.0, 38.0, 29.0, 26.0, 36.0, 29.0, 33.0, 22.0, 15.0, 12.0, 12.0, 15.0, 13.0, 10.0, 3.0, 8.0, 8.0, 6.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-49.47991943359375, -48.05036926269531, -46.62081527709961, -45.19126510620117, -43.761714935302734, -42.33216094970703, -40.902610778808594, -39.473060607910156, -38.04351043701172, -36.61396026611328, -35.18440628051758, -33.75485610961914, -32.3253059387207, -30.895753860473633, -29.466201782226562, -28.036651611328125, -26.607097625732422, -25.17754554748535, -23.747995376586914, -22.318443298339844, -20.888893127441406, -19.459341049194336, -18.029788970947266, -16.600238800048828, -15.170686721801758, -13.741135597229004, -12.31158447265625, -10.88203239440918, -9.452481269836426, -8.022930145263672, -6.593378067016602, -5.163826942443848, -3.734272003173828, -2.304720640182495, -0.8751692771911621, 0.55438232421875, 1.983933448791504, 3.413484573364258, 4.843036651611328, 6.272587776184082, 7.702138900756836, 9.13169002532959, 10.561241149902344, 11.990793228149414, 13.420344352722168, 14.849895477294922, 16.279447555541992, 17.708999633789062, 19.1385498046875, 20.56810188293457, 21.997652053833008, 23.427204132080078, 24.856754302978516, 26.286306381225586, 27.715858459472656, 29.145408630371094, 30.574960708618164, 32.004512786865234, 33.43406295776367, 34.863616943359375, 36.29316711425781, 37.72271728515625, 39.15226745605469, 40.58182144165039, 42.01137161254883]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 5.0, 7.0, 9.0, 4.0, 8.0, 14.0, 6.0, 9.0, 8.0, 12.0, 17.0, 16.0, 27.0, 25.0, 32.0, 32.0, 25.0, 38.0, 36.0, 38.0, 35.0, 31.0, 46.0, 54.0, 45.0, 30.0, 33.0, 41.0, 36.0, 31.0, 34.0, 24.0, 27.0, 30.0, 19.0, 21.0, 16.0, 13.0, 14.0, 7.0, 8.0, 8.0, 8.0, 3.0, 8.0, 3.0, 7.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-5.3828125, -5.216552734375, -5.05029296875, -4.884033203125, -4.7177734375, -4.551513671875, -4.38525390625, -4.218994140625, -4.052734375, -3.886474609375, -3.72021484375, -3.553955078125, -3.3876953125, -3.221435546875, -3.05517578125, -2.888916015625, -2.72265625, -2.556396484375, -2.39013671875, -2.223876953125, -2.0576171875, -1.891357421875, -1.72509765625, -1.558837890625, -1.392578125, -1.226318359375, -1.06005859375, -0.893798828125, -0.7275390625, -0.561279296875, -0.39501953125, -0.228759765625, -0.0625, 0.103759765625, 0.27001953125, 0.436279296875, 0.6025390625, 0.768798828125, 0.93505859375, 1.101318359375, 1.267578125, 1.433837890625, 1.60009765625, 1.766357421875, 1.9326171875, 2.098876953125, 2.26513671875, 2.431396484375, 2.59765625, 2.763916015625, 2.93017578125, 3.096435546875, 3.2626953125, 3.428955078125, 3.59521484375, 3.761474609375, 3.927734375, 4.093994140625, 4.26025390625, 4.426513671875, 4.5927734375, 4.759033203125, 4.92529296875, 5.091552734375, 5.2578125]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 7.0, 3.0, 5.0, 11.0, 16.0, 24.0, 19.0, 36.0, 60.0, 99.0, 114.0, 158.0, 238.0, 319.0, 512.0, 716.0, 994.0, 1551.0, 2211.0, 3349.0, 4922.0, 7106.0, 10843.0, 16269.0, 25304.0, 40373.0, 66660.0, 122402.0, 330217.0, 184785.0, 86911.0, 50771.0, 31286.0, 20206.0, 13115.0, 8635.0, 5760.0, 3994.0, 2710.0, 1865.0, 1229.0, 858.0, 608.0, 377.0, 259.0, 205.0, 125.0, 108.0, 66.0, 53.0, 35.0, 21.0, 16.0, 8.0, 8.0, 11.0, 4.0, 2.0, 0.0, 2.0, 1.0], "bins": [-1.0517578125, -1.01861572265625, -0.9854736328125, -0.95233154296875, -0.919189453125, -0.88604736328125, -0.8529052734375, -0.81976318359375, -0.78662109375, -0.75347900390625, -0.7203369140625, -0.68719482421875, -0.654052734375, -0.62091064453125, -0.5877685546875, -0.55462646484375, -0.521484375, -0.48834228515625, -0.4552001953125, -0.42205810546875, -0.388916015625, -0.35577392578125, -0.3226318359375, -0.28948974609375, -0.25634765625, -0.22320556640625, -0.1900634765625, -0.15692138671875, -0.123779296875, -0.09063720703125, -0.0574951171875, -0.02435302734375, 0.0087890625, 0.04193115234375, 0.0750732421875, 0.10821533203125, 0.141357421875, 0.17449951171875, 0.2076416015625, 0.24078369140625, 0.27392578125, 0.30706787109375, 0.3402099609375, 0.37335205078125, 0.406494140625, 0.43963623046875, 0.4727783203125, 0.50592041015625, 0.5390625, 0.57220458984375, 0.6053466796875, 0.63848876953125, 0.671630859375, 0.70477294921875, 0.7379150390625, 0.77105712890625, 0.80419921875, 0.83734130859375, 0.8704833984375, 0.90362548828125, 0.936767578125, 0.96990966796875, 1.0030517578125, 1.03619384765625, 1.0693359375]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 4.0, 6.0, 5.0, 4.0, 6.0, 10.0, 5.0, 9.0, 11.0, 18.0, 22.0, 12.0, 22.0, 18.0, 28.0, 21.0, 30.0, 28.0, 41.0, 21.0, 46.0, 31.0, 28.0, 39.0, 36.0, 1050.0, 33.0, 26.0, 36.0, 36.0, 35.0, 32.0, 29.0, 35.0, 29.0, 25.0, 25.0, 21.0, 15.0, 12.0, 15.0, 14.0, 12.0, 11.0, 15.0, 5.0, 6.0, 10.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-3.09765625, -2.995635986328125, -2.89361572265625, -2.791595458984375, -2.6895751953125, -2.587554931640625, -2.48553466796875, -2.383514404296875, -2.281494140625, -2.179473876953125, -2.07745361328125, -1.975433349609375, -1.8734130859375, -1.771392822265625, -1.66937255859375, -1.567352294921875, -1.46533203125, -1.363311767578125, -1.26129150390625, -1.159271240234375, -1.0572509765625, -0.955230712890625, -0.85321044921875, -0.751190185546875, -0.649169921875, -0.547149658203125, -0.44512939453125, -0.343109130859375, -0.2410888671875, -0.139068603515625, -0.03704833984375, 0.064971923828125, 0.1669921875, 0.269012451171875, 0.37103271484375, 0.473052978515625, 0.5750732421875, 0.677093505859375, 0.77911376953125, 0.881134033203125, 0.983154296875, 1.085174560546875, 1.18719482421875, 1.289215087890625, 1.3912353515625, 1.493255615234375, 1.59527587890625, 1.697296142578125, 1.79931640625, 1.901336669921875, 2.00335693359375, 2.105377197265625, 2.2073974609375, 2.309417724609375, 2.41143798828125, 2.513458251953125, 2.615478515625, 2.717498779296875, 2.81951904296875, 2.921539306640625, 3.0235595703125, 3.125579833984375, 3.22760009765625, 3.329620361328125, 3.431640625]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 8.0, 7.0, 9.0, 25.0, 15.0, 29.0, 51.0, 60.0, 105.0, 155.0, 230.0, 322.0, 503.0, 808.0, 1172.0, 1868.0, 2811.0, 4437.0, 6971.0, 10549.0, 16403.0, 26009.0, 42312.0, 72534.0, 138670.0, 1386850.0, 171501.0, 83764.0, 47840.0, 29267.0, 18321.0, 11837.0, 7576.0, 4895.0, 3225.0, 2060.0, 1339.0, 889.0, 564.0, 356.0, 258.0, 174.0, 120.0, 73.0, 54.0, 38.0, 28.0, 12.0, 14.0, 10.0, 7.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-1.2041015625, -1.1682891845703125, -1.132476806640625, -1.0966644287109375, -1.06085205078125, -1.0250396728515625, -0.989227294921875, -0.9534149169921875, -0.9176025390625, -0.8817901611328125, -0.845977783203125, -0.8101654052734375, -0.77435302734375, -0.7385406494140625, -0.702728271484375, -0.6669158935546875, -0.631103515625, -0.5952911376953125, -0.559478759765625, -0.5236663818359375, -0.48785400390625, -0.4520416259765625, -0.416229248046875, -0.3804168701171875, -0.3446044921875, -0.3087921142578125, -0.272979736328125, -0.2371673583984375, -0.20135498046875, -0.1655426025390625, -0.129730224609375, -0.0939178466796875, -0.05810546875, -0.0222930908203125, 0.013519287109375, 0.0493316650390625, 0.08514404296875, 0.1209564208984375, 0.156768798828125, 0.1925811767578125, 0.2283935546875, 0.2642059326171875, 0.300018310546875, 0.3358306884765625, 0.37164306640625, 0.4074554443359375, 0.443267822265625, 0.4790802001953125, 0.514892578125, 0.5507049560546875, 0.586517333984375, 0.6223297119140625, 0.65814208984375, 0.6939544677734375, 0.729766845703125, 0.7655792236328125, 0.8013916015625, 0.8372039794921875, 0.873016357421875, 0.9088287353515625, 0.94464111328125, 0.9804534912109375, 1.016265869140625, 1.0520782470703125, 1.087890625]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 5.0, 7.0, 2.0, 2.0, 2.0, 10.0, 8.0, 12.0, 14.0, 16.0, 26.0, 48.0, 56.0, 66.0, 89.0, 98.0, 103.0, 102.0, 87.0, 74.0, 52.0, 32.0, 20.0, 27.0, 16.0, 6.0, 7.0, 6.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0013437271118164062, -0.0013077855110168457, -0.0012718439102172852, -0.0012359023094177246, -0.001199960708618164, -0.0011640191078186035, -0.001128077507019043, -0.0010921359062194824, -0.0010561943054199219, -0.0010202527046203613, -0.0009843111038208008, -0.0009483695030212402, -0.0009124279022216797, -0.0008764863014221191, -0.0008405447006225586, -0.000804603099822998, -0.0007686614990234375, -0.000732719898223877, -0.0006967782974243164, -0.0006608366966247559, -0.0006248950958251953, -0.0005889534950256348, -0.0005530118942260742, -0.0005170702934265137, -0.0004811286926269531, -0.0004451870918273926, -0.00040924549102783203, -0.0003733038902282715, -0.00033736228942871094, -0.0003014206886291504, -0.00026547908782958984, -0.0002295374870300293, -0.00019359588623046875, -0.0001576542854309082, -0.00012171268463134766, -8.577108383178711e-05, -4.982948303222656e-05, -1.3887882232666016e-05, 2.205371856689453e-05, 5.799531936645508e-05, 9.393692016601562e-05, 0.00012987852096557617, 0.00016582012176513672, 0.00020176172256469727, 0.0002377033233642578, 0.00027364492416381836, 0.0003095865249633789, 0.00034552812576293945, 0.0003814697265625, 0.00041741132736206055, 0.0004533529281616211, 0.0004892945289611816, 0.0005252361297607422, 0.0005611777305603027, 0.0005971193313598633, 0.0006330609321594238, 0.0006690025329589844, 0.0007049441337585449, 0.0007408857345581055, 0.000776827335357666, 0.0008127689361572266, 0.0008487105369567871, 0.0008846521377563477, 0.0009205937385559082, 0.0009565353393554688]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 5.0, 8.0, 10.0, 9.0, 12.0, 23.0, 24.0, 45.0, 73.0, 96.0, 198.0, 412.0, 2152.0, 1042495.0, 2058.0, 414.0, 200.0, 100.0, 67.0, 36.0, 33.0, 22.0, 12.0, 3.0, 11.0, 7.0, 6.0, 5.0, 0.0, 2.0, 4.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02252197265625, -0.02173161506652832, -0.02094125747680664, -0.02015089988708496, -0.01936054229736328, -0.0185701847076416, -0.017779827117919922, -0.016989469528198242, -0.016199111938476562, -0.015408754348754883, -0.014618396759033203, -0.013828039169311523, -0.013037681579589844, -0.012247323989868164, -0.011456966400146484, -0.010666608810424805, -0.009876251220703125, -0.009085893630981445, -0.008295536041259766, -0.007505178451538086, -0.006714820861816406, -0.0059244632720947266, -0.005134105682373047, -0.004343748092651367, -0.0035533905029296875, -0.002763032913208008, -0.001972675323486328, -0.0011823177337646484, -0.00039196014404296875, 0.00039839744567871094, 0.0011887550354003906, 0.0019791126251220703, 0.00276947021484375, 0.0035598278045654297, 0.004350185394287109, 0.005140542984008789, 0.005930900573730469, 0.0067212581634521484, 0.007511615753173828, 0.008301973342895508, 0.009092330932617188, 0.009882688522338867, 0.010673046112060547, 0.011463403701782227, 0.012253761291503906, 0.013044118881225586, 0.013834476470947266, 0.014624834060668945, 0.015415191650390625, 0.016205549240112305, 0.016995906829833984, 0.017786264419555664, 0.018576622009277344, 0.019366979598999023, 0.020157337188720703, 0.020947694778442383, 0.021738052368164062, 0.022528409957885742, 0.023318767547607422, 0.0241091251373291, 0.02489948272705078, 0.02568984031677246, 0.02648019790649414, 0.02727055549621582, 0.0280609130859375]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 5.0, 41.0, 175.0, 409.0, 280.0, 89.0, 11.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015047903871163726, -0.0014614592073485255, -0.0014181279111653566, -0.0013747967313975096, -0.0013314655516296625, -0.0012881343718618155, -0.0012448030756786466, -0.0012014718959107995, -0.0011581405997276306, -0.0011148094199597836, -0.0010714781237766147, -0.0010281469440087676, -0.0009848157642409205, -0.0009414845262654126, -0.0008981532882899046, -0.0008548221085220575, -0.0008114909287542105, -0.0007681596907787025, -0.0007248285110108554, -0.0006814972730353475, -0.0006381660932675004, -0.0005948348552919924, -0.0005515036173164845, -0.0005081724375486374, -0.0004648411995731294, -0.0004215099907014519, -0.0003781787818297744, -0.0003348475438542664, -0.0002915163349825889, -0.00024818512611091137, -0.0002048538881354034, -0.00016152267926372588, -0.00011819135397672653, -7.48601378290914e-05, -3.152892168145627e-05, 1.1802301742136478e-05, 5.5133510613813996e-05, 9.846471948549151e-05, 0.0001417959574609995, 0.000185127166332677, 0.00022845837520435452, 0.00027178958407603204, 0.00031512079294770956, 0.00035845203092321754, 0.00040178323979489505, 0.00044511444866657257, 0.0004884456866420805, 0.0005317769246175885, 0.0005751081043854356, 0.0006184393423609436, 0.0006617705221287906, 0.0007051017601042986, 0.0007484329398721457, 0.0007917641778476536, 0.0008350954158231616, 0.0008784265955910087, 0.0009217578335665166, 0.0009650890715420246, 0.0010084202513098717, 0.0010517514310777187, 0.0010950827272608876, 0.0011384139070287347, 0.0011817452032119036, 0.0012250763829797506, 0.0012684075627475977]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 5.0, 7.0, 9.0, 5.0, 7.0, 8.0, 5.0, 12.0, 16.0, 13.0, 19.0, 21.0, 23.0, 25.0, 24.0, 30.0, 31.0, 37.0, 31.0, 38.0, 42.0, 30.0, 43.0, 34.0, 41.0, 56.0, 34.0, 34.0, 26.0, 32.0, 24.0, 28.0, 29.0, 18.0, 19.0, 22.0, 23.0, 10.0, 16.0, 11.0, 17.0, 8.0, 15.0, 10.0, 4.0, 4.0, 7.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.00038868188858032227, -0.0003760606050491333, -0.00036343932151794434, -0.00035081803798675537, -0.0003381967544555664, -0.00032557547092437744, -0.0003129541873931885, -0.0003003329038619995, -0.00028771162033081055, -0.0002750903367996216, -0.0002624690532684326, -0.00024984776973724365, -0.0002372264862060547, -0.00022460520267486572, -0.00021198391914367676, -0.0001993626356124878, -0.00018674135208129883, -0.00017412006855010986, -0.0001614987850189209, -0.00014887750148773193, -0.00013625621795654297, -0.000123634934425354, -0.00011101365089416504, -9.839236736297607e-05, -8.577108383178711e-05, -7.314980030059814e-05, -6.052851676940918e-05, -4.7907233238220215e-05, -3.528594970703125e-05, -2.2664666175842285e-05, -1.004338264465332e-05, 2.5779008865356445e-06, 1.519918441772461e-05, 2.7820467948913574e-05, 4.044175148010254e-05, 5.3063035011291504e-05, 6.568431854248047e-05, 7.830560207366943e-05, 9.09268856048584e-05, 0.00010354816913604736, 0.00011616945266723633, 0.0001287907361984253, 0.00014141201972961426, 0.00015403330326080322, 0.0001666545867919922, 0.00017927587032318115, 0.00019189715385437012, 0.00020451843738555908, 0.00021713972091674805, 0.000229761004447937, 0.00024238228797912598, 0.00025500357151031494, 0.0002676248550415039, 0.00028024613857269287, 0.00029286742210388184, 0.0003054887056350708, 0.00031810998916625977, 0.00033073127269744873, 0.0003433525562286377, 0.00035597383975982666, 0.0003685951232910156, 0.0003812164068222046, 0.00039383769035339355, 0.0004064589738845825, 0.0004190802574157715]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 5.0, 7.0, 9.0, 4.0, 8.0, 14.0, 6.0, 9.0, 8.0, 12.0, 17.0, 16.0, 27.0, 25.0, 32.0, 32.0, 25.0, 38.0, 36.0, 38.0, 35.0, 31.0, 47.0, 53.0, 45.0, 30.0, 33.0, 41.0, 36.0, 31.0, 34.0, 24.0, 27.0, 30.0, 19.0, 21.0, 16.0, 13.0, 14.0, 7.0, 8.0, 8.0, 8.0, 3.0, 8.0, 3.0, 7.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-5.3828125, -5.216552734375, -5.05029296875, -4.884033203125, -4.7177734375, -4.551513671875, -4.38525390625, -4.218994140625, -4.052734375, -3.886474609375, -3.72021484375, -3.553955078125, -3.3876953125, -3.221435546875, -3.05517578125, -2.888916015625, -2.72265625, -2.556396484375, -2.39013671875, -2.223876953125, -2.0576171875, -1.891357421875, -1.72509765625, -1.558837890625, -1.392578125, -1.226318359375, -1.06005859375, -0.893798828125, -0.7275390625, -0.561279296875, -0.39501953125, -0.228759765625, -0.0625, 0.103759765625, 0.27001953125, 0.436279296875, 0.6025390625, 0.768798828125, 0.93505859375, 1.101318359375, 1.267578125, 1.433837890625, 1.60009765625, 1.766357421875, 1.9326171875, 2.098876953125, 2.26513671875, 2.431396484375, 2.59765625, 2.763916015625, 2.93017578125, 3.096435546875, 3.2626953125, 3.428955078125, 3.59521484375, 3.761474609375, 3.927734375, 4.093994140625, 4.26025390625, 4.426513671875, 4.5927734375, 4.759033203125, 4.92529296875, 5.091552734375, 5.2578125]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 4.0, 0.0, 1.0, 4.0, 7.0, 5.0, 5.0, 10.0, 14.0, 10.0, 17.0, 27.0, 30.0, 44.0, 68.0, 112.0, 143.0, 239.0, 349.0, 555.0, 969.0, 1670.0, 3303.0, 6719.0, 15321.0, 38271.0, 106269.0, 313499.0, 358642.0, 124488.0, 44438.0, 17422.0, 7574.0, 3608.0, 1888.0, 1050.0, 602.0, 387.0, 228.0, 175.0, 108.0, 88.0, 60.0, 34.0, 27.0, 15.0, 11.0, 22.0, 6.0, 8.0, 3.0, 4.0, 4.0, 2.0, 2.0, 3.0, 1.0, 3.0, 0.0, 3.0], "bins": [-4.14453125, -4.01531982421875, -3.8861083984375, -3.75689697265625, -3.627685546875, -3.49847412109375, -3.3692626953125, -3.24005126953125, -3.11083984375, -2.98162841796875, -2.8524169921875, -2.72320556640625, -2.593994140625, -2.46478271484375, -2.3355712890625, -2.20635986328125, -2.0771484375, -1.94793701171875, -1.8187255859375, -1.68951416015625, -1.560302734375, -1.43109130859375, -1.3018798828125, -1.17266845703125, -1.04345703125, -0.91424560546875, -0.7850341796875, -0.65582275390625, -0.526611328125, -0.39739990234375, -0.2681884765625, -0.13897705078125, -0.009765625, 0.11944580078125, 0.2486572265625, 0.37786865234375, 0.507080078125, 0.63629150390625, 0.7655029296875, 0.89471435546875, 1.02392578125, 1.15313720703125, 1.2823486328125, 1.41156005859375, 1.540771484375, 1.66998291015625, 1.7991943359375, 1.92840576171875, 2.0576171875, 2.18682861328125, 2.3160400390625, 2.44525146484375, 2.574462890625, 2.70367431640625, 2.8328857421875, 2.96209716796875, 3.09130859375, 3.22052001953125, 3.3497314453125, 3.47894287109375, 3.608154296875, 3.73736572265625, 3.8665771484375, 3.99578857421875, 4.125]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 7.0, 2.0, 6.0, 4.0, 10.0, 8.0, 9.0, 16.0, 14.0, 16.0, 26.0, 16.0, 28.0, 32.0, 37.0, 33.0, 52.0, 54.0, 92.0, 179.0, 1771.0, 181.0, 69.0, 38.0, 43.0, 34.0, 44.0, 40.0, 30.0, 25.0, 20.0, 26.0, 18.0, 19.0, 12.0, 16.0, 10.0, 3.0, 3.0, 1.0, 4.0, 0.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-20.28125, -19.6376953125, -18.994140625, -18.3505859375, -17.70703125, -17.0634765625, -16.419921875, -15.7763671875, -15.1328125, -14.4892578125, -13.845703125, -13.2021484375, -12.55859375, -11.9150390625, -11.271484375, -10.6279296875, -9.984375, -9.3408203125, -8.697265625, -8.0537109375, -7.41015625, -6.7666015625, -6.123046875, -5.4794921875, -4.8359375, -4.1923828125, -3.548828125, -2.9052734375, -2.26171875, -1.6181640625, -0.974609375, -0.3310546875, 0.3125, 0.9560546875, 1.599609375, 2.2431640625, 2.88671875, 3.5302734375, 4.173828125, 4.8173828125, 5.4609375, 6.1044921875, 6.748046875, 7.3916015625, 8.03515625, 8.6787109375, 9.322265625, 9.9658203125, 10.609375, 11.2529296875, 11.896484375, 12.5400390625, 13.18359375, 13.8271484375, 14.470703125, 15.1142578125, 15.7578125, 16.4013671875, 17.044921875, 17.6884765625, 18.33203125, 18.9755859375, 19.619140625, 20.2626953125, 20.90625]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 0.0, 3.0, 3.0, 4.0, 6.0, 10.0, 21.0, 13.0, 23.0, 19.0, 40.0, 33.0, 26.0, 55.0, 74.0, 115.0, 147.0, 237.0, 325.0, 772.0, 6548.0, 2970723.0, 162668.0, 2381.0, 537.0, 266.0, 174.0, 114.0, 81.0, 69.0, 43.0, 34.0, 33.0, 18.0, 15.0, 16.0, 13.0, 15.0, 8.0, 8.0, 6.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.21875, -38.95458984375, -37.6904296875, -36.42626953125, -35.162109375, -33.89794921875, -32.6337890625, -31.36962890625, -30.10546875, -28.84130859375, -27.5771484375, -26.31298828125, -25.048828125, -23.78466796875, -22.5205078125, -21.25634765625, -19.9921875, -18.72802734375, -17.4638671875, -16.19970703125, -14.935546875, -13.67138671875, -12.4072265625, -11.14306640625, -9.87890625, -8.61474609375, -7.3505859375, -6.08642578125, -4.822265625, -3.55810546875, -2.2939453125, -1.02978515625, 0.234375, 1.49853515625, 2.7626953125, 4.02685546875, 5.291015625, 6.55517578125, 7.8193359375, 9.08349609375, 10.34765625, 11.61181640625, 12.8759765625, 14.14013671875, 15.404296875, 16.66845703125, 17.9326171875, 19.19677734375, 20.4609375, 21.72509765625, 22.9892578125, 24.25341796875, 25.517578125, 26.78173828125, 28.0458984375, 29.31005859375, 30.57421875, 31.83837890625, 33.1025390625, 34.36669921875, 35.630859375, 36.89501953125, 38.1591796875, 39.42333984375, 40.6875]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 5.0, 12.0, 44.0, 114.0, 278.0, 297.0, 170.0, 79.0, 16.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.69017791748047, -69.30968475341797, -67.92918395996094, -66.54869079589844, -65.16819763183594, -63.78770065307617, -62.407203674316406, -61.026710510253906, -59.646217346191406, -58.26572036743164, -56.88522720336914, -55.504730224609375, -54.124237060546875, -52.74374008178711, -51.363243103027344, -49.982749938964844, -48.60225296020508, -47.22175598144531, -45.84126281738281, -44.46076583862305, -43.08027267456055, -41.69977569580078, -40.31928253173828, -38.938785552978516, -37.55828857421875, -36.177791595458984, -34.797298431396484, -33.41680145263672, -32.03630828857422, -30.655811309814453, -29.27531623840332, -27.894821166992188, -26.514328002929688, -25.133832931518555, -23.753337860107422, -22.372840881347656, -20.992347717285156, -19.61185073852539, -18.231355667114258, -16.850860595703125, -15.470365524291992, -14.08987045288086, -12.709375381469727, -11.328879356384277, -9.948384284973145, -8.567889213562012, -7.1873931884765625, -5.80689811706543, -4.426403045654297, -3.045907735824585, -1.665412425994873, -0.28491687774658203, 1.0955781936645508, 2.4760732650756836, 3.856569290161133, 5.237064361572266, 6.617559432983398, 7.998054504394531, 9.378549575805664, 10.759045600891113, 12.139540672302246, 13.520035743713379, 14.900531768798828, 16.28102684020996, 17.661521911621094]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 2.0, 3.0, 6.0, 5.0, 7.0, 7.0, 9.0, 14.0, 15.0, 23.0, 16.0, 22.0, 18.0, 27.0, 20.0, 31.0, 36.0, 34.0, 43.0, 38.0, 47.0, 37.0, 51.0, 40.0, 35.0, 33.0, 40.0, 47.0, 30.0, 38.0, 33.0, 22.0, 28.0, 26.0, 19.0, 15.0, 21.0, 13.0, 13.0, 10.0, 7.0, 4.0, 4.0, 3.0, 0.0, 3.0, 0.0, 3.0, 6.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0], "bins": [-43.83641815185547, -42.401363372802734, -40.96630859375, -39.53125, -38.096195220947266, -36.66114044189453, -35.22608184814453, -33.7910270690918, -32.35597229003906, -30.920917510986328, -29.48586082458496, -28.050804138183594, -26.61574935913086, -25.180694580078125, -23.745637893676758, -22.31058120727539, -20.875526428222656, -19.440471649169922, -18.005414962768555, -16.570358276367188, -15.135303497314453, -13.700247764587402, -12.265192031860352, -10.8301362991333, -9.39508056640625, -7.960024833679199, -6.524969100952148, -5.089913368225098, -3.654857635498047, -2.219801902770996, -0.7847461700439453, 0.6503095626831055, 2.085369110107422, 3.5204248428344727, 4.955480575561523, 6.390536308288574, 7.825592041015625, 9.260647773742676, 10.695703506469727, 12.130759239196777, 13.565814971923828, 15.000870704650879, 16.43592643737793, 17.870983123779297, 19.30603790283203, 20.741092681884766, 22.176149368286133, 23.6112060546875, 25.046260833740234, 26.48131561279297, 27.916372299194336, 29.351428985595703, 30.786483764648438, 32.22153854370117, 33.656593322753906, 35.091651916503906, 36.52670669555664, 37.961761474609375, 39.396820068359375, 40.83187484741211, 42.266929626464844, 43.70198440551758, 45.13703918457031, 46.57209777832031, 48.00715255737305]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 6.0, 9.0, 8.0, 8.0, 6.0, 13.0, 7.0, 14.0, 14.0, 13.0, 16.0, 27.0, 30.0, 37.0, 22.0, 32.0, 39.0, 36.0, 36.0, 48.0, 37.0, 55.0, 34.0, 43.0, 36.0, 34.0, 42.0, 34.0, 25.0, 34.0, 31.0, 28.0, 22.0, 24.0, 14.0, 17.0, 11.0, 5.0, 10.0, 8.0, 10.0, 5.0, 4.0, 5.0, 4.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-5.91015625, -5.7354736328125, -5.560791015625, -5.3861083984375, -5.21142578125, -5.0367431640625, -4.862060546875, -4.6873779296875, -4.5126953125, -4.3380126953125, -4.163330078125, -3.9886474609375, -3.81396484375, -3.6392822265625, -3.464599609375, -3.2899169921875, -3.115234375, -2.9405517578125, -2.765869140625, -2.5911865234375, -2.41650390625, -2.2418212890625, -2.067138671875, -1.8924560546875, -1.7177734375, -1.5430908203125, -1.368408203125, -1.1937255859375, -1.01904296875, -0.8443603515625, -0.669677734375, -0.4949951171875, -0.3203125, -0.1456298828125, 0.029052734375, 0.2037353515625, 0.37841796875, 0.5531005859375, 0.727783203125, 0.9024658203125, 1.0771484375, 1.2518310546875, 1.426513671875, 1.6011962890625, 1.77587890625, 1.9505615234375, 2.125244140625, 2.2999267578125, 2.474609375, 2.6492919921875, 2.823974609375, 2.9986572265625, 3.17333984375, 3.3480224609375, 3.522705078125, 3.6973876953125, 3.8720703125, 4.0467529296875, 4.221435546875, 4.3961181640625, 4.57080078125, 4.7454833984375, 4.920166015625, 5.0948486328125, 5.26953125]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 4.0, 6.0, 9.0, 9.0, 9.0, 9.0, 10.0, 4.0, 13.0, 17.0, 21.0, 22.0, 25.0, 38.0, 38.0, 59.0, 83.0, 101.0, 186.0, 409.0, 2530.0, 371033.0, 3785579.0, 32109.0, 1060.0, 285.0, 160.0, 108.0, 60.0, 39.0, 43.0, 34.0, 24.0, 32.0, 18.0, 19.0, 10.0, 8.0, 7.0, 11.0, 5.0, 10.0, 5.0, 5.0, 6.0, 3.0, 2.0, 0.0, 5.0, 2.0, 0.0, 2.0, 1.0], "bins": [-33.21875, -32.221435546875, -31.22412109375, -30.226806640625, -29.2294921875, -28.232177734375, -27.23486328125, -26.237548828125, -25.240234375, -24.242919921875, -23.24560546875, -22.248291015625, -21.2509765625, -20.253662109375, -19.25634765625, -18.259033203125, -17.26171875, -16.264404296875, -15.26708984375, -14.269775390625, -13.2724609375, -12.275146484375, -11.27783203125, -10.280517578125, -9.283203125, -8.285888671875, -7.28857421875, -6.291259765625, -5.2939453125, -4.296630859375, -3.29931640625, -2.302001953125, -1.3046875, -0.307373046875, 0.68994140625, 1.687255859375, 2.6845703125, 3.681884765625, 4.67919921875, 5.676513671875, 6.673828125, 7.671142578125, 8.66845703125, 9.665771484375, 10.6630859375, 11.660400390625, 12.65771484375, 13.655029296875, 14.65234375, 15.649658203125, 16.64697265625, 17.644287109375, 18.6416015625, 19.638916015625, 20.63623046875, 21.633544921875, 22.630859375, 23.628173828125, 24.62548828125, 25.622802734375, 26.6201171875, 27.617431640625, 28.61474609375, 29.612060546875, 30.609375]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 4.0, 7.0, 7.0, 23.0, 50.0, 101.0, 156.0, 295.0, 517.0, 823.0, 872.0, 551.0, 313.0, 179.0, 91.0, 49.0, 24.0, 13.0, 6.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.625, -35.793701171875, -34.96240234375, -34.131103515625, -33.2998046875, -32.468505859375, -31.63720703125, -30.805908203125, -29.974609375, -29.143310546875, -28.31201171875, -27.480712890625, -26.6494140625, -25.818115234375, -24.98681640625, -24.155517578125, -23.32421875, -22.492919921875, -21.66162109375, -20.830322265625, -19.9990234375, -19.167724609375, -18.33642578125, -17.505126953125, -16.673828125, -15.842529296875, -15.01123046875, -14.179931640625, -13.3486328125, -12.517333984375, -11.68603515625, -10.854736328125, -10.0234375, -9.192138671875, -8.36083984375, -7.529541015625, -6.6982421875, -5.866943359375, -5.03564453125, -4.204345703125, -3.373046875, -2.541748046875, -1.71044921875, -0.879150390625, -0.0478515625, 0.783447265625, 1.61474609375, 2.446044921875, 3.27734375, 4.108642578125, 4.93994140625, 5.771240234375, 6.6025390625, 7.433837890625, 8.26513671875, 9.096435546875, 9.927734375, 10.759033203125, 11.59033203125, 12.421630859375, 13.2529296875, 14.084228515625, 14.91552734375, 15.746826171875, 16.578125]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 10.0, 9.0, 19.0, 38.0, 49.0, 90.0, 142.0, 254.0, 562.0, 1971.0, 4016367.0, 172659.0, 1095.0, 434.0, 248.0, 118.0, 93.0, 60.0, 27.0, 20.0, 10.0, 7.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-97.1875, -93.697265625, -90.20703125, -86.716796875, -83.2265625, -79.736328125, -76.24609375, -72.755859375, -69.265625, -65.775390625, -62.28515625, -58.794921875, -55.3046875, -51.814453125, -48.32421875, -44.833984375, -41.34375, -37.853515625, -34.36328125, -30.873046875, -27.3828125, -23.892578125, -20.40234375, -16.912109375, -13.421875, -9.931640625, -6.44140625, -2.951171875, 0.5390625, 4.029296875, 7.51953125, 11.009765625, 14.5, 17.990234375, 21.48046875, 24.970703125, 28.4609375, 31.951171875, 35.44140625, 38.931640625, 42.421875, 45.912109375, 49.40234375, 52.892578125, 56.3828125, 59.873046875, 63.36328125, 66.853515625, 70.34375, 73.833984375, 77.32421875, 80.814453125, 84.3046875, 87.794921875, 91.28515625, 94.775390625, 98.265625, 101.755859375, 105.24609375, 108.736328125, 112.2265625, 115.716796875, 119.20703125, 122.697265625, 126.1875]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 90.0, 259.0, 397.0, 225.0, 32.0, 7.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-272.6233825683594, -267.1060791015625, -261.5887756347656, -256.07147216796875, -250.55416870117188, -245.036865234375, -239.51956176757812, -234.00225830078125, -228.48495483398438, -222.9676513671875, -217.45034790039062, -211.93304443359375, -206.41574096679688, -200.8984375, -195.38113403320312, -189.86383056640625, -184.34652709960938, -178.8292236328125, -173.31192016601562, -167.79461669921875, -162.27731323242188, -156.760009765625, -151.24270629882812, -145.72540283203125, -140.20811462402344, -134.69081115722656, -129.1735076904297, -123.65620422363281, -118.13890075683594, -112.62159729003906, -107.10429382324219, -101.58699035644531, -96.0696792602539, -90.55237579345703, -85.03507232666016, -79.51776885986328, -74.0004653930664, -68.48316192626953, -62.96586227416992, -57.44855880737305, -51.93125534057617, -46.4139518737793, -40.89664840698242, -35.37934875488281, -29.862043380737305, -24.34473991394043, -18.827438354492188, -13.310134887695312, -7.7928314208984375, -2.2755284309387207, 3.241774559020996, 8.759077072143555, 14.27638053894043, 19.793684005737305, 25.310985565185547, 30.828289031982422, 36.3455924987793, 41.86289596557617, 47.38019943237305, 52.897499084472656, 58.41480255126953, 63.932106018066406, 69.44940948486328, 74.96671295166016, 80.48401641845703]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 4.0, 2.0, 8.0, 2.0, 3.0, 3.0, 6.0, 11.0, 15.0, 14.0, 9.0, 18.0, 17.0, 19.0, 23.0, 18.0, 18.0, 27.0, 18.0, 32.0, 40.0, 28.0, 27.0, 34.0, 36.0, 33.0, 46.0, 40.0, 45.0, 46.0, 42.0, 37.0, 30.0, 31.0, 27.0, 21.0, 22.0, 27.0, 23.0, 18.0, 15.0, 16.0, 14.0, 10.0, 8.0, 4.0, 11.0, 2.0, 4.0, 4.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-43.35927963256836, -42.06420135498047, -40.769126892089844, -39.47405242919922, -38.17897415161133, -36.88389587402344, -35.58882141113281, -34.29374694824219, -32.9986686706543, -31.70359230041504, -30.40851593017578, -29.113439559936523, -27.818363189697266, -26.523286819458008, -25.22821044921875, -23.933134078979492, -22.638057708740234, -21.342981338500977, -20.04790496826172, -18.75282859802246, -17.457752227783203, -16.162675857543945, -14.867599487304688, -13.57252311706543, -12.277446746826172, -10.982370376586914, -9.687294006347656, -8.392217636108398, -7.097141265869141, -5.802064895629883, -4.506988525390625, -3.211912155151367, -1.916839599609375, -0.6217632293701172, 0.6733131408691406, 1.9683895111083984, 3.2634658813476562, 4.558542251586914, 5.853618621826172, 7.14869499206543, 8.443771362304688, 9.738847732543945, 11.033924102783203, 12.329000473022461, 13.624076843261719, 14.919153213500977, 16.214229583740234, 17.509305953979492, 18.80438232421875, 20.099458694458008, 21.394535064697266, 22.689611434936523, 23.98468780517578, 25.27976417541504, 26.574840545654297, 27.869916915893555, 29.164993286132812, 30.46006965637207, 31.755146026611328, 33.05022430419922, 34.345298767089844, 35.64037322998047, 36.93545150756836, 38.23052978515625, 39.525604248046875]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 3.0, 6.0, 12.0, 11.0, 10.0, 7.0, 6.0, 17.0, 16.0, 16.0, 20.0, 23.0, 22.0, 35.0, 40.0, 35.0, 28.0, 34.0, 48.0, 48.0, 48.0, 37.0, 50.0, 49.0, 42.0, 28.0, 47.0, 34.0, 32.0, 25.0, 34.0, 18.0, 17.0, 23.0, 13.0, 11.0, 12.0, 9.0, 8.0, 7.0, 3.0, 4.0, 6.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.70703125, -5.52484130859375, -5.3426513671875, -5.16046142578125, -4.978271484375, -4.79608154296875, -4.6138916015625, -4.43170166015625, -4.24951171875, -4.06732177734375, -3.8851318359375, -3.70294189453125, -3.520751953125, -3.33856201171875, -3.1563720703125, -2.97418212890625, -2.7919921875, -2.60980224609375, -2.4276123046875, -2.24542236328125, -2.063232421875, -1.88104248046875, -1.6988525390625, -1.51666259765625, -1.33447265625, -1.15228271484375, -0.9700927734375, -0.78790283203125, -0.605712890625, -0.42352294921875, -0.2413330078125, -0.05914306640625, 0.123046875, 0.30523681640625, 0.4874267578125, 0.66961669921875, 0.851806640625, 1.03399658203125, 1.2161865234375, 1.39837646484375, 1.58056640625, 1.76275634765625, 1.9449462890625, 2.12713623046875, 2.309326171875, 2.49151611328125, 2.6737060546875, 2.85589599609375, 3.0380859375, 3.22027587890625, 3.4024658203125, 3.58465576171875, 3.766845703125, 3.94903564453125, 4.1312255859375, 4.31341552734375, 4.49560546875, 4.67779541015625, 4.8599853515625, 5.04217529296875, 5.224365234375, 5.40655517578125, 5.5887451171875, 5.77093505859375, 5.953125]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 8.0, 7.0, 12.0, 21.0, 31.0, 27.0, 51.0, 55.0, 107.0, 121.0, 193.0, 260.0, 365.0, 528.0, 719.0, 1071.0, 1422.0, 2157.0, 3013.0, 4061.0, 5880.0, 8492.0, 12240.0, 18285.0, 27879.0, 42395.0, 69504.0, 126402.0, 304391.0, 178194.0, 86608.0, 52057.0, 32929.0, 21592.0, 14492.0, 9831.0, 6831.0, 4828.0, 3311.0, 2337.0, 1646.0, 1172.0, 864.0, 642.0, 440.0, 339.0, 239.0, 173.0, 101.0, 71.0, 52.0, 43.0, 25.0, 21.0, 17.0, 6.0, 3.0, 5.0, 2.0, 1.0], "bins": [-1.064453125, -1.0319061279296875, -0.999359130859375, -0.9668121337890625, -0.93426513671875, -0.9017181396484375, -0.869171142578125, -0.8366241455078125, -0.8040771484375, -0.7715301513671875, -0.738983154296875, -0.7064361572265625, -0.67388916015625, -0.6413421630859375, -0.608795166015625, -0.5762481689453125, -0.543701171875, -0.5111541748046875, -0.478607177734375, -0.4460601806640625, -0.41351318359375, -0.3809661865234375, -0.348419189453125, -0.3158721923828125, -0.2833251953125, -0.2507781982421875, -0.218231201171875, -0.1856842041015625, -0.15313720703125, -0.1205902099609375, -0.088043212890625, -0.0554962158203125, -0.02294921875, 0.0095977783203125, 0.042144775390625, 0.0746917724609375, 0.10723876953125, 0.1397857666015625, 0.172332763671875, 0.2048797607421875, 0.2374267578125, 0.2699737548828125, 0.302520751953125, 0.3350677490234375, 0.36761474609375, 0.4001617431640625, 0.432708740234375, 0.4652557373046875, 0.497802734375, 0.5303497314453125, 0.562896728515625, 0.5954437255859375, 0.62799072265625, 0.6605377197265625, 0.693084716796875, 0.7256317138671875, 0.7581787109375, 0.7907257080078125, 0.823272705078125, 0.8558197021484375, 0.88836669921875, 0.9209136962890625, 0.953460693359375, 0.9860076904296875, 1.0185546875]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 0.0, 3.0, 2.0, 7.0, 7.0, 8.0, 12.0, 14.0, 15.0, 11.0, 18.0, 14.0, 22.0, 18.0, 22.0, 35.0, 29.0, 34.0, 39.0, 36.0, 41.0, 41.0, 41.0, 1080.0, 35.0, 30.0, 35.0, 34.0, 31.0, 32.0, 34.0, 38.0, 20.0, 28.0, 26.0, 20.0, 15.0, 24.0, 18.0, 11.0, 12.0, 6.0, 7.0, 9.0, 4.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.353515625, -3.244903564453125, -3.13629150390625, -3.027679443359375, -2.9190673828125, -2.810455322265625, -2.70184326171875, -2.593231201171875, -2.484619140625, -2.376007080078125, -2.26739501953125, -2.158782958984375, -2.0501708984375, -1.941558837890625, -1.83294677734375, -1.724334716796875, -1.61572265625, -1.507110595703125, -1.39849853515625, -1.289886474609375, -1.1812744140625, -1.072662353515625, -0.96405029296875, -0.855438232421875, -0.746826171875, -0.638214111328125, -0.52960205078125, -0.420989990234375, -0.3123779296875, -0.203765869140625, -0.09515380859375, 0.013458251953125, 0.1220703125, 0.230682373046875, 0.33929443359375, 0.447906494140625, 0.5565185546875, 0.665130615234375, 0.77374267578125, 0.882354736328125, 0.990966796875, 1.099578857421875, 1.20819091796875, 1.316802978515625, 1.4254150390625, 1.534027099609375, 1.64263916015625, 1.751251220703125, 1.85986328125, 1.968475341796875, 2.07708740234375, 2.185699462890625, 2.2943115234375, 2.402923583984375, 2.51153564453125, 2.620147705078125, 2.728759765625, 2.837371826171875, 2.94598388671875, 3.054595947265625, 3.1632080078125, 3.271820068359375, 3.38043212890625, 3.489044189453125, 3.59765625]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 5.0, 6.0, 12.0, 10.0, 16.0, 36.0, 33.0, 63.0, 74.0, 139.0, 184.0, 293.0, 453.0, 703.0, 1070.0, 1664.0, 2605.0, 4160.0, 6495.0, 10436.0, 16651.0, 26987.0, 45913.0, 82725.0, 182324.0, 1418716.0, 130575.0, 65891.0, 37874.0, 22658.0, 14138.0, 8893.0, 5612.0, 3452.0, 2215.0, 1391.0, 908.0, 580.0, 395.0, 264.0, 164.0, 113.0, 82.0, 50.0, 36.0, 27.0, 16.0, 13.0, 5.0, 4.0, 6.0, 4.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.2685546875, -1.2304840087890625, -1.192413330078125, -1.1543426513671875, -1.11627197265625, -1.0782012939453125, -1.040130615234375, -1.0020599365234375, -0.9639892578125, -0.9259185791015625, -0.887847900390625, -0.8497772216796875, -0.81170654296875, -0.7736358642578125, -0.735565185546875, -0.6974945068359375, -0.659423828125, -0.6213531494140625, -0.583282470703125, -0.5452117919921875, -0.50714111328125, -0.4690704345703125, -0.430999755859375, -0.3929290771484375, -0.3548583984375, -0.3167877197265625, -0.278717041015625, -0.2406463623046875, -0.20257568359375, -0.1645050048828125, -0.126434326171875, -0.0883636474609375, -0.05029296875, -0.0122222900390625, 0.025848388671875, 0.0639190673828125, 0.10198974609375, 0.1400604248046875, 0.178131103515625, 0.2162017822265625, 0.2542724609375, 0.2923431396484375, 0.330413818359375, 0.3684844970703125, 0.40655517578125, 0.4446258544921875, 0.482696533203125, 0.5207672119140625, 0.558837890625, 0.5969085693359375, 0.634979248046875, 0.6730499267578125, 0.71112060546875, 0.7491912841796875, 0.787261962890625, 0.8253326416015625, 0.8634033203125, 0.9014739990234375, 0.939544677734375, 0.9776153564453125, 1.01568603515625, 1.0537567138671875, 1.091827392578125, 1.1298980712890625, 1.16796875]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 0.0, 1.0, 7.0, 6.0, 2.0, 15.0, 13.0, 17.0, 13.0, 12.0, 27.0, 39.0, 36.0, 39.0, 45.0, 56.0, 75.0, 70.0, 81.0, 69.0, 64.0, 58.0, 40.0, 41.0, 25.0, 36.0, 22.0, 30.0, 10.0, 8.0, 9.0, 8.0, 5.0, 3.0, 5.0, 4.0, 3.0, 2.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.0007328987121582031, -0.0007079541683197021, -0.0006830096244812012, -0.0006580650806427002, -0.0006331205368041992, -0.0006081759929656982, -0.0005832314491271973, -0.0005582869052886963, -0.0005333423614501953, -0.0005083978176116943, -0.00048345327377319336, -0.0004585087299346924, -0.0004335641860961914, -0.00040861964225769043, -0.00038367509841918945, -0.0003587305545806885, -0.0003337860107421875, -0.0003088414669036865, -0.00028389692306518555, -0.00025895237922668457, -0.0002340078353881836, -0.00020906329154968262, -0.00018411874771118164, -0.00015917420387268066, -0.0001342296600341797, -0.00010928511619567871, -8.434057235717773e-05, -5.939602851867676e-05, -3.445148468017578e-05, -9.506940841674805e-06, 1.5437602996826172e-05, 4.038214683532715e-05, 6.532669067382812e-05, 9.02712345123291e-05, 0.00011521577835083008, 0.00014016032218933105, 0.00016510486602783203, 0.000190049409866333, 0.00021499395370483398, 0.00023993849754333496, 0.00026488304138183594, 0.0002898275852203369, 0.0003147721290588379, 0.00033971667289733887, 0.00036466121673583984, 0.0003896057605743408, 0.0004145503044128418, 0.0004394948482513428, 0.00046443939208984375, 0.0004893839359283447, 0.0005143284797668457, 0.0005392730236053467, 0.0005642175674438477, 0.0005891621112823486, 0.0006141066551208496, 0.0006390511989593506, 0.0006639957427978516, 0.0006889402866363525, 0.0007138848304748535, 0.0007388293743133545, 0.0007637739181518555, 0.0007887184619903564, 0.0008136630058288574, 0.0008386075496673584, 0.0008635520935058594]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 0.0, 4.0, 4.0, 2.0, 4.0, 6.0, 7.0, 7.0, 6.0, 10.0, 17.0, 18.0, 26.0, 28.0, 53.0, 67.0, 95.0, 196.0, 389.0, 1143.0, 429043.0, 615341.0, 1138.0, 393.0, 180.0, 107.0, 72.0, 49.0, 29.0, 22.0, 26.0, 19.0, 14.0, 6.0, 5.0, 9.0, 2.0, 6.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.019927978515625, -0.01934218406677246, -0.018756389617919922, -0.018170595169067383, -0.017584800720214844, -0.016999006271362305, -0.016413211822509766, -0.015827417373657227, -0.015241622924804688, -0.014655828475952148, -0.01407003402709961, -0.01348423957824707, -0.012898445129394531, -0.012312650680541992, -0.011726856231689453, -0.011141061782836914, -0.010555267333984375, -0.009969472885131836, -0.009383678436279297, -0.008797883987426758, -0.008212089538574219, -0.00762629508972168, -0.007040500640869141, -0.0064547061920166016, -0.0058689117431640625, -0.0052831172943115234, -0.004697322845458984, -0.004111528396606445, -0.0035257339477539062, -0.002939939498901367, -0.002354145050048828, -0.001768350601196289, -0.00118255615234375, -0.0005967617034912109, -1.0967254638671875e-05, 0.0005748271942138672, 0.0011606216430664062, 0.0017464160919189453, 0.0023322105407714844, 0.0029180049896240234, 0.0035037994384765625, 0.0040895938873291016, 0.004675388336181641, 0.00526118278503418, 0.005846977233886719, 0.006432771682739258, 0.007018566131591797, 0.007604360580444336, 0.008190155029296875, 0.008775949478149414, 0.009361743927001953, 0.009947538375854492, 0.010533332824707031, 0.01111912727355957, 0.01170492172241211, 0.012290716171264648, 0.012876510620117188, 0.013462305068969727, 0.014048099517822266, 0.014633893966674805, 0.015219688415527344, 0.015805482864379883, 0.016391277313232422, 0.01697707176208496, 0.0175628662109375]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 30.0, 129.0, 293.0, 324.0, 163.0, 54.0, 14.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008617144194431603, -0.0008229134255088866, -0.0007841124897822738, -0.000745311495848, -0.0007065105019137263, -0.0006677095079794526, -0.0006289085140451789, -0.0005901075783185661, -0.0005513065843842924, -0.0005125055904500186, -0.0004737046256195754, -0.0004349036607891321, -0.0003961026668548584, -0.0003573016729205847, -0.0003185007080901414, -0.00027969974325969815, -0.00024089874932542443, -0.00020209776994306594, -0.00016329679056070745, -0.00012449581117834896, -8.569483179599047e-05, -4.6893852413631976e-05, -8.092873031273484e-06, 3.070809179916978e-05, 6.95090857334435e-05, 0.00010831006511580199, 0.00014711104449816048, 0.00018591202388051897, 0.00022471300326287746, 0.0002635139971971512, 0.00030231496202759445, 0.0003411159268580377, 0.00037991697899997234, 0.00041871797293424606, 0.0004575189377646893, 0.0004963199025951326, 0.0005351208965294063, 0.00057392189046368, 0.0006127228261902928, 0.0006515238201245666, 0.0006903248140588403, 0.000729125807993114, 0.0007679268019273877, 0.0008067277376540005, 0.0008455287315882742, 0.000884329725522548, 0.0009231306612491608, 0.0009619316551834345, 0.0010007326491177082, 0.001039533643051982, 0.0010783346369862556, 0.0011171356309205294, 0.001155936624854803, 0.001194737502373755, 0.0012335384963080287, 0.0012723394902423024, 0.0013111404841765761, 0.0013499414781108499, 0.0013887424720451236, 0.0014275434659793973, 0.0014663443434983492, 0.001505145337432623, 0.0015439463313668966, 0.0015827473253011703, 0.001621548319235444]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 4.0, 1.0, 4.0, 2.0, 3.0, 2.0, 5.0, 5.0, 6.0, 9.0, 15.0, 11.0, 13.0, 15.0, 18.0, 18.0, 21.0, 22.0, 28.0, 34.0, 31.0, 43.0, 50.0, 47.0, 42.0, 40.0, 34.0, 39.0, 31.0, 47.0, 32.0, 38.0, 28.0, 34.0, 34.0, 18.0, 24.0, 22.0, 28.0, 12.0, 20.0, 15.0, 15.0, 12.0, 7.0, 5.0, 3.0, 9.0, 3.0, 0.0, 5.0, 5.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.0003362894058227539, -0.000324886292219162, -0.00031348317861557007, -0.00030208006501197815, -0.00029067695140838623, -0.0002792738378047943, -0.0002678707242012024, -0.0002564676105976105, -0.00024506449699401855, -0.00023366138339042664, -0.00022225826978683472, -0.0002108551561832428, -0.00019945204257965088, -0.00018804892897605896, -0.00017664581537246704, -0.00016524270176887512, -0.0001538395881652832, -0.00014243647456169128, -0.00013103336095809937, -0.00011963024735450745, -0.00010822713375091553, -9.682402014732361e-05, -8.542090654373169e-05, -7.401779294013977e-05, -6.261467933654785e-05, -5.121156573295593e-05, -3.9808452129364014e-05, -2.8405338525772095e-05, -1.7002224922180176e-05, -5.599111318588257e-06, 5.804002285003662e-06, 1.720711588859558e-05, 2.86102294921875e-05, 4.001334309577942e-05, 5.141645669937134e-05, 6.281957030296326e-05, 7.422268390655518e-05, 8.56257975101471e-05, 9.702891111373901e-05, 0.00010843202471733093, 0.00011983513832092285, 0.00013123825192451477, 0.0001426413655281067, 0.0001540444791316986, 0.00016544759273529053, 0.00017685070633888245, 0.00018825381994247437, 0.00019965693354606628, 0.0002110600471496582, 0.00022246316075325012, 0.00023386627435684204, 0.00024526938796043396, 0.0002566725015640259, 0.0002680756151676178, 0.0002794787287712097, 0.00029088184237480164, 0.00030228495597839355, 0.0003136880695819855, 0.0003250911831855774, 0.0003364942967891693, 0.00034789741039276123, 0.00035930052399635315, 0.00037070363759994507, 0.000382106751203537, 0.0003935098648071289]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 3.0, 6.0, 12.0, 11.0, 10.0, 7.0, 6.0, 17.0, 16.0, 16.0, 20.0, 23.0, 22.0, 35.0, 40.0, 35.0, 28.0, 34.0, 48.0, 48.0, 48.0, 37.0, 50.0, 49.0, 42.0, 28.0, 47.0, 34.0, 32.0, 25.0, 34.0, 18.0, 17.0, 23.0, 13.0, 11.0, 12.0, 9.0, 8.0, 7.0, 3.0, 4.0, 6.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.70703125, -5.52484130859375, -5.3426513671875, -5.16046142578125, -4.978271484375, -4.79608154296875, -4.6138916015625, -4.43170166015625, -4.24951171875, -4.06732177734375, -3.8851318359375, -3.70294189453125, -3.520751953125, -3.33856201171875, -3.1563720703125, -2.97418212890625, -2.7919921875, -2.60980224609375, -2.4276123046875, -2.24542236328125, -2.063232421875, -1.88104248046875, -1.6988525390625, -1.51666259765625, -1.33447265625, -1.15228271484375, -0.9700927734375, -0.78790283203125, -0.605712890625, -0.42352294921875, -0.2413330078125, -0.05914306640625, 0.123046875, 0.30523681640625, 0.4874267578125, 0.66961669921875, 0.851806640625, 1.03399658203125, 1.2161865234375, 1.39837646484375, 1.58056640625, 1.76275634765625, 1.9449462890625, 2.12713623046875, 2.309326171875, 2.49151611328125, 2.6737060546875, 2.85589599609375, 3.0380859375, 3.22027587890625, 3.4024658203125, 3.58465576171875, 3.766845703125, 3.94903564453125, 4.1312255859375, 4.31341552734375, 4.49560546875, 4.67779541015625, 4.8599853515625, 5.04217529296875, 5.224365234375, 5.40655517578125, 5.5887451171875, 5.77093505859375, 5.953125]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 7.0, 5.0, 6.0, 13.0, 10.0, 24.0, 34.0, 47.0, 91.0, 105.0, 205.0, 362.0, 545.0, 1018.0, 1673.0, 2956.0, 5309.0, 9446.0, 17809.0, 35583.0, 78999.0, 214480.0, 400945.0, 155878.0, 61178.0, 28509.0, 14819.0, 7982.0, 4329.0, 2591.0, 1423.0, 886.0, 472.0, 314.0, 178.0, 129.0, 84.0, 37.0, 21.0, 20.0, 11.0, 10.0, 13.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.05859375, -3.94378662109375, -3.8289794921875, -3.71417236328125, -3.599365234375, -3.48455810546875, -3.3697509765625, -3.25494384765625, -3.14013671875, -3.02532958984375, -2.9105224609375, -2.79571533203125, -2.680908203125, -2.56610107421875, -2.4512939453125, -2.33648681640625, -2.2216796875, -2.10687255859375, -1.9920654296875, -1.87725830078125, -1.762451171875, -1.64764404296875, -1.5328369140625, -1.41802978515625, -1.30322265625, -1.18841552734375, -1.0736083984375, -0.95880126953125, -0.843994140625, -0.72918701171875, -0.6143798828125, -0.49957275390625, -0.384765625, -0.26995849609375, -0.1551513671875, -0.04034423828125, 0.074462890625, 0.18927001953125, 0.3040771484375, 0.41888427734375, 0.53369140625, 0.64849853515625, 0.7633056640625, 0.87811279296875, 0.992919921875, 1.10772705078125, 1.2225341796875, 1.33734130859375, 1.4521484375, 1.56695556640625, 1.6817626953125, 1.79656982421875, 1.911376953125, 2.02618408203125, 2.1409912109375, 2.25579833984375, 2.37060546875, 2.48541259765625, 2.6002197265625, 2.71502685546875, 2.829833984375, 2.94464111328125, 3.0594482421875, 3.17425537109375, 3.2890625]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 7.0, 5.0, 9.0, 8.0, 7.0, 15.0, 12.0, 20.0, 16.0, 23.0, 13.0, 25.0, 38.0, 30.0, 30.0, 40.0, 38.0, 41.0, 38.0, 76.0, 207.0, 1709.0, 140.0, 65.0, 49.0, 48.0, 29.0, 37.0, 32.0, 25.0, 36.0, 28.0, 23.0, 17.0, 16.0, 14.0, 17.0, 11.0, 15.0, 13.0, 10.0, 8.0, 5.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-18.203125, -17.62353515625, -17.0439453125, -16.46435546875, -15.884765625, -15.30517578125, -14.7255859375, -14.14599609375, -13.56640625, -12.98681640625, -12.4072265625, -11.82763671875, -11.248046875, -10.66845703125, -10.0888671875, -9.50927734375, -8.9296875, -8.35009765625, -7.7705078125, -7.19091796875, -6.611328125, -6.03173828125, -5.4521484375, -4.87255859375, -4.29296875, -3.71337890625, -3.1337890625, -2.55419921875, -1.974609375, -1.39501953125, -0.8154296875, -0.23583984375, 0.34375, 0.92333984375, 1.5029296875, 2.08251953125, 2.662109375, 3.24169921875, 3.8212890625, 4.40087890625, 4.98046875, 5.56005859375, 6.1396484375, 6.71923828125, 7.298828125, 7.87841796875, 8.4580078125, 9.03759765625, 9.6171875, 10.19677734375, 10.7763671875, 11.35595703125, 11.935546875, 12.51513671875, 13.0947265625, 13.67431640625, 14.25390625, 14.83349609375, 15.4130859375, 15.99267578125, 16.572265625, 17.15185546875, 17.7314453125, 18.31103515625, 18.890625]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 6.0, 3.0, 7.0, 4.0, 13.0, 24.0, 41.0, 61.0, 66.0, 104.0, 181.0, 346.0, 914.0, 33981.0, 3105784.0, 2986.0, 534.0, 276.0, 125.0, 79.0, 56.0, 34.0, 30.0, 13.0, 16.0, 6.0, 7.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-85.6875, -83.2578125, -80.828125, -78.3984375, -75.96875, -73.5390625, -71.109375, -68.6796875, -66.25, -63.8203125, -61.390625, -58.9609375, -56.53125, -54.1015625, -51.671875, -49.2421875, -46.8125, -44.3828125, -41.953125, -39.5234375, -37.09375, -34.6640625, -32.234375, -29.8046875, -27.375, -24.9453125, -22.515625, -20.0859375, -17.65625, -15.2265625, -12.796875, -10.3671875, -7.9375, -5.5078125, -3.078125, -0.6484375, 1.78125, 4.2109375, 6.640625, 9.0703125, 11.5, 13.9296875, 16.359375, 18.7890625, 21.21875, 23.6484375, 26.078125, 28.5078125, 30.9375, 33.3671875, 35.796875, 38.2265625, 40.65625, 43.0859375, 45.515625, 47.9453125, 50.375, 52.8046875, 55.234375, 57.6640625, 60.09375, 62.5234375, 64.953125, 67.3828125, 69.8125]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 8.0, 751.0, 259.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-352.3639221191406, -345.4296569824219, -338.49542236328125, -331.5611572265625, -324.6269226074219, -317.6926574707031, -310.7584228515625, -303.82415771484375, -296.8899230957031, -289.9556579589844, -283.02142333984375, -276.087158203125, -269.1529235839844, -262.2186584472656, -255.284423828125, -248.35015869140625, -241.41590881347656, -234.48165893554688, -227.5474090576172, -220.6131591796875, -213.6789093017578, -206.74465942382812, -199.81039428710938, -192.87615966796875, -185.94189453125, -179.0076446533203, -172.07339477539062, -165.13914489746094, -158.20489501953125, -151.27064514160156, -144.33639526367188, -137.40213012695312, -130.46791076660156, -123.53366088867188, -116.59941101074219, -109.6651611328125, -102.73091125488281, -95.79666137695312, -88.8624038696289, -81.92815399169922, -74.99390411376953, -68.05965423583984, -61.125404357910156, -54.1911506652832, -47.256900787353516, -40.32265090942383, -33.388397216796875, -26.454147338867188, -19.5198974609375, -12.585646629333496, -5.651395797729492, 1.2828559875488281, 8.217105865478516, 15.151355743408203, 22.085609436035156, 29.019859313964844, 35.95410919189453, 42.88835906982422, 49.822608947753906, 56.75686264038086, 63.69111251831055, 70.6253662109375, 77.55961608886719, 84.49386596679688, 91.42811584472656]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 3.0, 2.0, 5.0, 7.0, 7.0, 11.0, 8.0, 15.0, 22.0, 22.0, 32.0, 36.0, 28.0, 30.0, 39.0, 33.0, 41.0, 40.0, 29.0, 44.0, 39.0, 42.0, 46.0, 40.0, 43.0, 35.0, 39.0, 32.0, 24.0, 37.0, 32.0, 27.0, 24.0, 19.0, 20.0, 16.0, 8.0, 6.0, 7.0, 9.0, 2.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.190879821777344, -55.32159423828125, -53.45230484008789, -51.5830192565918, -49.71372985839844, -47.844444274902344, -45.97515869140625, -44.10586929321289, -42.23657989501953, -40.36729431152344, -38.49800491333008, -36.628719329833984, -34.759429931640625, -32.89014434814453, -31.020856857299805, -29.151569366455078, -27.282283782958984, -25.412996292114258, -23.54370880126953, -21.674423217773438, -19.805133819580078, -17.935848236083984, -16.066560745239258, -14.197273254394531, -12.327985763549805, -10.458698272705078, -8.589410781860352, -6.720124244689941, -4.850836753845215, -2.9815492630004883, -1.1122627258300781, 0.7570247650146484, 2.6263160705566406, 4.495603561401367, 6.3648905754089355, 8.234177589416504, 10.10346508026123, 11.972752571105957, 13.842039108276367, 15.711326599121094, 17.58061408996582, 19.449901580810547, 21.319189071655273, 23.1884765625, 25.057762145996094, 26.927051544189453, 28.796337127685547, 30.665624618530273, 32.534912109375, 34.404197692871094, 36.27348709106445, 38.14277267456055, 40.012062072753906, 41.88134765625, 43.750633239746094, 45.61992263793945, 47.48921203613281, 49.358497619628906, 51.227787017822266, 53.09707260131836, 54.96636199951172, 56.83564758300781, 58.704933166503906, 60.574222564697266, 62.44350814819336]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 3.0, 1.0, 6.0, 8.0, 13.0, 7.0, 5.0, 8.0, 17.0, 12.0, 17.0, 17.0, 19.0, 27.0, 23.0, 33.0, 36.0, 31.0, 32.0, 38.0, 53.0, 54.0, 43.0, 37.0, 46.0, 43.0, 43.0, 38.0, 31.0, 42.0, 33.0, 27.0, 21.0, 18.0, 20.0, 24.0, 8.0, 13.0, 16.0, 8.0, 5.0, 8.0, 5.0, 5.0, 3.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-5.8671875, -5.6787109375, -5.490234375, -5.3017578125, -5.11328125, -4.9248046875, -4.736328125, -4.5478515625, -4.359375, -4.1708984375, -3.982421875, -3.7939453125, -3.60546875, -3.4169921875, -3.228515625, -3.0400390625, -2.8515625, -2.6630859375, -2.474609375, -2.2861328125, -2.09765625, -1.9091796875, -1.720703125, -1.5322265625, -1.34375, -1.1552734375, -0.966796875, -0.7783203125, -0.58984375, -0.4013671875, -0.212890625, -0.0244140625, 0.1640625, 0.3525390625, 0.541015625, 0.7294921875, 0.91796875, 1.1064453125, 1.294921875, 1.4833984375, 1.671875, 1.8603515625, 2.048828125, 2.2373046875, 2.42578125, 2.6142578125, 2.802734375, 2.9912109375, 3.1796875, 3.3681640625, 3.556640625, 3.7451171875, 3.93359375, 4.1220703125, 4.310546875, 4.4990234375, 4.6875, 4.8759765625, 5.064453125, 5.2529296875, 5.44140625, 5.6298828125, 5.818359375, 6.0068359375, 6.1953125]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 8.0, 6.0, 13.0, 9.0, 22.0, 20.0, 29.0, 39.0, 35.0, 43.0, 66.0, 79.0, 111.0, 171.0, 244.0, 428.0, 808.0, 1902.0, 5651.0, 22898.0, 126413.0, 685004.0, 1870659.0, 1171653.0, 251237.0, 41704.0, 9314.0, 2931.0, 1175.0, 576.0, 308.0, 175.0, 126.0, 94.0, 58.0, 55.0, 57.0, 34.0, 23.0, 22.0, 19.0, 22.0, 10.0, 5.0, 6.0, 6.0, 3.0, 1.0, 8.0, 2.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.703125, -7.4346923828125, -7.166259765625, -6.8978271484375, -6.62939453125, -6.3609619140625, -6.092529296875, -5.8240966796875, -5.5556640625, -5.2872314453125, -5.018798828125, -4.7503662109375, -4.48193359375, -4.2135009765625, -3.945068359375, -3.6766357421875, -3.408203125, -3.1397705078125, -2.871337890625, -2.6029052734375, -2.33447265625, -2.0660400390625, -1.797607421875, -1.5291748046875, -1.2607421875, -0.9923095703125, -0.723876953125, -0.4554443359375, -0.18701171875, 0.0814208984375, 0.349853515625, 0.6182861328125, 0.88671875, 1.1551513671875, 1.423583984375, 1.6920166015625, 1.96044921875, 2.2288818359375, 2.497314453125, 2.7657470703125, 3.0341796875, 3.3026123046875, 3.571044921875, 3.8394775390625, 4.10791015625, 4.3763427734375, 4.644775390625, 4.9132080078125, 5.181640625, 5.4500732421875, 5.718505859375, 5.9869384765625, 6.25537109375, 6.5238037109375, 6.792236328125, 7.0606689453125, 7.3291015625, 7.5975341796875, 7.865966796875, 8.1343994140625, 8.40283203125, 8.6712646484375, 8.939697265625, 9.2081298828125, 9.4765625]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 14.0, 11.0, 18.0, 30.0, 50.0, 60.0, 75.0, 93.0, 150.0, 244.0, 320.0, 499.0, 563.0, 538.0, 434.0, 294.0, 207.0, 153.0, 97.0, 65.0, 47.0, 34.0, 17.0, 21.0, 10.0, 6.0, 9.0, 9.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.4921875, -11.9688720703125, -11.445556640625, -10.9222412109375, -10.39892578125, -9.8756103515625, -9.352294921875, -8.8289794921875, -8.3056640625, -7.7823486328125, -7.259033203125, -6.7357177734375, -6.21240234375, -5.6890869140625, -5.165771484375, -4.6424560546875, -4.119140625, -3.5958251953125, -3.072509765625, -2.5491943359375, -2.02587890625, -1.5025634765625, -0.979248046875, -0.4559326171875, 0.0673828125, 0.5906982421875, 1.114013671875, 1.6373291015625, 2.16064453125, 2.6839599609375, 3.207275390625, 3.7305908203125, 4.25390625, 4.7772216796875, 5.300537109375, 5.8238525390625, 6.34716796875, 6.8704833984375, 7.393798828125, 7.9171142578125, 8.4404296875, 8.9637451171875, 9.487060546875, 10.0103759765625, 10.53369140625, 11.0570068359375, 11.580322265625, 12.1036376953125, 12.626953125, 13.1502685546875, 13.673583984375, 14.1968994140625, 14.72021484375, 15.2435302734375, 15.766845703125, 16.2901611328125, 16.8134765625, 17.3367919921875, 17.860107421875, 18.3834228515625, 18.90673828125, 19.4300537109375, 19.953369140625, 20.4766845703125, 21.0]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 6.0, 2.0, 3.0, 6.0, 7.0, 6.0, 6.0, 6.0, 14.0, 12.0, 16.0, 17.0, 39.0, 41.0, 51.0, 59.0, 73.0, 86.0, 118.0, 220.0, 389.0, 807.0, 3516.0, 1209847.0, 2971695.0, 5079.0, 905.0, 400.0, 245.0, 143.0, 96.0, 82.0, 61.0, 53.0, 29.0, 34.0, 26.0, 18.0, 18.0, 14.0, 7.0, 5.0, 10.0, 9.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-66.375, -64.48193359375, -62.5888671875, -60.69580078125, -58.802734375, -56.90966796875, -55.0166015625, -53.12353515625, -51.23046875, -49.33740234375, -47.4443359375, -45.55126953125, -43.658203125, -41.76513671875, -39.8720703125, -37.97900390625, -36.0859375, -34.19287109375, -32.2998046875, -30.40673828125, -28.513671875, -26.62060546875, -24.7275390625, -22.83447265625, -20.94140625, -19.04833984375, -17.1552734375, -15.26220703125, -13.369140625, -11.47607421875, -9.5830078125, -7.68994140625, -5.796875, -3.90380859375, -2.0107421875, -0.11767578125, 1.775390625, 3.66845703125, 5.5615234375, 7.45458984375, 9.34765625, 11.24072265625, 13.1337890625, 15.02685546875, 16.919921875, 18.81298828125, 20.7060546875, 22.59912109375, 24.4921875, 26.38525390625, 28.2783203125, 30.17138671875, 32.064453125, 33.95751953125, 35.8505859375, 37.74365234375, 39.63671875, 41.52978515625, 43.4228515625, 45.31591796875, 47.208984375, 49.10205078125, 50.9951171875, 52.88818359375, 54.78125]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 15.0, 126.0, 368.0, 389.0, 93.0, 17.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-112.28854370117188, -106.04094696044922, -99.79335021972656, -93.5457534790039, -87.29815673828125, -81.0505599975586, -74.80296325683594, -68.55536651611328, -62.307769775390625, -56.06017303466797, -49.81257629394531, -43.564979553222656, -37.3173828125, -31.069786071777344, -24.822189331054688, -18.57459259033203, -12.326995849609375, -6.079399108886719, 0.1681976318359375, 6.415794372558594, 12.66339111328125, 18.910987854003906, 25.158584594726562, 31.40618133544922, 37.653778076171875, 43.90137481689453, 50.14897155761719, 56.396568298339844, 62.6441650390625, 68.89176177978516, 75.13935852050781, 81.38695526123047, 87.63455200195312, 93.88214874267578, 100.12974548339844, 106.3773422241211, 112.62493896484375, 118.8725357055664, 125.12013244628906, 131.36773681640625, 137.61532592773438, 143.8629150390625, 150.1105194091797, 156.35812377929688, 162.605712890625, 168.85330200195312, 175.1009063720703, 181.3485107421875, 187.59609985351562, 193.84368896484375, 200.09129333496094, 206.33889770507812, 212.58648681640625, 218.83407592773438, 225.08168029785156, 231.32928466796875, 237.57687377929688, 243.824462890625, 250.0720672607422, 256.3196716308594, 262.5672607421875, 268.8148498535156, 275.06243896484375, 281.31005859375, 287.5576477050781]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 1.0, 5.0, 3.0, 6.0, 7.0, 6.0, 11.0, 11.0, 11.0, 14.0, 19.0, 13.0, 19.0, 23.0, 34.0, 31.0, 35.0, 40.0, 48.0, 36.0, 39.0, 56.0, 37.0, 48.0, 40.0, 55.0, 29.0, 38.0, 35.0, 27.0, 25.0, 23.0, 26.0, 27.0, 13.0, 15.0, 16.0, 12.0, 14.0, 9.0, 9.0, 12.0, 7.0, 7.0, 5.0, 5.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.56770324707031, -35.167823791503906, -33.767940521240234, -32.36806106567383, -30.968181610107422, -29.568300247192383, -28.168418884277344, -26.768539428710938, -25.3686580657959, -23.96877670288086, -22.568897247314453, -21.169015884399414, -19.769134521484375, -18.36925506591797, -16.96937370300293, -15.569493293762207, -14.169612884521484, -12.769732475280762, -11.369852066040039, -9.969970703125, -8.570090293884277, -7.170209884643555, -5.770328521728516, -4.370448112487793, -2.9705677032470703, -1.5706870555877686, -0.1708064079284668, 1.229074478149414, 2.6289548873901367, 4.028835296630859, 5.428716659545898, 6.828597068786621, 8.228477478027344, 9.628357887268066, 11.028238296508789, 12.428119659423828, 13.82800006866455, 15.227880477905273, 16.627761840820312, 18.02764129638672, 19.427522659301758, 20.827404022216797, 22.227283477783203, 23.627164840698242, 25.02704620361328, 26.426925659179688, 27.826807022094727, 29.226688385009766, 30.626567840576172, 32.02644729614258, 33.42633056640625, 34.826210021972656, 36.22608947753906, 37.62596893310547, 39.02585220336914, 40.42573165893555, 41.82561492919922, 43.225494384765625, 44.6253776550293, 46.0252571105957, 47.42513656616211, 48.82501983642578, 50.22489929199219, 51.624778747558594, 53.024658203125]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 5.0, 4.0, 6.0, 3.0, 3.0, 11.0, 7.0, 9.0, 7.0, 16.0, 12.0, 17.0, 24.0, 16.0, 36.0, 29.0, 31.0, 25.0, 40.0, 32.0, 39.0, 37.0, 47.0, 45.0, 45.0, 38.0, 50.0, 39.0, 34.0, 34.0, 31.0, 31.0, 30.0, 26.0, 23.0, 25.0, 22.0, 13.0, 13.0, 6.0, 8.0, 8.0, 8.0, 3.0, 5.0, 3.0, 3.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.59765625, -5.41156005859375, -5.2254638671875, -5.03936767578125, -4.853271484375, -4.66717529296875, -4.4810791015625, -4.29498291015625, -4.10888671875, -3.92279052734375, -3.7366943359375, -3.55059814453125, -3.364501953125, -3.17840576171875, -2.9923095703125, -2.80621337890625, -2.6201171875, -2.43402099609375, -2.2479248046875, -2.06182861328125, -1.875732421875, -1.68963623046875, -1.5035400390625, -1.31744384765625, -1.13134765625, -0.94525146484375, -0.7591552734375, -0.57305908203125, -0.386962890625, -0.20086669921875, -0.0147705078125, 0.17132568359375, 0.357421875, 0.54351806640625, 0.7296142578125, 0.91571044921875, 1.101806640625, 1.28790283203125, 1.4739990234375, 1.66009521484375, 1.84619140625, 2.03228759765625, 2.2183837890625, 2.40447998046875, 2.590576171875, 2.77667236328125, 2.9627685546875, 3.14886474609375, 3.3349609375, 3.52105712890625, 3.7071533203125, 3.89324951171875, 4.079345703125, 4.26544189453125, 4.4515380859375, 4.63763427734375, 4.82373046875, 5.00982666015625, 5.1959228515625, 5.38201904296875, 5.568115234375, 5.75421142578125, 5.9403076171875, 6.12640380859375, 6.3125]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 3.0, 3.0, 8.0, 10.0, 14.0, 16.0, 32.0, 51.0, 74.0, 109.0, 151.0, 206.0, 349.0, 501.0, 661.0, 1038.0, 1501.0, 2158.0, 3136.0, 4768.0, 7005.0, 10809.0, 16717.0, 26297.0, 41885.0, 68604.0, 126733.0, 317079.0, 185973.0, 88668.0, 51940.0, 32210.0, 20543.0, 13278.0, 8527.0, 5676.0, 3795.0, 2482.0, 1733.0, 1183.0, 816.0, 573.0, 398.0, 269.0, 181.0, 112.0, 110.0, 59.0, 39.0, 24.0, 27.0, 13.0, 5.0, 8.0, 3.0, 2.0, 1.0, 3.0], "bins": [-1.2216796875, -1.185455322265625, -1.14923095703125, -1.113006591796875, -1.0767822265625, -1.040557861328125, -1.00433349609375, -0.968109130859375, -0.931884765625, -0.895660400390625, -0.85943603515625, -0.823211669921875, -0.7869873046875, -0.750762939453125, -0.71453857421875, -0.678314208984375, -0.64208984375, -0.605865478515625, -0.56964111328125, -0.533416748046875, -0.4971923828125, -0.460968017578125, -0.42474365234375, -0.388519287109375, -0.352294921875, -0.316070556640625, -0.27984619140625, -0.243621826171875, -0.2073974609375, -0.171173095703125, -0.13494873046875, -0.098724365234375, -0.0625, -0.026275634765625, 0.00994873046875, 0.046173095703125, 0.0823974609375, 0.118621826171875, 0.15484619140625, 0.191070556640625, 0.227294921875, 0.263519287109375, 0.29974365234375, 0.335968017578125, 0.3721923828125, 0.408416748046875, 0.44464111328125, 0.480865478515625, 0.51708984375, 0.553314208984375, 0.58953857421875, 0.625762939453125, 0.6619873046875, 0.698211669921875, 0.73443603515625, 0.770660400390625, 0.806884765625, 0.843109130859375, 0.87933349609375, 0.915557861328125, 0.9517822265625, 0.988006591796875, 1.02423095703125, 1.060455322265625, 1.0966796875]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 6.0, 3.0, 4.0, 7.0, 6.0, 7.0, 11.0, 10.0, 21.0, 15.0, 13.0, 25.0, 17.0, 27.0, 40.0, 26.0, 28.0, 34.0, 41.0, 26.0, 41.0, 38.0, 38.0, 49.0, 1065.0, 25.0, 27.0, 29.0, 34.0, 33.0, 38.0, 27.0, 27.0, 31.0, 21.0, 20.0, 18.0, 16.0, 16.0, 12.0, 14.0, 11.0, 4.0, 4.0, 9.0, 5.0, 1.0, 6.0, 1.0, 2.0, 3.0, 2.0, 1.0], "bins": [-3.931640625, -3.819610595703125, -3.70758056640625, -3.595550537109375, -3.4835205078125, -3.371490478515625, -3.25946044921875, -3.147430419921875, -3.035400390625, -2.923370361328125, -2.81134033203125, -2.699310302734375, -2.5872802734375, -2.475250244140625, -2.36322021484375, -2.251190185546875, -2.13916015625, -2.027130126953125, -1.91510009765625, -1.803070068359375, -1.6910400390625, -1.579010009765625, -1.46697998046875, -1.354949951171875, -1.242919921875, -1.130889892578125, -1.01885986328125, -0.906829833984375, -0.7947998046875, -0.682769775390625, -0.57073974609375, -0.458709716796875, -0.3466796875, -0.234649658203125, -0.12261962890625, -0.010589599609375, 0.1014404296875, 0.213470458984375, 0.32550048828125, 0.437530517578125, 0.549560546875, 0.661590576171875, 0.77362060546875, 0.885650634765625, 0.9976806640625, 1.109710693359375, 1.22174072265625, 1.333770751953125, 1.44580078125, 1.557830810546875, 1.66986083984375, 1.781890869140625, 1.8939208984375, 2.005950927734375, 2.11798095703125, 2.230010986328125, 2.342041015625, 2.454071044921875, 2.56610107421875, 2.678131103515625, 2.7901611328125, 2.902191162109375, 3.01422119140625, 3.126251220703125, 3.23828125]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 4.0, 3.0, 3.0, 6.0, 8.0, 12.0, 21.0, 35.0, 39.0, 56.0, 90.0, 132.0, 168.0, 273.0, 400.0, 637.0, 904.0, 1368.0, 2154.0, 3291.0, 5140.0, 8052.0, 12666.0, 20384.0, 32712.0, 55174.0, 100516.0, 253003.0, 1340451.0, 107877.0, 58764.0, 34797.0, 21115.0, 13216.0, 8286.0, 5479.0, 3397.0, 2198.0, 1481.0, 956.0, 629.0, 398.0, 272.0, 176.0, 129.0, 78.0, 67.0, 40.0, 24.0, 21.0, 10.0, 12.0, 5.0, 7.0, 5.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.1357421875, -1.096649169921875, -1.05755615234375, -1.018463134765625, -0.9793701171875, -0.940277099609375, -0.90118408203125, -0.862091064453125, -0.822998046875, -0.783905029296875, -0.74481201171875, -0.705718994140625, -0.6666259765625, -0.627532958984375, -0.58843994140625, -0.549346923828125, -0.51025390625, -0.471160888671875, -0.43206787109375, -0.392974853515625, -0.3538818359375, -0.314788818359375, -0.27569580078125, -0.236602783203125, -0.197509765625, -0.158416748046875, -0.11932373046875, -0.080230712890625, -0.0411376953125, -0.002044677734375, 0.03704833984375, 0.076141357421875, 0.115234375, 0.154327392578125, 0.19342041015625, 0.232513427734375, 0.2716064453125, 0.310699462890625, 0.34979248046875, 0.388885498046875, 0.427978515625, 0.467071533203125, 0.50616455078125, 0.545257568359375, 0.5843505859375, 0.623443603515625, 0.66253662109375, 0.701629638671875, 0.74072265625, 0.779815673828125, 0.81890869140625, 0.858001708984375, 0.8970947265625, 0.936187744140625, 0.97528076171875, 1.014373779296875, 1.053466796875, 1.092559814453125, 1.13165283203125, 1.170745849609375, 1.2098388671875, 1.248931884765625, 1.28802490234375, 1.327117919921875, 1.3662109375]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 3.0, 5.0, 6.0, 6.0, 5.0, 7.0, 19.0, 12.0, 16.0, 20.0, 25.0, 33.0, 43.0, 48.0, 71.0, 62.0, 78.0, 78.0, 65.0, 60.0, 71.0, 48.0, 39.0, 46.0, 25.0, 22.0, 21.0, 20.0, 7.0, 5.0, 12.0, 6.0, 6.0, 5.0, 5.0, 1.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0008034706115722656, -0.0007776468992233276, -0.0007518231868743896, -0.0007259994745254517, -0.0007001757621765137, -0.0006743520498275757, -0.0006485283374786377, -0.0006227046251296997, -0.0005968809127807617, -0.0005710572004318237, -0.0005452334880828857, -0.0005194097757339478, -0.0004935860633850098, -0.0004677623510360718, -0.0004419386386871338, -0.0004161149263381958, -0.0003902912139892578, -0.0003644675016403198, -0.00033864378929138184, -0.00031282007694244385, -0.00028699636459350586, -0.00026117265224456787, -0.00023534893989562988, -0.0002095252275466919, -0.0001837015151977539, -0.00015787780284881592, -0.00013205409049987793, -0.00010623037815093994, -8.040666580200195e-05, -5.4582953453063965e-05, -2.8759241104125977e-05, -2.9355287551879883e-06, 2.288818359375e-05, 4.871189594268799e-05, 7.453560829162598e-05, 0.00010035932064056396, 0.00012618303298950195, 0.00015200674533843994, 0.00017783045768737793, 0.00020365417003631592, 0.0002294778823852539, 0.0002553015947341919, 0.0002811253070831299, 0.00030694901943206787, 0.00033277273178100586, 0.00035859644412994385, 0.00038442015647888184, 0.0004102438688278198, 0.0004360675811767578, 0.0004618912935256958, 0.0004877150058746338, 0.0005135387182235718, 0.0005393624305725098, 0.0005651861429214478, 0.0005910098552703857, 0.0006168335676193237, 0.0006426572799682617, 0.0006684809923171997, 0.0006943047046661377, 0.0007201284170150757, 0.0007459521293640137, 0.0007717758417129517, 0.0007975995540618896, 0.0008234232664108276, 0.0008492469787597656]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 1.0, 2.0, 5.0, 9.0, 11.0, 8.0, 12.0, 17.0, 17.0, 26.0, 28.0, 48.0, 74.0, 98.0, 205.0, 490.0, 1600.0, 994404.0, 49785.0, 858.0, 329.0, 163.0, 103.0, 75.0, 37.0, 39.0, 20.0, 12.0, 15.0, 13.0, 8.0, 9.0, 7.0, 7.0, 5.0, 3.0, 4.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.01898193359375, -0.018403053283691406, -0.017824172973632812, -0.01724529266357422, -0.016666412353515625, -0.01608753204345703, -0.015508651733398438, -0.014929771423339844, -0.01435089111328125, -0.013772010803222656, -0.013193130493164062, -0.012614250183105469, -0.012035369873046875, -0.011456489562988281, -0.010877609252929688, -0.010298728942871094, -0.0097198486328125, -0.009140968322753906, -0.008562088012695312, -0.007983207702636719, -0.007404327392578125, -0.006825447082519531, -0.0062465667724609375, -0.005667686462402344, -0.00508880615234375, -0.004509925842285156, -0.0039310455322265625, -0.0033521652221679688, -0.002773284912109375, -0.0021944046020507812, -0.0016155242919921875, -0.0010366439819335938, -0.000457763671875, 0.00012111663818359375, 0.0006999969482421875, 0.0012788772583007812, 0.001857757568359375, 0.0024366378784179688, 0.0030155181884765625, 0.0035943984985351562, 0.00417327880859375, 0.004752159118652344, 0.0053310394287109375, 0.005909919738769531, 0.006488800048828125, 0.007067680358886719, 0.0076465606689453125, 0.008225440979003906, 0.0088043212890625, 0.009383201599121094, 0.009962081909179688, 0.010540962219238281, 0.011119842529296875, 0.011698722839355469, 0.012277603149414062, 0.012856483459472656, 0.01343536376953125, 0.014014244079589844, 0.014593124389648438, 0.015172004699707031, 0.015750885009765625, 0.01632976531982422, 0.016908645629882812, 0.017487525939941406, 0.01806640625]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 4.0, 20.0, 145.0, 462.0, 306.0, 73.0, 7.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002582227170933038, -0.00020389042038004845, -0.0001495581236667931, -9.522581240162253e-05, -4.089351568836719e-05, 1.3438781024888158e-05, 6.777109229005873e-05, 0.00012210337445139885, 0.00017643568571656942, 0.00023076798242982477, 0.0002851002791430801, 0.0003394325904082507, 0.0003937648725695908, 0.0004480971838347614, 0.000502429495099932, 0.0005567617481574416, 0.0006110940594226122, 0.0006654263706877828, 0.0007197586819529533, 0.0007740909932181239, 0.0008284232462756336, 0.0008827555575408041, 0.0009370878688059747, 0.0009914201218634844, 0.0010457525495439768, 0.0011000848608091474, 0.001154417172074318, 0.0012087494833394885, 0.001263081794604659, 0.0013174139894545078, 0.0013717464171350002, 0.001426078611984849, 0.0014804109232500196, 0.0015347432345151901, 0.0015890755457803607, 0.0016434078570455313, 0.0016977401683107018, 0.0017520724795758724, 0.0018064046744257212, 0.0018607369856908917, 0.0019150692969560623, 0.001969401491805911, 0.0020237339194864035, 0.002078066114336252, 0.0021323985420167446, 0.0021867307368665934, 0.0022410631645470858, 0.0022953953593969345, 0.002349727787077427, 0.0024040599819272757, 0.002458392409607768, 0.002512724604457617, 0.002567057032138109, 0.002621389226987958, 0.0026757216546684504, 0.002730053849518299, 0.002784386044368148, 0.0028387182392179966, 0.002893050666898489, 0.0029473828617483377, 0.00300171528942883, 0.003056047484278679, 0.0031103799119591713, 0.00316471210680902, 0.0032190445344895124]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 1.0, 3.0, 6.0, 5.0, 11.0, 13.0, 10.0, 16.0, 11.0, 21.0, 26.0, 26.0, 32.0, 30.0, 32.0, 33.0, 42.0, 38.0, 46.0, 40.0, 46.0, 42.0, 50.0, 36.0, 54.0, 44.0, 28.0, 40.0, 16.0, 31.0, 35.0, 22.0, 19.0, 7.0, 14.0, 14.0, 14.0, 14.0, 7.0, 9.0, 4.0, 7.0, 4.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00041979551315307617, -0.00040724407881498337, -0.00039469264447689056, -0.00038214121013879776, -0.00036958977580070496, -0.00035703834146261215, -0.00034448690712451935, -0.00033193547278642654, -0.00031938403844833374, -0.00030683260411024094, -0.00029428116977214813, -0.00028172973543405533, -0.0002691783010959625, -0.0002566268667578697, -0.00024407543241977692, -0.0002315239980816841, -0.0002189725637435913, -0.0002064211294054985, -0.0001938696950674057, -0.0001813182607293129, -0.0001687668263912201, -0.0001562153920531273, -0.00014366395771503448, -0.00013111252337694168, -0.00011856108903884888, -0.00010600965470075607, -9.345822036266327e-05, -8.090678602457047e-05, -6.835535168647766e-05, -5.580391734838486e-05, -4.325248301029205e-05, -3.070104867219925e-05, -1.8149614334106445e-05, -5.598179996013641e-06, 6.953254342079163e-06, 1.9504688680171967e-05, 3.205612301826477e-05, 4.4607557356357574e-05, 5.715899169445038e-05, 6.971042603254318e-05, 8.226186037063599e-05, 9.481329470872879e-05, 0.0001073647290468216, 0.0001199161633849144, 0.0001324675977230072, 0.0001450190320611, 0.0001575704663991928, 0.00017012190073728561, 0.00018267333507537842, 0.00019522476941347122, 0.00020777620375156403, 0.00022032763808965683, 0.00023287907242774963, 0.00024543050676584244, 0.00025798194110393524, 0.00027053337544202805, 0.00028308480978012085, 0.00029563624411821365, 0.00030818767845630646, 0.00032073911279439926, 0.00033329054713249207, 0.00034584198147058487, 0.0003583934158086777, 0.0003709448501467705, 0.0003834962844848633]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 5.0, 4.0, 6.0, 3.0, 3.0, 11.0, 7.0, 9.0, 7.0, 16.0, 12.0, 17.0, 24.0, 16.0, 36.0, 29.0, 31.0, 25.0, 40.0, 32.0, 39.0, 37.0, 47.0, 45.0, 45.0, 38.0, 50.0, 39.0, 35.0, 33.0, 31.0, 31.0, 30.0, 26.0, 23.0, 25.0, 22.0, 13.0, 13.0, 6.0, 8.0, 8.0, 8.0, 3.0, 5.0, 3.0, 3.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.59765625, -5.41156005859375, -5.2254638671875, -5.03936767578125, -4.853271484375, -4.66717529296875, -4.4810791015625, -4.29498291015625, -4.10888671875, -3.92279052734375, -3.7366943359375, -3.55059814453125, -3.364501953125, -3.17840576171875, -2.9923095703125, -2.80621337890625, -2.6201171875, -2.43402099609375, -2.2479248046875, -2.06182861328125, -1.875732421875, -1.68963623046875, -1.5035400390625, -1.31744384765625, -1.13134765625, -0.94525146484375, -0.7591552734375, -0.57305908203125, -0.386962890625, -0.20086669921875, -0.0147705078125, 0.17132568359375, 0.357421875, 0.54351806640625, 0.7296142578125, 0.91571044921875, 1.101806640625, 1.28790283203125, 1.4739990234375, 1.66009521484375, 1.84619140625, 2.03228759765625, 2.2183837890625, 2.40447998046875, 2.590576171875, 2.77667236328125, 2.9627685546875, 3.14886474609375, 3.3349609375, 3.52105712890625, 3.7071533203125, 3.89324951171875, 4.079345703125, 4.26544189453125, 4.4515380859375, 4.63763427734375, 4.82373046875, 5.00982666015625, 5.1959228515625, 5.38201904296875, 5.568115234375, 5.75421142578125, 5.9403076171875, 6.12640380859375, 6.3125]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 9.0, 3.0, 12.0, 11.0, 21.0, 24.0, 28.0, 48.0, 35.0, 55.0, 104.0, 125.0, 160.0, 260.0, 385.0, 613.0, 920.0, 1547.0, 2781.0, 4902.0, 9182.0, 17682.0, 35249.0, 72272.0, 165338.0, 326491.0, 222456.0, 95077.0, 44350.0, 22428.0, 11425.0, 6094.0, 3339.0, 1855.0, 1154.0, 675.0, 418.0, 285.0, 203.0, 134.0, 105.0, 89.0, 63.0, 34.0, 30.0, 22.0, 17.0, 12.0, 15.0, 7.0, 7.0, 3.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0], "bins": [-3.484375, -3.374359130859375, -3.26434326171875, -3.154327392578125, -3.0443115234375, -2.934295654296875, -2.82427978515625, -2.714263916015625, -2.604248046875, -2.494232177734375, -2.38421630859375, -2.274200439453125, -2.1641845703125, -2.054168701171875, -1.94415283203125, -1.834136962890625, -1.72412109375, -1.614105224609375, -1.50408935546875, -1.394073486328125, -1.2840576171875, -1.174041748046875, -1.06402587890625, -0.954010009765625, -0.843994140625, -0.733978271484375, -0.62396240234375, -0.513946533203125, -0.4039306640625, -0.293914794921875, -0.18389892578125, -0.073883056640625, 0.0361328125, 0.146148681640625, 0.25616455078125, 0.366180419921875, 0.4761962890625, 0.586212158203125, 0.69622802734375, 0.806243896484375, 0.916259765625, 1.026275634765625, 1.13629150390625, 1.246307373046875, 1.3563232421875, 1.466339111328125, 1.57635498046875, 1.686370849609375, 1.79638671875, 1.906402587890625, 2.01641845703125, 2.126434326171875, 2.2364501953125, 2.346466064453125, 2.45648193359375, 2.566497802734375, 2.676513671875, 2.786529541015625, 2.89654541015625, 3.006561279296875, 3.1165771484375, 3.226593017578125, 3.33660888671875, 3.446624755859375, 3.556640625]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 4.0, 3.0, 3.0, 10.0, 5.0, 7.0, 6.0, 18.0, 20.0, 20.0, 22.0, 26.0, 34.0, 28.0, 32.0, 38.0, 36.0, 61.0, 69.0, 68.0, 336.0, 1610.0, 119.0, 67.0, 50.0, 47.0, 35.0, 37.0, 40.0, 34.0, 25.0, 30.0, 22.0, 16.0, 14.0, 19.0, 13.0, 11.0, 6.0, 4.0, 1.0, 4.0, 2.0, 0.0, 5.0, 2.0], "bins": [-28.75, -28.017333984375, -27.28466796875, -26.552001953125, -25.8193359375, -25.086669921875, -24.35400390625, -23.621337890625, -22.888671875, -22.156005859375, -21.42333984375, -20.690673828125, -19.9580078125, -19.225341796875, -18.49267578125, -17.760009765625, -17.02734375, -16.294677734375, -15.56201171875, -14.829345703125, -14.0966796875, -13.364013671875, -12.63134765625, -11.898681640625, -11.166015625, -10.433349609375, -9.70068359375, -8.968017578125, -8.2353515625, -7.502685546875, -6.77001953125, -6.037353515625, -5.3046875, -4.572021484375, -3.83935546875, -3.106689453125, -2.3740234375, -1.641357421875, -0.90869140625, -0.176025390625, 0.556640625, 1.289306640625, 2.02197265625, 2.754638671875, 3.4873046875, 4.219970703125, 4.95263671875, 5.685302734375, 6.41796875, 7.150634765625, 7.88330078125, 8.615966796875, 9.3486328125, 10.081298828125, 10.81396484375, 11.546630859375, 12.279296875, 13.011962890625, 13.74462890625, 14.477294921875, 15.2099609375, 15.942626953125, 16.67529296875, 17.407958984375, 18.140625]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 7.0, 1.0, 2.0, 6.0, 4.0, 9.0, 10.0, 20.0, 21.0, 23.0, 42.0, 41.0, 52.0, 89.0, 110.0, 146.0, 210.0, 291.0, 590.0, 2933.0, 842304.0, 2293761.0, 3314.0, 639.0, 298.0, 221.0, 134.0, 109.0, 83.0, 68.0, 44.0, 25.0, 32.0, 14.0, 9.0, 5.0, 16.0, 6.0, 6.0, 3.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-48.375, -46.5166015625, -44.658203125, -42.7998046875, -40.94140625, -39.0830078125, -37.224609375, -35.3662109375, -33.5078125, -31.6494140625, -29.791015625, -27.9326171875, -26.07421875, -24.2158203125, -22.357421875, -20.4990234375, -18.640625, -16.7822265625, -14.923828125, -13.0654296875, -11.20703125, -9.3486328125, -7.490234375, -5.6318359375, -3.7734375, -1.9150390625, -0.056640625, 1.8017578125, 3.66015625, 5.5185546875, 7.376953125, 9.2353515625, 11.09375, 12.9521484375, 14.810546875, 16.6689453125, 18.52734375, 20.3857421875, 22.244140625, 24.1025390625, 25.9609375, 27.8193359375, 29.677734375, 31.5361328125, 33.39453125, 35.2529296875, 37.111328125, 38.9697265625, 40.828125, 42.6865234375, 44.544921875, 46.4033203125, 48.26171875, 50.1201171875, 51.978515625, 53.8369140625, 55.6953125, 57.5537109375, 59.412109375, 61.2705078125, 63.12890625, 64.9873046875, 66.845703125, 68.7041015625, 70.5625]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 52.0, 701.0, 253.0, 12.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.227364540100098, -8.376840591430664, -3.526315689086914, 1.3242082595825195, 6.1747331619262695, 11.02525806427002, 15.875781059265137, 20.726306915283203, 25.576831817626953, 30.427356719970703, 35.27788162231445, 40.12840270996094, 44.97892761230469, 49.82945251464844, 54.67997741699219, 59.53050231933594, 64.38102722167969, 69.23155212402344, 74.08207702636719, 78.93260192871094, 83.78312683105469, 88.63365173339844, 93.48417663574219, 98.33470153808594, 103.18521881103516, 108.0357437133789, 112.88626861572266, 117.7367935180664, 122.58731842041016, 127.4378433227539, 132.28836059570312, 137.13888549804688, 141.9894256591797, 146.83995056152344, 151.6904754638672, 156.54100036621094, 161.3915252685547, 166.24205017089844, 171.0925750732422, 175.94309997558594, 180.7936248779297, 185.64414978027344, 190.4946746826172, 195.34519958496094, 200.1957244873047, 205.04624938964844, 209.8967742919922, 214.74729919433594, 219.59780883789062, 224.44833374023438, 229.29885864257812, 234.14938354492188, 238.99990844726562, 243.85043334960938, 248.70095825195312, 253.55148315429688, 258.4020080566406, 263.2525329589844, 268.1030578613281, 272.9535827636719, 277.8041076660156, 282.6546325683594, 287.5051574707031, 292.3556823730469, 297.2062072753906]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 7.0, 7.0, 7.0, 8.0, 10.0, 5.0, 6.0, 18.0, 11.0, 13.0, 10.0, 20.0, 19.0, 18.0, 20.0, 24.0, 23.0, 35.0, 16.0, 21.0, 37.0, 35.0, 39.0, 42.0, 39.0, 36.0, 40.0, 39.0, 31.0, 35.0, 30.0, 38.0, 35.0, 28.0, 22.0, 20.0, 22.0, 21.0, 19.0, 14.0, 17.0, 13.0, 12.0, 11.0, 6.0, 5.0, 9.0, 3.0, 7.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-49.94728088378906, -48.46657180786133, -46.98585891723633, -45.505149841308594, -44.024436950683594, -42.54372787475586, -41.063018798828125, -39.582305908203125, -38.101593017578125, -36.62088394165039, -35.14017105102539, -33.659461975097656, -32.178749084472656, -30.698040008544922, -29.217329025268555, -27.736618041992188, -26.255908966064453, -24.775197982788086, -23.29448699951172, -21.813777923583984, -20.333065032958984, -18.85235595703125, -17.371644973754883, -15.890933990478516, -14.410223007202148, -12.929512023925781, -11.448801040649414, -9.968091011047363, -8.487380027770996, -7.006669044494629, -5.525959014892578, -4.045248031616211, -2.5645408630371094, -1.0838301181793213, 0.3968806266784668, 1.8775911331176758, 3.358302116394043, 4.83901309967041, 6.319723129272461, 7.800434112548828, 9.281145095825195, 10.761856079101562, 12.24256706237793, 13.72327709197998, 15.203988075256348, 16.68470001220703, 18.165409088134766, 19.646120071411133, 21.1268310546875, 22.607542037963867, 24.088253021240234, 25.56896209716797, 27.04967498779297, 28.530384063720703, 30.01109504699707, 31.491806030273438, 32.97251892089844, 34.45322799682617, 35.93394088745117, 37.414649963378906, 38.895362854003906, 40.37607192993164, 41.856781005859375, 43.337493896484375, 44.81820297241211]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 3.0, 4.0, 4.0, 10.0, 4.0, 9.0, 9.0, 17.0, 12.0, 9.0, 18.0, 18.0, 31.0, 29.0, 40.0, 21.0, 35.0, 34.0, 30.0, 43.0, 39.0, 48.0, 53.0, 53.0, 36.0, 31.0, 32.0, 44.0, 38.0, 29.0, 24.0, 29.0, 26.0, 35.0, 20.0, 11.0, 14.0, 7.0, 6.0, 6.0, 12.0, 10.0, 3.0, 3.0, 2.0, 4.0, 1.0, 2.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-6.1484375, -5.953857421875, -5.75927734375, -5.564697265625, -5.3701171875, -5.175537109375, -4.98095703125, -4.786376953125, -4.591796875, -4.397216796875, -4.20263671875, -4.008056640625, -3.8134765625, -3.618896484375, -3.42431640625, -3.229736328125, -3.03515625, -2.840576171875, -2.64599609375, -2.451416015625, -2.2568359375, -2.062255859375, -1.86767578125, -1.673095703125, -1.478515625, -1.283935546875, -1.08935546875, -0.894775390625, -0.7001953125, -0.505615234375, -0.31103515625, -0.116455078125, 0.078125, 0.272705078125, 0.46728515625, 0.661865234375, 0.8564453125, 1.051025390625, 1.24560546875, 1.440185546875, 1.634765625, 1.829345703125, 2.02392578125, 2.218505859375, 2.4130859375, 2.607666015625, 2.80224609375, 2.996826171875, 3.19140625, 3.385986328125, 3.58056640625, 3.775146484375, 3.9697265625, 4.164306640625, 4.35888671875, 4.553466796875, 4.748046875, 4.942626953125, 5.13720703125, 5.331787109375, 5.5263671875, 5.720947265625, 5.91552734375, 6.110107421875, 6.3046875]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 3.0, 3.0, 6.0, 11.0, 4.0, 9.0, 9.0, 12.0, 13.0, 17.0, 19.0, 22.0, 26.0, 28.0, 41.0, 60.0, 87.0, 113.0, 239.0, 825.0, 7810.0, 717563.0, 3396857.0, 67003.0, 2408.0, 467.0, 202.0, 108.0, 61.0, 47.0, 36.0, 35.0, 20.0, 18.0, 17.0, 13.0, 15.0, 11.0, 14.0, 6.0, 8.0, 6.0, 2.0, 1.0, 1.0, 2.0, 6.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-25.140625, -24.336669921875, -23.53271484375, -22.728759765625, -21.9248046875, -21.120849609375, -20.31689453125, -19.512939453125, -18.708984375, -17.905029296875, -17.10107421875, -16.297119140625, -15.4931640625, -14.689208984375, -13.88525390625, -13.081298828125, -12.27734375, -11.473388671875, -10.66943359375, -9.865478515625, -9.0615234375, -8.257568359375, -7.45361328125, -6.649658203125, -5.845703125, -5.041748046875, -4.23779296875, -3.433837890625, -2.6298828125, -1.825927734375, -1.02197265625, -0.218017578125, 0.5859375, 1.389892578125, 2.19384765625, 2.997802734375, 3.8017578125, 4.605712890625, 5.40966796875, 6.213623046875, 7.017578125, 7.821533203125, 8.62548828125, 9.429443359375, 10.2333984375, 11.037353515625, 11.84130859375, 12.645263671875, 13.44921875, 14.253173828125, 15.05712890625, 15.861083984375, 16.6650390625, 17.468994140625, 18.27294921875, 19.076904296875, 19.880859375, 20.684814453125, 21.48876953125, 22.292724609375, 23.0966796875, 23.900634765625, 24.70458984375, 25.508544921875, 26.3125]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 2.0, 2.0, 7.0, 5.0, 18.0, 20.0, 19.0, 21.0, 38.0, 31.0, 32.0, 60.0, 54.0, 100.0, 113.0, 142.0, 202.0, 243.0, 308.0, 368.0, 359.0, 381.0, 343.0, 262.0, 181.0, 171.0, 137.0, 100.0, 77.0, 61.0, 49.0, 37.0, 34.0, 24.0, 22.0, 12.0, 8.0, 6.0, 5.0, 6.0, 7.0, 6.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-11.0625, -10.72412109375, -10.3857421875, -10.04736328125, -9.708984375, -9.37060546875, -9.0322265625, -8.69384765625, -8.35546875, -8.01708984375, -7.6787109375, -7.34033203125, -7.001953125, -6.66357421875, -6.3251953125, -5.98681640625, -5.6484375, -5.31005859375, -4.9716796875, -4.63330078125, -4.294921875, -3.95654296875, -3.6181640625, -3.27978515625, -2.94140625, -2.60302734375, -2.2646484375, -1.92626953125, -1.587890625, -1.24951171875, -0.9111328125, -0.57275390625, -0.234375, 0.10400390625, 0.4423828125, 0.78076171875, 1.119140625, 1.45751953125, 1.7958984375, 2.13427734375, 2.47265625, 2.81103515625, 3.1494140625, 3.48779296875, 3.826171875, 4.16455078125, 4.5029296875, 4.84130859375, 5.1796875, 5.51806640625, 5.8564453125, 6.19482421875, 6.533203125, 6.87158203125, 7.2099609375, 7.54833984375, 7.88671875, 8.22509765625, 8.5634765625, 8.90185546875, 9.240234375, 9.57861328125, 9.9169921875, 10.25537109375, 10.59375]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 6.0, 13.0, 7.0, 9.0, 17.0, 26.0, 27.0, 36.0, 54.0, 64.0, 123.0, 168.0, 264.0, 508.0, 1912.0, 3573581.0, 615016.0, 1270.0, 448.0, 242.0, 147.0, 101.0, 71.0, 45.0, 35.0, 25.0, 19.0, 12.0, 13.0, 6.0, 7.0, 3.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-86.3125, -83.689453125, -81.06640625, -78.443359375, -75.8203125, -73.197265625, -70.57421875, -67.951171875, -65.328125, -62.705078125, -60.08203125, -57.458984375, -54.8359375, -52.212890625, -49.58984375, -46.966796875, -44.34375, -41.720703125, -39.09765625, -36.474609375, -33.8515625, -31.228515625, -28.60546875, -25.982421875, -23.359375, -20.736328125, -18.11328125, -15.490234375, -12.8671875, -10.244140625, -7.62109375, -4.998046875, -2.375, 0.248046875, 2.87109375, 5.494140625, 8.1171875, 10.740234375, 13.36328125, 15.986328125, 18.609375, 21.232421875, 23.85546875, 26.478515625, 29.1015625, 31.724609375, 34.34765625, 36.970703125, 39.59375, 42.216796875, 44.83984375, 47.462890625, 50.0859375, 52.708984375, 55.33203125, 57.955078125, 60.578125, 63.201171875, 65.82421875, 68.447265625, 71.0703125, 73.693359375, 76.31640625, 78.939453125, 81.5625]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 10.0, 31.0, 59.0, 111.0, 165.0, 197.0, 198.0, 124.0, 64.0, 25.0, 13.0, 6.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.72490692138672, -73.26342010498047, -70.80193328857422, -68.34044647216797, -65.87895965576172, -63.41747283935547, -60.95598602294922, -58.49449920654297, -56.03301239013672, -53.57152557373047, -51.11003875732422, -48.64855194091797, -46.18706512451172, -43.72557830810547, -41.26409149169922, -38.80260467529297, -36.34111785888672, -33.87963104248047, -31.41814422607422, -28.95665740966797, -26.49517059326172, -24.03368377685547, -21.57219696044922, -19.11071014404297, -16.64922332763672, -14.187736511230469, -11.726249694824219, -9.264762878417969, -6.803276062011719, -4.341789245605469, -1.8803024291992188, 0.5811843872070312, 3.0426788330078125, 5.5041656494140625, 7.9656524658203125, 10.427139282226562, 12.888626098632812, 15.350112915039062, 17.811599731445312, 20.273086547851562, 22.734573364257812, 25.196060180664062, 27.657546997070312, 30.119033813476562, 32.58052062988281, 35.04200744628906, 37.50349426269531, 39.96498107910156, 42.42646789550781, 44.88795471191406, 47.34944152832031, 49.81092834472656, 52.27241516113281, 54.73390197753906, 57.19538879394531, 59.65687561035156, 62.11836242675781, 64.57984924316406, 67.04133605957031, 69.50282287597656, 71.96430969238281, 74.42579650878906, 76.88728332519531, 79.34877014160156, 81.81025695800781]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 5.0, 4.0, 6.0, 10.0, 11.0, 12.0, 15.0, 16.0, 20.0, 30.0, 26.0, 40.0, 40.0, 30.0, 36.0, 45.0, 40.0, 45.0, 52.0, 42.0, 56.0, 49.0, 32.0, 56.0, 44.0, 41.0, 34.0, 26.0, 18.0, 31.0, 19.0, 14.0, 19.0, 8.0, 16.0, 5.0, 6.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.960670471191406, -46.42705535888672, -44.89344024658203, -43.359825134277344, -41.82620620727539, -40.2925910949707, -38.758975982666016, -37.22536087036133, -35.69174575805664, -34.15813064575195, -32.624515533447266, -31.090898513793945, -29.557283401489258, -28.023666381835938, -26.49005126953125, -24.956436157226562, -23.422819137573242, -21.889204025268555, -20.355587005615234, -18.821971893310547, -17.28835678100586, -15.754740715026855, -14.221124649047852, -12.687509536743164, -11.15389347076416, -9.620277404785156, -8.086662292480469, -6.553046226501465, -5.019430637359619, -3.4858150482177734, -1.9521989822387695, -0.41858386993408203, 1.1150321960449219, 2.6486477851867676, 4.182263374328613, 5.715879440307617, 7.249495029449463, 8.783110618591309, 10.316726684570312, 11.850341796875, 13.383957862854004, 14.917573928833008, 16.451189041137695, 17.984806060791016, 19.518421173095703, 21.05203628540039, 22.585651397705078, 24.119266510009766, 25.652883529663086, 27.186498641967773, 28.720115661621094, 30.25373077392578, 31.78734588623047, 33.320960998535156, 34.854576110839844, 36.38819122314453, 37.921810150146484, 39.45542526245117, 40.98904037475586, 42.52265930175781, 44.0562744140625, 45.58988952636719, 47.123504638671875, 48.65711975097656, 50.19073486328125]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 3.0, 7.0, 4.0, 3.0, 6.0, 10.0, 16.0, 11.0, 12.0, 13.0, 21.0, 22.0, 19.0, 31.0, 41.0, 31.0, 34.0, 33.0, 44.0, 46.0, 39.0, 43.0, 42.0, 36.0, 45.0, 46.0, 34.0, 47.0, 39.0, 26.0, 32.0, 28.0, 27.0, 15.0, 25.0, 12.0, 6.0, 8.0, 7.0, 8.0, 7.0, 4.0, 8.0, 3.0, 4.0, 2.0, 3.0, 3.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.83203125, -5.63946533203125, -5.4468994140625, -5.25433349609375, -5.061767578125, -4.86920166015625, -4.6766357421875, -4.48406982421875, -4.29150390625, -4.09893798828125, -3.9063720703125, -3.71380615234375, -3.521240234375, -3.32867431640625, -3.1361083984375, -2.94354248046875, -2.7509765625, -2.55841064453125, -2.3658447265625, -2.17327880859375, -1.980712890625, -1.78814697265625, -1.5955810546875, -1.40301513671875, -1.21044921875, -1.01788330078125, -0.8253173828125, -0.63275146484375, -0.440185546875, -0.24761962890625, -0.0550537109375, 0.13751220703125, 0.330078125, 0.52264404296875, 0.7152099609375, 0.90777587890625, 1.100341796875, 1.29290771484375, 1.4854736328125, 1.67803955078125, 1.87060546875, 2.06317138671875, 2.2557373046875, 2.44830322265625, 2.640869140625, 2.83343505859375, 3.0260009765625, 3.21856689453125, 3.4111328125, 3.60369873046875, 3.7962646484375, 3.98883056640625, 4.181396484375, 4.37396240234375, 4.5665283203125, 4.75909423828125, 4.95166015625, 5.14422607421875, 5.3367919921875, 5.52935791015625, 5.721923828125, 5.91448974609375, 6.1070556640625, 6.29962158203125, 6.4921875]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 3.0, 14.0, 13.0, 20.0, 29.0, 40.0, 59.0, 97.0, 156.0, 193.0, 278.0, 413.0, 572.0, 782.0, 1160.0, 1698.0, 2398.0, 3537.0, 5309.0, 7885.0, 11997.0, 18313.0, 29133.0, 47420.0, 81477.0, 157613.0, 325393.0, 148188.0, 77555.0, 45656.0, 28009.0, 17889.0, 11609.0, 7377.0, 5128.0, 3411.0, 2312.0, 1647.0, 1159.0, 772.0, 554.0, 400.0, 262.0, 202.0, 154.0, 85.0, 80.0, 37.0, 25.0, 16.0, 15.0, 11.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.1103515625, -1.0738983154296875, -1.037445068359375, -1.0009918212890625, -0.96453857421875, -0.9280853271484375, -0.891632080078125, -0.8551788330078125, -0.8187255859375, -0.7822723388671875, -0.745819091796875, -0.7093658447265625, -0.67291259765625, -0.6364593505859375, -0.600006103515625, -0.5635528564453125, -0.527099609375, -0.4906463623046875, -0.454193115234375, -0.4177398681640625, -0.38128662109375, -0.3448333740234375, -0.308380126953125, -0.2719268798828125, -0.2354736328125, -0.1990203857421875, -0.162567138671875, -0.1261138916015625, -0.08966064453125, -0.0532073974609375, -0.016754150390625, 0.0196990966796875, 0.05615234375, 0.0926055908203125, 0.129058837890625, 0.1655120849609375, 0.20196533203125, 0.2384185791015625, 0.274871826171875, 0.3113250732421875, 0.3477783203125, 0.3842315673828125, 0.420684814453125, 0.4571380615234375, 0.49359130859375, 0.5300445556640625, 0.566497802734375, 0.6029510498046875, 0.639404296875, 0.6758575439453125, 0.712310791015625, 0.7487640380859375, 0.78521728515625, 0.8216705322265625, 0.858123779296875, 0.8945770263671875, 0.9310302734375, 0.9674835205078125, 1.003936767578125, 1.0403900146484375, 1.07684326171875, 1.1132965087890625, 1.149749755859375, 1.1862030029296875, 1.22265625]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 5.0, 4.0, 5.0, 11.0, 6.0, 17.0, 10.0, 11.0, 23.0, 18.0, 23.0, 26.0, 38.0, 28.0, 45.0, 37.0, 29.0, 46.0, 48.0, 44.0, 1070.0, 43.0, 27.0, 44.0, 43.0, 42.0, 32.0, 34.0, 34.0, 28.0, 34.0, 17.0, 18.0, 25.0, 21.0, 12.0, 8.0, 4.0, 6.0, 9.0, 3.0, 1.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.986328125, -3.856292724609375, -3.72625732421875, -3.596221923828125, -3.4661865234375, -3.336151123046875, -3.20611572265625, -3.076080322265625, -2.946044921875, -2.816009521484375, -2.68597412109375, -2.555938720703125, -2.4259033203125, -2.295867919921875, -2.16583251953125, -2.035797119140625, -1.90576171875, -1.775726318359375, -1.64569091796875, -1.515655517578125, -1.3856201171875, -1.255584716796875, -1.12554931640625, -0.995513916015625, -0.865478515625, -0.735443115234375, -0.60540771484375, -0.475372314453125, -0.3453369140625, -0.215301513671875, -0.08526611328125, 0.044769287109375, 0.1748046875, 0.304840087890625, 0.43487548828125, 0.564910888671875, 0.6949462890625, 0.824981689453125, 0.95501708984375, 1.085052490234375, 1.215087890625, 1.345123291015625, 1.47515869140625, 1.605194091796875, 1.7352294921875, 1.865264892578125, 1.99530029296875, 2.125335693359375, 2.25537109375, 2.385406494140625, 2.51544189453125, 2.645477294921875, 2.7755126953125, 2.905548095703125, 3.03558349609375, 3.165618896484375, 3.295654296875, 3.425689697265625, 3.55572509765625, 3.685760498046875, 3.8157958984375, 3.945831298828125, 4.07586669921875, 4.205902099609375, 4.3359375]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 7.0, 8.0, 7.0, 20.0, 34.0, 37.0, 74.0, 89.0, 169.0, 242.0, 371.0, 608.0, 998.0, 1596.0, 2773.0, 4560.0, 7823.0, 13239.0, 22984.0, 40447.0, 74946.0, 162310.0, 1445963.0, 153056.0, 71603.0, 39110.0, 22164.0, 12917.0, 7708.0, 4456.0, 2672.0, 1578.0, 969.0, 561.0, 369.0, 241.0, 153.0, 96.0, 53.0, 49.0, 21.0, 20.0, 12.0, 9.0, 4.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5234375, -1.4779205322265625, -1.432403564453125, -1.3868865966796875, -1.34136962890625, -1.2958526611328125, -1.250335693359375, -1.2048187255859375, -1.1593017578125, -1.1137847900390625, -1.068267822265625, -1.0227508544921875, -0.97723388671875, -0.9317169189453125, -0.886199951171875, -0.8406829833984375, -0.795166015625, -0.7496490478515625, -0.704132080078125, -0.6586151123046875, -0.61309814453125, -0.5675811767578125, -0.522064208984375, -0.4765472412109375, -0.4310302734375, -0.3855133056640625, -0.339996337890625, -0.2944793701171875, -0.24896240234375, -0.2034454345703125, -0.157928466796875, -0.1124114990234375, -0.06689453125, -0.0213775634765625, 0.024139404296875, 0.0696563720703125, 0.11517333984375, 0.1606903076171875, 0.206207275390625, 0.2517242431640625, 0.2972412109375, 0.3427581787109375, 0.388275146484375, 0.4337921142578125, 0.47930908203125, 0.5248260498046875, 0.570343017578125, 0.6158599853515625, 0.661376953125, 0.7068939208984375, 0.752410888671875, 0.7979278564453125, 0.84344482421875, 0.8889617919921875, 0.934478759765625, 0.9799957275390625, 1.0255126953125, 1.0710296630859375, 1.116546630859375, 1.1620635986328125, 1.20758056640625, 1.2530975341796875, 1.298614501953125, 1.3441314697265625, 1.3896484375]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 2.0, 3.0, 5.0, 2.0, 3.0, 9.0, 10.0, 13.0, 13.0, 19.0, 19.0, 24.0, 33.0, 44.0, 47.0, 51.0, 69.0, 76.0, 90.0, 79.0, 71.0, 67.0, 50.0, 49.0, 30.0, 30.0, 18.0, 16.0, 11.0, 11.0, 8.0, 11.0, 1.0, 5.0, 2.0, 3.0, 2.0, 2.0, 5.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007634162902832031, -0.0007360652089118958, -0.0007087141275405884, -0.000681363046169281, -0.0006540119647979736, -0.0006266608834266663, -0.0005993098020553589, -0.0005719587206840515, -0.0005446076393127441, -0.0005172565579414368, -0.0004899054765701294, -0.000462554395198822, -0.00043520331382751465, -0.0004078522324562073, -0.0003805011510848999, -0.00035315006971359253, -0.00032579898834228516, -0.0002984479069709778, -0.0002710968255996704, -0.00024374574422836304, -0.00021639466285705566, -0.0001890435814857483, -0.00016169250011444092, -0.00013434141874313354, -0.00010699033737182617, -7.96392560005188e-05, -5.2288174629211426e-05, -2.4937093257904053e-05, 2.4139881134033203e-06, 2.9765069484710693e-05, 5.7116150856018066e-05, 8.446723222732544e-05, 0.00011181831359863281, 0.00013916939496994019, 0.00016652047634124756, 0.00019387155771255493, 0.0002212226390838623, 0.0002485737204551697, 0.00027592480182647705, 0.0003032758831977844, 0.0003306269645690918, 0.00035797804594039917, 0.00038532912731170654, 0.0004126802086830139, 0.0004400312900543213, 0.00046738237142562866, 0.000494733452796936, 0.0005220845341682434, 0.0005494356155395508, 0.0005767866969108582, 0.0006041377782821655, 0.0006314888596534729, 0.0006588399410247803, 0.0006861910223960876, 0.000713542103767395, 0.0007408931851387024, 0.0007682442665100098, 0.0007955953478813171, 0.0008229464292526245, 0.0008502975106239319, 0.0008776485919952393, 0.0009049996733665466, 0.000932350754737854, 0.0009597018361091614, 0.0009870529174804688]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 6.0, 2.0, 4.0, 6.0, 5.0, 11.0, 8.0, 17.0, 17.0, 24.0, 31.0, 50.0, 71.0, 120.0, 271.0, 874.0, 114985.0, 929927.0, 1281.0, 365.0, 152.0, 78.0, 57.0, 45.0, 29.0, 15.0, 22.0, 18.0, 9.0, 10.0, 10.0, 9.0, 7.0, 3.0, 7.0, 0.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.024871826171875, -0.024219512939453125, -0.02356719970703125, -0.022914886474609375, -0.0222625732421875, -0.021610260009765625, -0.02095794677734375, -0.020305633544921875, -0.0196533203125, -0.019001007080078125, -0.01834869384765625, -0.017696380615234375, -0.0170440673828125, -0.016391754150390625, -0.01573944091796875, -0.015087127685546875, -0.014434814453125, -0.013782501220703125, -0.01313018798828125, -0.012477874755859375, -0.0118255615234375, -0.011173248291015625, -0.01052093505859375, -0.009868621826171875, -0.00921630859375, -0.008563995361328125, -0.00791168212890625, -0.007259368896484375, -0.0066070556640625, -0.005954742431640625, -0.00530242919921875, -0.004650115966796875, -0.003997802734375, -0.003345489501953125, -0.00269317626953125, -0.002040863037109375, -0.0013885498046875, -0.000736236572265625, -8.392333984375e-05, 0.000568389892578125, 0.001220703125, 0.001873016357421875, 0.00252532958984375, 0.003177642822265625, 0.0038299560546875, 0.004482269287109375, 0.00513458251953125, 0.005786895751953125, 0.006439208984375, 0.007091522216796875, 0.00774383544921875, 0.008396148681640625, 0.0090484619140625, 0.009700775146484375, 0.01035308837890625, 0.011005401611328125, 0.01165771484375, 0.012310028076171875, 0.01296234130859375, 0.013614654541015625, 0.0142669677734375, 0.014919281005859375, 0.01557159423828125, 0.016223907470703125, 0.016876220703125]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 34.0, 310.0, 498.0, 154.0, 16.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009861517464742064, -0.0009172761347144842, -0.0008484005811624229, -0.0007795249694027007, -0.0007106494158506393, -0.0006417738040909171, -0.0005728981923311949, -0.0005040225805714726, -0.0004351470270194113, -0.00036627144436351955, -0.0002973958617076278, -0.00022852024994790554, -0.00015964466729201376, -9.076908463612199e-05, -2.1893472876399755e-05, 4.698210977949202e-05, 0.0001158576924353838, 0.00018473327509127557, 0.00025360885774716735, 0.0003224844695068896, 0.00039136005216278136, 0.00046023563481867313, 0.0005291112465783954, 0.0005979868583381176, 0.0006668624118901789, 0.0007357380236499012, 0.0008046135772019625, 0.0008734891889616847, 0.0009423648007214069, 0.0010112402960658073, 0.0010801160242408514, 0.0011489915195852518, 0.0012178672477602959, 0.001286742859520018, 0.0013556184712797403, 0.0014244939666241407, 0.001493369578383863, 0.0015622451901435852, 0.0016311208019033074, 0.0016999964136630297, 0.00176887190900743, 0.0018377475207671523, 0.0019066231325268745, 0.001975498627871275, 0.002044374356046319, 0.0021132498513907194, 0.0021821255795657635, 0.002251001074910164, 0.0023198765702545643, 0.0023887520655989647, 0.0024576277937740088, 0.002526503289118409, 0.002595379017293453, 0.0026642545126378536, 0.002733130007982254, 0.002802005736157298, 0.002870881464332342, 0.0029397569596767426, 0.0030086326878517866, 0.003077508183196187, 0.003146383911371231, 0.0032152594067156315, 0.003284134902060032, 0.003353010630235076, 0.0034218861255794764]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 5.0, 6.0, 4.0, 3.0, 10.0, 5.0, 10.0, 14.0, 12.0, 19.0, 20.0, 21.0, 11.0, 23.0, 25.0, 29.0, 41.0, 32.0, 40.0, 38.0, 31.0, 35.0, 43.0, 45.0, 31.0, 40.0, 39.0, 38.0, 36.0, 31.0, 44.0, 35.0, 29.0, 24.0, 18.0, 26.0, 18.0, 14.0, 8.0, 8.0, 8.0, 6.0, 9.0, 6.0, 4.0, 6.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.0004063844680786133, -0.0003941524773836136, -0.0003819204866886139, -0.0003696884959936142, -0.0003574565052986145, -0.0003452245146036148, -0.0003329925239086151, -0.0003207605332136154, -0.0003085285425186157, -0.00029629655182361603, -0.00028406456112861633, -0.00027183257043361664, -0.00025960057973861694, -0.00024736858904361725, -0.00023513659834861755, -0.00022290460765361786, -0.00021067261695861816, -0.00019844062626361847, -0.00018620863556861877, -0.00017397664487361908, -0.00016174465417861938, -0.0001495126634836197, -0.00013728067278862, -0.0001250486820936203, -0.0001128166913986206, -0.00010058470070362091, -8.835271000862122e-05, -7.612071931362152e-05, -6.388872861862183e-05, -5.165673792362213e-05, -3.9424747228622437e-05, -2.7192756533622742e-05, -1.4960765838623047e-05, -2.728775143623352e-06, 9.503215551376343e-06, 2.1735206246376038e-05, 3.396719694137573e-05, 4.619918763637543e-05, 5.843117833137512e-05, 7.066316902637482e-05, 8.289515972137451e-05, 9.51271504163742e-05, 0.0001073591411113739, 0.0001195911318063736, 0.0001318231225013733, 0.00014405511319637299, 0.00015628710389137268, 0.00016851909458637238, 0.00018075108528137207, 0.00019298307597637177, 0.00020521506667137146, 0.00021744705736637115, 0.00022967904806137085, 0.00024191103875637054, 0.00025414302945137024, 0.00026637502014636993, 0.00027860701084136963, 0.0002908390015363693, 0.000303070992231369, 0.0003153029829263687, 0.0003275349736213684, 0.0003397669643163681, 0.0003519989550113678, 0.0003642309457063675, 0.0003764629364013672]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 3.0, 7.0, 4.0, 3.0, 6.0, 10.0, 16.0, 11.0, 12.0, 13.0, 21.0, 22.0, 19.0, 31.0, 41.0, 31.0, 34.0, 33.0, 44.0, 46.0, 39.0, 43.0, 42.0, 36.0, 45.0, 46.0, 34.0, 47.0, 39.0, 26.0, 32.0, 28.0, 27.0, 15.0, 25.0, 12.0, 6.0, 8.0, 7.0, 8.0, 7.0, 4.0, 8.0, 3.0, 4.0, 2.0, 3.0, 3.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.83203125, -5.63946533203125, -5.4468994140625, -5.25433349609375, -5.061767578125, -4.86920166015625, -4.6766357421875, -4.48406982421875, -4.29150390625, -4.09893798828125, -3.9063720703125, -3.71380615234375, -3.521240234375, -3.32867431640625, -3.1361083984375, -2.94354248046875, -2.7509765625, -2.55841064453125, -2.3658447265625, -2.17327880859375, -1.980712890625, -1.78814697265625, -1.5955810546875, -1.40301513671875, -1.21044921875, -1.01788330078125, -0.8253173828125, -0.63275146484375, -0.440185546875, -0.24761962890625, -0.0550537109375, 0.13751220703125, 0.330078125, 0.52264404296875, 0.7152099609375, 0.90777587890625, 1.100341796875, 1.29290771484375, 1.4854736328125, 1.67803955078125, 1.87060546875, 2.06317138671875, 2.2557373046875, 2.44830322265625, 2.640869140625, 2.83343505859375, 3.0260009765625, 3.21856689453125, 3.4111328125, 3.60369873046875, 3.7962646484375, 3.98883056640625, 4.181396484375, 4.37396240234375, 4.5665283203125, 4.75909423828125, 4.95166015625, 5.14422607421875, 5.3367919921875, 5.52935791015625, 5.721923828125, 5.91448974609375, 6.1070556640625, 6.29962158203125, 6.4921875]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 2.0, 2.0, 6.0, 8.0, 9.0, 12.0, 19.0, 13.0, 37.0, 27.0, 48.0, 61.0, 80.0, 124.0, 175.0, 238.0, 344.0, 480.0, 711.0, 1202.0, 1987.0, 4151.0, 9971.0, 30580.0, 114472.0, 440673.0, 322779.0, 81524.0, 22779.0, 7726.0, 3362.0, 1688.0, 1075.0, 678.0, 418.0, 265.0, 238.0, 144.0, 132.0, 88.0, 66.0, 39.0, 32.0, 22.0, 11.0, 14.0, 17.0, 11.0, 9.0, 12.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-6.12890625, -5.92376708984375, -5.7186279296875, -5.51348876953125, -5.308349609375, -5.10321044921875, -4.8980712890625, -4.69293212890625, -4.48779296875, -4.28265380859375, -4.0775146484375, -3.87237548828125, -3.667236328125, -3.46209716796875, -3.2569580078125, -3.05181884765625, -2.8466796875, -2.64154052734375, -2.4364013671875, -2.23126220703125, -2.026123046875, -1.82098388671875, -1.6158447265625, -1.41070556640625, -1.20556640625, -1.00042724609375, -0.7952880859375, -0.59014892578125, -0.385009765625, -0.17987060546875, 0.0252685546875, 0.23040771484375, 0.435546875, 0.64068603515625, 0.8458251953125, 1.05096435546875, 1.256103515625, 1.46124267578125, 1.6663818359375, 1.87152099609375, 2.07666015625, 2.28179931640625, 2.4869384765625, 2.69207763671875, 2.897216796875, 3.10235595703125, 3.3074951171875, 3.51263427734375, 3.7177734375, 3.92291259765625, 4.1280517578125, 4.33319091796875, 4.538330078125, 4.74346923828125, 4.9486083984375, 5.15374755859375, 5.35888671875, 5.56402587890625, 5.7691650390625, 5.97430419921875, 6.179443359375, 6.38458251953125, 6.5897216796875, 6.79486083984375, 7.0]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 8.0, 2.0, 4.0, 2.0, 2.0, 7.0, 10.0, 7.0, 14.0, 10.0, 19.0, 14.0, 27.0, 17.0, 23.0, 43.0, 32.0, 22.0, 42.0, 47.0, 47.0, 61.0, 100.0, 1499.0, 416.0, 122.0, 54.0, 52.0, 40.0, 39.0, 36.0, 28.0, 41.0, 28.0, 24.0, 19.0, 16.0, 16.0, 11.0, 12.0, 8.0, 4.0, 12.0, 5.0, 5.0, 4.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.875, -17.279052734375, -16.68310546875, -16.087158203125, -15.4912109375, -14.895263671875, -14.29931640625, -13.703369140625, -13.107421875, -12.511474609375, -11.91552734375, -11.319580078125, -10.7236328125, -10.127685546875, -9.53173828125, -8.935791015625, -8.33984375, -7.743896484375, -7.14794921875, -6.552001953125, -5.9560546875, -5.360107421875, -4.76416015625, -4.168212890625, -3.572265625, -2.976318359375, -2.38037109375, -1.784423828125, -1.1884765625, -0.592529296875, 0.00341796875, 0.599365234375, 1.1953125, 1.791259765625, 2.38720703125, 2.983154296875, 3.5791015625, 4.175048828125, 4.77099609375, 5.366943359375, 5.962890625, 6.558837890625, 7.15478515625, 7.750732421875, 8.3466796875, 8.942626953125, 9.53857421875, 10.134521484375, 10.73046875, 11.326416015625, 11.92236328125, 12.518310546875, 13.1142578125, 13.710205078125, 14.30615234375, 14.902099609375, 15.498046875, 16.093994140625, 16.68994140625, 17.285888671875, 17.8818359375, 18.477783203125, 19.07373046875, 19.669677734375, 20.265625]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 2.0, 7.0, 7.0, 9.0, 10.0, 12.0, 11.0, 18.0, 31.0, 31.0, 38.0, 41.0, 75.0, 92.0, 108.0, 173.0, 278.0, 350.0, 749.0, 7313.0, 3074677.0, 58878.0, 1373.0, 445.0, 290.0, 179.0, 122.0, 97.0, 64.0, 45.0, 46.0, 29.0, 22.0, 26.0, 12.0, 14.0, 10.0, 7.0, 6.0, 4.0, 4.0, 5.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.78125, -43.1640625, -41.546875, -39.9296875, -38.3125, -36.6953125, -35.078125, -33.4609375, -31.84375, -30.2265625, -28.609375, -26.9921875, -25.375, -23.7578125, -22.140625, -20.5234375, -18.90625, -17.2890625, -15.671875, -14.0546875, -12.4375, -10.8203125, -9.203125, -7.5859375, -5.96875, -4.3515625, -2.734375, -1.1171875, 0.5, 2.1171875, 3.734375, 5.3515625, 6.96875, 8.5859375, 10.203125, 11.8203125, 13.4375, 15.0546875, 16.671875, 18.2890625, 19.90625, 21.5234375, 23.140625, 24.7578125, 26.375, 27.9921875, 29.609375, 31.2265625, 32.84375, 34.4609375, 36.078125, 37.6953125, 39.3125, 40.9296875, 42.546875, 44.1640625, 45.78125, 47.3984375, 49.015625, 50.6328125, 52.25, 53.8671875, 55.484375, 57.1015625, 58.71875]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 5.0, 29.0, 55.0, 123.0, 222.0, 223.0, 187.0, 103.0, 47.0, 8.0, 4.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.461393356323242, -14.111532211303711, -12.761670112609863, -11.411808013916016, -10.061946868896484, -8.712085723876953, -7.3622236251831055, -6.012361526489258, -4.662500381469727, -3.312638759613037, -1.9627771377563477, -0.6129155158996582, 0.7369461059570312, 2.0868077278137207, 3.43666934967041, 4.786531448364258, 6.136392593383789, 7.4862542152404785, 8.836115837097168, 10.185977935791016, 11.535839080810547, 12.885700225830078, 14.235562324523926, 15.585424423217773, 16.935285568237305, 18.285146713256836, 19.635009765625, 20.98487091064453, 22.334732055664062, 23.684593200683594, 25.034454345703125, 26.38431739807129, 27.734176635742188, 29.08403778076172, 30.43389892578125, 31.783761978149414, 33.13362121582031, 34.48348617553711, 35.83334732055664, 37.18320846557617, 38.5330696105957, 39.882930755615234, 41.232791900634766, 42.5826530456543, 43.932518005371094, 45.282379150390625, 46.632240295410156, 47.98210144042969, 49.33196258544922, 50.68182373046875, 52.03168487548828, 53.38154602050781, 54.731407165527344, 56.08127212524414, 57.43113327026367, 58.7809944152832, 60.130855560302734, 61.480716705322266, 62.8305778503418, 64.1804428100586, 65.53030395507812, 66.88016510009766, 68.23002624511719, 69.57988739013672, 70.92974853515625]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 6.0, 2.0, 2.0, 4.0, 6.0, 5.0, 8.0, 9.0, 16.0, 11.0, 15.0, 19.0, 14.0, 20.0, 28.0, 32.0, 26.0, 36.0, 30.0, 35.0, 40.0, 37.0, 40.0, 42.0, 28.0, 38.0, 42.0, 49.0, 33.0, 41.0, 41.0, 31.0, 33.0, 26.0, 30.0, 23.0, 18.0, 17.0, 15.0, 18.0, 11.0, 9.0, 4.0, 4.0, 6.0, 4.0, 1.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-64.16007995605469, -62.35831069946289, -60.55654525756836, -58.75477600097656, -56.95301055908203, -55.151241302490234, -53.34947204589844, -51.547706604003906, -49.74593734741211, -47.94416809082031, -46.14240264892578, -44.340633392333984, -42.53886413574219, -40.737098693847656, -38.93532943725586, -37.13356018066406, -35.33179473876953, -33.530025482177734, -31.728260040283203, -29.926490783691406, -28.124723434448242, -26.322956085205078, -24.52118682861328, -22.719419479370117, -20.917652130126953, -19.11588478088379, -17.314117431640625, -15.512348175048828, -13.710580825805664, -11.9088134765625, -10.10704517364502, -8.305276870727539, -6.503505706787109, -4.701737880706787, -2.899970054626465, -1.0982022285461426, 0.7035655975341797, 2.5053329467773438, 4.307101249694824, 6.108869552612305, 7.910636901855469, 9.712404251098633, 11.514172554016113, 13.315940856933594, 15.117708206176758, 16.919475555419922, 18.72124481201172, 20.523012161254883, 22.324779510498047, 24.12654685974121, 25.928314208984375, 27.730083465576172, 29.531850814819336, 31.3336181640625, 33.1353874206543, 34.937156677246094, 36.738922119140625, 38.54069137573242, 40.34245681762695, 42.14422607421875, 43.94599151611328, 45.74776077270508, 47.549530029296875, 49.351295471191406, 51.1530647277832]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 5.0, 2.0, 5.0, 8.0, 9.0, 10.0, 12.0, 12.0, 13.0, 17.0, 22.0, 15.0, 11.0, 32.0, 34.0, 30.0, 39.0, 22.0, 42.0, 32.0, 44.0, 44.0, 41.0, 33.0, 46.0, 37.0, 43.0, 31.0, 42.0, 29.0, 42.0, 24.0, 26.0, 23.0, 23.0, 14.0, 16.0, 10.0, 13.0, 7.0, 7.0, 8.0, 2.0, 7.0, 2.0, 5.0, 7.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.85546875, -5.66107177734375, -5.4666748046875, -5.27227783203125, -5.077880859375, -4.88348388671875, -4.6890869140625, -4.49468994140625, -4.30029296875, -4.10589599609375, -3.9114990234375, -3.71710205078125, -3.522705078125, -3.32830810546875, -3.1339111328125, -2.93951416015625, -2.7451171875, -2.55072021484375, -2.3563232421875, -2.16192626953125, -1.967529296875, -1.77313232421875, -1.5787353515625, -1.38433837890625, -1.18994140625, -0.99554443359375, -0.8011474609375, -0.60675048828125, -0.412353515625, -0.21795654296875, -0.0235595703125, 0.17083740234375, 0.365234375, 0.55963134765625, 0.7540283203125, 0.94842529296875, 1.142822265625, 1.33721923828125, 1.5316162109375, 1.72601318359375, 1.92041015625, 2.11480712890625, 2.3092041015625, 2.50360107421875, 2.697998046875, 2.89239501953125, 3.0867919921875, 3.28118896484375, 3.4755859375, 3.66998291015625, 3.8643798828125, 4.05877685546875, 4.253173828125, 4.44757080078125, 4.6419677734375, 4.83636474609375, 5.03076171875, 5.22515869140625, 5.4195556640625, 5.61395263671875, 5.808349609375, 6.00274658203125, 6.1971435546875, 6.39154052734375, 6.5859375]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 5.0, 8.0, 6.0, 6.0, 9.0, 14.0, 8.0, 16.0, 14.0, 19.0, 14.0, 21.0, 28.0, 35.0, 26.0, 39.0, 62.0, 112.0, 337.0, 1114.0, 8489.0, 553961.0, 3474777.0, 149352.0, 4299.0, 830.0, 265.0, 97.0, 61.0, 51.0, 30.0, 23.0, 22.0, 25.0, 16.0, 23.0, 10.0, 10.0, 4.0, 4.0, 6.0, 8.0, 4.0, 7.0, 4.0, 5.0, 6.0, 1.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-22.46875, -21.728759765625, -20.98876953125, -20.248779296875, -19.5087890625, -18.768798828125, -18.02880859375, -17.288818359375, -16.548828125, -15.808837890625, -15.06884765625, -14.328857421875, -13.5888671875, -12.848876953125, -12.10888671875, -11.368896484375, -10.62890625, -9.888916015625, -9.14892578125, -8.408935546875, -7.6689453125, -6.928955078125, -6.18896484375, -5.448974609375, -4.708984375, -3.968994140625, -3.22900390625, -2.489013671875, -1.7490234375, -1.009033203125, -0.26904296875, 0.470947265625, 1.2109375, 1.950927734375, 2.69091796875, 3.430908203125, 4.1708984375, 4.910888671875, 5.65087890625, 6.390869140625, 7.130859375, 7.870849609375, 8.61083984375, 9.350830078125, 10.0908203125, 10.830810546875, 11.57080078125, 12.310791015625, 13.05078125, 13.790771484375, 14.53076171875, 15.270751953125, 16.0107421875, 16.750732421875, 17.49072265625, 18.230712890625, 18.970703125, 19.710693359375, 20.45068359375, 21.190673828125, 21.9306640625, 22.670654296875, 23.41064453125, 24.150634765625, 24.890625]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 7.0, 6.0, 12.0, 18.0, 10.0, 35.0, 39.0, 59.0, 89.0, 120.0, 171.0, 245.0, 346.0, 489.0, 580.0, 518.0, 413.0, 290.0, 201.0, 137.0, 79.0, 66.0, 32.0, 30.0, 32.0, 13.0, 17.0, 8.0, 6.0, 9.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.28125, -14.78173828125, -14.2822265625, -13.78271484375, -13.283203125, -12.78369140625, -12.2841796875, -11.78466796875, -11.28515625, -10.78564453125, -10.2861328125, -9.78662109375, -9.287109375, -8.78759765625, -8.2880859375, -7.78857421875, -7.2890625, -6.78955078125, -6.2900390625, -5.79052734375, -5.291015625, -4.79150390625, -4.2919921875, -3.79248046875, -3.29296875, -2.79345703125, -2.2939453125, -1.79443359375, -1.294921875, -0.79541015625, -0.2958984375, 0.20361328125, 0.703125, 1.20263671875, 1.7021484375, 2.20166015625, 2.701171875, 3.20068359375, 3.7001953125, 4.19970703125, 4.69921875, 5.19873046875, 5.6982421875, 6.19775390625, 6.697265625, 7.19677734375, 7.6962890625, 8.19580078125, 8.6953125, 9.19482421875, 9.6943359375, 10.19384765625, 10.693359375, 11.19287109375, 11.6923828125, 12.19189453125, 12.69140625, 13.19091796875, 13.6904296875, 14.18994140625, 14.689453125, 15.18896484375, 15.6884765625, 16.18798828125, 16.6875]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 7.0, 9.0, 6.0, 16.0, 20.0, 13.0, 28.0, 32.0, 38.0, 51.0, 74.0, 99.0, 95.0, 165.0, 197.0, 297.0, 466.0, 919.0, 12254.0, 4100498.0, 76050.0, 1271.0, 501.0, 319.0, 179.0, 147.0, 118.0, 109.0, 62.0, 46.0, 57.0, 36.0, 31.0, 14.0, 9.0, 8.0, 14.0, 11.0, 3.0, 9.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-70.9375, -68.8896484375, -66.841796875, -64.7939453125, -62.74609375, -60.6982421875, -58.650390625, -56.6025390625, -54.5546875, -52.5068359375, -50.458984375, -48.4111328125, -46.36328125, -44.3154296875, -42.267578125, -40.2197265625, -38.171875, -36.1240234375, -34.076171875, -32.0283203125, -29.98046875, -27.9326171875, -25.884765625, -23.8369140625, -21.7890625, -19.7412109375, -17.693359375, -15.6455078125, -13.59765625, -11.5498046875, -9.501953125, -7.4541015625, -5.40625, -3.3583984375, -1.310546875, 0.7373046875, 2.78515625, 4.8330078125, 6.880859375, 8.9287109375, 10.9765625, 13.0244140625, 15.072265625, 17.1201171875, 19.16796875, 21.2158203125, 23.263671875, 25.3115234375, 27.359375, 29.4072265625, 31.455078125, 33.5029296875, 35.55078125, 37.5986328125, 39.646484375, 41.6943359375, 43.7421875, 45.7900390625, 47.837890625, 49.8857421875, 51.93359375, 53.9814453125, 56.029296875, 58.0771484375, 60.125]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 83.0, 641.0, 276.0, 13.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-126.81945037841797, -117.58995056152344, -108.36045837402344, -99.13096618652344, -89.9014663696289, -80.67196655273438, -71.44247436523438, -62.212974548339844, -52.983482360839844, -43.75398635864258, -34.52449035644531, -25.294994354248047, -16.06549835205078, -6.836002349853516, 2.39349365234375, 11.622993469238281, 20.85248565673828, 30.081981658935547, 39.31147766113281, 48.54097366333008, 57.770469665527344, 66.99996948242188, 76.22946166992188, 85.4589614868164, 94.6884536743164, 103.91795349121094, 113.14744567871094, 122.37693786621094, 131.6064453125, 140.8359375, 150.0654296875, 159.294921875, 168.5244140625, 177.75390625, 186.9833984375, 196.21290588378906, 205.44239807128906, 214.67189025878906, 223.90139770507812, 233.13088989257812, 242.36038208007812, 251.58987426757812, 260.8193664550781, 270.0488586425781, 279.27838134765625, 288.50787353515625, 297.73736572265625, 306.96685791015625, 316.19635009765625, 325.42584228515625, 334.65533447265625, 343.88482666015625, 353.11431884765625, 362.3438415527344, 371.5733337402344, 380.8028259277344, 390.0323181152344, 399.2618103027344, 408.4913024902344, 417.7207946777344, 426.9503173828125, 436.1798095703125, 445.4093017578125, 454.6387939453125, 463.8682861328125]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 3.0, 3.0, 5.0, 4.0, 10.0, 11.0, 10.0, 8.0, 15.0, 13.0, 32.0, 20.0, 44.0, 33.0, 35.0, 49.0, 51.0, 35.0, 51.0, 39.0, 42.0, 65.0, 52.0, 43.0, 39.0, 31.0, 37.0, 29.0, 32.0, 20.0, 32.0, 23.0, 10.0, 8.0, 10.0, 7.0, 15.0, 12.0, 10.0, 2.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.55354309082031, -41.105613708496094, -39.657684326171875, -38.209754943847656, -36.76182174682617, -35.31389236450195, -33.865962982177734, -32.418033599853516, -30.970102310180664, -29.522172927856445, -28.074241638183594, -26.626312255859375, -25.178382873535156, -23.730451583862305, -22.282522201538086, -20.834590911865234, -19.386661529541016, -17.938732147216797, -16.490800857543945, -15.042871475219727, -13.594941139221191, -12.147010803222656, -10.699081420898438, -9.251151084899902, -7.803220748901367, -6.355290412902832, -4.907360553741455, -3.459430694580078, -2.011500358581543, -0.5635700225830078, 0.8843593597412109, 2.332289695739746, 3.7802200317382812, 5.228150367736816, 6.676080226898193, 8.12401008605957, 9.571940422058105, 11.01987075805664, 12.46780014038086, 13.915730476379395, 15.36366081237793, 16.81159019470215, 18.259521484375, 19.70745086669922, 21.155380249023438, 22.60331153869629, 24.051240921020508, 25.49917221069336, 26.947101593017578, 28.395030975341797, 29.84296226501465, 31.290891647338867, 32.73882293701172, 34.18675231933594, 35.634681701660156, 37.082611083984375, 38.530540466308594, 39.97846984863281, 41.42639923095703, 42.87432861328125, 44.322261810302734, 45.77019119262695, 47.21812057495117, 48.66604995727539, 50.113983154296875]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 8.0, 8.0, 13.0, 7.0, 14.0, 13.0, 13.0, 24.0, 17.0, 18.0, 20.0, 29.0, 34.0, 32.0, 36.0, 37.0, 42.0, 50.0, 43.0, 52.0, 43.0, 42.0, 43.0, 38.0, 42.0, 41.0, 42.0, 37.0, 26.0, 27.0, 23.0, 15.0, 16.0, 7.0, 8.0, 10.0, 9.0, 7.0, 6.0, 3.0, 4.0, 2.0, 3.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.90625, -5.69384765625, -5.4814453125, -5.26904296875, -5.056640625, -4.84423828125, -4.6318359375, -4.41943359375, -4.20703125, -3.99462890625, -3.7822265625, -3.56982421875, -3.357421875, -3.14501953125, -2.9326171875, -2.72021484375, -2.5078125, -2.29541015625, -2.0830078125, -1.87060546875, -1.658203125, -1.44580078125, -1.2333984375, -1.02099609375, -0.80859375, -0.59619140625, -0.3837890625, -0.17138671875, 0.041015625, 0.25341796875, 0.4658203125, 0.67822265625, 0.890625, 1.10302734375, 1.3154296875, 1.52783203125, 1.740234375, 1.95263671875, 2.1650390625, 2.37744140625, 2.58984375, 2.80224609375, 3.0146484375, 3.22705078125, 3.439453125, 3.65185546875, 3.8642578125, 4.07666015625, 4.2890625, 4.50146484375, 4.7138671875, 4.92626953125, 5.138671875, 5.35107421875, 5.5634765625, 5.77587890625, 5.98828125, 6.20068359375, 6.4130859375, 6.62548828125, 6.837890625, 7.05029296875, 7.2626953125, 7.47509765625, 7.6875]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 7.0, 8.0, 10.0, 19.0, 16.0, 37.0, 44.0, 79.0, 132.0, 200.0, 273.0, 444.0, 647.0, 1069.0, 1698.0, 2749.0, 4690.0, 8014.0, 13688.0, 24337.0, 44946.0, 87487.0, 194466.0, 369349.0, 141710.0, 68294.0, 35839.0, 19799.0, 11498.0, 6586.0, 4089.0, 2392.0, 1396.0, 964.0, 617.0, 368.0, 211.0, 132.0, 86.0, 64.0, 38.0, 24.0, 17.0, 11.0, 8.0, 4.0, 4.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.455078125, -1.40545654296875, -1.3558349609375, -1.30621337890625, -1.256591796875, -1.20697021484375, -1.1573486328125, -1.10772705078125, -1.05810546875, -1.00848388671875, -0.9588623046875, -0.90924072265625, -0.859619140625, -0.80999755859375, -0.7603759765625, -0.71075439453125, -0.6611328125, -0.61151123046875, -0.5618896484375, -0.51226806640625, -0.462646484375, -0.41302490234375, -0.3634033203125, -0.31378173828125, -0.26416015625, -0.21453857421875, -0.1649169921875, -0.11529541015625, -0.065673828125, -0.01605224609375, 0.0335693359375, 0.08319091796875, 0.1328125, 0.18243408203125, 0.2320556640625, 0.28167724609375, 0.331298828125, 0.38092041015625, 0.4305419921875, 0.48016357421875, 0.52978515625, 0.57940673828125, 0.6290283203125, 0.67864990234375, 0.728271484375, 0.77789306640625, 0.8275146484375, 0.87713623046875, 0.9267578125, 0.97637939453125, 1.0260009765625, 1.07562255859375, 1.125244140625, 1.17486572265625, 1.2244873046875, 1.27410888671875, 1.32373046875, 1.37335205078125, 1.4229736328125, 1.47259521484375, 1.522216796875, 1.57183837890625, 1.6214599609375, 1.67108154296875, 1.720703125]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 6.0, 5.0, 2.0, 1.0, 6.0, 6.0, 3.0, 13.0, 12.0, 12.0, 26.0, 15.0, 14.0, 20.0, 19.0, 19.0, 24.0, 18.0, 17.0, 22.0, 35.0, 36.0, 50.0, 30.0, 40.0, 28.0, 1060.0, 36.0, 23.0, 39.0, 35.0, 29.0, 33.0, 24.0, 34.0, 30.0, 24.0, 28.0, 24.0, 20.0, 19.0, 14.0, 17.0, 12.0, 11.0, 8.0, 7.0, 7.0, 3.0, 8.0, 4.0, 3.0, 2.0, 2.0, 4.0, 2.0], "bins": [-3.818359375, -3.707550048828125, -3.59674072265625, -3.485931396484375, -3.3751220703125, -3.264312744140625, -3.15350341796875, -3.042694091796875, -2.931884765625, -2.821075439453125, -2.71026611328125, -2.599456787109375, -2.4886474609375, -2.377838134765625, -2.26702880859375, -2.156219482421875, -2.04541015625, -1.934600830078125, -1.82379150390625, -1.712982177734375, -1.6021728515625, -1.491363525390625, -1.38055419921875, -1.269744873046875, -1.158935546875, -1.048126220703125, -0.93731689453125, -0.826507568359375, -0.7156982421875, -0.604888916015625, -0.49407958984375, -0.383270263671875, -0.2724609375, -0.161651611328125, -0.05084228515625, 0.059967041015625, 0.1707763671875, 0.281585693359375, 0.39239501953125, 0.503204345703125, 0.614013671875, 0.724822998046875, 0.83563232421875, 0.946441650390625, 1.0572509765625, 1.168060302734375, 1.27886962890625, 1.389678955078125, 1.50048828125, 1.611297607421875, 1.72210693359375, 1.832916259765625, 1.9437255859375, 2.054534912109375, 2.16534423828125, 2.276153564453125, 2.386962890625, 2.497772216796875, 2.60858154296875, 2.719390869140625, 2.8302001953125, 2.941009521484375, 3.05181884765625, 3.162628173828125, 3.2734375]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 3.0, 3.0, 2.0, 5.0, 11.0, 16.0, 20.0, 36.0, 45.0, 66.0, 83.0, 125.0, 192.0, 268.0, 407.0, 624.0, 921.0, 1421.0, 2124.0, 3279.0, 4938.0, 7593.0, 11549.0, 17681.0, 27102.0, 43213.0, 74531.0, 146825.0, 1391054.0, 158255.0, 77629.0, 45158.0, 28457.0, 18500.0, 12140.0, 7831.0, 5145.0, 3315.0, 2192.0, 1454.0, 983.0, 638.0, 437.0, 279.0, 195.0, 106.0, 104.0, 60.0, 36.0, 27.0, 23.0, 14.0, 8.0, 9.0, 8.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.14453125, -1.1057891845703125, -1.067047119140625, -1.0283050537109375, -0.98956298828125, -0.9508209228515625, -0.912078857421875, -0.8733367919921875, -0.8345947265625, -0.7958526611328125, -0.757110595703125, -0.7183685302734375, -0.67962646484375, -0.6408843994140625, -0.602142333984375, -0.5634002685546875, -0.524658203125, -0.4859161376953125, -0.447174072265625, -0.4084320068359375, -0.36968994140625, -0.3309478759765625, -0.292205810546875, -0.2534637451171875, -0.2147216796875, -0.1759796142578125, -0.137237548828125, -0.0984954833984375, -0.05975341796875, -0.0210113525390625, 0.017730712890625, 0.0564727783203125, 0.09521484375, 0.1339569091796875, 0.172698974609375, 0.2114410400390625, 0.25018310546875, 0.2889251708984375, 0.327667236328125, 0.3664093017578125, 0.4051513671875, 0.4438934326171875, 0.482635498046875, 0.5213775634765625, 0.56011962890625, 0.5988616943359375, 0.637603759765625, 0.6763458251953125, 0.715087890625, 0.7538299560546875, 0.792572021484375, 0.8313140869140625, 0.87005615234375, 0.9087982177734375, 0.947540283203125, 0.9862823486328125, 1.0250244140625, 1.0637664794921875, 1.102508544921875, 1.1412506103515625, 1.17999267578125, 1.2187347412109375, 1.257476806640625, 1.2962188720703125, 1.3349609375]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 4.0, 1.0, 8.0, 10.0, 19.0, 13.0, 20.0, 23.0, 38.0, 33.0, 39.0, 38.0, 38.0, 55.0, 54.0, 68.0, 54.0, 70.0, 61.0, 47.0, 53.0, 46.0, 36.0, 38.0, 24.0, 18.0, 23.0, 15.0, 12.0, 9.0, 8.0, 2.0, 6.0, 10.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0009284019470214844, -0.0009005740284919739, -0.0008727461099624634, -0.0008449181914329529, -0.0008170902729034424, -0.0007892623543739319, -0.0007614344358444214, -0.0007336065173149109, -0.0007057785987854004, -0.0006779506802558899, -0.0006501227617263794, -0.0006222948431968689, -0.0005944669246673584, -0.0005666390061378479, -0.0005388110876083374, -0.0005109831690788269, -0.0004831552505493164, -0.0004553273320198059, -0.0004274994134902954, -0.0003996714949607849, -0.0003718435764312744, -0.0003440156579017639, -0.0003161877393722534, -0.0002883598208427429, -0.0002605319023132324, -0.00023270398378372192, -0.00020487606525421143, -0.00017704814672470093, -0.00014922022819519043, -0.00012139230966567993, -9.356439113616943e-05, -6.573647260665894e-05, -3.790855407714844e-05, -1.008063554763794e-05, 1.774728298187256e-05, 4.557520151138306e-05, 7.340312004089355e-05, 0.00010123103857040405, 0.00012905895709991455, 0.00015688687562942505, 0.00018471479415893555, 0.00021254271268844604, 0.00024037063121795654, 0.00026819854974746704, 0.00029602646827697754, 0.00032385438680648804, 0.00035168230533599854, 0.00037951022386550903, 0.00040733814239501953, 0.00043516606092453003, 0.00046299397945404053, 0.000490821897983551, 0.0005186498165130615, 0.000546477735042572, 0.0005743056535720825, 0.000602133572101593, 0.0006299614906311035, 0.000657789409160614, 0.0006856173276901245, 0.000713445246219635, 0.0007412731647491455, 0.000769101083278656, 0.0007969290018081665, 0.000824756920337677, 0.0008525848388671875]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 3.0, 8.0, 5.0, 6.0, 12.0, 8.0, 11.0, 13.0, 21.0, 24.0, 33.0, 31.0, 64.0, 73.0, 86.0, 136.0, 334.0, 1161.0, 820975.0, 223806.0, 977.0, 295.0, 108.0, 83.0, 46.0, 45.0, 44.0, 26.0, 22.0, 23.0, 19.0, 13.0, 13.0, 8.0, 6.0, 3.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0203094482421875, -0.019652843475341797, -0.018996238708496094, -0.01833963394165039, -0.017683029174804688, -0.017026424407958984, -0.01636981964111328, -0.015713214874267578, -0.015056610107421875, -0.014400005340576172, -0.013743400573730469, -0.013086795806884766, -0.012430191040039062, -0.01177358627319336, -0.011116981506347656, -0.010460376739501953, -0.00980377197265625, -0.009147167205810547, -0.008490562438964844, -0.00783395767211914, -0.0071773529052734375, -0.006520748138427734, -0.005864143371582031, -0.005207538604736328, -0.004550933837890625, -0.003894329071044922, -0.0032377243041992188, -0.0025811195373535156, -0.0019245147705078125, -0.0012679100036621094, -0.0006113052368164062, 4.5299530029296875e-05, 0.000701904296875, 0.0013585090637207031, 0.0020151138305664062, 0.0026717185974121094, 0.0033283233642578125, 0.003984928131103516, 0.004641532897949219, 0.005298137664794922, 0.005954742431640625, 0.006611347198486328, 0.007267951965332031, 0.007924556732177734, 0.008581161499023438, 0.00923776626586914, 0.009894371032714844, 0.010550975799560547, 0.01120758056640625, 0.011864185333251953, 0.012520790100097656, 0.01317739486694336, 0.013833999633789062, 0.014490604400634766, 0.015147209167480469, 0.015803813934326172, 0.016460418701171875, 0.017117023468017578, 0.01777362823486328, 0.018430233001708984, 0.019086837768554688, 0.01974344253540039, 0.020400047302246094, 0.021056652069091797, 0.0217132568359375]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 103.0, 674.0, 226.0, 11.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008886405848897994, -0.0007964096730574965, -0.0007041788194328547, -0.0006119479658082128, -0.00051971705397591, -0.0004274861712474376, -0.00033525528851896524, -0.00024302437668666244, -0.00015079352306202054, -5.856264033354819e-05, 3.3668242394924164e-05, 0.00012589912512339652, 0.00021813000785186887, 0.0003103608905803412, 0.00040259177330881357, 0.0004948226851411164, 0.0005870535387657583, 0.0006792844505980611, 0.000771515304222703, 0.0008637461578473449, 0.0009559770696796477, 0.0010482079815119505, 0.0011404388351365924, 0.0012326696887612343, 0.001324900658801198, 0.00141713151242584, 0.0015093623660504818, 0.0016015933360904455, 0.0016938241897150874, 0.0017860550433397293, 0.001878286013379693, 0.0019705169834196568, 0.002062747720628977, 0.0021549786906689405, 0.0022472094278782606, 0.0023394403979182243, 0.0024316711351275444, 0.002523902105167508, 0.002616133075207472, 0.002708363812416792, 0.0028005947824567556, 0.0028928257524967194, 0.0029850564897060394, 0.003077287459746003, 0.003169518429785967, 0.003261749166995287, 0.0033539801370352507, 0.0034462111070752144, 0.0035384418442845345, 0.003630672814324498, 0.0037229035515338182, 0.003815134521573782, 0.003907365258783102, 0.003999596461653709, 0.0040918271988630295, 0.0041840579360723495, 0.00427628867328167, 0.00436851941049099, 0.004460750613361597, 0.004552981350570917, 0.004645212087780237, 0.004737443290650845, 0.004829674027860165, 0.004921904765069485, 0.005014135967940092]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 1.0, 7.0, 6.0, 4.0, 10.0, 11.0, 11.0, 15.0, 13.0, 18.0, 26.0, 30.0, 33.0, 33.0, 39.0, 39.0, 34.0, 45.0, 26.0, 44.0, 43.0, 55.0, 40.0, 44.0, 31.0, 45.0, 33.0, 33.0, 31.0, 33.0, 36.0, 23.0, 14.0, 14.0, 13.0, 16.0, 13.0, 7.0, 9.0, 6.0, 7.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.000512242317199707, -0.000497656874358654, -0.000483071431517601, -0.000468485988676548, -0.000453900545835495, -0.000439315102994442, -0.000424729660153389, -0.00041014421731233597, -0.00039555877447128296, -0.00038097333163022995, -0.00036638788878917694, -0.00035180244594812393, -0.0003372170031070709, -0.0003226315602660179, -0.0003080461174249649, -0.0002934606745839119, -0.0002788752317428589, -0.0002642897889018059, -0.00024970434606075287, -0.00023511890321969986, -0.00022053346037864685, -0.00020594801753759384, -0.00019136257469654083, -0.00017677713185548782, -0.00016219168901443481, -0.0001476062461733818, -0.0001330208033323288, -0.00011843536049127579, -0.00010384991765022278, -8.926447480916977e-05, -7.467903196811676e-05, -6.009358912706375e-05, -4.550814628601074e-05, -3.092270344495773e-05, -1.6337260603904724e-05, -1.751817762851715e-06, 1.2833625078201294e-05, 2.7419067919254303e-05, 4.200451076030731e-05, 5.658995360136032e-05, 7.117539644241333e-05, 8.576083928346634e-05, 0.00010034628212451935, 0.00011493172496557236, 0.00012951716780662537, 0.00014410261064767838, 0.00015868805348873138, 0.0001732734963297844, 0.0001878589391708374, 0.0002024443820118904, 0.00021702982485294342, 0.00023161526769399643, 0.00024620071053504944, 0.00026078615337610245, 0.00027537159621715546, 0.00028995703905820847, 0.0003045424818992615, 0.0003191279247403145, 0.0003337133675813675, 0.0003482988104224205, 0.0003628842532634735, 0.0003774696961045265, 0.00039205513894557953, 0.00040664058178663254, 0.00042122602462768555]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 8.0, 8.0, 13.0, 7.0, 14.0, 13.0, 13.0, 24.0, 17.0, 18.0, 20.0, 29.0, 34.0, 32.0, 36.0, 37.0, 42.0, 50.0, 43.0, 52.0, 43.0, 42.0, 43.0, 38.0, 42.0, 41.0, 42.0, 37.0, 26.0, 27.0, 23.0, 15.0, 16.0, 7.0, 8.0, 10.0, 9.0, 7.0, 6.0, 3.0, 4.0, 2.0, 3.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.90625, -5.69384765625, -5.4814453125, -5.26904296875, -5.056640625, -4.84423828125, -4.6318359375, -4.41943359375, -4.20703125, -3.99462890625, -3.7822265625, -3.56982421875, -3.357421875, -3.14501953125, -2.9326171875, -2.72021484375, -2.5078125, -2.29541015625, -2.0830078125, -1.87060546875, -1.658203125, -1.44580078125, -1.2333984375, -1.02099609375, -0.80859375, -0.59619140625, -0.3837890625, -0.17138671875, 0.041015625, 0.25341796875, 0.4658203125, 0.67822265625, 0.890625, 1.10302734375, 1.3154296875, 1.52783203125, 1.740234375, 1.95263671875, 2.1650390625, 2.37744140625, 2.58984375, 2.80224609375, 3.0146484375, 3.22705078125, 3.439453125, 3.65185546875, 3.8642578125, 4.07666015625, 4.2890625, 4.50146484375, 4.7138671875, 4.92626953125, 5.138671875, 5.35107421875, 5.5634765625, 5.77587890625, 5.98828125, 6.20068359375, 6.4130859375, 6.62548828125, 6.837890625, 7.05029296875, 7.2626953125, 7.47509765625, 7.6875]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 6.0, 4.0, 3.0, 10.0, 11.0, 10.0, 21.0, 35.0, 34.0, 45.0, 74.0, 100.0, 137.0, 210.0, 290.0, 382.0, 616.0, 959.0, 1531.0, 2780.0, 5851.0, 13081.0, 33527.0, 94596.0, 266809.0, 388737.0, 149876.0, 51971.0, 19356.0, 8178.0, 3800.0, 2085.0, 1106.0, 691.0, 485.0, 316.0, 236.0, 159.0, 109.0, 92.0, 70.0, 53.0, 35.0, 26.0, 17.0, 12.0, 6.0, 7.0, 8.0, 4.0, 4.0, 4.0, 2.0, 1.0, 1.0], "bins": [-4.79296875, -4.65289306640625, -4.5128173828125, -4.37274169921875, -4.232666015625, -4.09259033203125, -3.9525146484375, -3.81243896484375, -3.67236328125, -3.53228759765625, -3.3922119140625, -3.25213623046875, -3.112060546875, -2.97198486328125, -2.8319091796875, -2.69183349609375, -2.5517578125, -2.41168212890625, -2.2716064453125, -2.13153076171875, -1.991455078125, -1.85137939453125, -1.7113037109375, -1.57122802734375, -1.43115234375, -1.29107666015625, -1.1510009765625, -1.01092529296875, -0.870849609375, -0.73077392578125, -0.5906982421875, -0.45062255859375, -0.310546875, -0.17047119140625, -0.0303955078125, 0.10968017578125, 0.249755859375, 0.38983154296875, 0.5299072265625, 0.66998291015625, 0.81005859375, 0.95013427734375, 1.0902099609375, 1.23028564453125, 1.370361328125, 1.51043701171875, 1.6505126953125, 1.79058837890625, 1.9306640625, 2.07073974609375, 2.2108154296875, 2.35089111328125, 2.490966796875, 2.63104248046875, 2.7711181640625, 2.91119384765625, 3.05126953125, 3.19134521484375, 3.3314208984375, 3.47149658203125, 3.611572265625, 3.75164794921875, 3.8917236328125, 4.03179931640625, 4.171875]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 3.0, 6.0, 5.0, 8.0, 9.0, 5.0, 14.0, 13.0, 21.0, 23.0, 26.0, 29.0, 19.0, 27.0, 22.0, 36.0, 51.0, 47.0, 51.0, 80.0, 201.0, 1603.0, 231.0, 79.0, 52.0, 41.0, 43.0, 38.0, 43.0, 29.0, 37.0, 15.0, 21.0, 16.0, 18.0, 13.0, 15.0, 11.0, 12.0, 8.0, 5.0, 8.0, 7.0, 2.0, 3.0, 4.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-18.328125, -17.7275390625, -17.126953125, -16.5263671875, -15.92578125, -15.3251953125, -14.724609375, -14.1240234375, -13.5234375, -12.9228515625, -12.322265625, -11.7216796875, -11.12109375, -10.5205078125, -9.919921875, -9.3193359375, -8.71875, -8.1181640625, -7.517578125, -6.9169921875, -6.31640625, -5.7158203125, -5.115234375, -4.5146484375, -3.9140625, -3.3134765625, -2.712890625, -2.1123046875, -1.51171875, -0.9111328125, -0.310546875, 0.2900390625, 0.890625, 1.4912109375, 2.091796875, 2.6923828125, 3.29296875, 3.8935546875, 4.494140625, 5.0947265625, 5.6953125, 6.2958984375, 6.896484375, 7.4970703125, 8.09765625, 8.6982421875, 9.298828125, 9.8994140625, 10.5, 11.1005859375, 11.701171875, 12.3017578125, 12.90234375, 13.5029296875, 14.103515625, 14.7041015625, 15.3046875, 15.9052734375, 16.505859375, 17.1064453125, 17.70703125, 18.3076171875, 18.908203125, 19.5087890625, 20.109375]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 9.0, 11.0, 11.0, 15.0, 19.0, 31.0, 45.0, 68.0, 84.0, 151.0, 225.0, 384.0, 698.0, 7991.0, 3129964.0, 4462.0, 601.0, 345.0, 208.0, 136.0, 81.0, 55.0, 47.0, 21.0, 16.0, 9.0, 7.0, 4.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-98.625, -96.0595703125, -93.494140625, -90.9287109375, -88.36328125, -85.7978515625, -83.232421875, -80.6669921875, -78.1015625, -75.5361328125, -72.970703125, -70.4052734375, -67.83984375, -65.2744140625, -62.708984375, -60.1435546875, -57.578125, -55.0126953125, -52.447265625, -49.8818359375, -47.31640625, -44.7509765625, -42.185546875, -39.6201171875, -37.0546875, -34.4892578125, -31.923828125, -29.3583984375, -26.79296875, -24.2275390625, -21.662109375, -19.0966796875, -16.53125, -13.9658203125, -11.400390625, -8.8349609375, -6.26953125, -3.7041015625, -1.138671875, 1.4267578125, 3.9921875, 6.5576171875, 9.123046875, 11.6884765625, 14.25390625, 16.8193359375, 19.384765625, 21.9501953125, 24.515625, 27.0810546875, 29.646484375, 32.2119140625, 34.77734375, 37.3427734375, 39.908203125, 42.4736328125, 45.0390625, 47.6044921875, 50.169921875, 52.7353515625, 55.30078125, 57.8662109375, 60.431640625, 62.9970703125, 65.5625]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 5.0, 21.0, 43.0, 69.0, 109.0, 141.0, 168.0, 153.0, 130.0, 75.0, 38.0, 27.0, 14.0, 2.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-11.906025886535645, -11.10049057006836, -10.294955253601074, -9.489419937133789, -8.683884620666504, -7.878349781036377, -7.072814464569092, -6.267279148101807, -5.4617438316345215, -4.656208515167236, -3.850673198699951, -3.045138120651245, -2.23960280418396, -1.434067726135254, -0.6285324096679688, 0.1770029067993164, 0.9825382232666016, 1.7880735397338867, 2.593608856201172, 3.399143934249878, 4.204679489135742, 5.010214328765869, 5.815749645233154, 6.6212849617004395, 7.426820278167725, 8.232355117797852, 9.037890434265137, 9.843425750732422, 10.648961067199707, 11.454496383666992, 12.260031700134277, 13.065567016601562, 13.871103286743164, 14.67663860321045, 15.482173919677734, 16.287708282470703, 17.093244552612305, 17.898778915405273, 18.704315185546875, 19.509849548339844, 20.315385818481445, 21.120920181274414, 21.926456451416016, 22.731990814208984, 23.537527084350586, 24.343061447143555, 25.148597717285156, 25.954132080078125, 26.759666442871094, 27.565200805664062, 28.370737075805664, 29.176271438598633, 29.981807708740234, 30.787342071533203, 31.592878341674805, 32.398414611816406, 33.203948974609375, 34.009483337402344, 34.81501770019531, 35.62055587768555, 36.426090240478516, 37.231624603271484, 38.03715896606445, 38.84269714355469, 39.648231506347656]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 8.0, 6.0, 7.0, 8.0, 13.0, 6.0, 15.0, 17.0, 21.0, 19.0, 25.0, 27.0, 40.0, 37.0, 29.0, 23.0, 38.0, 49.0, 41.0, 46.0, 48.0, 44.0, 36.0, 30.0, 35.0, 38.0, 38.0, 23.0, 29.0, 25.0, 20.0, 19.0, 17.0, 25.0, 18.0, 15.0, 14.0, 6.0, 8.0, 6.0, 6.0, 8.0, 7.0, 3.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-57.65232849121094, -55.96324920654297, -54.274166107177734, -52.585086822509766, -50.89600372314453, -49.20692443847656, -47.517845153808594, -45.82876205444336, -44.13968276977539, -42.45060348510742, -40.76152038574219, -39.07244110107422, -37.383358001708984, -35.694278717041016, -34.00519561767578, -32.31611633300781, -30.62703514099121, -28.93795394897461, -27.248872756958008, -25.559791564941406, -23.870712280273438, -22.181631088256836, -20.492549896240234, -18.803470611572266, -17.11438751220703, -15.42530632019043, -13.736226081848145, -12.047144889831543, -10.358064651489258, -8.668983459472656, -6.979902267456055, -5.2908220291137695, -3.6017417907714844, -1.9126609563827515, -0.22358012199401855, 1.465500831604004, 3.1545815467834473, 4.843662261962891, 6.532743453979492, 8.221823692321777, 9.910904884338379, 11.59998607635498, 13.289066314697266, 14.978147506713867, 16.66722869873047, 18.356307983398438, 20.045391082763672, 21.73447036743164, 23.423551559448242, 25.112632751464844, 26.801713943481445, 28.490795135498047, 30.179874420166016, 31.868955612182617, 33.55803680419922, 35.24711608886719, 36.93619918823242, 38.62527847290039, 40.314361572265625, 42.003440856933594, 43.69252395629883, 45.3816032409668, 47.07068634033203, 48.759765625, 50.44884490966797]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 9.0, 11.0, 6.0, 13.0, 11.0, 19.0, 15.0, 17.0, 19.0, 23.0, 23.0, 31.0, 30.0, 43.0, 43.0, 36.0, 40.0, 46.0, 47.0, 60.0, 39.0, 41.0, 54.0, 41.0, 45.0, 32.0, 31.0, 32.0, 35.0, 24.0, 12.0, 15.0, 9.0, 9.0, 12.0, 8.0, 7.0, 7.0, 2.0, 4.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.5703125, -6.3370361328125, -6.103759765625, -5.8704833984375, -5.63720703125, -5.4039306640625, -5.170654296875, -4.9373779296875, -4.7041015625, -4.4708251953125, -4.237548828125, -4.0042724609375, -3.77099609375, -3.5377197265625, -3.304443359375, -3.0711669921875, -2.837890625, -2.6046142578125, -2.371337890625, -2.1380615234375, -1.90478515625, -1.6715087890625, -1.438232421875, -1.2049560546875, -0.9716796875, -0.7384033203125, -0.505126953125, -0.2718505859375, -0.03857421875, 0.1947021484375, 0.427978515625, 0.6612548828125, 0.89453125, 1.1278076171875, 1.361083984375, 1.5943603515625, 1.82763671875, 2.0609130859375, 2.294189453125, 2.5274658203125, 2.7607421875, 2.9940185546875, 3.227294921875, 3.4605712890625, 3.69384765625, 3.9271240234375, 4.160400390625, 4.3936767578125, 4.626953125, 4.8602294921875, 5.093505859375, 5.3267822265625, 5.56005859375, 5.7933349609375, 6.026611328125, 6.2598876953125, 6.4931640625, 6.7264404296875, 6.959716796875, 7.1929931640625, 7.42626953125, 7.6595458984375, 7.892822265625, 8.1260986328125, 8.359375]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 7.0, 6.0, 10.0, 15.0, 7.0, 11.0, 12.0, 22.0, 29.0, 26.0, 33.0, 59.0, 70.0, 106.0, 242.0, 553.0, 2251.0, 26724.0, 1248446.0, 2802605.0, 106865.0, 4541.0, 832.0, 317.0, 151.0, 97.0, 60.0, 39.0, 30.0, 28.0, 20.0, 15.0, 9.0, 13.0, 10.0, 4.0, 3.0, 6.0, 6.0, 6.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.125, -17.48193359375, -16.8388671875, -16.19580078125, -15.552734375, -14.90966796875, -14.2666015625, -13.62353515625, -12.98046875, -12.33740234375, -11.6943359375, -11.05126953125, -10.408203125, -9.76513671875, -9.1220703125, -8.47900390625, -7.8359375, -7.19287109375, -6.5498046875, -5.90673828125, -5.263671875, -4.62060546875, -3.9775390625, -3.33447265625, -2.69140625, -2.04833984375, -1.4052734375, -0.76220703125, -0.119140625, 0.52392578125, 1.1669921875, 1.81005859375, 2.453125, 3.09619140625, 3.7392578125, 4.38232421875, 5.025390625, 5.66845703125, 6.3115234375, 6.95458984375, 7.59765625, 8.24072265625, 8.8837890625, 9.52685546875, 10.169921875, 10.81298828125, 11.4560546875, 12.09912109375, 12.7421875, 13.38525390625, 14.0283203125, 14.67138671875, 15.314453125, 15.95751953125, 16.6005859375, 17.24365234375, 17.88671875, 18.52978515625, 19.1728515625, 19.81591796875, 20.458984375, 21.10205078125, 21.7451171875, 22.38818359375, 23.03125]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 4.0, 1.0, 4.0, 9.0, 7.0, 15.0, 14.0, 20.0, 26.0, 30.0, 40.0, 47.0, 69.0, 98.0, 117.0, 151.0, 229.0, 292.0, 349.0, 464.0, 435.0, 368.0, 312.0, 211.0, 196.0, 121.0, 100.0, 80.0, 50.0, 51.0, 39.0, 27.0, 24.0, 15.0, 14.0, 13.0, 8.0, 10.0, 3.0, 2.0, 4.0, 4.0, 0.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 4.0], "bins": [-11.875, -11.505126953125, -11.13525390625, -10.765380859375, -10.3955078125, -10.025634765625, -9.65576171875, -9.285888671875, -8.916015625, -8.546142578125, -8.17626953125, -7.806396484375, -7.4365234375, -7.066650390625, -6.69677734375, -6.326904296875, -5.95703125, -5.587158203125, -5.21728515625, -4.847412109375, -4.4775390625, -4.107666015625, -3.73779296875, -3.367919921875, -2.998046875, -2.628173828125, -2.25830078125, -1.888427734375, -1.5185546875, -1.148681640625, -0.77880859375, -0.408935546875, -0.0390625, 0.330810546875, 0.70068359375, 1.070556640625, 1.4404296875, 1.810302734375, 2.18017578125, 2.550048828125, 2.919921875, 3.289794921875, 3.65966796875, 4.029541015625, 4.3994140625, 4.769287109375, 5.13916015625, 5.509033203125, 5.87890625, 6.248779296875, 6.61865234375, 6.988525390625, 7.3583984375, 7.728271484375, 8.09814453125, 8.468017578125, 8.837890625, 9.207763671875, 9.57763671875, 9.947509765625, 10.3173828125, 10.687255859375, 11.05712890625, 11.427001953125, 11.796875]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 3.0, 3.0, 5.0, 3.0, 2.0, 6.0, 7.0, 5.0, 12.0, 10.0, 12.0, 17.0, 24.0, 34.0, 36.0, 34.0, 46.0, 72.0, 84.0, 103.0, 110.0, 170.0, 234.0, 352.0, 642.0, 3151.0, 3119095.0, 1065999.0, 2115.0, 594.0, 355.0, 228.0, 167.0, 116.0, 80.0, 63.0, 56.0, 61.0, 41.0, 34.0, 18.0, 13.0, 17.0, 13.0, 14.0, 7.0, 9.0, 4.0, 6.0, 0.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-65.6875, -63.69287109375, -61.6982421875, -59.70361328125, -57.708984375, -55.71435546875, -53.7197265625, -51.72509765625, -49.73046875, -47.73583984375, -45.7412109375, -43.74658203125, -41.751953125, -39.75732421875, -37.7626953125, -35.76806640625, -33.7734375, -31.77880859375, -29.7841796875, -27.78955078125, -25.794921875, -23.80029296875, -21.8056640625, -19.81103515625, -17.81640625, -15.82177734375, -13.8271484375, -11.83251953125, -9.837890625, -7.84326171875, -5.8486328125, -3.85400390625, -1.859375, 0.13525390625, 2.1298828125, 4.12451171875, 6.119140625, 8.11376953125, 10.1083984375, 12.10302734375, 14.09765625, 16.09228515625, 18.0869140625, 20.08154296875, 22.076171875, 24.07080078125, 26.0654296875, 28.06005859375, 30.0546875, 32.04931640625, 34.0439453125, 36.03857421875, 38.033203125, 40.02783203125, 42.0224609375, 44.01708984375, 46.01171875, 48.00634765625, 50.0009765625, 51.99560546875, 53.990234375, 55.98486328125, 57.9794921875, 59.97412109375, 61.96875]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 36.0, 142.0, 365.0, 339.0, 109.0, 20.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-71.16841888427734, -66.35317993164062, -61.53794860839844, -56.72270965576172, -51.907474517822266, -47.09223937988281, -42.277000427246094, -37.46176528930664, -32.64653015136719, -27.831295013427734, -23.01605796813965, -18.200820922851562, -13.38558578491211, -8.570350646972656, -3.7551136016845703, 1.0601234436035156, 5.875358581542969, 10.690594673156738, 15.505830764770508, 20.321067810058594, 25.136302947998047, 29.9515380859375, 34.76677703857422, 39.58201217651367, 44.397247314453125, 49.21248245239258, 54.02771759033203, 58.84295654296875, 63.6581916809082, 68.47342681884766, 73.28866577148438, 78.10389709472656, 82.91912841796875, 87.73436737060547, 92.54959869384766, 97.36483764648438, 102.18006896972656, 106.99530792236328, 111.810546875, 116.62577819824219, 121.4410171508789, 126.25625610351562, 131.0714874267578, 135.88671875, 140.70196533203125, 145.51719665527344, 150.33242797851562, 155.14767456054688, 159.96290588378906, 164.77813720703125, 169.5933837890625, 174.4086151123047, 179.22384643554688, 184.03909301757812, 188.8543243408203, 193.6695556640625, 198.48480224609375, 203.30003356933594, 208.1152801513672, 212.93051147460938, 217.74574279785156, 222.56097412109375, 227.376220703125, 232.1914520263672, 237.00668334960938]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 1.0, 1.0, 3.0, 1.0, 4.0, 6.0, 4.0, 8.0, 11.0, 7.0, 7.0, 10.0, 10.0, 6.0, 15.0, 16.0, 14.0, 24.0, 27.0, 18.0, 18.0, 30.0, 22.0, 31.0, 31.0, 21.0, 38.0, 36.0, 42.0, 48.0, 39.0, 31.0, 39.0, 40.0, 28.0, 31.0, 25.0, 34.0, 26.0, 17.0, 27.0, 19.0, 15.0, 12.0, 26.0, 15.0, 7.0, 12.0, 16.0, 7.0, 7.0, 7.0, 6.0, 7.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 3.0], "bins": [-38.872467041015625, -37.699764251708984, -36.52706527709961, -35.35436248779297, -34.18165969848633, -33.00895690917969, -31.836257934570312, -30.663555145263672, -29.490854263305664, -28.318153381347656, -27.145450592041016, -25.972749710083008, -24.800048828125, -23.62734603881836, -22.45464515686035, -21.281944274902344, -20.109241485595703, -18.936540603637695, -17.763837814331055, -16.591136932373047, -15.418435096740723, -14.245733261108398, -13.07303237915039, -11.900330543518066, -10.727628707885742, -9.554926872253418, -8.382225036621094, -7.209524154663086, -6.036822319030762, -4.8641204833984375, -3.6914191246032715, -2.5187177658081055, -1.3460121154785156, -0.1733105182647705, 0.9993910789489746, 2.1720926761627197, 3.344794273376465, 4.517496109008789, 5.690197467803955, 6.862898826599121, 8.035600662231445, 9.20830249786377, 10.381004333496094, 11.553705215454102, 12.726407051086426, 13.89910888671875, 15.071809768676758, 16.244510650634766, 17.417213439941406, 18.589914321899414, 19.762617111206055, 20.935317993164062, 22.108020782470703, 23.28072166442871, 24.45342254638672, 25.62612533569336, 26.798826217651367, 27.971527099609375, 29.144229888916016, 30.316930770874023, 31.48963165283203, 32.66233444213867, 33.83503723144531, 35.00773620605469, 36.18043899536133]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 6.0, 6.0, 8.0, 11.0, 11.0, 11.0, 9.0, 12.0, 20.0, 15.0, 19.0, 26.0, 25.0, 21.0, 39.0, 25.0, 33.0, 46.0, 34.0, 51.0, 40.0, 42.0, 42.0, 38.0, 30.0, 40.0, 43.0, 46.0, 39.0, 41.0, 32.0, 23.0, 18.0, 14.0, 20.0, 15.0, 17.0, 9.0, 8.0, 2.0, 3.0, 4.0, 3.0, 4.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-6.3125, -6.10650634765625, -5.9005126953125, -5.69451904296875, -5.488525390625, -5.28253173828125, -5.0765380859375, -4.87054443359375, -4.66455078125, -4.45855712890625, -4.2525634765625, -4.04656982421875, -3.840576171875, -3.63458251953125, -3.4285888671875, -3.22259521484375, -3.0166015625, -2.81060791015625, -2.6046142578125, -2.39862060546875, -2.192626953125, -1.98663330078125, -1.7806396484375, -1.57464599609375, -1.36865234375, -1.16265869140625, -0.9566650390625, -0.75067138671875, -0.544677734375, -0.33868408203125, -0.1326904296875, 0.07330322265625, 0.279296875, 0.48529052734375, 0.6912841796875, 0.89727783203125, 1.103271484375, 1.30926513671875, 1.5152587890625, 1.72125244140625, 1.92724609375, 2.13323974609375, 2.3392333984375, 2.54522705078125, 2.751220703125, 2.95721435546875, 3.1632080078125, 3.36920166015625, 3.5751953125, 3.78118896484375, 3.9871826171875, 4.19317626953125, 4.399169921875, 4.60516357421875, 4.8111572265625, 5.01715087890625, 5.22314453125, 5.42913818359375, 5.6351318359375, 5.84112548828125, 6.047119140625, 6.25311279296875, 6.4591064453125, 6.66510009765625, 6.87109375]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 10.0, 5.0, 10.0, 24.0, 27.0, 42.0, 53.0, 87.0, 112.0, 168.0, 224.0, 394.0, 583.0, 875.0, 1393.0, 2156.0, 3345.0, 4969.0, 7621.0, 12387.0, 19793.0, 32905.0, 57465.0, 104355.0, 235196.0, 288020.0, 116812.0, 63541.0, 36648.0, 22147.0, 13238.0, 8680.0, 5544.0, 3366.0, 2138.0, 1418.0, 954.0, 616.0, 395.0, 279.0, 170.0, 127.0, 76.0, 57.0, 38.0, 30.0, 22.0, 16.0, 15.0, 2.0, 3.0, 2.0, 4.0, 3.0, 0.0, 0.0, 2.0, 4.0], "bins": [-1.3837890625, -1.3392791748046875, -1.294769287109375, -1.2502593994140625, -1.20574951171875, -1.1612396240234375, -1.116729736328125, -1.0722198486328125, -1.0277099609375, -0.9832000732421875, -0.938690185546875, -0.8941802978515625, -0.84967041015625, -0.8051605224609375, -0.760650634765625, -0.7161407470703125, -0.671630859375, -0.6271209716796875, -0.582611083984375, -0.5381011962890625, -0.49359130859375, -0.4490814208984375, -0.404571533203125, -0.3600616455078125, -0.3155517578125, -0.2710418701171875, -0.226531982421875, -0.1820220947265625, -0.13751220703125, -0.0930023193359375, -0.048492431640625, -0.0039825439453125, 0.04052734375, 0.0850372314453125, 0.129547119140625, 0.1740570068359375, 0.21856689453125, 0.2630767822265625, 0.307586669921875, 0.3520965576171875, 0.3966064453125, 0.4411163330078125, 0.485626220703125, 0.5301361083984375, 0.57464599609375, 0.6191558837890625, 0.663665771484375, 0.7081756591796875, 0.752685546875, 0.7971954345703125, 0.841705322265625, 0.8862152099609375, 0.93072509765625, 0.9752349853515625, 1.019744873046875, 1.0642547607421875, 1.1087646484375, 1.1532745361328125, 1.197784423828125, 1.2422943115234375, 1.28680419921875, 1.3313140869140625, 1.375823974609375, 1.4203338623046875, 1.46484375]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 6.0, 6.0, 10.0, 9.0, 12.0, 16.0, 18.0, 13.0, 16.0, 23.0, 32.0, 26.0, 30.0, 34.0, 35.0, 39.0, 41.0, 35.0, 49.0, 1075.0, 48.0, 45.0, 43.0, 43.0, 43.0, 24.0, 35.0, 37.0, 22.0, 27.0, 33.0, 16.0, 11.0, 20.0, 12.0, 10.0, 3.0, 6.0, 6.0, 6.0, 2.0, 6.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6953125, -4.55718994140625, -4.4190673828125, -4.28094482421875, -4.142822265625, -4.00469970703125, -3.8665771484375, -3.72845458984375, -3.59033203125, -3.45220947265625, -3.3140869140625, -3.17596435546875, -3.037841796875, -2.89971923828125, -2.7615966796875, -2.62347412109375, -2.4853515625, -2.34722900390625, -2.2091064453125, -2.07098388671875, -1.932861328125, -1.79473876953125, -1.6566162109375, -1.51849365234375, -1.38037109375, -1.24224853515625, -1.1041259765625, -0.96600341796875, -0.827880859375, -0.68975830078125, -0.5516357421875, -0.41351318359375, -0.275390625, -0.13726806640625, 0.0008544921875, 0.13897705078125, 0.277099609375, 0.41522216796875, 0.5533447265625, 0.69146728515625, 0.82958984375, 0.96771240234375, 1.1058349609375, 1.24395751953125, 1.382080078125, 1.52020263671875, 1.6583251953125, 1.79644775390625, 1.9345703125, 2.07269287109375, 2.2108154296875, 2.34893798828125, 2.487060546875, 2.62518310546875, 2.7633056640625, 2.90142822265625, 3.03955078125, 3.17767333984375, 3.3157958984375, 3.45391845703125, 3.592041015625, 3.73016357421875, 3.8682861328125, 4.00640869140625, 4.14453125]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 8.0, 11.0, 10.0, 18.0, 32.0, 51.0, 64.0, 101.0, 139.0, 228.0, 337.0, 546.0, 888.0, 1441.0, 2214.0, 3811.0, 6013.0, 10010.0, 16827.0, 28448.0, 50540.0, 98943.0, 289148.0, 1358886.0, 103008.0, 52302.0, 29435.0, 17201.0, 10246.0, 6221.0, 3767.0, 2284.0, 1431.0, 900.0, 574.0, 357.0, 244.0, 162.0, 103.0, 63.0, 41.0, 27.0, 17.0, 15.0, 6.0, 7.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.455078125, -1.4066162109375, -1.358154296875, -1.3096923828125, -1.26123046875, -1.2127685546875, -1.164306640625, -1.1158447265625, -1.0673828125, -1.0189208984375, -0.970458984375, -0.9219970703125, -0.87353515625, -0.8250732421875, -0.776611328125, -0.7281494140625, -0.6796875, -0.6312255859375, -0.582763671875, -0.5343017578125, -0.48583984375, -0.4373779296875, -0.388916015625, -0.3404541015625, -0.2919921875, -0.2435302734375, -0.195068359375, -0.1466064453125, -0.09814453125, -0.0496826171875, -0.001220703125, 0.0472412109375, 0.095703125, 0.1441650390625, 0.192626953125, 0.2410888671875, 0.28955078125, 0.3380126953125, 0.386474609375, 0.4349365234375, 0.4833984375, 0.5318603515625, 0.580322265625, 0.6287841796875, 0.67724609375, 0.7257080078125, 0.774169921875, 0.8226318359375, 0.87109375, 0.9195556640625, 0.968017578125, 1.0164794921875, 1.06494140625, 1.1134033203125, 1.161865234375, 1.2103271484375, 1.2587890625, 1.3072509765625, 1.355712890625, 1.4041748046875, 1.45263671875, 1.5010986328125, 1.549560546875, 1.5980224609375, 1.646484375]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 5.0, 3.0, 6.0, 5.0, 6.0, 3.0, 12.0, 9.0, 11.0, 21.0, 27.0, 33.0, 41.0, 56.0, 58.0, 53.0, 75.0, 90.0, 97.0, 72.0, 62.0, 58.0, 52.0, 28.0, 36.0, 18.0, 21.0, 15.0, 6.0, 5.0, 5.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001033782958984375, -0.0010012835264205933, -0.0009687840938568115, -0.0009362846612930298, -0.000903785228729248, -0.0008712857961654663, -0.0008387863636016846, -0.0008062869310379028, -0.0007737874984741211, -0.0007412880659103394, -0.0007087886333465576, -0.0006762892007827759, -0.0006437897682189941, -0.0006112903356552124, -0.0005787909030914307, -0.0005462914705276489, -0.0005137920379638672, -0.00048129260540008545, -0.0004487931728363037, -0.00041629374027252197, -0.00038379430770874023, -0.0003512948751449585, -0.00031879544258117676, -0.000286296010017395, -0.0002537965774536133, -0.00022129714488983154, -0.0001887977123260498, -0.00015629827976226807, -0.00012379884719848633, -9.129941463470459e-05, -5.879998207092285e-05, -2.6300549507141113e-05, 6.198883056640625e-06, 3.869831562042236e-05, 7.11977481842041e-05, 0.00010369718074798584, 0.00013619661331176758, 0.00016869604587554932, 0.00020119547843933105, 0.0002336949110031128, 0.00026619434356689453, 0.00029869377613067627, 0.000331193208694458, 0.00036369264125823975, 0.0003961920738220215, 0.0004286915063858032, 0.00046119093894958496, 0.0004936903715133667, 0.0005261898040771484, 0.0005586892366409302, 0.0005911886692047119, 0.0006236881017684937, 0.0006561875343322754, 0.0006886869668960571, 0.0007211863994598389, 0.0007536858320236206, 0.0007861852645874023, 0.0008186846971511841, 0.0008511841297149658, 0.0008836835622787476, 0.0009161829948425293, 0.000948682427406311, 0.0009811818599700928, 0.0010136812925338745, 0.0010461807250976562]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 5.0, 6.0, 2.0, 6.0, 14.0, 13.0, 23.0, 30.0, 48.0, 61.0, 72.0, 170.0, 450.0, 4340.0, 1040852.0, 1686.0, 314.0, 152.0, 90.0, 52.0, 40.0, 40.0, 18.0, 14.0, 11.0, 6.0, 5.0, 10.0, 6.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02838134765625, -0.027504920959472656, -0.026628494262695312, -0.02575206756591797, -0.024875640869140625, -0.02399921417236328, -0.023122787475585938, -0.022246360778808594, -0.02136993408203125, -0.020493507385253906, -0.019617080688476562, -0.01874065399169922, -0.017864227294921875, -0.01698780059814453, -0.016111373901367188, -0.015234947204589844, -0.0143585205078125, -0.013482093811035156, -0.012605667114257812, -0.011729240417480469, -0.010852813720703125, -0.009976387023925781, -0.009099960327148438, -0.008223533630371094, -0.00734710693359375, -0.006470680236816406, -0.0055942535400390625, -0.004717826843261719, -0.003841400146484375, -0.0029649734497070312, -0.0020885467529296875, -0.0012121200561523438, -0.000335693359375, 0.0005407333374023438, 0.0014171600341796875, 0.0022935867309570312, 0.003170013427734375, 0.004046440124511719, 0.0049228668212890625, 0.005799293518066406, 0.00667572021484375, 0.007552146911621094, 0.008428573608398438, 0.009305000305175781, 0.010181427001953125, 0.011057853698730469, 0.011934280395507812, 0.012810707092285156, 0.0136871337890625, 0.014563560485839844, 0.015439987182617188, 0.01631641387939453, 0.017192840576171875, 0.01806926727294922, 0.018945693969726562, 0.019822120666503906, 0.02069854736328125, 0.021574974060058594, 0.022451400756835938, 0.02332782745361328, 0.024204254150390625, 0.02508068084716797, 0.025957107543945312, 0.026833534240722656, 0.0277099609375]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 15.0, 661.0, 335.0, 6.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.007261773105710745, -0.007136218249797821, -0.0070106638595461845, -0.006885109003633261, -0.006759554147720337, -0.006633999291807413, -0.006508444435894489, -0.006382890045642853, -0.006257335189729929, -0.006131780333817005, -0.006006225943565369, -0.005880671087652445, -0.005755116231739521, -0.005629561375826597, -0.005504006519913673, -0.005378452129662037, -0.005252897273749113, -0.005127342417836189, -0.005001788027584553, -0.004876233171671629, -0.004750678315758705, -0.004625123459845781, -0.0044995686039328575, -0.004374014213681221, -0.004248459357768297, -0.004122904501855373, -0.003997350111603737, -0.003871795255690813, -0.0037462403997778893, -0.0036206855438649654, -0.0034951309207826853, -0.003369576297700405, -0.003244021674618125, -0.003118467051535845, -0.002992912195622921, -0.002867357339709997, -0.002741802716627717, -0.002616248093545437, -0.002490693237632513, -0.0023651383817195892, -0.002239583758637309, -0.002114029135555029, -0.001988474279642105, -0.0018629195401445031, -0.0017373648006469011, -0.0016118100611492991, -0.0014862553216516972, -0.0013607005821540952, -0.0012351458426564932, -0.0011095911031588912, -0.0009840363636612892, -0.0008584816241636872, -0.0007329268846660852, -0.0006073721451684833, -0.00048181740567088127, -0.0003562626661732793, -0.0002307079848833382, -0.00010515324538573623, 2.040149411186576e-05, 0.00014595623360946774, 0.00027151097310706973, 0.0003970657126046717, 0.0005226204521022737, 0.0006481751915998757, 0.0007737299310974777]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 6.0, 7.0, 8.0, 5.0, 9.0, 15.0, 17.0, 13.0, 17.0, 20.0, 27.0, 26.0, 19.0, 40.0, 30.0, 32.0, 38.0, 48.0, 32.0, 42.0, 33.0, 32.0, 40.0, 43.0, 47.0, 30.0, 34.0, 29.0, 35.0, 26.0, 34.0, 25.0, 28.0, 24.0, 19.0, 16.0, 15.0, 14.0, 5.0, 5.0, 4.0, 3.0, 7.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00041735172271728516, -0.0004031714051961899, -0.0003889910876750946, -0.00037481077015399933, -0.00036063045263290405, -0.0003464501351118088, -0.0003322698175907135, -0.0003180895000696182, -0.00030390918254852295, -0.0002897288650274277, -0.0002755485475063324, -0.0002613682299852371, -0.00024718791246414185, -0.00023300759494304657, -0.0002188272774219513, -0.00020464695990085602, -0.00019046664237976074, -0.00017628632485866547, -0.0001621060073375702, -0.00014792568981647491, -0.00013374537229537964, -0.00011956505477428436, -0.00010538473725318909, -9.120441973209381e-05, -7.702410221099854e-05, -6.284378468990326e-05, -4.8663467168807983e-05, -3.448314964771271e-05, -2.030283212661743e-05, -6.122514605522156e-06, 8.05780291557312e-06, 2.2238120436668396e-05, 3.641843795776367e-05, 5.059875547885895e-05, 6.477907299995422e-05, 7.89593905210495e-05, 9.313970804214478e-05, 0.00010732002556324005, 0.00012150034308433533, 0.0001356806606054306, 0.00014986097812652588, 0.00016404129564762115, 0.00017822161316871643, 0.0001924019306898117, 0.00020658224821090698, 0.00022076256573200226, 0.00023494288325309753, 0.0002491232007741928, 0.0002633035182952881, 0.00027748383581638336, 0.00029166415333747864, 0.0003058444708585739, 0.0003200247883796692, 0.00033420510590076447, 0.00034838542342185974, 0.000362565740942955, 0.0003767460584640503, 0.00039092637598514557, 0.00040510669350624084, 0.0004192870110273361, 0.0004334673285484314, 0.00044764764606952667, 0.00046182796359062195, 0.0004760082811117172, 0.0004901885986328125]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 6.0, 6.0, 8.0, 11.0, 11.0, 11.0, 9.0, 12.0, 20.0, 15.0, 19.0, 26.0, 25.0, 21.0, 39.0, 25.0, 33.0, 46.0, 34.0, 51.0, 40.0, 42.0, 42.0, 38.0, 30.0, 40.0, 43.0, 46.0, 39.0, 41.0, 32.0, 23.0, 18.0, 14.0, 20.0, 15.0, 17.0, 9.0, 8.0, 2.0, 3.0, 4.0, 3.0, 4.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-6.3125, -6.10650634765625, -5.9005126953125, -5.69451904296875, -5.488525390625, -5.28253173828125, -5.0765380859375, -4.87054443359375, -4.66455078125, -4.45855712890625, -4.2525634765625, -4.04656982421875, -3.840576171875, -3.63458251953125, -3.4285888671875, -3.22259521484375, -3.0166015625, -2.81060791015625, -2.6046142578125, -2.39862060546875, -2.192626953125, -1.98663330078125, -1.7806396484375, -1.57464599609375, -1.36865234375, -1.16265869140625, -0.9566650390625, -0.75067138671875, -0.544677734375, -0.33868408203125, -0.1326904296875, 0.07330322265625, 0.279296875, 0.48529052734375, 0.6912841796875, 0.89727783203125, 1.103271484375, 1.30926513671875, 1.5152587890625, 1.72125244140625, 1.92724609375, 2.13323974609375, 2.3392333984375, 2.54522705078125, 2.751220703125, 2.95721435546875, 3.1632080078125, 3.36920166015625, 3.5751953125, 3.78118896484375, 3.9871826171875, 4.19317626953125, 4.399169921875, 4.60516357421875, 4.8111572265625, 5.01715087890625, 5.22314453125, 5.42913818359375, 5.6351318359375, 5.84112548828125, 6.047119140625, 6.25311279296875, 6.4591064453125, 6.66510009765625, 6.87109375]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 6.0, 7.0, 10.0, 12.0, 12.0, 15.0, 14.0, 28.0, 40.0, 39.0, 72.0, 92.0, 126.0, 179.0, 302.0, 538.0, 1159.0, 3024.0, 8850.0, 31376.0, 140905.0, 572979.0, 222702.0, 46725.0, 12196.0, 3902.0, 1432.0, 679.0, 367.0, 257.0, 167.0, 96.0, 81.0, 38.0, 29.0, 28.0, 25.0, 13.0, 10.0, 3.0, 5.0, 4.0, 4.0, 5.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-6.15234375, -5.9515380859375, -5.750732421875, -5.5499267578125, -5.34912109375, -5.1483154296875, -4.947509765625, -4.7467041015625, -4.5458984375, -4.3450927734375, -4.144287109375, -3.9434814453125, -3.74267578125, -3.5418701171875, -3.341064453125, -3.1402587890625, -2.939453125, -2.7386474609375, -2.537841796875, -2.3370361328125, -2.13623046875, -1.9354248046875, -1.734619140625, -1.5338134765625, -1.3330078125, -1.1322021484375, -0.931396484375, -0.7305908203125, -0.52978515625, -0.3289794921875, -0.128173828125, 0.0726318359375, 0.2734375, 0.4742431640625, 0.675048828125, 0.8758544921875, 1.07666015625, 1.2774658203125, 1.478271484375, 1.6790771484375, 1.8798828125, 2.0806884765625, 2.281494140625, 2.4822998046875, 2.68310546875, 2.8839111328125, 3.084716796875, 3.2855224609375, 3.486328125, 3.6871337890625, 3.887939453125, 4.0887451171875, 4.28955078125, 4.4903564453125, 4.691162109375, 4.8919677734375, 5.0927734375, 5.2935791015625, 5.494384765625, 5.6951904296875, 5.89599609375, 6.0968017578125, 6.297607421875, 6.4984130859375, 6.69921875]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 3.0, 4.0, 8.0, 8.0, 4.0, 9.0, 10.0, 11.0, 7.0, 10.0, 11.0, 19.0, 17.0, 22.0, 25.0, 22.0, 24.0, 25.0, 40.0, 33.0, 23.0, 31.0, 57.0, 69.0, 247.0, 1662.0, 165.0, 54.0, 48.0, 36.0, 39.0, 27.0, 36.0, 35.0, 29.0, 22.0, 27.0, 22.0, 10.0, 21.0, 19.0, 15.0, 12.0, 4.0, 9.0, 6.0, 6.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 1.0], "bins": [-20.484375, -19.888427734375, -19.29248046875, -18.696533203125, -18.1005859375, -17.504638671875, -16.90869140625, -16.312744140625, -15.716796875, -15.120849609375, -14.52490234375, -13.928955078125, -13.3330078125, -12.737060546875, -12.14111328125, -11.545166015625, -10.94921875, -10.353271484375, -9.75732421875, -9.161376953125, -8.5654296875, -7.969482421875, -7.37353515625, -6.777587890625, -6.181640625, -5.585693359375, -4.98974609375, -4.393798828125, -3.7978515625, -3.201904296875, -2.60595703125, -2.010009765625, -1.4140625, -0.818115234375, -0.22216796875, 0.373779296875, 0.9697265625, 1.565673828125, 2.16162109375, 2.757568359375, 3.353515625, 3.949462890625, 4.54541015625, 5.141357421875, 5.7373046875, 6.333251953125, 6.92919921875, 7.525146484375, 8.12109375, 8.717041015625, 9.31298828125, 9.908935546875, 10.5048828125, 11.100830078125, 11.69677734375, 12.292724609375, 12.888671875, 13.484619140625, 14.08056640625, 14.676513671875, 15.2724609375, 15.868408203125, 16.46435546875, 17.060302734375, 17.65625]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 15.0, 20.0, 62.0, 195.0, 604.0, 65266.0, 3078459.0, 725.0, 211.0, 77.0, 48.0, 15.0, 8.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-194.5, -188.029296875, -181.55859375, -175.087890625, -168.6171875, -162.146484375, -155.67578125, -149.205078125, -142.734375, -136.263671875, -129.79296875, -123.322265625, -116.8515625, -110.380859375, -103.91015625, -97.439453125, -90.96875, -84.498046875, -78.02734375, -71.556640625, -65.0859375, -58.615234375, -52.14453125, -45.673828125, -39.203125, -32.732421875, -26.26171875, -19.791015625, -13.3203125, -6.849609375, -0.37890625, 6.091796875, 12.5625, 19.033203125, 25.50390625, 31.974609375, 38.4453125, 44.916015625, 51.38671875, 57.857421875, 64.328125, 70.798828125, 77.26953125, 83.740234375, 90.2109375, 96.681640625, 103.15234375, 109.623046875, 116.09375, 122.564453125, 129.03515625, 135.505859375, 141.9765625, 148.447265625, 154.91796875, 161.388671875, 167.859375, 174.330078125, 180.80078125, 187.271484375, 193.7421875, 200.212890625, 206.68359375, 213.154296875, 219.625]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 945.0, 70.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.8262710571289, -60.81092071533203, -51.79556655883789, -42.78021240234375, -33.764862060546875, -24.74951171875, -15.73415756225586, -6.718803405761719, 2.2965469360351562, 11.311899185180664, 20.327251434326172, 29.34260368347168, 38.35795593261719, 47.37330627441406, 56.3886604309082, 65.40401458740234, 74.41936492919922, 83.4347152709961, 92.4500732421875, 101.46542358398438, 110.48077392578125, 119.49612426757812, 128.511474609375, 137.52682495117188, 146.54217529296875, 155.55752563476562, 164.5728759765625, 173.58822631835938, 182.60357666015625, 191.61892700195312, 200.63429260253906, 209.64964294433594, 218.66497802734375, 227.68032836914062, 236.6956787109375, 245.71102905273438, 254.72637939453125, 263.7417297363281, 272.757080078125, 281.7724609375, 290.78778076171875, 299.8031311035156, 308.8184814453125, 317.8338317871094, 326.84918212890625, 335.8645324707031, 344.8798828125, 353.895263671875, 362.9106140136719, 371.92596435546875, 380.9413146972656, 389.9566650390625, 398.9720153808594, 407.98736572265625, 417.0027160644531, 426.01806640625, 435.033447265625, 444.0487976074219, 453.06414794921875, 462.0794982910156, 471.0948486328125, 480.1101989746094, 489.12554931640625, 498.14093017578125, 507.15625]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 7.0, 3.0, 8.0, 10.0, 7.0, 14.0, 18.0, 15.0, 27.0, 27.0, 19.0, 27.0, 41.0, 37.0, 35.0, 39.0, 45.0, 35.0, 33.0, 37.0, 43.0, 39.0, 42.0, 36.0, 39.0, 31.0, 31.0, 37.0, 32.0, 32.0, 21.0, 13.0, 17.0, 27.0, 14.0, 14.0, 12.0, 7.0, 8.0, 7.0, 2.0, 7.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-61.813053131103516, -59.95393753051758, -58.094825744628906, -56.23571014404297, -54.37659454345703, -52.517478942871094, -50.65836715698242, -48.799251556396484, -46.94013977050781, -45.081024169921875, -43.2219123840332, -41.362796783447266, -39.50368118286133, -37.644569396972656, -35.78545379638672, -33.92633819580078, -32.067222595214844, -30.20810890197754, -28.3489933013916, -26.489879608154297, -24.63076400756836, -22.771650314331055, -20.91253662109375, -19.053421020507812, -17.194307327270508, -15.335192680358887, -13.476078033447266, -11.616964340209961, -9.75784969329834, -7.898735046386719, -6.039621353149414, -4.180506706237793, -2.3213958740234375, -0.4622814655303955, 1.3968329429626465, 3.2559471130371094, 5.1150617599487305, 6.974176406860352, 8.833290100097656, 10.692404747009277, 12.551519393920898, 14.41063404083252, 16.26974868774414, 18.128862380981445, 19.98797607421875, 21.847091674804688, 23.706205368041992, 25.565319061279297, 27.424434661865234, 29.28354835510254, 31.142663955688477, 33.00177764892578, 34.86089324951172, 36.720008850097656, 38.57912063598633, 40.438236236572266, 42.29734802246094, 44.156463623046875, 46.01557540893555, 47.874691009521484, 49.73380661010742, 51.592918395996094, 53.45203399658203, 55.31114959716797, 57.170265197753906]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 8.0, 4.0, 7.0, 9.0, 7.0, 11.0, 14.0, 12.0, 18.0, 17.0, 21.0, 26.0, 24.0, 24.0, 27.0, 20.0, 35.0, 44.0, 48.0, 48.0, 44.0, 42.0, 35.0, 24.0, 49.0, 38.0, 37.0, 47.0, 51.0, 28.0, 28.0, 28.0, 25.0, 19.0, 13.0, 19.0, 18.0, 8.0, 8.0, 4.0, 4.0, 1.0, 3.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-6.5625, -6.34930419921875, -6.1361083984375, -5.92291259765625, -5.709716796875, -5.49652099609375, -5.2833251953125, -5.07012939453125, -4.85693359375, -4.64373779296875, -4.4305419921875, -4.21734619140625, -4.004150390625, -3.79095458984375, -3.5777587890625, -3.36456298828125, -3.1513671875, -2.93817138671875, -2.7249755859375, -2.51177978515625, -2.298583984375, -2.08538818359375, -1.8721923828125, -1.65899658203125, -1.44580078125, -1.23260498046875, -1.0194091796875, -0.80621337890625, -0.593017578125, -0.37982177734375, -0.1666259765625, 0.04656982421875, 0.259765625, 0.47296142578125, 0.6861572265625, 0.89935302734375, 1.112548828125, 1.32574462890625, 1.5389404296875, 1.75213623046875, 1.96533203125, 2.17852783203125, 2.3917236328125, 2.60491943359375, 2.818115234375, 3.03131103515625, 3.2445068359375, 3.45770263671875, 3.6708984375, 3.88409423828125, 4.0972900390625, 4.31048583984375, 4.523681640625, 4.73687744140625, 4.9500732421875, 5.16326904296875, 5.37646484375, 5.58966064453125, 5.8028564453125, 6.01605224609375, 6.229248046875, 6.44244384765625, 6.6556396484375, 6.86883544921875, 7.08203125]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 9.0, 8.0, 6.0, 12.0, 16.0, 15.0, 32.0, 33.0, 24.0, 33.0, 39.0, 48.0, 58.0, 85.0, 120.0, 152.0, 239.0, 418.0, 1141.0, 5454.0, 77965.0, 1922531.0, 2079853.0, 97568.0, 5805.0, 1210.0, 441.0, 242.0, 177.0, 139.0, 88.0, 63.0, 62.0, 38.0, 34.0, 23.0, 24.0, 13.0, 20.0, 4.0, 12.0, 10.0, 6.0, 1.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-17.171875, -16.618408203125, -16.06494140625, -15.511474609375, -14.9580078125, -14.404541015625, -13.85107421875, -13.297607421875, -12.744140625, -12.190673828125, -11.63720703125, -11.083740234375, -10.5302734375, -9.976806640625, -9.42333984375, -8.869873046875, -8.31640625, -7.762939453125, -7.20947265625, -6.656005859375, -6.1025390625, -5.549072265625, -4.99560546875, -4.442138671875, -3.888671875, -3.335205078125, -2.78173828125, -2.228271484375, -1.6748046875, -1.121337890625, -0.56787109375, -0.014404296875, 0.5390625, 1.092529296875, 1.64599609375, 2.199462890625, 2.7529296875, 3.306396484375, 3.85986328125, 4.413330078125, 4.966796875, 5.520263671875, 6.07373046875, 6.627197265625, 7.1806640625, 7.734130859375, 8.28759765625, 8.841064453125, 9.39453125, 9.947998046875, 10.50146484375, 11.054931640625, 11.6083984375, 12.161865234375, 12.71533203125, 13.268798828125, 13.822265625, 14.375732421875, 14.92919921875, 15.482666015625, 16.0361328125, 16.589599609375, 17.14306640625, 17.696533203125, 18.25]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 10.0, 7.0, 5.0, 11.0, 7.0, 10.0, 17.0, 16.0, 19.0, 13.0, 28.0, 45.0, 71.0, 65.0, 92.0, 124.0, 149.0, 202.0, 252.0, 315.0, 382.0, 404.0, 376.0, 313.0, 258.0, 202.0, 138.0, 113.0, 93.0, 71.0, 42.0, 53.0, 42.0, 23.0, 20.0, 22.0, 16.0, 16.0, 5.0, 11.0, 5.0, 4.0, 7.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-11.2890625, -10.9617919921875, -10.634521484375, -10.3072509765625, -9.97998046875, -9.6527099609375, -9.325439453125, -8.9981689453125, -8.6708984375, -8.3436279296875, -8.016357421875, -7.6890869140625, -7.36181640625, -7.0345458984375, -6.707275390625, -6.3800048828125, -6.052734375, -5.7254638671875, -5.398193359375, -5.0709228515625, -4.74365234375, -4.4163818359375, -4.089111328125, -3.7618408203125, -3.4345703125, -3.1072998046875, -2.780029296875, -2.4527587890625, -2.12548828125, -1.7982177734375, -1.470947265625, -1.1436767578125, -0.81640625, -0.4891357421875, -0.161865234375, 0.1654052734375, 0.49267578125, 0.8199462890625, 1.147216796875, 1.4744873046875, 1.8017578125, 2.1290283203125, 2.456298828125, 2.7835693359375, 3.11083984375, 3.4381103515625, 3.765380859375, 4.0926513671875, 4.419921875, 4.7471923828125, 5.074462890625, 5.4017333984375, 5.72900390625, 6.0562744140625, 6.383544921875, 6.7108154296875, 7.0380859375, 7.3653564453125, 7.692626953125, 8.0198974609375, 8.34716796875, 8.6744384765625, 9.001708984375, 9.3289794921875, 9.65625]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 6.0, 4.0, 3.0, 9.0, 14.0, 11.0, 12.0, 26.0, 18.0, 24.0, 44.0, 43.0, 47.0, 70.0, 62.0, 97.0, 107.0, 138.0, 179.0, 221.0, 291.0, 490.0, 1271.0, 260193.0, 3923213.0, 5439.0, 602.0, 396.0, 250.0, 201.0, 157.0, 138.0, 110.0, 78.0, 64.0, 60.0, 45.0, 23.0, 31.0, 16.0, 19.0, 15.0, 14.0, 12.0, 9.0, 8.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-61.625, -59.7119140625, -57.798828125, -55.8857421875, -53.97265625, -52.0595703125, -50.146484375, -48.2333984375, -46.3203125, -44.4072265625, -42.494140625, -40.5810546875, -38.66796875, -36.7548828125, -34.841796875, -32.9287109375, -31.015625, -29.1025390625, -27.189453125, -25.2763671875, -23.36328125, -21.4501953125, -19.537109375, -17.6240234375, -15.7109375, -13.7978515625, -11.884765625, -9.9716796875, -8.05859375, -6.1455078125, -4.232421875, -2.3193359375, -0.40625, 1.5068359375, 3.419921875, 5.3330078125, 7.24609375, 9.1591796875, 11.072265625, 12.9853515625, 14.8984375, 16.8115234375, 18.724609375, 20.6376953125, 22.55078125, 24.4638671875, 26.376953125, 28.2900390625, 30.203125, 32.1162109375, 34.029296875, 35.9423828125, 37.85546875, 39.7685546875, 41.681640625, 43.5947265625, 45.5078125, 47.4208984375, 49.333984375, 51.2470703125, 53.16015625, 55.0732421875, 56.986328125, 58.8994140625, 60.8125]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 27.0, 134.0, 363.0, 343.0, 119.0, 22.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.414926528930664, -23.65823745727539, -18.90155029296875, -14.144862174987793, -9.388174057006836, -4.631486892700195, 0.12520217895507812, 4.881891250610352, 9.638578414916992, 14.39526653289795, 19.151954650878906, 23.908641815185547, 28.66533088684082, 33.422019958496094, 38.178707122802734, 42.935394287109375, 47.69208526611328, 52.44877243041992, 57.20545959472656, 61.96215057373047, 66.71884155273438, 71.47552490234375, 76.23221588134766, 80.98890686035156, 85.74559020996094, 90.50228118896484, 95.25896453857422, 100.01565551757812, 104.7723388671875, 109.5290298461914, 114.28572082519531, 119.04240417480469, 123.79910278320312, 128.5557861328125, 133.31248474121094, 138.0691680908203, 142.8258514404297, 147.58255004882812, 152.3392333984375, 157.09591674804688, 161.85260009765625, 166.60928344726562, 171.36598205566406, 176.12266540527344, 180.8793487548828, 185.63604736328125, 190.39273071289062, 195.1494140625, 199.90611267089844, 204.6627960205078, 209.41949462890625, 214.17617797851562, 218.932861328125, 223.68954467773438, 228.4462432861328, 233.2029266357422, 237.95962524414062, 242.71630859375, 247.47300720214844, 252.2296905517578, 256.98638916015625, 261.7430725097656, 266.499755859375, 271.2564392089844, 276.01312255859375]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 1.0, 5.0, 3.0, 8.0, 6.0, 13.0, 10.0, 14.0, 18.0, 13.0, 16.0, 19.0, 25.0, 28.0, 23.0, 34.0, 34.0, 33.0, 42.0, 36.0, 40.0, 49.0, 36.0, 61.0, 32.0, 39.0, 28.0, 36.0, 30.0, 33.0, 31.0, 22.0, 24.0, 21.0, 18.0, 21.0, 18.0, 16.0, 14.0, 10.0, 12.0, 11.0, 6.0, 7.0, 1.0, 1.0, 3.0, 7.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-36.67071533203125, -35.43153381347656, -34.192352294921875, -32.95316696166992, -31.713985443115234, -30.474803924560547, -29.235620498657227, -27.996437072753906, -26.75725555419922, -25.51807403564453, -24.27889060974121, -23.03970718383789, -21.800525665283203, -20.561344146728516, -19.322160720825195, -18.082977294921875, -16.843795776367188, -15.604613304138184, -14.36543083190918, -13.126248359680176, -11.887065887451172, -10.647883415222168, -9.408700942993164, -8.16951847076416, -6.930335998535156, -5.691153526306152, -4.451971054077148, -3.2127885818481445, -1.9736061096191406, -0.7344236373901367, 0.5047588348388672, 1.743941307067871, 2.983123779296875, 4.222306251525879, 5.461488723754883, 6.700671195983887, 7.939853668212891, 9.179036140441895, 10.418218612670898, 11.657401084899902, 12.896583557128906, 14.13576602935791, 15.374948501586914, 16.614131927490234, 17.853313446044922, 19.09249496459961, 20.33167839050293, 21.57086181640625, 22.810043334960938, 24.049224853515625, 25.288408279418945, 26.527591705322266, 27.766773223876953, 29.00595474243164, 30.24513816833496, 31.48432159423828, 32.72350311279297, 33.962684631347656, 35.201866149902344, 36.4410514831543, 37.680233001708984, 38.91941452026367, 40.158599853515625, 41.39778137207031, 42.636962890625]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 7.0, 7.0, 10.0, 10.0, 9.0, 13.0, 10.0, 14.0, 22.0, 25.0, 21.0, 29.0, 26.0, 30.0, 32.0, 30.0, 40.0, 35.0, 31.0, 54.0, 41.0, 33.0, 51.0, 37.0, 41.0, 41.0, 37.0, 28.0, 27.0, 28.0, 38.0, 26.0, 27.0, 26.0, 18.0, 10.0, 8.0, 5.0, 9.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 0.0, 2.0], "bins": [-7.1328125, -6.921875, -6.7109375, -6.5, -6.2890625, -6.078125, -5.8671875, -5.65625, -5.4453125, -5.234375, -5.0234375, -4.8125, -4.6015625, -4.390625, -4.1796875, -3.96875, -3.7578125, -3.546875, -3.3359375, -3.125, -2.9140625, -2.703125, -2.4921875, -2.28125, -2.0703125, -1.859375, -1.6484375, -1.4375, -1.2265625, -1.015625, -0.8046875, -0.59375, -0.3828125, -0.171875, 0.0390625, 0.25, 0.4609375, 0.671875, 0.8828125, 1.09375, 1.3046875, 1.515625, 1.7265625, 1.9375, 2.1484375, 2.359375, 2.5703125, 2.78125, 2.9921875, 3.203125, 3.4140625, 3.625, 3.8359375, 4.046875, 4.2578125, 4.46875, 4.6796875, 4.890625, 5.1015625, 5.3125, 5.5234375, 5.734375, 5.9453125, 6.15625, 6.3671875]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 6.0, 4.0, 6.0, 4.0, 10.0, 11.0, 18.0, 33.0, 30.0, 66.0, 99.0, 157.0, 216.0, 352.0, 568.0, 897.0, 1380.0, 2082.0, 3204.0, 5123.0, 8052.0, 13009.0, 20373.0, 32732.0, 53482.0, 95354.0, 215805.0, 310198.0, 118067.0, 64341.0, 38195.0, 24124.0, 14915.0, 9494.0, 5792.0, 3699.0, 2319.0, 1480.0, 930.0, 676.0, 446.0, 243.0, 179.0, 124.0, 119.0, 46.0, 42.0, 25.0, 19.0, 10.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.306640625, -1.2633209228515625, -1.220001220703125, -1.1766815185546875, -1.13336181640625, -1.0900421142578125, -1.046722412109375, -1.0034027099609375, -0.9600830078125, -0.9167633056640625, -0.873443603515625, -0.8301239013671875, -0.78680419921875, -0.7434844970703125, -0.700164794921875, -0.6568450927734375, -0.613525390625, -0.5702056884765625, -0.526885986328125, -0.4835662841796875, -0.44024658203125, -0.3969268798828125, -0.353607177734375, -0.3102874755859375, -0.2669677734375, -0.2236480712890625, -0.180328369140625, -0.1370086669921875, -0.09368896484375, -0.0503692626953125, -0.007049560546875, 0.0362701416015625, 0.07958984375, 0.1229095458984375, 0.166229248046875, 0.2095489501953125, 0.25286865234375, 0.2961883544921875, 0.339508056640625, 0.3828277587890625, 0.4261474609375, 0.4694671630859375, 0.512786865234375, 0.5561065673828125, 0.59942626953125, 0.6427459716796875, 0.686065673828125, 0.7293853759765625, 0.772705078125, 0.8160247802734375, 0.859344482421875, 0.9026641845703125, 0.94598388671875, 0.9893035888671875, 1.032623291015625, 1.0759429931640625, 1.1192626953125, 1.1625823974609375, 1.205902099609375, 1.2492218017578125, 1.29254150390625, 1.3358612060546875, 1.379180908203125, 1.4225006103515625, 1.4658203125]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 5.0, 3.0, 4.0, 4.0, 6.0, 9.0, 4.0, 11.0, 13.0, 17.0, 18.0, 25.0, 20.0, 37.0, 23.0, 33.0, 28.0, 34.0, 37.0, 42.0, 36.0, 45.0, 44.0, 1059.0, 28.0, 54.0, 34.0, 33.0, 47.0, 28.0, 25.0, 28.0, 31.0, 20.0, 29.0, 18.0, 19.0, 14.0, 8.0, 11.0, 12.0, 7.0, 6.0, 7.0, 3.0, 1.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-4.0234375, -3.899566650390625, -3.77569580078125, -3.651824951171875, -3.5279541015625, -3.404083251953125, -3.28021240234375, -3.156341552734375, -3.032470703125, -2.908599853515625, -2.78472900390625, -2.660858154296875, -2.5369873046875, -2.413116455078125, -2.28924560546875, -2.165374755859375, -2.04150390625, -1.917633056640625, -1.79376220703125, -1.669891357421875, -1.5460205078125, -1.422149658203125, -1.29827880859375, -1.174407958984375, -1.050537109375, -0.926666259765625, -0.80279541015625, -0.678924560546875, -0.5550537109375, -0.431182861328125, -0.30731201171875, -0.183441162109375, -0.0595703125, 0.064300537109375, 0.18817138671875, 0.312042236328125, 0.4359130859375, 0.559783935546875, 0.68365478515625, 0.807525634765625, 0.931396484375, 1.055267333984375, 1.17913818359375, 1.303009033203125, 1.4268798828125, 1.550750732421875, 1.67462158203125, 1.798492431640625, 1.92236328125, 2.046234130859375, 2.17010498046875, 2.293975830078125, 2.4178466796875, 2.541717529296875, 2.66558837890625, 2.789459228515625, 2.913330078125, 3.037200927734375, 3.16107177734375, 3.284942626953125, 3.4088134765625, 3.532684326171875, 3.65655517578125, 3.780426025390625, 3.904296875]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 7.0, 8.0, 17.0, 21.0, 37.0, 32.0, 62.0, 111.0, 122.0, 199.0, 282.0, 459.0, 660.0, 982.0, 1514.0, 2388.0, 3602.0, 5801.0, 9365.0, 15164.0, 25383.0, 42229.0, 75931.0, 164295.0, 1425873.0, 148510.0, 71558.0, 39756.0, 23805.0, 14513.0, 8786.0, 5580.0, 3528.0, 2241.0, 1485.0, 938.0, 641.0, 408.0, 273.0, 171.0, 117.0, 97.0, 54.0, 38.0, 26.0, 17.0, 14.0, 14.0, 7.0, 8.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0], "bins": [-1.3623046875, -1.3189849853515625, -1.275665283203125, -1.2323455810546875, -1.18902587890625, -1.1457061767578125, -1.102386474609375, -1.0590667724609375, -1.0157470703125, -0.9724273681640625, -0.929107666015625, -0.8857879638671875, -0.84246826171875, -0.7991485595703125, -0.755828857421875, -0.7125091552734375, -0.669189453125, -0.6258697509765625, -0.582550048828125, -0.5392303466796875, -0.49591064453125, -0.4525909423828125, -0.409271240234375, -0.3659515380859375, -0.3226318359375, -0.2793121337890625, -0.235992431640625, -0.1926727294921875, -0.14935302734375, -0.1060333251953125, -0.062713623046875, -0.0193939208984375, 0.02392578125, 0.0672454833984375, 0.110565185546875, 0.1538848876953125, 0.19720458984375, 0.2405242919921875, 0.283843994140625, 0.3271636962890625, 0.3704833984375, 0.4138031005859375, 0.457122802734375, 0.5004425048828125, 0.54376220703125, 0.5870819091796875, 0.630401611328125, 0.6737213134765625, 0.717041015625, 0.7603607177734375, 0.803680419921875, 0.8470001220703125, 0.89031982421875, 0.9336395263671875, 0.976959228515625, 1.0202789306640625, 1.0635986328125, 1.1069183349609375, 1.150238037109375, 1.1935577392578125, 1.23687744140625, 1.2801971435546875, 1.323516845703125, 1.3668365478515625, 1.41015625]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 9.0, 10.0, 3.0, 6.0, 2.0, 14.0, 15.0, 23.0, 16.0, 22.0, 25.0, 44.0, 35.0, 50.0, 43.0, 44.0, 62.0, 74.0, 66.0, 55.0, 63.0, 50.0, 49.0, 37.0, 29.0, 38.0, 20.0, 16.0, 14.0, 17.0, 10.0, 7.0, 7.0, 7.0, 3.0, 4.0, 3.0, 2.0, 4.0, 1.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006680488586425781, -0.0006473064422607422, -0.0006265640258789062, -0.0006058216094970703, -0.0005850791931152344, -0.0005643367767333984, -0.0005435943603515625, -0.0005228519439697266, -0.0005021095275878906, -0.0004813671112060547, -0.00046062469482421875, -0.0004398822784423828, -0.0004191398620605469, -0.00039839744567871094, -0.000377655029296875, -0.00035691261291503906, -0.0003361701965332031, -0.0003154277801513672, -0.00029468536376953125, -0.0002739429473876953, -0.0002532005310058594, -0.00023245811462402344, -0.0002117156982421875, -0.00019097328186035156, -0.00017023086547851562, -0.0001494884490966797, -0.00012874603271484375, -0.00010800361633300781, -8.726119995117188e-05, -6.651878356933594e-05, -4.57763671875e-05, -2.5033950805664062e-05, -4.291534423828125e-06, 1.6450881958007812e-05, 3.719329833984375e-05, 5.793571472167969e-05, 7.867813110351562e-05, 9.942054748535156e-05, 0.0001201629638671875, 0.00014090538024902344, 0.00016164779663085938, 0.0001823902130126953, 0.00020313262939453125, 0.0002238750457763672, 0.0002446174621582031, 0.00026535987854003906, 0.000286102294921875, 0.00030684471130371094, 0.0003275871276855469, 0.0003483295440673828, 0.00036907196044921875, 0.0003898143768310547, 0.0004105567932128906, 0.00043129920959472656, 0.0004520416259765625, 0.00047278404235839844, 0.0004935264587402344, 0.0005142688751220703, 0.0005350112915039062, 0.0005557537078857422, 0.0005764961242675781, 0.0005972385406494141, 0.00061798095703125, 0.0006387233734130859, 0.0006594657897949219]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 6.0, 1.0, 4.0, 1.0, 6.0, 5.0, 4.0, 4.0, 5.0, 8.0, 18.0, 10.0, 15.0, 25.0, 20.0, 36.0, 48.0, 52.0, 73.0, 121.0, 194.0, 467.0, 1651.0, 870635.0, 173109.0, 1037.0, 358.0, 190.0, 82.0, 83.0, 49.0, 42.0, 44.0, 35.0, 21.0, 31.0, 13.0, 14.0, 10.0, 6.0, 8.0, 5.0, 7.0, 2.0, 7.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0130615234375, -0.01259303092956543, -0.01212453842163086, -0.011656045913696289, -0.011187553405761719, -0.010719060897827148, -0.010250568389892578, -0.009782075881958008, -0.009313583374023438, -0.008845090866088867, -0.008376598358154297, -0.007908105850219727, -0.007439613342285156, -0.006971120834350586, -0.006502628326416016, -0.006034135818481445, -0.005565643310546875, -0.005097150802612305, -0.004628658294677734, -0.004160165786743164, -0.0036916732788085938, -0.0032231807708740234, -0.002754688262939453, -0.002286195755004883, -0.0018177032470703125, -0.0013492107391357422, -0.0008807182312011719, -0.00041222572326660156, 5.626678466796875e-05, 0.0005247592926025391, 0.0009932518005371094, 0.0014617443084716797, 0.00193023681640625, 0.0023987293243408203, 0.0028672218322753906, 0.003335714340209961, 0.0038042068481445312, 0.0042726993560791016, 0.004741191864013672, 0.005209684371948242, 0.0056781768798828125, 0.006146669387817383, 0.006615161895751953, 0.0070836544036865234, 0.007552146911621094, 0.008020639419555664, 0.008489131927490234, 0.008957624435424805, 0.009426116943359375, 0.009894609451293945, 0.010363101959228516, 0.010831594467163086, 0.011300086975097656, 0.011768579483032227, 0.012237071990966797, 0.012705564498901367, 0.013174057006835938, 0.013642549514770508, 0.014111042022705078, 0.014579534530639648, 0.015048027038574219, 0.015516519546508789, 0.01598501205444336, 0.01645350456237793, 0.0169219970703125]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 7.0, 8.0, 15.0, 29.0, 67.0, 97.0, 112.0, 142.0, 142.0, 135.0, 104.0, 72.0, 35.0, 24.0, 9.0, 7.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.0006525710341520607, -0.0006367276073433459, -0.000620884180534631, -0.0006050408119335771, -0.0005891973851248622, -0.0005733539583161473, -0.0005575105315074325, -0.0005416671046987176, -0.0005258236778900027, -0.0005099802510812879, -0.000494136824272573, -0.0004782934265676886, -0.0004624500288628042, -0.0004466066020540893, -0.00043076317524537444, -0.0004149197484366596, -0.0003990763798356056, -0.00038323295302689075, -0.00036738955532200634, -0.0003515461285132915, -0.00033570273080840707, -0.0003198593039996922, -0.00030401587719097733, -0.00028817245038226247, -0.00027232905267737806, -0.0002564856258686632, -0.00024064222816377878, -0.00022479880135506392, -0.00020895538909826428, -0.00019311197684146464, -0.00017726855003274977, -0.00016142513777595013, -0.00014558175462298095, -0.00012973834236618131, -0.00011389492283342406, -9.805150330066681e-05, -8.220809104386717e-05, -6.636467878706753e-05, -5.052125925431028e-05, -3.467783972155303e-05, -1.883442746475339e-05, -2.991011569974944e-06, 1.2852404324803501e-05, 2.8695820219581947e-05, 4.453923611436039e-05, 6.038264837116003e-05, 7.622606790391728e-05, 9.206948743667454e-05, 0.00010791289969347417, 0.0001237563119502738, 0.00013959972420707345, 0.00015544315101578832, 0.00017128656327258795, 0.0001871299755293876, 0.00020297340233810246, 0.0002188168145949021, 0.00023466022685170174, 0.0002505036536604166, 0.000266347051365301, 0.0002821904781740159, 0.0002980338758789003, 0.00031387730268761516, 0.00032972072949633, 0.0003455641563050449, 0.0003614075540099293]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 3.0, 7.0, 5.0, 11.0, 7.0, 11.0, 10.0, 19.0, 12.0, 20.0, 26.0, 19.0, 37.0, 33.0, 30.0, 41.0, 34.0, 42.0, 37.0, 42.0, 38.0, 49.0, 52.0, 48.0, 39.0, 40.0, 33.0, 29.0, 31.0, 33.0, 43.0, 18.0, 28.0, 17.0, 15.0, 12.0, 6.0, 5.0, 10.0, 4.0, 0.0, 4.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0003628730773925781, -0.0003516189754009247, -0.00034036487340927124, -0.0003291107714176178, -0.00031785666942596436, -0.0003066025674343109, -0.00029534846544265747, -0.00028409436345100403, -0.0002728402614593506, -0.00026158615946769714, -0.0002503320574760437, -0.00023907795548439026, -0.00022782385349273682, -0.00021656975150108337, -0.00020531564950942993, -0.0001940615475177765, -0.00018280744552612305, -0.0001715533435344696, -0.00016029924154281616, -0.00014904513955116272, -0.00013779103755950928, -0.00012653693556785583, -0.00011528283357620239, -0.00010402873158454895, -9.277462959289551e-05, -8.152052760124207e-05, -7.026642560958862e-05, -5.901232361793518e-05, -4.775822162628174e-05, -3.6504119634628296e-05, -2.5250017642974854e-05, -1.3995915651321411e-05, -2.7418136596679688e-06, 8.512288331985474e-06, 1.9766390323638916e-05, 3.102049231529236e-05, 4.22745943069458e-05, 5.352869629859924e-05, 6.478279829025269e-05, 7.603690028190613e-05, 8.729100227355957e-05, 9.854510426521301e-05, 0.00010979920625686646, 0.0001210533082485199, 0.00013230741024017334, 0.00014356151223182678, 0.00015481561422348022, 0.00016606971621513367, 0.0001773238182067871, 0.00018857792019844055, 0.000199832022190094, 0.00021108612418174744, 0.00022234022617340088, 0.00023359432816505432, 0.00024484843015670776, 0.0002561025321483612, 0.00026735663414001465, 0.0002786107361316681, 0.00028986483812332153, 0.000301118940114975, 0.0003123730421066284, 0.00032362714409828186, 0.0003348812460899353, 0.00034613534808158875, 0.0003573894500732422]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 7.0, 7.0, 10.0, 10.0, 9.0, 13.0, 10.0, 14.0, 22.0, 25.0, 21.0, 29.0, 26.0, 30.0, 32.0, 30.0, 40.0, 35.0, 31.0, 53.0, 42.0, 33.0, 51.0, 37.0, 41.0, 41.0, 37.0, 28.0, 27.0, 28.0, 38.0, 26.0, 27.0, 26.0, 18.0, 10.0, 8.0, 5.0, 9.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 0.0, 2.0], "bins": [-7.1328125, -6.921875, -6.7109375, -6.5, -6.2890625, -6.078125, -5.8671875, -5.65625, -5.4453125, -5.234375, -5.0234375, -4.8125, -4.6015625, -4.390625, -4.1796875, -3.96875, -3.7578125, -3.546875, -3.3359375, -3.125, -2.9140625, -2.703125, -2.4921875, -2.28125, -2.0703125, -1.859375, -1.6484375, -1.4375, -1.2265625, -1.015625, -0.8046875, -0.59375, -0.3828125, -0.171875, 0.0390625, 0.25, 0.4609375, 0.671875, 0.8828125, 1.09375, 1.3046875, 1.515625, 1.7265625, 1.9375, 2.1484375, 2.359375, 2.5703125, 2.78125, 2.9921875, 3.203125, 3.4140625, 3.625, 3.8359375, 4.046875, 4.2578125, 4.46875, 4.6796875, 4.890625, 5.1015625, 5.3125, 5.5234375, 5.734375, 5.9453125, 6.15625, 6.3671875]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 1.0, 6.0, 6.0, 2.0, 4.0, 12.0, 10.0, 25.0, 17.0, 20.0, 38.0, 46.0, 71.0, 123.0, 215.0, 334.0, 616.0, 1274.0, 2637.0, 5816.0, 14086.0, 35912.0, 104954.0, 331680.0, 367267.0, 116074.0, 39928.0, 15117.0, 6383.0, 2903.0, 1362.0, 646.0, 340.0, 196.0, 131.0, 79.0, 50.0, 44.0, 38.0, 21.0, 16.0, 13.0, 15.0, 7.0, 4.0, 8.0, 2.0, 3.0, 1.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.77734375, -4.61834716796875, -4.4593505859375, -4.30035400390625, -4.141357421875, -3.98236083984375, -3.8233642578125, -3.66436767578125, -3.50537109375, -3.34637451171875, -3.1873779296875, -3.02838134765625, -2.869384765625, -2.71038818359375, -2.5513916015625, -2.39239501953125, -2.2333984375, -2.07440185546875, -1.9154052734375, -1.75640869140625, -1.597412109375, -1.43841552734375, -1.2794189453125, -1.12042236328125, -0.96142578125, -0.80242919921875, -0.6434326171875, -0.48443603515625, -0.325439453125, -0.16644287109375, -0.0074462890625, 0.15155029296875, 0.310546875, 0.46954345703125, 0.6285400390625, 0.78753662109375, 0.946533203125, 1.10552978515625, 1.2645263671875, 1.42352294921875, 1.58251953125, 1.74151611328125, 1.9005126953125, 2.05950927734375, 2.218505859375, 2.37750244140625, 2.5364990234375, 2.69549560546875, 2.8544921875, 3.01348876953125, 3.1724853515625, 3.33148193359375, 3.490478515625, 3.64947509765625, 3.8084716796875, 3.96746826171875, 4.12646484375, 4.28546142578125, 4.4444580078125, 4.60345458984375, 4.762451171875, 4.92144775390625, 5.0804443359375, 5.23944091796875, 5.3984375]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 7.0, 4.0, 10.0, 9.0, 13.0, 14.0, 25.0, 24.0, 23.0, 25.0, 34.0, 31.0, 45.0, 43.0, 51.0, 68.0, 102.0, 1748.0, 299.0, 84.0, 57.0, 51.0, 41.0, 33.0, 35.0, 35.0, 24.0, 18.0, 20.0, 14.0, 17.0, 7.0, 10.0, 12.0, 5.0, 4.0, 4.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.828125, -25.98486328125, -25.1416015625, -24.29833984375, -23.455078125, -22.61181640625, -21.7685546875, -20.92529296875, -20.08203125, -19.23876953125, -18.3955078125, -17.55224609375, -16.708984375, -15.86572265625, -15.0224609375, -14.17919921875, -13.3359375, -12.49267578125, -11.6494140625, -10.80615234375, -9.962890625, -9.11962890625, -8.2763671875, -7.43310546875, -6.58984375, -5.74658203125, -4.9033203125, -4.06005859375, -3.216796875, -2.37353515625, -1.5302734375, -0.68701171875, 0.15625, 0.99951171875, 1.8427734375, 2.68603515625, 3.529296875, 4.37255859375, 5.2158203125, 6.05908203125, 6.90234375, 7.74560546875, 8.5888671875, 9.43212890625, 10.275390625, 11.11865234375, 11.9619140625, 12.80517578125, 13.6484375, 14.49169921875, 15.3349609375, 16.17822265625, 17.021484375, 17.86474609375, 18.7080078125, 19.55126953125, 20.39453125, 21.23779296875, 22.0810546875, 22.92431640625, 23.767578125, 24.61083984375, 25.4541015625, 26.29736328125, 27.140625]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 4.0, 4.0, 3.0, 12.0, 14.0, 12.0, 16.0, 18.0, 41.0, 33.0, 38.0, 68.0, 121.0, 103.0, 144.0, 222.0, 373.0, 838.0, 52508.0, 3087371.0, 2181.0, 558.0, 298.0, 164.0, 141.0, 99.0, 82.0, 59.0, 41.0, 44.0, 23.0, 21.0, 16.0, 8.0, 9.0, 8.0, 5.0, 7.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.1875, -63.1650390625, -61.142578125, -59.1201171875, -57.09765625, -55.0751953125, -53.052734375, -51.0302734375, -49.0078125, -46.9853515625, -44.962890625, -42.9404296875, -40.91796875, -38.8955078125, -36.873046875, -34.8505859375, -32.828125, -30.8056640625, -28.783203125, -26.7607421875, -24.73828125, -22.7158203125, -20.693359375, -18.6708984375, -16.6484375, -14.6259765625, -12.603515625, -10.5810546875, -8.55859375, -6.5361328125, -4.513671875, -2.4912109375, -0.46875, 1.5537109375, 3.576171875, 5.5986328125, 7.62109375, 9.6435546875, 11.666015625, 13.6884765625, 15.7109375, 17.7333984375, 19.755859375, 21.7783203125, 23.80078125, 25.8232421875, 27.845703125, 29.8681640625, 31.890625, 33.9130859375, 35.935546875, 37.9580078125, 39.98046875, 42.0029296875, 44.025390625, 46.0478515625, 48.0703125, 50.0927734375, 52.115234375, 54.1376953125, 56.16015625, 58.1826171875, 60.205078125, 62.2275390625, 64.25]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [250.0, 769.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.894426345825195, -1.428757667541504, 8.036911010742188, 17.502580642700195, 26.96824836730957, 36.43391418457031, 45.89958953857422, 55.365257263183594, 64.83092498779297, 74.29659271240234, 83.76226043701172, 93.22793579101562, 102.693603515625, 112.15927124023438, 121.62493896484375, 131.09060668945312, 140.5562744140625, 150.02194213867188, 159.48760986328125, 168.95327758789062, 178.4189453125, 187.88461303710938, 197.35028076171875, 206.81594848632812, 216.2816162109375, 225.74728393554688, 235.21295166015625, 244.67861938476562, 254.144287109375, 263.6099548339844, 273.07562255859375, 282.5412902832031, 292.0069885253906, 301.47265625, 310.9383239746094, 320.40399169921875, 329.8696594238281, 339.3353271484375, 348.8009948730469, 358.26666259765625, 367.7323303222656, 377.197998046875, 386.6636657714844, 396.12933349609375, 405.5950012207031, 415.0606689453125, 424.5263366699219, 433.99200439453125, 443.45770263671875, 452.9233703613281, 462.3890380859375, 471.8547058105469, 481.32037353515625, 490.7860412597656, 500.251708984375, 509.7173767089844, 519.1830444335938, 528.6487426757812, 538.1143798828125, 547.580078125, 557.0457153320312, 566.5114135742188, 575.97705078125, 585.4427490234375, 594.9083862304688]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 6.0, 6.0, 10.0, 10.0, 10.0, 12.0, 9.0, 15.0, 15.0, 18.0, 19.0, 25.0, 23.0, 40.0, 30.0, 36.0, 39.0, 38.0, 43.0, 35.0, 42.0, 53.0, 36.0, 39.0, 40.0, 34.0, 32.0, 31.0, 38.0, 20.0, 32.0, 27.0, 17.0, 17.0, 18.0, 21.0, 14.0, 8.0, 6.0, 9.0, 7.0, 7.0, 7.0, 1.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0], "bins": [-65.78682708740234, -63.929779052734375, -62.07273483276367, -60.21569061279297, -58.358642578125, -56.50159454345703, -54.64455032348633, -52.787506103515625, -50.930458068847656, -49.07341003417969, -47.216365814208984, -45.35932159423828, -43.50227355957031, -41.645225524902344, -39.78818130493164, -37.93113708496094, -36.07408905029297, -34.217041015625, -32.3599967956543, -30.50295066833496, -28.645904541015625, -26.78885841369629, -24.931812286376953, -23.074766159057617, -21.21772003173828, -19.360673904418945, -17.50362777709961, -15.646581649780273, -13.789535522460938, -11.932489395141602, -10.075443267822266, -8.21839714050293, -6.361354827880859, -4.504308700561523, -2.6472625732421875, -0.7902164459228516, 1.0668296813964844, 2.9238758087158203, 4.780921936035156, 6.637968063354492, 8.495014190673828, 10.352060317993164, 12.2091064453125, 14.066152572631836, 15.923198699951172, 17.780244827270508, 19.637290954589844, 21.49433708190918, 23.351383209228516, 25.20842933654785, 27.065475463867188, 28.922521591186523, 30.77956771850586, 32.63661193847656, 34.49365997314453, 36.3507080078125, 38.2077522277832, 40.064796447753906, 41.921844482421875, 43.778892517089844, 45.63593673706055, 47.49298095703125, 49.35002899169922, 51.20707702636719, 53.06412124633789]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 11.0, 5.0, 6.0, 10.0, 14.0, 8.0, 19.0, 15.0, 21.0, 23.0, 25.0, 27.0, 32.0, 30.0, 46.0, 28.0, 33.0, 46.0, 31.0, 48.0, 32.0, 44.0, 60.0, 41.0, 36.0, 35.0, 33.0, 35.0, 34.0, 27.0, 33.0, 23.0, 23.0, 25.0, 11.0, 11.0, 2.0, 4.0, 4.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.3515625, -7.12322998046875, -6.8948974609375, -6.66656494140625, -6.438232421875, -6.20989990234375, -5.9815673828125, -5.75323486328125, -5.52490234375, -5.29656982421875, -5.0682373046875, -4.83990478515625, -4.611572265625, -4.38323974609375, -4.1549072265625, -3.92657470703125, -3.6982421875, -3.46990966796875, -3.2415771484375, -3.01324462890625, -2.784912109375, -2.55657958984375, -2.3282470703125, -2.09991455078125, -1.87158203125, -1.64324951171875, -1.4149169921875, -1.18658447265625, -0.958251953125, -0.72991943359375, -0.5015869140625, -0.27325439453125, -0.044921875, 0.18341064453125, 0.4117431640625, 0.64007568359375, 0.868408203125, 1.09674072265625, 1.3250732421875, 1.55340576171875, 1.78173828125, 2.01007080078125, 2.2384033203125, 2.46673583984375, 2.695068359375, 2.92340087890625, 3.1517333984375, 3.38006591796875, 3.6083984375, 3.83673095703125, 4.0650634765625, 4.29339599609375, 4.521728515625, 4.75006103515625, 4.9783935546875, 5.20672607421875, 5.43505859375, 5.66339111328125, 5.8917236328125, 6.12005615234375, 6.348388671875, 6.57672119140625, 6.8050537109375, 7.03338623046875, 7.26171875]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 8.0, 5.0, 8.0, 6.0, 13.0, 6.0, 19.0, 28.0, 24.0, 23.0, 27.0, 34.0, 55.0, 91.0, 148.0, 300.0, 775.0, 3236.0, 66435.0, 3276919.0, 833318.0, 10277.0, 1472.0, 467.0, 192.0, 96.0, 72.0, 43.0, 36.0, 26.0, 25.0, 31.0, 15.0, 14.0, 6.0, 11.0, 2.0, 6.0, 4.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.75, -26.951416015625, -26.15283203125, -25.354248046875, -24.5556640625, -23.757080078125, -22.95849609375, -22.159912109375, -21.361328125, -20.562744140625, -19.76416015625, -18.965576171875, -18.1669921875, -17.368408203125, -16.56982421875, -15.771240234375, -14.97265625, -14.174072265625, -13.37548828125, -12.576904296875, -11.7783203125, -10.979736328125, -10.18115234375, -9.382568359375, -8.583984375, -7.785400390625, -6.98681640625, -6.188232421875, -5.3896484375, -4.591064453125, -3.79248046875, -2.993896484375, -2.1953125, -1.396728515625, -0.59814453125, 0.200439453125, 0.9990234375, 1.797607421875, 2.59619140625, 3.394775390625, 4.193359375, 4.991943359375, 5.79052734375, 6.589111328125, 7.3876953125, 8.186279296875, 8.98486328125, 9.783447265625, 10.58203125, 11.380615234375, 12.17919921875, 12.977783203125, 13.7763671875, 14.574951171875, 15.37353515625, 16.172119140625, 16.970703125, 17.769287109375, 18.56787109375, 19.366455078125, 20.1650390625, 20.963623046875, 21.76220703125, 22.560791015625, 23.359375]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 3.0, 2.0, 8.0, 9.0, 20.0, 16.0, 24.0, 42.0, 66.0, 78.0, 118.0, 186.0, 276.0, 405.0, 595.0, 571.0, 464.0, 340.0, 269.0, 154.0, 116.0, 100.0, 50.0, 55.0, 32.0, 16.0, 15.0, 15.0, 12.0, 9.0, 3.0, 6.0, 1.0, 1.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-12.625, -12.144775390625, -11.66455078125, -11.184326171875, -10.7041015625, -10.223876953125, -9.74365234375, -9.263427734375, -8.783203125, -8.302978515625, -7.82275390625, -7.342529296875, -6.8623046875, -6.382080078125, -5.90185546875, -5.421630859375, -4.94140625, -4.461181640625, -3.98095703125, -3.500732421875, -3.0205078125, -2.540283203125, -2.06005859375, -1.579833984375, -1.099609375, -0.619384765625, -0.13916015625, 0.341064453125, 0.8212890625, 1.301513671875, 1.78173828125, 2.261962890625, 2.7421875, 3.222412109375, 3.70263671875, 4.182861328125, 4.6630859375, 5.143310546875, 5.62353515625, 6.103759765625, 6.583984375, 7.064208984375, 7.54443359375, 8.024658203125, 8.5048828125, 8.985107421875, 9.46533203125, 9.945556640625, 10.42578125, 10.906005859375, 11.38623046875, 11.866455078125, 12.3466796875, 12.826904296875, 13.30712890625, 13.787353515625, 14.267578125, 14.747802734375, 15.22802734375, 15.708251953125, 16.1884765625, 16.668701171875, 17.14892578125, 17.629150390625, 18.109375]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 5.0, 10.0, 8.0, 24.0, 19.0, 27.0, 22.0, 42.0, 61.0, 70.0, 110.0, 127.0, 159.0, 174.0, 261.0, 391.0, 665.0, 10677.0, 4166867.0, 12489.0, 734.0, 356.0, 255.0, 170.0, 145.0, 115.0, 81.0, 55.0, 54.0, 17.0, 17.0, 26.0, 13.0, 10.0, 7.0, 6.0, 6.0, 4.0, 4.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-93.625, -91.060546875, -88.49609375, -85.931640625, -83.3671875, -80.802734375, -78.23828125, -75.673828125, -73.109375, -70.544921875, -67.98046875, -65.416015625, -62.8515625, -60.287109375, -57.72265625, -55.158203125, -52.59375, -50.029296875, -47.46484375, -44.900390625, -42.3359375, -39.771484375, -37.20703125, -34.642578125, -32.078125, -29.513671875, -26.94921875, -24.384765625, -21.8203125, -19.255859375, -16.69140625, -14.126953125, -11.5625, -8.998046875, -6.43359375, -3.869140625, -1.3046875, 1.259765625, 3.82421875, 6.388671875, 8.953125, 11.517578125, 14.08203125, 16.646484375, 19.2109375, 21.775390625, 24.33984375, 26.904296875, 29.46875, 32.033203125, 34.59765625, 37.162109375, 39.7265625, 42.291015625, 44.85546875, 47.419921875, 49.984375, 52.548828125, 55.11328125, 57.677734375, 60.2421875, 62.806640625, 65.37109375, 67.935546875, 70.5]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 16.0, 102.0, 360.0, 414.0, 113.0, 9.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-83.88794708251953, -78.63007354736328, -73.3721923828125, -68.11431884765625, -62.856441497802734, -57.59856414794922, -52.34069061279297, -47.08281326293945, -41.82493591308594, -36.56705856323242, -31.30918312072754, -26.051307678222656, -20.79343032836914, -15.535552978515625, -10.277677536010742, -5.019802093505859, 0.23807525634765625, 5.4959516525268555, 10.753828048706055, 16.011703491210938, 21.269580841064453, 26.52745819091797, 31.78533363342285, 37.043209075927734, 42.30108642578125, 47.558963775634766, 52.81684112548828, 58.07471466064453, 63.33259201049805, 68.59046936035156, 73.84834289550781, 79.10621643066406, 84.36410522460938, 89.62197875976562, 94.8798599243164, 100.13773345947266, 105.39561462402344, 110.65348815917969, 115.91136169433594, 121.16923522949219, 126.42711639404297, 131.68499755859375, 136.94287109375, 142.20074462890625, 147.4586181640625, 152.71649169921875, 157.97438049316406, 163.2322540283203, 168.49012756347656, 173.7480010986328, 179.00587463378906, 184.26376342773438, 189.52163696289062, 194.77951049804688, 200.03738403320312, 205.29525756835938, 210.55313110351562, 215.81100463867188, 221.06887817382812, 226.32676696777344, 231.5846405029297, 236.84251403808594, 242.1003875732422, 247.35826110839844, 252.61614990234375]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 4.0, 5.0, 8.0, 6.0, 7.0, 7.0, 8.0, 10.0, 10.0, 12.0, 13.0, 15.0, 17.0, 23.0, 38.0, 23.0, 32.0, 26.0, 28.0, 45.0, 25.0, 45.0, 41.0, 35.0, 31.0, 36.0, 46.0, 47.0, 28.0, 25.0, 46.0, 31.0, 35.0, 23.0, 19.0, 16.0, 22.0, 14.0, 16.0, 11.0, 15.0, 13.0, 7.0, 5.0, 5.0, 4.0, 10.0, 5.0, 3.0, 1.0, 6.0, 0.0, 1.0, 1.0, 5.0], "bins": [-39.92527770996094, -38.73172378540039, -37.53817367553711, -36.34461975097656, -35.15106964111328, -33.957515716552734, -32.76396179199219, -31.570409774780273, -30.37685775756836, -29.183305740356445, -27.98975372314453, -26.796199798583984, -25.60264778137207, -24.409095764160156, -23.21554183959961, -22.021989822387695, -20.82843780517578, -19.634885787963867, -18.441333770751953, -17.247779846191406, -16.054227828979492, -14.860675811767578, -13.667122840881348, -12.473569869995117, -11.280017852783203, -10.086465835571289, -8.892912864685059, -7.699360370635986, -6.505807876586914, -5.312255382537842, -4.1187028884887695, -2.925149917602539, -1.731597900390625, -0.5380454063415527, 0.6555070877075195, 1.8490595817565918, 3.042612075805664, 4.236164569854736, 5.429717063903809, 6.623270034790039, 7.816822052001953, 9.010374069213867, 10.203927040100098, 11.397480010986328, 12.591032028198242, 13.784584045410156, 14.978137016296387, 16.171689987182617, 17.36524200439453, 18.558794021606445, 19.75234603881836, 20.945899963378906, 22.13945198059082, 23.333003997802734, 24.52655792236328, 25.720109939575195, 26.91366195678711, 28.107213973999023, 29.300765991210938, 30.494319915771484, 31.6878719329834, 32.88142395019531, 34.07497787475586, 35.268531799316406, 36.46208190917969]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 1.0, 3.0, 14.0, 10.0, 8.0, 15.0, 18.0, 15.0, 26.0, 21.0, 28.0, 33.0, 24.0, 34.0, 37.0, 24.0, 46.0, 26.0, 46.0, 40.0, 46.0, 50.0, 46.0, 31.0, 45.0, 35.0, 30.0, 35.0, 33.0, 28.0, 23.0, 22.0, 19.0, 23.0, 17.0, 11.0, 5.0, 6.0, 6.0, 7.0, 4.0, 4.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-7.3203125, -7.1068115234375, -6.893310546875, -6.6798095703125, -6.46630859375, -6.2528076171875, -6.039306640625, -5.8258056640625, -5.6123046875, -5.3988037109375, -5.185302734375, -4.9718017578125, -4.75830078125, -4.5447998046875, -4.331298828125, -4.1177978515625, -3.904296875, -3.6907958984375, -3.477294921875, -3.2637939453125, -3.05029296875, -2.8367919921875, -2.623291015625, -2.4097900390625, -2.1962890625, -1.9827880859375, -1.769287109375, -1.5557861328125, -1.34228515625, -1.1287841796875, -0.915283203125, -0.7017822265625, -0.48828125, -0.2747802734375, -0.061279296875, 0.1522216796875, 0.36572265625, 0.5792236328125, 0.792724609375, 1.0062255859375, 1.2197265625, 1.4332275390625, 1.646728515625, 1.8602294921875, 2.07373046875, 2.2872314453125, 2.500732421875, 2.7142333984375, 2.927734375, 3.1412353515625, 3.354736328125, 3.5682373046875, 3.78173828125, 3.9952392578125, 4.208740234375, 4.4222412109375, 4.6357421875, 4.8492431640625, 5.062744140625, 5.2762451171875, 5.48974609375, 5.7032470703125, 5.916748046875, 6.1302490234375, 6.34375]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 7.0, 6.0, 4.0, 8.0, 12.0, 23.0, 31.0, 58.0, 64.0, 112.0, 168.0, 207.0, 325.0, 560.0, 721.0, 1117.0, 1641.0, 2546.0, 3879.0, 5845.0, 9047.0, 14342.0, 22882.0, 36683.0, 61125.0, 109902.0, 292002.0, 237221.0, 99040.0, 55891.0, 33952.0, 20936.0, 13383.0, 8579.0, 5495.0, 3588.0, 2404.0, 1599.0, 1023.0, 688.0, 454.0, 297.0, 244.0, 161.0, 95.0, 68.0, 47.0, 28.0, 19.0, 18.0, 12.0, 3.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.349609375, -1.3073272705078125, -1.265045166015625, -1.2227630615234375, -1.18048095703125, -1.1381988525390625, -1.095916748046875, -1.0536346435546875, -1.0113525390625, -0.9690704345703125, -0.926788330078125, -0.8845062255859375, -0.84222412109375, -0.7999420166015625, -0.757659912109375, -0.7153778076171875, -0.673095703125, -0.6308135986328125, -0.588531494140625, -0.5462493896484375, -0.50396728515625, -0.4616851806640625, -0.419403076171875, -0.3771209716796875, -0.3348388671875, -0.2925567626953125, -0.250274658203125, -0.2079925537109375, -0.16571044921875, -0.1234283447265625, -0.081146240234375, -0.0388641357421875, 0.00341796875, 0.0457000732421875, 0.087982177734375, 0.1302642822265625, 0.17254638671875, 0.2148284912109375, 0.257110595703125, 0.2993927001953125, 0.3416748046875, 0.3839569091796875, 0.426239013671875, 0.4685211181640625, 0.51080322265625, 0.5530853271484375, 0.595367431640625, 0.6376495361328125, 0.679931640625, 0.7222137451171875, 0.764495849609375, 0.8067779541015625, 0.84906005859375, 0.8913421630859375, 0.933624267578125, 0.9759063720703125, 1.0181884765625, 1.0604705810546875, 1.102752685546875, 1.1450347900390625, 1.18731689453125, 1.2295989990234375, 1.271881103515625, 1.3141632080078125, 1.3564453125]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 0.0, 2.0, 4.0, 3.0, 7.0, 7.0, 7.0, 12.0, 12.0, 12.0, 16.0, 18.0, 23.0, 22.0, 21.0, 21.0, 37.0, 31.0, 33.0, 42.0, 46.0, 39.0, 42.0, 39.0, 1069.0, 44.0, 25.0, 49.0, 40.0, 29.0, 34.0, 25.0, 26.0, 22.0, 18.0, 22.0, 21.0, 23.0, 19.0, 16.0, 14.0, 12.0, 6.0, 8.0, 4.0, 5.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.52734375, -4.3922119140625, -4.257080078125, -4.1219482421875, -3.98681640625, -3.8516845703125, -3.716552734375, -3.5814208984375, -3.4462890625, -3.3111572265625, -3.176025390625, -3.0408935546875, -2.90576171875, -2.7706298828125, -2.635498046875, -2.5003662109375, -2.365234375, -2.2301025390625, -2.094970703125, -1.9598388671875, -1.82470703125, -1.6895751953125, -1.554443359375, -1.4193115234375, -1.2841796875, -1.1490478515625, -1.013916015625, -0.8787841796875, -0.74365234375, -0.6085205078125, -0.473388671875, -0.3382568359375, -0.203125, -0.0679931640625, 0.067138671875, 0.2022705078125, 0.33740234375, 0.4725341796875, 0.607666015625, 0.7427978515625, 0.8779296875, 1.0130615234375, 1.148193359375, 1.2833251953125, 1.41845703125, 1.5535888671875, 1.688720703125, 1.8238525390625, 1.958984375, 2.0941162109375, 2.229248046875, 2.3643798828125, 2.49951171875, 2.6346435546875, 2.769775390625, 2.9049072265625, 3.0400390625, 3.1751708984375, 3.310302734375, 3.4454345703125, 3.58056640625, 3.7156982421875, 3.850830078125, 3.9859619140625, 4.12109375]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 7.0, 11.0, 18.0, 20.0, 31.0, 36.0, 89.0, 97.0, 169.0, 236.0, 402.0, 580.0, 947.0, 1506.0, 2344.0, 3861.0, 6089.0, 10012.0, 16034.0, 25786.0, 43241.0, 79449.0, 176148.0, 1428676.0, 137278.0, 66479.0, 37223.0, 22747.0, 14077.0, 8956.0, 5477.0, 3420.0, 2085.0, 1297.0, 808.0, 525.0, 332.0, 226.0, 149.0, 82.0, 62.0, 34.0, 32.0, 24.0, 11.0, 10.0, 4.0, 3.0, 4.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.435546875, -1.388275146484375, -1.34100341796875, -1.293731689453125, -1.2464599609375, -1.199188232421875, -1.15191650390625, -1.104644775390625, -1.057373046875, -1.010101318359375, -0.96282958984375, -0.915557861328125, -0.8682861328125, -0.821014404296875, -0.77374267578125, -0.726470947265625, -0.67919921875, -0.631927490234375, -0.58465576171875, -0.537384033203125, -0.4901123046875, -0.442840576171875, -0.39556884765625, -0.348297119140625, -0.301025390625, -0.253753662109375, -0.20648193359375, -0.159210205078125, -0.1119384765625, -0.064666748046875, -0.01739501953125, 0.029876708984375, 0.0771484375, 0.124420166015625, 0.17169189453125, 0.218963623046875, 0.2662353515625, 0.313507080078125, 0.36077880859375, 0.408050537109375, 0.455322265625, 0.502593994140625, 0.54986572265625, 0.597137451171875, 0.6444091796875, 0.691680908203125, 0.73895263671875, 0.786224365234375, 0.83349609375, 0.880767822265625, 0.92803955078125, 0.975311279296875, 1.0225830078125, 1.069854736328125, 1.11712646484375, 1.164398193359375, 1.211669921875, 1.258941650390625, 1.30621337890625, 1.353485107421875, 1.4007568359375, 1.448028564453125, 1.49530029296875, 1.542572021484375, 1.58984375]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 2.0, 7.0, 8.0, 7.0, 5.0, 12.0, 13.0, 27.0, 17.0, 40.0, 43.0, 55.0, 70.0, 99.0, 91.0, 85.0, 86.0, 61.0, 50.0, 64.0, 31.0, 35.0, 22.0, 17.0, 9.0, 9.0, 8.0, 6.0, 2.0, 6.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008935928344726562, -0.0008617788553237915, -0.0008299648761749268, -0.000798150897026062, -0.0007663369178771973, -0.0007345229387283325, -0.0007027089595794678, -0.000670894980430603, -0.0006390810012817383, -0.0006072670221328735, -0.0005754530429840088, -0.000543639063835144, -0.0005118250846862793, -0.00048001110553741455, -0.0004481971263885498, -0.00041638314723968506, -0.0003845691680908203, -0.00035275518894195557, -0.0003209412097930908, -0.0002891272306442261, -0.00025731325149536133, -0.00022549927234649658, -0.00019368529319763184, -0.0001618713140487671, -0.00013005733489990234, -9.82433557510376e-05, -6.642937660217285e-05, -3.4615397453308105e-05, -2.8014183044433594e-06, 2.9012560844421387e-05, 6.082653999328613e-05, 9.264051914215088e-05, 0.00012445449829101562, 0.00015626847743988037, 0.00018808245658874512, 0.00021989643573760986, 0.0002517104148864746, 0.00028352439403533936, 0.0003153383731842041, 0.00034715235233306885, 0.0003789663314819336, 0.00041078031063079834, 0.0004425942897796631, 0.00047440826892852783, 0.0005062222480773926, 0.0005380362272262573, 0.0005698502063751221, 0.0006016641855239868, 0.0006334781646728516, 0.0006652921438217163, 0.0006971061229705811, 0.0007289201021194458, 0.0007607340812683105, 0.0007925480604171753, 0.00082436203956604, 0.0008561760187149048, 0.0008879899978637695, 0.0009198039770126343, 0.000951617956161499, 0.0009834319353103638, 0.0010152459144592285, 0.0010470598936080933, 0.001078873872756958, 0.0011106878519058228, 0.0011425018310546875]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 6.0, 8.0, 5.0, 6.0, 4.0, 13.0, 10.0, 24.0, 25.0, 31.0, 44.0, 76.0, 98.0, 146.0, 370.0, 1669.0, 1035529.0, 9303.0, 596.0, 204.0, 115.0, 77.0, 52.0, 38.0, 29.0, 19.0, 15.0, 9.0, 4.0, 8.0, 7.0, 6.0, 3.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.0273590087890625, -0.026613235473632812, -0.025867462158203125, -0.025121688842773438, -0.02437591552734375, -0.023630142211914062, -0.022884368896484375, -0.022138595581054688, -0.021392822265625, -0.020647048950195312, -0.019901275634765625, -0.019155502319335938, -0.01840972900390625, -0.017663955688476562, -0.016918182373046875, -0.016172409057617188, -0.0154266357421875, -0.014680862426757812, -0.013935089111328125, -0.013189315795898438, -0.01244354248046875, -0.011697769165039062, -0.010951995849609375, -0.010206222534179688, -0.00946044921875, -0.008714675903320312, -0.007968902587890625, -0.0072231292724609375, -0.00647735595703125, -0.0057315826416015625, -0.004985809326171875, -0.0042400360107421875, -0.0034942626953125, -0.0027484893798828125, -0.002002716064453125, -0.0012569427490234375, -0.00051116943359375, 0.0002346038818359375, 0.000980377197265625, 0.0017261505126953125, 0.002471923828125, 0.0032176971435546875, 0.003963470458984375, 0.0047092437744140625, 0.00545501708984375, 0.0062007904052734375, 0.006946563720703125, 0.0076923370361328125, 0.0084381103515625, 0.009183883666992188, 0.009929656982421875, 0.010675430297851562, 0.01142120361328125, 0.012166976928710938, 0.012912750244140625, 0.013658523559570312, 0.014404296875, 0.015150070190429688, 0.015895843505859375, 0.016641616821289062, 0.01738739013671875, 0.018133163452148438, 0.018878936767578125, 0.019624710083007812, 0.0203704833984375]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 31.0, 266.0, 545.0, 157.0, 14.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006333711207844317, -0.0005657888832502067, -0.0004982065875083208, -0.0004306243499740958, -0.00036304211243987083, -0.00029545987490564585, -0.0002278776082675904, -0.00016029534162953496, -9.271310409530997e-05, -2.5130852009169757e-05, 4.245140007697046e-05, 0.00011003365216311067, 0.0001776159042492509, 0.0002451981417834759, 0.0003127804084215313, 0.00038036267505958676, 0.00044794491259381175, 0.0005155271501280367, 0.0005831094458699226, 0.0006506916834041476, 0.0007182739209383726, 0.0007858561584725976, 0.0008534383960068226, 0.0009210206917487085, 0.0009886028710752726, 0.0010561851086094975, 0.0011237673461437225, 0.0011913495836779475, 0.0012589318212121725, 0.0013265141751617193, 0.0013940964126959443, 0.0014616786502301693, 0.0015292607713490725, 0.0015968430088832974, 0.0016644252464175224, 0.0017320074839517474, 0.0017995897214859724, 0.0018671720754355192, 0.0019347543129697442, 0.002002336550503969, 0.002069918904453516, 0.002137501258403063, 0.002205083379521966, 0.002272665733471513, 0.002340247854590416, 0.0024078302085399628, 0.002475412329658866, 0.0025429946836084127, 0.002610576804727316, 0.0026781591586768627, 0.002745741279795766, 0.0028133236337453127, 0.002880905754864216, 0.0029484881088137627, 0.003016070229932666, 0.0030836525838822126, 0.003151234705001116, 0.0032188170589506626, 0.0032863991800695658, 0.0033539815340191126, 0.0034215636551380157, 0.0034891460090875626, 0.0035567281302064657, 0.0036243104841560125, 0.0036918928381055593]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 6.0, 4.0, 2.0, 4.0, 6.0, 10.0, 5.0, 11.0, 12.0, 19.0, 14.0, 17.0, 25.0, 24.0, 30.0, 38.0, 31.0, 44.0, 36.0, 43.0, 50.0, 44.0, 47.0, 35.0, 45.0, 37.0, 39.0, 39.0, 46.0, 31.0, 33.0, 21.0, 32.0, 18.0, 27.0, 23.0, 14.0, 8.0, 15.0, 6.0, 10.0, 5.0, 2.0, 1.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00044846534729003906, -0.00043472088873386383, -0.0004209764301776886, -0.00040723197162151337, -0.00039348751306533813, -0.0003797430545091629, -0.00036599859595298767, -0.00035225413739681244, -0.0003385096788406372, -0.000324765220284462, -0.00031102076172828674, -0.0002972763031721115, -0.0002835318446159363, -0.00026978738605976105, -0.0002560429275035858, -0.00024229846894741058, -0.00022855401039123535, -0.00021480955183506012, -0.0002010650932788849, -0.00018732063472270966, -0.00017357617616653442, -0.0001598317176103592, -0.00014608725905418396, -0.00013234280049800873, -0.0001185983419418335, -0.00010485388338565826, -9.110942482948303e-05, -7.73649662733078e-05, -6.362050771713257e-05, -4.9876049160957336e-05, -3.6131590604782104e-05, -2.2387132048606873e-05, -8.64267349243164e-06, 5.101785063743591e-06, 1.8846243619918823e-05, 3.2590702176094055e-05, 4.633516073226929e-05, 6.007961928844452e-05, 7.382407784461975e-05, 8.756853640079498e-05, 0.00010131299495697021, 0.00011505745351314545, 0.00012880191206932068, 0.0001425463706254959, 0.00015629082918167114, 0.00017003528773784637, 0.0001837797462940216, 0.00019752420485019684, 0.00021126866340637207, 0.0002250131219625473, 0.00023875758051872253, 0.00025250203907489777, 0.000266246497631073, 0.00027999095618724823, 0.00029373541474342346, 0.0003074798732995987, 0.0003212243318557739, 0.00033496879041194916, 0.0003487132489681244, 0.0003624577075242996, 0.00037620216608047485, 0.0003899466246366501, 0.0004036910831928253, 0.00041743554174900055, 0.0004311800003051758]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 1.0, 3.0, 14.0, 10.0, 8.0, 15.0, 18.0, 15.0, 26.0, 21.0, 28.0, 33.0, 24.0, 34.0, 37.0, 24.0, 46.0, 26.0, 46.0, 40.0, 46.0, 50.0, 46.0, 31.0, 45.0, 35.0, 30.0, 35.0, 33.0, 28.0, 23.0, 22.0, 19.0, 23.0, 17.0, 11.0, 5.0, 6.0, 6.0, 7.0, 4.0, 4.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-7.3203125, -7.1068115234375, -6.893310546875, -6.6798095703125, -6.46630859375, -6.2528076171875, -6.039306640625, -5.8258056640625, -5.6123046875, -5.3988037109375, -5.185302734375, -4.9718017578125, -4.75830078125, -4.5447998046875, -4.331298828125, -4.1177978515625, -3.904296875, -3.6907958984375, -3.477294921875, -3.2637939453125, -3.05029296875, -2.8367919921875, -2.623291015625, -2.4097900390625, -2.1962890625, -1.9827880859375, -1.769287109375, -1.5557861328125, -1.34228515625, -1.1287841796875, -0.915283203125, -0.7017822265625, -0.48828125, -0.2747802734375, -0.061279296875, 0.1522216796875, 0.36572265625, 0.5792236328125, 0.792724609375, 1.0062255859375, 1.2197265625, 1.4332275390625, 1.646728515625, 1.8602294921875, 2.07373046875, 2.2872314453125, 2.500732421875, 2.7142333984375, 2.927734375, 3.1412353515625, 3.354736328125, 3.5682373046875, 3.78173828125, 3.9952392578125, 4.208740234375, 4.4222412109375, 4.6357421875, 4.8492431640625, 5.062744140625, 5.2762451171875, 5.48974609375, 5.7032470703125, 5.916748046875, 6.1302490234375, 6.34375]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 4.0, 2.0, 2.0, 2.0, 10.0, 15.0, 19.0, 15.0, 18.0, 38.0, 33.0, 47.0, 79.0, 96.0, 135.0, 195.0, 310.0, 480.0, 1058.0, 2872.0, 8993.0, 32828.0, 132748.0, 515193.0, 266012.0, 62327.0, 16533.0, 4938.0, 1691.0, 693.0, 362.0, 208.0, 185.0, 99.0, 76.0, 65.0, 50.0, 29.0, 32.0, 17.0, 10.0, 13.0, 5.0, 15.0, 3.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-8.1328125, -7.898681640625, -7.66455078125, -7.430419921875, -7.1962890625, -6.962158203125, -6.72802734375, -6.493896484375, -6.259765625, -6.025634765625, -5.79150390625, -5.557373046875, -5.3232421875, -5.089111328125, -4.85498046875, -4.620849609375, -4.38671875, -4.152587890625, -3.91845703125, -3.684326171875, -3.4501953125, -3.216064453125, -2.98193359375, -2.747802734375, -2.513671875, -2.279541015625, -2.04541015625, -1.811279296875, -1.5771484375, -1.343017578125, -1.10888671875, -0.874755859375, -0.640625, -0.406494140625, -0.17236328125, 0.061767578125, 0.2958984375, 0.530029296875, 0.76416015625, 0.998291015625, 1.232421875, 1.466552734375, 1.70068359375, 1.934814453125, 2.1689453125, 2.403076171875, 2.63720703125, 2.871337890625, 3.10546875, 3.339599609375, 3.57373046875, 3.807861328125, 4.0419921875, 4.276123046875, 4.51025390625, 4.744384765625, 4.978515625, 5.212646484375, 5.44677734375, 5.680908203125, 5.9150390625, 6.149169921875, 6.38330078125, 6.617431640625, 6.8515625]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 5.0, 0.0, 3.0, 2.0, 2.0, 9.0, 11.0, 7.0, 7.0, 8.0, 12.0, 13.0, 24.0, 22.0, 24.0, 42.0, 40.0, 38.0, 40.0, 51.0, 43.0, 86.0, 278.0, 1701.0, 140.0, 57.0, 39.0, 46.0, 52.0, 41.0, 25.0, 33.0, 24.0, 15.0, 19.0, 14.0, 25.0, 18.0, 7.0, 8.0, 10.0, 4.0, 3.0, 4.0, 2.0, 3.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.328125, -19.610107421875, -18.89208984375, -18.174072265625, -17.4560546875, -16.738037109375, -16.02001953125, -15.302001953125, -14.583984375, -13.865966796875, -13.14794921875, -12.429931640625, -11.7119140625, -10.993896484375, -10.27587890625, -9.557861328125, -8.83984375, -8.121826171875, -7.40380859375, -6.685791015625, -5.9677734375, -5.249755859375, -4.53173828125, -3.813720703125, -3.095703125, -2.377685546875, -1.65966796875, -0.941650390625, -0.2236328125, 0.494384765625, 1.21240234375, 1.930419921875, 2.6484375, 3.366455078125, 4.08447265625, 4.802490234375, 5.5205078125, 6.238525390625, 6.95654296875, 7.674560546875, 8.392578125, 9.110595703125, 9.82861328125, 10.546630859375, 11.2646484375, 11.982666015625, 12.70068359375, 13.418701171875, 14.13671875, 14.854736328125, 15.57275390625, 16.290771484375, 17.0087890625, 17.726806640625, 18.44482421875, 19.162841796875, 19.880859375, 20.598876953125, 21.31689453125, 22.034912109375, 22.7529296875, 23.470947265625, 24.18896484375, 24.906982421875, 25.625]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 6.0, 6.0, 6.0, 9.0, 9.0, 14.0, 10.0, 25.0, 37.0, 35.0, 35.0, 44.0, 55.0, 93.0, 122.0, 136.0, 237.0, 311.0, 564.0, 2221.0, 2128167.0, 1009792.0, 2067.0, 532.0, 331.0, 219.0, 150.0, 106.0, 85.0, 59.0, 55.0, 41.0, 18.0, 21.0, 14.0, 11.0, 20.0, 11.0, 6.0, 6.0, 5.0, 3.0, 3.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-52.15625, -50.57470703125, -48.9931640625, -47.41162109375, -45.830078125, -44.24853515625, -42.6669921875, -41.08544921875, -39.50390625, -37.92236328125, -36.3408203125, -34.75927734375, -33.177734375, -31.59619140625, -30.0146484375, -28.43310546875, -26.8515625, -25.27001953125, -23.6884765625, -22.10693359375, -20.525390625, -18.94384765625, -17.3623046875, -15.78076171875, -14.19921875, -12.61767578125, -11.0361328125, -9.45458984375, -7.873046875, -6.29150390625, -4.7099609375, -3.12841796875, -1.546875, 0.03466796875, 1.6162109375, 3.19775390625, 4.779296875, 6.36083984375, 7.9423828125, 9.52392578125, 11.10546875, 12.68701171875, 14.2685546875, 15.85009765625, 17.431640625, 19.01318359375, 20.5947265625, 22.17626953125, 23.7578125, 25.33935546875, 26.9208984375, 28.50244140625, 30.083984375, 31.66552734375, 33.2470703125, 34.82861328125, 36.41015625, 37.99169921875, 39.5732421875, 41.15478515625, 42.736328125, 44.31787109375, 45.8994140625, 47.48095703125, 49.0625]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 7.0, 650.0, 363.0], "bins": [-341.5059814453125, -336.0758056640625, -330.6456298828125, -325.2154541015625, -319.7853088378906, -314.3551330566406, -308.9249572753906, -303.4947814941406, -298.0646057128906, -292.6344299316406, -287.2042541503906, -281.77410888671875, -276.34393310546875, -270.91375732421875, -265.48358154296875, -260.05340576171875, -254.6232452392578, -249.1930694580078, -243.76290893554688, -238.33273315429688, -232.90255737304688, -227.47238159179688, -222.04222106933594, -216.61204528808594, -211.181884765625, -205.751708984375, -200.32154846191406, -194.89137268066406, -189.46119689941406, -184.03103637695312, -178.60086059570312, -173.17068481445312, -167.74050903320312, -162.31033325195312, -156.8801727294922, -151.4499969482422, -146.0198211669922, -140.58966064453125, -135.15948486328125, -129.72930908203125, -124.29913330078125, -118.86896514892578, -113.43878936767578, -108.00862121582031, -102.57844543457031, -97.14827728271484, -91.71810913085938, -86.28793334960938, -80.8577651977539, -75.42759704589844, -69.99742126464844, -64.56725311279297, -59.137081146240234, -53.7069091796875, -48.27674102783203, -42.8465690612793, -37.41639709472656, -31.986225128173828, -26.556055068969727, -21.125885009765625, -15.69571304321289, -10.265541076660156, -4.8353729248046875, 0.5947990417480469, 6.024970054626465]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 3.0, 3.0, 4.0, 6.0, 12.0, 18.0, 24.0, 19.0, 19.0, 18.0, 27.0, 28.0, 28.0, 28.0, 30.0, 50.0, 39.0, 36.0, 45.0, 51.0, 47.0, 37.0, 50.0, 47.0, 42.0, 28.0, 49.0, 26.0, 25.0, 27.0, 26.0, 16.0, 20.0, 15.0, 9.0, 13.0, 8.0, 7.0, 10.0, 2.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.000572204589844, -48.26482009887695, -46.52906799316406, -44.79331970214844, -43.05756759643555, -41.321815490722656, -39.586063385009766, -37.850311279296875, -36.11456298828125, -34.37881088256836, -32.64305877685547, -30.90730857849121, -29.171558380126953, -27.435806274414062, -25.700054168701172, -23.96430206298828, -22.22854995727539, -20.4927978515625, -18.757047653198242, -17.02129554748535, -15.285544395446777, -13.549793243408203, -11.814041137695312, -10.078289985656738, -8.342538833618164, -6.60678768157959, -4.871036052703857, -3.135284423828125, -1.3995332717895508, 0.33621788024902344, 2.071969985961914, 3.8077211380004883, 5.543468475341797, 7.279219627380371, 9.014970779418945, 10.750722885131836, 12.48647403717041, 14.222225189208984, 15.957977294921875, 17.693729400634766, 19.429479598999023, 21.165231704711914, 22.900981903076172, 24.636734008789062, 26.372486114501953, 28.10823631286621, 29.8439884185791, 31.57973861694336, 33.31549072265625, 35.05124282836914, 36.78699493408203, 38.522743225097656, 40.25849533081055, 41.99424743652344, 43.72999954223633, 45.46575164794922, 47.201499938964844, 48.937252044677734, 50.673004150390625, 52.40875244140625, 54.14450454711914, 55.88025665283203, 57.61600875854492, 59.35176086425781, 61.0875129699707]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 4.0, 1.0, 7.0, 6.0, 7.0, 17.0, 12.0, 12.0, 21.0, 20.0, 14.0, 29.0, 34.0, 22.0, 24.0, 34.0, 40.0, 26.0, 34.0, 45.0, 33.0, 48.0, 52.0, 43.0, 40.0, 41.0, 34.0, 37.0, 27.0, 32.0, 33.0, 26.0, 25.0, 14.0, 24.0, 21.0, 18.0, 13.0, 9.0, 5.0, 5.0, 5.0, 4.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-7.7109375, -7.49066162109375, -7.2703857421875, -7.05010986328125, -6.829833984375, -6.60955810546875, -6.3892822265625, -6.16900634765625, -5.94873046875, -5.72845458984375, -5.5081787109375, -5.28790283203125, -5.067626953125, -4.84735107421875, -4.6270751953125, -4.40679931640625, -4.1865234375, -3.96624755859375, -3.7459716796875, -3.52569580078125, -3.305419921875, -3.08514404296875, -2.8648681640625, -2.64459228515625, -2.42431640625, -2.20404052734375, -1.9837646484375, -1.76348876953125, -1.543212890625, -1.32293701171875, -1.1026611328125, -0.88238525390625, -0.662109375, -0.44183349609375, -0.2215576171875, -0.00128173828125, 0.218994140625, 0.43927001953125, 0.6595458984375, 0.87982177734375, 1.10009765625, 1.32037353515625, 1.5406494140625, 1.76092529296875, 1.981201171875, 2.20147705078125, 2.4217529296875, 2.64202880859375, 2.8623046875, 3.08258056640625, 3.3028564453125, 3.52313232421875, 3.743408203125, 3.96368408203125, 4.1839599609375, 4.40423583984375, 4.62451171875, 4.84478759765625, 5.0650634765625, 5.28533935546875, 5.505615234375, 5.72589111328125, 5.9461669921875, 6.16644287109375, 6.38671875]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 2.0, 4.0, 2.0, 7.0, 8.0, 10.0, 17.0, 18.0, 18.0, 19.0, 20.0, 35.0, 46.0, 70.0, 85.0, 137.0, 201.0, 389.0, 985.0, 4635.0, 258992.0, 3760622.0, 162136.0, 3963.0, 814.0, 389.0, 194.0, 125.0, 83.0, 72.0, 27.0, 37.0, 23.0, 22.0, 22.0, 11.0, 12.0, 12.0, 5.0, 5.0, 5.0, 5.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-30.171875, -29.34423828125, -28.5166015625, -27.68896484375, -26.861328125, -26.03369140625, -25.2060546875, -24.37841796875, -23.55078125, -22.72314453125, -21.8955078125, -21.06787109375, -20.240234375, -19.41259765625, -18.5849609375, -17.75732421875, -16.9296875, -16.10205078125, -15.2744140625, -14.44677734375, -13.619140625, -12.79150390625, -11.9638671875, -11.13623046875, -10.30859375, -9.48095703125, -8.6533203125, -7.82568359375, -6.998046875, -6.17041015625, -5.3427734375, -4.51513671875, -3.6875, -2.85986328125, -2.0322265625, -1.20458984375, -0.376953125, 0.45068359375, 1.2783203125, 2.10595703125, 2.93359375, 3.76123046875, 4.5888671875, 5.41650390625, 6.244140625, 7.07177734375, 7.8994140625, 8.72705078125, 9.5546875, 10.38232421875, 11.2099609375, 12.03759765625, 12.865234375, 13.69287109375, 14.5205078125, 15.34814453125, 16.17578125, 17.00341796875, 17.8310546875, 18.65869140625, 19.486328125, 20.31396484375, 21.1416015625, 21.96923828125, 22.796875]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 5.0, 4.0, 4.0, 11.0, 11.0, 14.0, 21.0, 31.0, 46.0, 66.0, 90.0, 148.0, 184.0, 267.0, 345.0, 476.0, 550.0, 534.0, 378.0, 262.0, 172.0, 142.0, 89.0, 73.0, 38.0, 37.0, 27.0, 17.0, 10.0, 10.0, 7.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.5, -10.072998046875, -9.64599609375, -9.218994140625, -8.7919921875, -8.364990234375, -7.93798828125, -7.510986328125, -7.083984375, -6.656982421875, -6.22998046875, -5.802978515625, -5.3759765625, -4.948974609375, -4.52197265625, -4.094970703125, -3.66796875, -3.240966796875, -2.81396484375, -2.386962890625, -1.9599609375, -1.532958984375, -1.10595703125, -0.678955078125, -0.251953125, 0.175048828125, 0.60205078125, 1.029052734375, 1.4560546875, 1.883056640625, 2.31005859375, 2.737060546875, 3.1640625, 3.591064453125, 4.01806640625, 4.445068359375, 4.8720703125, 5.299072265625, 5.72607421875, 6.153076171875, 6.580078125, 7.007080078125, 7.43408203125, 7.861083984375, 8.2880859375, 8.715087890625, 9.14208984375, 9.569091796875, 9.99609375, 10.423095703125, 10.85009765625, 11.277099609375, 11.7041015625, 12.131103515625, 12.55810546875, 12.985107421875, 13.412109375, 13.839111328125, 14.26611328125, 14.693115234375, 15.1201171875, 15.547119140625, 15.97412109375, 16.401123046875, 16.828125]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 4.0, 1.0, 2.0, 6.0, 4.0, 4.0, 5.0, 12.0, 21.0, 20.0, 24.0, 51.0, 57.0, 85.0, 84.0, 106.0, 158.0, 229.0, 288.0, 461.0, 1168.0, 831054.0, 3357114.0, 1551.0, 508.0, 348.0, 226.0, 166.0, 133.0, 106.0, 65.0, 60.0, 44.0, 39.0, 22.0, 16.0, 18.0, 11.0, 6.0, 2.0, 5.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-101.8125, -99.1376953125, -96.462890625, -93.7880859375, -91.11328125, -88.4384765625, -85.763671875, -83.0888671875, -80.4140625, -77.7392578125, -75.064453125, -72.3896484375, -69.71484375, -67.0400390625, -64.365234375, -61.6904296875, -59.015625, -56.3408203125, -53.666015625, -50.9912109375, -48.31640625, -45.6416015625, -42.966796875, -40.2919921875, -37.6171875, -34.9423828125, -32.267578125, -29.5927734375, -26.91796875, -24.2431640625, -21.568359375, -18.8935546875, -16.21875, -13.5439453125, -10.869140625, -8.1943359375, -5.51953125, -2.8447265625, -0.169921875, 2.5048828125, 5.1796875, 7.8544921875, 10.529296875, 13.2041015625, 15.87890625, 18.5537109375, 21.228515625, 23.9033203125, 26.578125, 29.2529296875, 31.927734375, 34.6025390625, 37.27734375, 39.9521484375, 42.626953125, 45.3017578125, 47.9765625, 50.6513671875, 53.326171875, 56.0009765625, 58.67578125, 61.3505859375, 64.025390625, 66.7001953125, 69.375]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 10.0, 248.0, 562.0, 183.0, 11.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-105.7583999633789, -98.92786407470703, -92.09733581542969, -85.26679992675781, -78.43626403808594, -71.60572814941406, -64.77519989013672, -57.944664001464844, -51.114131927490234, -44.283599853515625, -37.45306396484375, -30.62253189086914, -23.7919979095459, -16.961463928222656, -10.130931854248047, -3.300395965576172, 3.5301361083984375, 10.36067008972168, 17.191204071044922, 24.02173614501953, 30.852270126342773, 37.682804107666016, 44.513336181640625, 51.3438720703125, 58.17440414428711, 65.00493621826172, 71.8354721069336, 78.66600036621094, 85.49653625488281, 92.32707214355469, 99.15760803222656, 105.98814392089844, 112.81867980957031, 119.64921569824219, 126.47974395751953, 133.31027221679688, 140.14080810546875, 146.97134399414062, 153.8018798828125, 160.63241577148438, 167.46295166015625, 174.29348754882812, 181.1240234375, 187.95455932617188, 194.7850799560547, 201.61561584472656, 208.44615173339844, 215.2766876220703, 222.10720825195312, 228.937744140625, 235.76828002929688, 242.59881591796875, 249.42933654785156, 256.2598876953125, 263.09039306640625, 269.92095947265625, 276.7514953613281, 283.58203125, 290.4125671386719, 297.24310302734375, 304.0736389160156, 310.9041748046875, 317.73468017578125, 324.56524658203125, 331.395751953125]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 5.0, 6.0, 3.0, 8.0, 7.0, 8.0, 8.0, 14.0, 23.0, 13.0, 23.0, 22.0, 18.0, 25.0, 30.0, 30.0, 35.0, 33.0, 48.0, 31.0, 43.0, 46.0, 39.0, 41.0, 35.0, 42.0, 33.0, 29.0, 35.0, 35.0, 29.0, 16.0, 38.0, 22.0, 22.0, 28.0, 14.0, 9.0, 9.0, 5.0, 15.0, 5.0, 4.0, 4.0, 4.0, 1.0, 5.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-36.08770751953125, -34.915348052978516, -33.74299240112305, -32.57063293457031, -31.39827537536621, -30.22591781616211, -29.053560256958008, -27.881202697753906, -26.708843231201172, -25.53648567199707, -24.36412811279297, -23.191768646240234, -22.019411087036133, -20.84705352783203, -19.67469596862793, -18.502338409423828, -17.329980850219727, -16.157623291015625, -14.985264778137207, -13.812907218933105, -12.640548706054688, -11.468191146850586, -10.295833587646484, -9.123475074768066, -7.951117515563965, -6.778759479522705, -5.606401443481445, -4.434043884277344, -3.261685848236084, -2.089327812194824, -0.9169702529907227, 0.2553882598876953, 1.4277458190917969, 2.6001038551330566, 3.7724616527557373, 4.944819450378418, 6.117177486419678, 7.2895355224609375, 8.461893081665039, 9.634251594543457, 10.806609153747559, 11.97896671295166, 13.151325225830078, 14.32368278503418, 15.496040344238281, 16.668399810791016, 17.840755462646484, 19.01311492919922, 20.18547248840332, 21.357830047607422, 22.530187606811523, 23.702545166015625, 24.87490463256836, 26.04726219177246, 27.219619750976562, 28.391979217529297, 29.564334869384766, 30.736692428588867, 31.90904998779297, 33.0814094543457, 34.25376510620117, 35.426124572753906, 36.598480224609375, 37.77083969116211, 38.943199157714844]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 4.0, 5.0, 11.0, 8.0, 8.0, 23.0, 14.0, 21.0, 15.0, 16.0, 21.0, 24.0, 29.0, 24.0, 30.0, 38.0, 41.0, 41.0, 27.0, 42.0, 50.0, 41.0, 46.0, 39.0, 40.0, 44.0, 30.0, 31.0, 43.0, 30.0, 28.0, 16.0, 25.0, 14.0, 15.0, 14.0, 15.0, 9.0, 8.0, 6.0, 7.0, 5.0, 4.0, 3.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0], "bins": [-7.6953125, -7.47576904296875, -7.2562255859375, -7.03668212890625, -6.817138671875, -6.59759521484375, -6.3780517578125, -6.15850830078125, -5.93896484375, -5.71942138671875, -5.4998779296875, -5.28033447265625, -5.060791015625, -4.84124755859375, -4.6217041015625, -4.40216064453125, -4.1826171875, -3.96307373046875, -3.7435302734375, -3.52398681640625, -3.304443359375, -3.08489990234375, -2.8653564453125, -2.64581298828125, -2.42626953125, -2.20672607421875, -1.9871826171875, -1.76763916015625, -1.548095703125, -1.32855224609375, -1.1090087890625, -0.88946533203125, -0.669921875, -0.45037841796875, -0.2308349609375, -0.01129150390625, 0.208251953125, 0.42779541015625, 0.6473388671875, 0.86688232421875, 1.08642578125, 1.30596923828125, 1.5255126953125, 1.74505615234375, 1.964599609375, 2.18414306640625, 2.4036865234375, 2.62322998046875, 2.8427734375, 3.06231689453125, 3.2818603515625, 3.50140380859375, 3.720947265625, 3.94049072265625, 4.1600341796875, 4.37957763671875, 4.59912109375, 4.81866455078125, 5.0382080078125, 5.25775146484375, 5.477294921875, 5.69683837890625, 5.9163818359375, 6.13592529296875, 6.35546875]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 3.0, 5.0, 6.0, 6.0, 6.0, 14.0, 13.0, 26.0, 44.0, 67.0, 97.0, 150.0, 199.0, 293.0, 421.0, 620.0, 922.0, 1289.0, 1870.0, 2827.0, 4243.0, 6454.0, 10036.0, 15303.0, 24363.0, 38569.0, 63713.0, 112756.0, 280283.0, 225735.0, 100748.0, 57939.0, 35375.0, 22424.0, 14285.0, 9190.0, 5967.0, 4014.0, 2628.0, 1769.0, 1261.0, 822.0, 558.0, 412.0, 237.0, 187.0, 129.0, 90.0, 61.0, 49.0, 25.0, 19.0, 18.0, 10.0, 2.0, 6.0, 3.0, 3.0, 2.0, 3.0], "bins": [-1.39453125, -1.3521575927734375, -1.309783935546875, -1.2674102783203125, -1.22503662109375, -1.1826629638671875, -1.140289306640625, -1.0979156494140625, -1.0555419921875, -1.0131683349609375, -0.970794677734375, -0.9284210205078125, -0.88604736328125, -0.8436737060546875, -0.801300048828125, -0.7589263916015625, -0.716552734375, -0.6741790771484375, -0.631805419921875, -0.5894317626953125, -0.54705810546875, -0.5046844482421875, -0.462310791015625, -0.4199371337890625, -0.3775634765625, -0.3351898193359375, -0.292816162109375, -0.2504425048828125, -0.20806884765625, -0.1656951904296875, -0.123321533203125, -0.0809478759765625, -0.03857421875, 0.0037994384765625, 0.046173095703125, 0.0885467529296875, 0.13092041015625, 0.1732940673828125, 0.215667724609375, 0.2580413818359375, 0.3004150390625, 0.3427886962890625, 0.385162353515625, 0.4275360107421875, 0.46990966796875, 0.5122833251953125, 0.554656982421875, 0.5970306396484375, 0.639404296875, 0.6817779541015625, 0.724151611328125, 0.7665252685546875, 0.80889892578125, 0.8512725830078125, 0.893646240234375, 0.9360198974609375, 0.9783935546875, 1.0207672119140625, 1.063140869140625, 1.1055145263671875, 1.14788818359375, 1.1902618408203125, 1.232635498046875, 1.2750091552734375, 1.3173828125]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 2.0, 3.0, 5.0, 1.0, 10.0, 2.0, 8.0, 10.0, 5.0, 15.0, 10.0, 11.0, 17.0, 20.0, 17.0, 32.0, 18.0, 28.0, 23.0, 26.0, 46.0, 40.0, 33.0, 29.0, 34.0, 1076.0, 40.0, 45.0, 27.0, 48.0, 34.0, 36.0, 31.0, 39.0, 22.0, 28.0, 23.0, 20.0, 22.0, 18.0, 17.0, 15.0, 9.0, 10.0, 8.0, 4.0, 2.0, 4.0, 6.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.92578125, -3.78997802734375, -3.6541748046875, -3.51837158203125, -3.382568359375, -3.24676513671875, -3.1109619140625, -2.97515869140625, -2.83935546875, -2.70355224609375, -2.5677490234375, -2.43194580078125, -2.296142578125, -2.16033935546875, -2.0245361328125, -1.88873291015625, -1.7529296875, -1.61712646484375, -1.4813232421875, -1.34552001953125, -1.209716796875, -1.07391357421875, -0.9381103515625, -0.80230712890625, -0.66650390625, -0.53070068359375, -0.3948974609375, -0.25909423828125, -0.123291015625, 0.01251220703125, 0.1483154296875, 0.28411865234375, 0.419921875, 0.55572509765625, 0.6915283203125, 0.82733154296875, 0.963134765625, 1.09893798828125, 1.2347412109375, 1.37054443359375, 1.50634765625, 1.64215087890625, 1.7779541015625, 1.91375732421875, 2.049560546875, 2.18536376953125, 2.3211669921875, 2.45697021484375, 2.5927734375, 2.72857666015625, 2.8643798828125, 3.00018310546875, 3.135986328125, 3.27178955078125, 3.4075927734375, 3.54339599609375, 3.67919921875, 3.81500244140625, 3.9508056640625, 4.08660888671875, 4.222412109375, 4.35821533203125, 4.4940185546875, 4.62982177734375, 4.765625]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 7.0, 8.0, 15.0, 17.0, 16.0, 28.0, 55.0, 77.0, 105.0, 173.0, 245.0, 380.0, 582.0, 871.0, 1328.0, 2029.0, 3168.0, 4934.0, 7639.0, 12348.0, 19414.0, 32114.0, 55818.0, 105097.0, 1340002.0, 271822.0, 101158.0, 53405.0, 31737.0, 19223.0, 11983.0, 7687.0, 4800.0, 3106.0, 1953.0, 1281.0, 844.0, 540.0, 347.0, 240.0, 181.0, 105.0, 76.0, 59.0, 39.0, 22.0, 27.0, 7.0, 11.0, 5.0, 4.0, 2.0, 2.0, 2.0], "bins": [-1.6650390625, -1.617431640625, -1.56982421875, -1.522216796875, -1.474609375, -1.427001953125, -1.37939453125, -1.331787109375, -1.2841796875, -1.236572265625, -1.18896484375, -1.141357421875, -1.09375, -1.046142578125, -0.99853515625, -0.950927734375, -0.9033203125, -0.855712890625, -0.80810546875, -0.760498046875, -0.712890625, -0.665283203125, -0.61767578125, -0.570068359375, -0.5224609375, -0.474853515625, -0.42724609375, -0.379638671875, -0.33203125, -0.284423828125, -0.23681640625, -0.189208984375, -0.1416015625, -0.093994140625, -0.04638671875, 0.001220703125, 0.048828125, 0.096435546875, 0.14404296875, 0.191650390625, 0.2392578125, 0.286865234375, 0.33447265625, 0.382080078125, 0.4296875, 0.477294921875, 0.52490234375, 0.572509765625, 0.6201171875, 0.667724609375, 0.71533203125, 0.762939453125, 0.810546875, 0.858154296875, 0.90576171875, 0.953369140625, 1.0009765625, 1.048583984375, 1.09619140625, 1.143798828125, 1.19140625, 1.239013671875, 1.28662109375, 1.334228515625, 1.3818359375]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 4.0, 5.0, 5.0, 5.0, 8.0, 8.0, 7.0, 16.0, 20.0, 14.0, 32.0, 32.0, 37.0, 46.0, 46.0, 46.0, 47.0, 55.0, 65.0, 66.0, 74.0, 60.0, 43.0, 38.0, 36.0, 37.0, 22.0, 30.0, 25.0, 17.0, 8.0, 7.0, 9.0, 6.0, 12.0, 5.0, 3.0, 4.0, 3.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0008220672607421875, -0.0007936209440231323, -0.0007651746273040771, -0.000736728310585022, -0.0007082819938659668, -0.0006798356771469116, -0.0006513893604278564, -0.0006229430437088013, -0.0005944967269897461, -0.0005660504102706909, -0.0005376040935516357, -0.0005091577768325806, -0.0004807114601135254, -0.0004522651433944702, -0.00042381882667541504, -0.00039537250995635986, -0.0003669261932373047, -0.0003384798765182495, -0.00031003355979919434, -0.00028158724308013916, -0.000253140926361084, -0.0002246946096420288, -0.00019624829292297363, -0.00016780197620391846, -0.00013935565948486328, -0.0001109093427658081, -8.246302604675293e-05, -5.4016709327697754e-05, -2.5570392608642578e-05, 2.8759241104125977e-06, 3.1322240829467773e-05, 5.976855754852295e-05, 8.821487426757812e-05, 0.0001166611909866333, 0.00014510750770568848, 0.00017355382442474365, 0.00020200014114379883, 0.000230446457862854, 0.0002588927745819092, 0.00028733909130096436, 0.00031578540802001953, 0.0003442317247390747, 0.0003726780414581299, 0.00040112435817718506, 0.00042957067489624023, 0.0004580169916152954, 0.0004864633083343506, 0.0005149096250534058, 0.0005433559417724609, 0.0005718022584915161, 0.0006002485752105713, 0.0006286948919296265, 0.0006571412086486816, 0.0006855875253677368, 0.000714033842086792, 0.0007424801588058472, 0.0007709264755249023, 0.0007993727922439575, 0.0008278191089630127, 0.0008562654256820679, 0.000884711742401123, 0.0009131580591201782, 0.0009416043758392334, 0.0009700506925582886, 0.0009984970092773438]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 3.0, 6.0, 3.0, 5.0, 9.0, 8.0, 10.0, 15.0, 19.0, 23.0, 28.0, 42.0, 31.0, 54.0, 71.0, 107.0, 153.0, 378.0, 1549.0, 1034899.0, 9947.0, 541.0, 181.0, 119.0, 84.0, 64.0, 38.0, 46.0, 19.0, 19.0, 23.0, 16.0, 10.0, 7.0, 9.0, 5.0, 3.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.02581787109375, -0.025113821029663086, -0.024409770965576172, -0.023705720901489258, -0.023001670837402344, -0.02229762077331543, -0.021593570709228516, -0.0208895206451416, -0.020185470581054688, -0.019481420516967773, -0.01877737045288086, -0.018073320388793945, -0.01736927032470703, -0.016665220260620117, -0.015961170196533203, -0.015257120132446289, -0.014553070068359375, -0.013849020004272461, -0.013144969940185547, -0.012440919876098633, -0.011736869812011719, -0.011032819747924805, -0.01032876968383789, -0.009624719619750977, -0.008920669555664062, -0.008216619491577148, -0.007512569427490234, -0.00680851936340332, -0.006104469299316406, -0.005400419235229492, -0.004696369171142578, -0.003992319107055664, -0.00328826904296875, -0.002584218978881836, -0.0018801689147949219, -0.0011761188507080078, -0.00047206878662109375, 0.0002319812774658203, 0.0009360313415527344, 0.0016400814056396484, 0.0023441314697265625, 0.0030481815338134766, 0.0037522315979003906, 0.004456281661987305, 0.005160331726074219, 0.005864381790161133, 0.006568431854248047, 0.007272481918334961, 0.007976531982421875, 0.008680582046508789, 0.009384632110595703, 0.010088682174682617, 0.010792732238769531, 0.011496782302856445, 0.01220083236694336, 0.012904882431030273, 0.013608932495117188, 0.014312982559204102, 0.015017032623291016, 0.01572108268737793, 0.016425132751464844, 0.017129182815551758, 0.017833232879638672, 0.018537282943725586, 0.0192413330078125]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 11.0, 44.0, 113.0, 251.0, 251.0, 206.0, 89.0, 37.0, 7.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005941957933828235, -0.0005617249989882112, -0.0005292542628012598, -0.0004967834684066474, -0.0004643127031158656, -0.00043184193782508373, -0.0003993711434304714, -0.00036690037813968956, -0.0003344296128489077, -0.00030195884755812585, -0.000269488082267344, -0.00023701728787273169, -0.00020454652258194983, -0.00017207575729116797, -0.0001396049774484709, -0.0001071341976057738, -7.466343231499195e-05, -4.219265974825248e-05, -9.721887181513011e-06, 2.274888538522646e-05, 5.521965795196593e-05, 8.769042324274778e-05, 0.00012016120308544487, 0.00015263198292814195, 0.0001851027482189238, 0.00021757351350970566, 0.0002500442788004875, 0.00028251507319509983, 0.0003149858384858817, 0.00034745660377666354, 0.00037992739817127585, 0.0004123981634620577, 0.00044486881233751774, 0.0004773395776282996, 0.0005098103429190814, 0.0005422811373136938, 0.0005747518735006452, 0.0006072226678952575, 0.0006396934622898698, 0.0006721642566844821, 0.0007046349928714335, 0.0007371057872660458, 0.0007695765234529972, 0.0008020473178476095, 0.0008345181122422218, 0.0008669888484291732, 0.0008994596428237855, 0.0009319303790107369, 0.0009644011734053493, 0.0009968719677999616, 0.0010293427621945739, 0.0010618134401738644, 0.0010942842345684767, 0.001126755028963089, 0.0011592258233577013, 0.0011916966177523136, 0.001224167412146926, 0.0012566382065415382, 0.0012891090009361506, 0.001321579678915441, 0.0013540504733100533, 0.0013865212677046657, 0.001418992062099278, 0.0014514628564938903, 0.0014839335344731808]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 2.0, 6.0, 4.0, 8.0, 10.0, 8.0, 10.0, 10.0, 13.0, 20.0, 14.0, 18.0, 30.0, 29.0, 34.0, 41.0, 34.0, 41.0, 37.0, 39.0, 42.0, 43.0, 43.0, 46.0, 41.0, 37.0, 46.0, 38.0, 37.0, 23.0, 32.0, 28.0, 22.0, 24.0, 18.0, 18.0, 11.0, 5.0, 14.0, 9.0, 2.0, 9.0, 4.0, 8.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.0005475282669067383, -0.0005324399098753929, -0.0005173515528440475, -0.0005022631958127022, -0.0004871748387813568, -0.00047208648175001144, -0.0004569981247186661, -0.0004419097676873207, -0.00042682141065597534, -0.00041173305362463, -0.0003966446965932846, -0.00038155633956193924, -0.00036646798253059387, -0.0003513796254992485, -0.00033629126846790314, -0.00032120291143655777, -0.0003061145544052124, -0.00029102619737386703, -0.00027593784034252167, -0.0002608494833111763, -0.00024576112627983093, -0.00023067276924848557, -0.0002155844122171402, -0.00020049605518579483, -0.00018540769815444946, -0.0001703193411231041, -0.00015523098409175873, -0.00014014262706041336, -0.000125054270029068, -0.00010996591299772263, -9.487755596637726e-05, -7.978919893503189e-05, -6.470084190368652e-05, -4.9612484872341156e-05, -3.452412784099579e-05, -1.943577080965042e-05, -4.347413778305054e-06, 1.0740943253040314e-05, 2.582930028438568e-05, 4.091765731573105e-05, 5.6006014347076416e-05, 7.109437137842178e-05, 8.618272840976715e-05, 0.00010127108544111252, 0.00011635944247245789, 0.00013144779950380325, 0.00014653615653514862, 0.000161624513566494, 0.00017671287059783936, 0.00019180122762918472, 0.0002068895846605301, 0.00022197794169187546, 0.00023706629872322083, 0.0002521546557545662, 0.00026724301278591156, 0.00028233136981725693, 0.0002974197268486023, 0.00031250808387994766, 0.00032759644091129303, 0.0003426847979426384, 0.00035777315497398376, 0.00037286151200532913, 0.0003879498690366745, 0.00040303822606801987, 0.00041812658309936523]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 4.0, 5.0, 11.0, 8.0, 8.0, 23.0, 14.0, 21.0, 15.0, 16.0, 21.0, 24.0, 29.0, 24.0, 30.0, 38.0, 41.0, 41.0, 27.0, 42.0, 51.0, 40.0, 46.0, 39.0, 40.0, 44.0, 30.0, 31.0, 43.0, 30.0, 28.0, 16.0, 25.0, 14.0, 15.0, 14.0, 15.0, 9.0, 8.0, 6.0, 7.0, 5.0, 4.0, 3.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0], "bins": [-7.6953125, -7.47576904296875, -7.2562255859375, -7.03668212890625, -6.817138671875, -6.59759521484375, -6.3780517578125, -6.15850830078125, -5.93896484375, -5.71942138671875, -5.4998779296875, -5.28033447265625, -5.060791015625, -4.84124755859375, -4.6217041015625, -4.40216064453125, -4.1826171875, -3.96307373046875, -3.7435302734375, -3.52398681640625, -3.304443359375, -3.08489990234375, -2.8653564453125, -2.64581298828125, -2.42626953125, -2.20672607421875, -1.9871826171875, -1.76763916015625, -1.548095703125, -1.32855224609375, -1.1090087890625, -0.88946533203125, -0.669921875, -0.45037841796875, -0.2308349609375, -0.01129150390625, 0.208251953125, 0.42779541015625, 0.6473388671875, 0.86688232421875, 1.08642578125, 1.30596923828125, 1.5255126953125, 1.74505615234375, 1.964599609375, 2.18414306640625, 2.4036865234375, 2.62322998046875, 2.8427734375, 3.06231689453125, 3.2818603515625, 3.50140380859375, 3.720947265625, 3.94049072265625, 4.1600341796875, 4.37957763671875, 4.59912109375, 4.81866455078125, 5.0382080078125, 5.25775146484375, 5.477294921875, 5.69683837890625, 5.9163818359375, 6.13592529296875, 6.35546875]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 8.0, 11.0, 8.0, 18.0, 24.0, 25.0, 27.0, 42.0, 49.0, 81.0, 82.0, 117.0, 155.0, 258.0, 422.0, 721.0, 1456.0, 5651.0, 48172.0, 672551.0, 289357.0, 23094.0, 3307.0, 1061.0, 638.0, 362.0, 248.0, 163.0, 107.0, 86.0, 51.0, 46.0, 32.0, 32.0, 22.0, 17.0, 12.0, 11.0, 7.0, 8.0, 4.0, 4.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-14.1171875, -13.7120361328125, -13.306884765625, -12.9017333984375, -12.49658203125, -12.0914306640625, -11.686279296875, -11.2811279296875, -10.8759765625, -10.4708251953125, -10.065673828125, -9.6605224609375, -9.25537109375, -8.8502197265625, -8.445068359375, -8.0399169921875, -7.634765625, -7.2296142578125, -6.824462890625, -6.4193115234375, -6.01416015625, -5.6090087890625, -5.203857421875, -4.7987060546875, -4.3935546875, -3.9884033203125, -3.583251953125, -3.1781005859375, -2.77294921875, -2.3677978515625, -1.962646484375, -1.5574951171875, -1.15234375, -0.7471923828125, -0.342041015625, 0.0631103515625, 0.46826171875, 0.8734130859375, 1.278564453125, 1.6837158203125, 2.0888671875, 2.4940185546875, 2.899169921875, 3.3043212890625, 3.70947265625, 4.1146240234375, 4.519775390625, 4.9249267578125, 5.330078125, 5.7352294921875, 6.140380859375, 6.5455322265625, 6.95068359375, 7.3558349609375, 7.760986328125, 8.1661376953125, 8.5712890625, 8.9764404296875, 9.381591796875, 9.7867431640625, 10.19189453125, 10.5970458984375, 11.002197265625, 11.4073486328125, 11.8125]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 8.0, 6.0, 4.0, 5.0, 12.0, 13.0, 8.0, 16.0, 15.0, 26.0, 28.0, 38.0, 41.0, 43.0, 40.0, 46.0, 65.0, 58.0, 185.0, 1794.0, 150.0, 57.0, 52.0, 41.0, 42.0, 37.0, 32.0, 42.0, 31.0, 20.0, 17.0, 16.0, 15.0, 14.0, 5.0, 8.0, 4.0, 7.0, 5.0, 1.0, 4.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-23.59375, -22.792236328125, -21.99072265625, -21.189208984375, -20.3876953125, -19.586181640625, -18.78466796875, -17.983154296875, -17.181640625, -16.380126953125, -15.57861328125, -14.777099609375, -13.9755859375, -13.174072265625, -12.37255859375, -11.571044921875, -10.76953125, -9.968017578125, -9.16650390625, -8.364990234375, -7.5634765625, -6.761962890625, -5.96044921875, -5.158935546875, -4.357421875, -3.555908203125, -2.75439453125, -1.952880859375, -1.1513671875, -0.349853515625, 0.45166015625, 1.253173828125, 2.0546875, 2.856201171875, 3.65771484375, 4.459228515625, 5.2607421875, 6.062255859375, 6.86376953125, 7.665283203125, 8.466796875, 9.268310546875, 10.06982421875, 10.871337890625, 11.6728515625, 12.474365234375, 13.27587890625, 14.077392578125, 14.87890625, 15.680419921875, 16.48193359375, 17.283447265625, 18.0849609375, 18.886474609375, 19.68798828125, 20.489501953125, 21.291015625, 22.092529296875, 22.89404296875, 23.695556640625, 24.4970703125, 25.298583984375, 26.10009765625, 26.901611328125, 27.703125]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 7.0, 1.0, 4.0, 5.0, 8.0, 5.0, 6.0, 11.0, 17.0, 11.0, 21.0, 13.0, 34.0, 45.0, 42.0, 57.0, 73.0, 123.0, 162.0, 342.0, 826.0, 38374.0, 3102439.0, 1837.0, 496.0, 251.0, 119.0, 78.0, 65.0, 61.0, 33.0, 30.0, 27.0, 18.0, 13.0, 12.0, 12.0, 8.0, 5.0, 5.0, 6.0, 7.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-81.0625, -78.693359375, -76.32421875, -73.955078125, -71.5859375, -69.216796875, -66.84765625, -64.478515625, -62.109375, -59.740234375, -57.37109375, -55.001953125, -52.6328125, -50.263671875, -47.89453125, -45.525390625, -43.15625, -40.787109375, -38.41796875, -36.048828125, -33.6796875, -31.310546875, -28.94140625, -26.572265625, -24.203125, -21.833984375, -19.46484375, -17.095703125, -14.7265625, -12.357421875, -9.98828125, -7.619140625, -5.25, -2.880859375, -0.51171875, 1.857421875, 4.2265625, 6.595703125, 8.96484375, 11.333984375, 13.703125, 16.072265625, 18.44140625, 20.810546875, 23.1796875, 25.548828125, 27.91796875, 30.287109375, 32.65625, 35.025390625, 37.39453125, 39.763671875, 42.1328125, 44.501953125, 46.87109375, 49.240234375, 51.609375, 53.978515625, 56.34765625, 58.716796875, 61.0859375, 63.455078125, 65.82421875, 68.193359375, 70.5625]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 37.0, 971.0, 12.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.89371109008789, -31.734853744506836, -24.57599639892578, -17.417139053344727, -10.258281707763672, -3.0994224548339844, 4.0594329833984375, 11.21828842163086, 18.377147674560547, 25.5360050201416, 32.694862365722656, 39.853721618652344, 47.012577056884766, 54.17143630981445, 61.330291748046875, 68.48915100097656, 75.64801025390625, 82.80686950683594, 89.96572875976562, 97.12458038330078, 104.28343963623047, 111.44229888916016, 118.60115051269531, 125.760009765625, 132.9188690185547, 140.07772827148438, 147.23658752441406, 154.39544677734375, 161.55429077148438, 168.71316528320312, 175.87200927734375, 183.03086853027344, 190.18972778320312, 197.3485870361328, 204.5074462890625, 211.6663055419922, 218.82516479492188, 225.9840087890625, 233.1428680419922, 240.30172729492188, 247.46058654785156, 254.61944580078125, 261.7782897949219, 268.9371643066406, 276.09600830078125, 283.2548828125, 290.4137268066406, 297.57257080078125, 304.7314453125, 311.8902893066406, 319.0491638183594, 326.2080078125, 333.36688232421875, 340.5257263183594, 347.6846008300781, 354.84344482421875, 362.0023193359375, 369.1611633300781, 376.3200378417969, 383.4788818359375, 390.63775634765625, 397.7966003417969, 404.9554748535156, 412.11431884765625, 419.2731628417969]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 4.0, 2.0, 5.0, 10.0, 9.0, 14.0, 17.0, 13.0, 16.0, 15.0, 15.0, 14.0, 26.0, 24.0, 23.0, 41.0, 27.0, 33.0, 48.0, 36.0, 41.0, 34.0, 44.0, 43.0, 34.0, 33.0, 38.0, 39.0, 33.0, 45.0, 25.0, 30.0, 13.0, 24.0, 27.0, 15.0, 14.0, 14.0, 12.0, 10.0, 9.0, 6.0, 5.0, 4.0, 5.0, 3.0, 3.0, 6.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-66.64518737792969, -64.67286682128906, -62.70055389404297, -60.728233337402344, -58.755916595458984, -56.783599853515625, -54.811279296875, -52.83896255493164, -50.86664581298828, -48.89432907104492, -46.92201232910156, -44.94969177246094, -42.97737503051758, -41.00505828857422, -39.032737731933594, -37.060420989990234, -35.088104248046875, -33.115787506103516, -31.143468856811523, -29.17115020751953, -27.198833465576172, -25.226516723632812, -23.25419807434082, -21.281879425048828, -19.30956268310547, -17.33724594116211, -15.364927291870117, -13.392609596252441, -11.420291900634766, -9.44797420501709, -7.475656509399414, -5.503338813781738, -3.531024932861328, -1.5587072372436523, 0.41361045837402344, 2.385928153991699, 4.358245849609375, 6.330563545227051, 8.302881240844727, 10.275198936462402, 12.247516632080078, 14.219834327697754, 16.19215202331543, 18.164470672607422, 20.13678741455078, 22.10910415649414, 24.081422805786133, 26.053741455078125, 28.026058197021484, 29.998374938964844, 31.970693588256836, 33.94301223754883, 35.91532897949219, 37.88764572143555, 39.859962463378906, 41.83228302001953, 43.80459976196289, 45.77691650390625, 47.749237060546875, 49.721553802490234, 51.693870544433594, 53.66618728637695, 55.63850402832031, 57.61082458496094, 59.5831413269043]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 8.0, 6.0, 9.0, 7.0, 8.0, 10.0, 8.0, 15.0, 15.0, 32.0, 15.0, 19.0, 30.0, 24.0, 35.0, 31.0, 39.0, 28.0, 51.0, 49.0, 33.0, 42.0, 38.0, 45.0, 36.0, 40.0, 35.0, 42.0, 37.0, 35.0, 29.0, 24.0, 15.0, 20.0, 20.0, 12.0, 12.0, 15.0, 5.0, 11.0, 8.0, 4.0, 6.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-7.80078125, -7.5692138671875, -7.337646484375, -7.1060791015625, -6.87451171875, -6.6429443359375, -6.411376953125, -6.1798095703125, -5.9482421875, -5.7166748046875, -5.485107421875, -5.2535400390625, -5.02197265625, -4.7904052734375, -4.558837890625, -4.3272705078125, -4.095703125, -3.8641357421875, -3.632568359375, -3.4010009765625, -3.16943359375, -2.9378662109375, -2.706298828125, -2.4747314453125, -2.2431640625, -2.0115966796875, -1.780029296875, -1.5484619140625, -1.31689453125, -1.0853271484375, -0.853759765625, -0.6221923828125, -0.390625, -0.1590576171875, 0.072509765625, 0.3040771484375, 0.53564453125, 0.7672119140625, 0.998779296875, 1.2303466796875, 1.4619140625, 1.6934814453125, 1.925048828125, 2.1566162109375, 2.38818359375, 2.6197509765625, 2.851318359375, 3.0828857421875, 3.314453125, 3.5460205078125, 3.777587890625, 4.0091552734375, 4.24072265625, 4.4722900390625, 4.703857421875, 4.9354248046875, 5.1669921875, 5.3985595703125, 5.630126953125, 5.8616943359375, 6.09326171875, 6.3248291015625, 6.556396484375, 6.7879638671875, 7.01953125]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 7.0, 9.0, 9.0, 7.0, 9.0, 11.0, 20.0, 32.0, 44.0, 38.0, 44.0, 59.0, 79.0, 96.0, 159.0, 222.0, 324.0, 660.0, 1270.0, 2937.0, 8641.0, 35837.0, 198697.0, 854894.0, 1702450.0, 1047188.0, 270004.0, 51294.0, 11947.0, 3765.0, 1514.0, 701.0, 416.0, 252.0, 149.0, 131.0, 77.0, 63.0, 45.0, 51.0, 30.0, 28.0, 18.0, 17.0, 13.0, 9.0, 5.0, 4.0, 6.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-9.375, -9.095947265625, -8.81689453125, -8.537841796875, -8.2587890625, -7.979736328125, -7.70068359375, -7.421630859375, -7.142578125, -6.863525390625, -6.58447265625, -6.305419921875, -6.0263671875, -5.747314453125, -5.46826171875, -5.189208984375, -4.91015625, -4.631103515625, -4.35205078125, -4.072998046875, -3.7939453125, -3.514892578125, -3.23583984375, -2.956787109375, -2.677734375, -2.398681640625, -2.11962890625, -1.840576171875, -1.5615234375, -1.282470703125, -1.00341796875, -0.724365234375, -0.4453125, -0.166259765625, 0.11279296875, 0.391845703125, 0.6708984375, 0.949951171875, 1.22900390625, 1.508056640625, 1.787109375, 2.066162109375, 2.34521484375, 2.624267578125, 2.9033203125, 3.182373046875, 3.46142578125, 3.740478515625, 4.01953125, 4.298583984375, 4.57763671875, 4.856689453125, 5.1357421875, 5.414794921875, 5.69384765625, 5.972900390625, 6.251953125, 6.531005859375, 6.81005859375, 7.089111328125, 7.3681640625, 7.647216796875, 7.92626953125, 8.205322265625, 8.484375]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 6.0, 8.0, 4.0, 11.0, 22.0, 39.0, 48.0, 81.0, 129.0, 180.0, 252.0, 436.0, 614.0, 663.0, 505.0, 350.0, 249.0, 153.0, 116.0, 87.0, 42.0, 30.0, 17.0, 14.0, 14.0, 7.0, 5.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.0, -19.3798828125, -18.759765625, -18.1396484375, -17.51953125, -16.8994140625, -16.279296875, -15.6591796875, -15.0390625, -14.4189453125, -13.798828125, -13.1787109375, -12.55859375, -11.9384765625, -11.318359375, -10.6982421875, -10.078125, -9.4580078125, -8.837890625, -8.2177734375, -7.59765625, -6.9775390625, -6.357421875, -5.7373046875, -5.1171875, -4.4970703125, -3.876953125, -3.2568359375, -2.63671875, -2.0166015625, -1.396484375, -0.7763671875, -0.15625, 0.4638671875, 1.083984375, 1.7041015625, 2.32421875, 2.9443359375, 3.564453125, 4.1845703125, 4.8046875, 5.4248046875, 6.044921875, 6.6650390625, 7.28515625, 7.9052734375, 8.525390625, 9.1455078125, 9.765625, 10.3857421875, 11.005859375, 11.6259765625, 12.24609375, 12.8662109375, 13.486328125, 14.1064453125, 14.7265625, 15.3466796875, 15.966796875, 16.5869140625, 17.20703125, 17.8271484375, 18.447265625, 19.0673828125, 19.6875]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 4.0, 4.0, 6.0, 10.0, 13.0, 16.0, 17.0, 29.0, 31.0, 50.0, 75.0, 92.0, 115.0, 145.0, 188.0, 211.0, 290.0, 433.0, 912.0, 6690.0, 4085499.0, 96058.0, 1474.0, 526.0, 330.0, 251.0, 176.0, 163.0, 109.0, 88.0, 64.0, 70.0, 40.0, 35.0, 22.0, 17.0, 9.0, 10.0, 5.0, 2.0, 4.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.25, -66.02734375, -63.8046875, -61.58203125, -59.359375, -57.13671875, -54.9140625, -52.69140625, -50.46875, -48.24609375, -46.0234375, -43.80078125, -41.578125, -39.35546875, -37.1328125, -34.91015625, -32.6875, -30.46484375, -28.2421875, -26.01953125, -23.796875, -21.57421875, -19.3515625, -17.12890625, -14.90625, -12.68359375, -10.4609375, -8.23828125, -6.015625, -3.79296875, -1.5703125, 0.65234375, 2.875, 5.09765625, 7.3203125, 9.54296875, 11.765625, 13.98828125, 16.2109375, 18.43359375, 20.65625, 22.87890625, 25.1015625, 27.32421875, 29.546875, 31.76953125, 33.9921875, 36.21484375, 38.4375, 40.66015625, 42.8828125, 45.10546875, 47.328125, 49.55078125, 51.7734375, 53.99609375, 56.21875, 58.44140625, 60.6640625, 62.88671875, 65.109375, 67.33203125, 69.5546875, 71.77734375, 74.0]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 2.0, 11.0, 470.0, 512.0, 20.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.965850830078125, -29.18315315246582, -19.400455474853516, -9.617757797241211, 0.16493988037109375, 9.947639465332031, 19.730335235595703, 29.513031005859375, 39.29573059082031, 49.07843017578125, 58.86112594604492, 68.6438217163086, 78.42652130126953, 88.20922088623047, 97.99191284179688, 107.77461242675781, 117.55731201171875, 127.34001159667969, 137.12271118164062, 146.90541076660156, 156.6881103515625, 166.47079467773438, 176.2534942626953, 186.03619384765625, 195.8188934326172, 205.60159301757812, 215.38429260253906, 225.1669921875, 234.94967651367188, 244.73239135742188, 254.51507568359375, 264.29779052734375, 274.0804443359375, 283.8631286621094, 293.6458435058594, 303.42852783203125, 313.21124267578125, 322.9939270019531, 332.7766418457031, 342.559326171875, 352.342041015625, 362.1247253417969, 371.9074401855469, 381.69012451171875, 391.47283935546875, 401.2555236816406, 411.0382385253906, 420.8209228515625, 430.6036071777344, 440.38629150390625, 450.16900634765625, 459.9516906738281, 469.7344055175781, 479.51708984375, 489.2998046875, 499.0824890136719, 508.86517333984375, 518.6478881835938, 528.4305419921875, 538.2132568359375, 547.9959716796875, 557.7786865234375, 567.5613403320312, 577.3440551757812, 587.1267700195312]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 3.0, 3.0, 5.0, 5.0, 9.0, 10.0, 11.0, 10.0, 16.0, 17.0, 17.0, 21.0, 29.0, 24.0, 19.0, 31.0, 32.0, 40.0, 42.0, 45.0, 51.0, 45.0, 42.0, 64.0, 48.0, 38.0, 39.0, 34.0, 40.0, 26.0, 33.0, 22.0, 21.0, 29.0, 17.0, 19.0, 11.0, 13.0, 7.0, 6.0, 5.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.33057403564453, -46.683143615722656, -45.035709381103516, -43.38827896118164, -41.740848541259766, -40.093414306640625, -38.44598388671875, -36.798553466796875, -35.151119232177734, -33.50368881225586, -31.85625648498535, -30.208824157714844, -28.561391830444336, -26.913959503173828, -25.266529083251953, -23.619096755981445, -21.97166633605957, -20.324234008789062, -18.676803588867188, -17.02937126159668, -15.381938934326172, -13.73450756072998, -12.087076187133789, -10.439643859863281, -8.79221248626709, -7.14478063583374, -5.497348785400391, -3.849917411804199, -2.2024855613708496, -0.5550537109375, 1.0923776626586914, 2.739809989929199, 4.387241363525391, 6.03467321395874, 7.68210506439209, 9.329536437988281, 10.976968765258789, 12.62440013885498, 14.271831512451172, 15.91926383972168, 17.566696166992188, 19.214128494262695, 20.86155891418457, 22.508991241455078, 24.156423568725586, 25.803855895996094, 27.45128631591797, 29.098718643188477, 30.74614906311035, 32.39358139038086, 34.041011810302734, 35.688446044921875, 37.33587646484375, 38.983306884765625, 40.6307373046875, 42.27817153930664, 43.925601959228516, 45.57303237915039, 47.22046661376953, 48.867897033691406, 50.51532745361328, 52.16276168823242, 53.8101921081543, 55.45762634277344, 57.10505676269531]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 7.0, 5.0, 7.0, 13.0, 12.0, 11.0, 11.0, 22.0, 22.0, 20.0, 25.0, 25.0, 34.0, 38.0, 36.0, 50.0, 43.0, 51.0, 48.0, 47.0, 37.0, 37.0, 41.0, 52.0, 42.0, 44.0, 27.0, 35.0, 20.0, 29.0, 19.0, 19.0, 18.0, 10.0, 8.0, 10.0, 10.0, 6.0, 2.0, 4.0, 6.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.515625, -7.26953125, -7.0234375, -6.77734375, -6.53125, -6.28515625, -6.0390625, -5.79296875, -5.546875, -5.30078125, -5.0546875, -4.80859375, -4.5625, -4.31640625, -4.0703125, -3.82421875, -3.578125, -3.33203125, -3.0859375, -2.83984375, -2.59375, -2.34765625, -2.1015625, -1.85546875, -1.609375, -1.36328125, -1.1171875, -0.87109375, -0.625, -0.37890625, -0.1328125, 0.11328125, 0.359375, 0.60546875, 0.8515625, 1.09765625, 1.34375, 1.58984375, 1.8359375, 2.08203125, 2.328125, 2.57421875, 2.8203125, 3.06640625, 3.3125, 3.55859375, 3.8046875, 4.05078125, 4.296875, 4.54296875, 4.7890625, 5.03515625, 5.28125, 5.52734375, 5.7734375, 6.01953125, 6.265625, 6.51171875, 6.7578125, 7.00390625, 7.25, 7.49609375, 7.7421875, 7.98828125, 8.234375]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 4.0, 7.0, 9.0, 19.0, 38.0, 49.0, 68.0, 92.0, 156.0, 230.0, 325.0, 509.0, 842.0, 1255.0, 1992.0, 3106.0, 5012.0, 7782.0, 12607.0, 20209.0, 33663.0, 59216.0, 112340.0, 284418.0, 256992.0, 107015.0, 56209.0, 32124.0, 19310.0, 12066.0, 7568.0, 4772.0, 3105.0, 1938.0, 1229.0, 810.0, 484.0, 357.0, 207.0, 147.0, 91.0, 61.0, 35.0, 31.0, 23.0, 14.0, 11.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-1.5712890625, -1.522125244140625, -1.47296142578125, -1.423797607421875, -1.3746337890625, -1.325469970703125, -1.27630615234375, -1.227142333984375, -1.177978515625, -1.128814697265625, -1.07965087890625, -1.030487060546875, -0.9813232421875, -0.932159423828125, -0.88299560546875, -0.833831787109375, -0.78466796875, -0.735504150390625, -0.68634033203125, -0.637176513671875, -0.5880126953125, -0.538848876953125, -0.48968505859375, -0.440521240234375, -0.391357421875, -0.342193603515625, -0.29302978515625, -0.243865966796875, -0.1947021484375, -0.145538330078125, -0.09637451171875, -0.047210693359375, 0.001953125, 0.051116943359375, 0.10028076171875, 0.149444580078125, 0.1986083984375, 0.247772216796875, 0.29693603515625, 0.346099853515625, 0.395263671875, 0.444427490234375, 0.49359130859375, 0.542755126953125, 0.5919189453125, 0.641082763671875, 0.69024658203125, 0.739410400390625, 0.78857421875, 0.837738037109375, 0.88690185546875, 0.936065673828125, 0.9852294921875, 1.034393310546875, 1.08355712890625, 1.132720947265625, 1.181884765625, 1.231048583984375, 1.28021240234375, 1.329376220703125, 1.3785400390625, 1.427703857421875, 1.47686767578125, 1.526031494140625, 1.5751953125]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 8.0, 5.0, 5.0, 13.0, 10.0, 7.0, 27.0, 14.0, 21.0, 29.0, 19.0, 25.0, 25.0, 22.0, 38.0, 41.0, 54.0, 35.0, 40.0, 50.0, 1063.0, 41.0, 35.0, 37.0, 29.0, 32.0, 34.0, 32.0, 23.0, 26.0, 28.0, 28.0, 27.0, 24.0, 16.0, 13.0, 11.0, 9.0, 5.0, 10.0, 7.0, 3.0, 1.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.37890625, -4.2325439453125, -4.086181640625, -3.9398193359375, -3.79345703125, -3.6470947265625, -3.500732421875, -3.3543701171875, -3.2080078125, -3.0616455078125, -2.915283203125, -2.7689208984375, -2.62255859375, -2.4761962890625, -2.329833984375, -2.1834716796875, -2.037109375, -1.8907470703125, -1.744384765625, -1.5980224609375, -1.45166015625, -1.3052978515625, -1.158935546875, -1.0125732421875, -0.8662109375, -0.7198486328125, -0.573486328125, -0.4271240234375, -0.28076171875, -0.1343994140625, 0.011962890625, 0.1583251953125, 0.3046875, 0.4510498046875, 0.597412109375, 0.7437744140625, 0.89013671875, 1.0364990234375, 1.182861328125, 1.3292236328125, 1.4755859375, 1.6219482421875, 1.768310546875, 1.9146728515625, 2.06103515625, 2.2073974609375, 2.353759765625, 2.5001220703125, 2.646484375, 2.7928466796875, 2.939208984375, 3.0855712890625, 3.23193359375, 3.3782958984375, 3.524658203125, 3.6710205078125, 3.8173828125, 3.9637451171875, 4.110107421875, 4.2564697265625, 4.40283203125, 4.5491943359375, 4.695556640625, 4.8419189453125, 4.98828125]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 7.0, 6.0, 6.0, 12.0, 20.0, 38.0, 44.0, 66.0, 99.0, 150.0, 255.0, 388.0, 559.0, 941.0, 1469.0, 2431.0, 3873.0, 6303.0, 10424.0, 17024.0, 27990.0, 47295.0, 87979.0, 201931.0, 1408104.0, 124568.0, 62966.0, 35923.0, 21903.0, 13347.0, 8039.0, 4942.0, 2941.0, 1859.0, 1190.0, 723.0, 439.0, 301.0, 200.0, 130.0, 77.0, 65.0, 35.0, 25.0, 19.0, 13.0, 8.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-1.75, -1.6988983154296875, -1.647796630859375, -1.5966949462890625, -1.54559326171875, -1.4944915771484375, -1.443389892578125, -1.3922882080078125, -1.3411865234375, -1.2900848388671875, -1.238983154296875, -1.1878814697265625, -1.13677978515625, -1.0856781005859375, -1.034576416015625, -0.9834747314453125, -0.932373046875, -0.8812713623046875, -0.830169677734375, -0.7790679931640625, -0.72796630859375, -0.6768646240234375, -0.625762939453125, -0.5746612548828125, -0.5235595703125, -0.4724578857421875, -0.421356201171875, -0.3702545166015625, -0.31915283203125, -0.2680511474609375, -0.216949462890625, -0.1658477783203125, -0.11474609375, -0.0636444091796875, -0.012542724609375, 0.0385589599609375, 0.08966064453125, 0.1407623291015625, 0.191864013671875, 0.2429656982421875, 0.2940673828125, 0.3451690673828125, 0.396270751953125, 0.4473724365234375, 0.49847412109375, 0.5495758056640625, 0.600677490234375, 0.6517791748046875, 0.702880859375, 0.7539825439453125, 0.805084228515625, 0.8561859130859375, 0.90728759765625, 0.9583892822265625, 1.009490966796875, 1.0605926513671875, 1.1116943359375, 1.1627960205078125, 1.213897705078125, 1.2649993896484375, 1.31610107421875, 1.3672027587890625, 1.418304443359375, 1.4694061279296875, 1.5205078125]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 6.0, 5.0, 3.0, 11.0, 10.0, 22.0, 28.0, 24.0, 49.0, 61.0, 77.0, 85.0, 114.0, 108.0, 82.0, 85.0, 64.0, 46.0, 36.0, 20.0, 12.0, 10.0, 5.0, 5.0, 8.0, 3.0, 6.0, 5.0, 4.0, 4.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0013675689697265625, -0.0013282299041748047, -0.0012888908386230469, -0.001249551773071289, -0.0012102127075195312, -0.0011708736419677734, -0.0011315345764160156, -0.0010921955108642578, -0.0010528564453125, -0.0010135173797607422, -0.0009741783142089844, -0.0009348392486572266, -0.0008955001831054688, -0.0008561611175537109, -0.0008168220520019531, -0.0007774829864501953, -0.0007381439208984375, -0.0006988048553466797, -0.0006594657897949219, -0.0006201267242431641, -0.0005807876586914062, -0.0005414485931396484, -0.0005021095275878906, -0.0004627704620361328, -0.000423431396484375, -0.0003840923309326172, -0.0003447532653808594, -0.00030541419982910156, -0.00026607513427734375, -0.00022673606872558594, -0.00018739700317382812, -0.0001480579376220703, -0.0001087188720703125, -6.937980651855469e-05, -3.0040740966796875e-05, 9.298324584960938e-06, 4.863739013671875e-05, 8.797645568847656e-05, 0.00012731552124023438, 0.0001666545867919922, 0.00020599365234375, 0.0002453327178955078, 0.0002846717834472656, 0.00032401084899902344, 0.00036334991455078125, 0.00040268898010253906, 0.0004420280456542969, 0.0004813671112060547, 0.0005207061767578125, 0.0005600452423095703, 0.0005993843078613281, 0.0006387233734130859, 0.0006780624389648438, 0.0007174015045166016, 0.0007567405700683594, 0.0007960796356201172, 0.000835418701171875, 0.0008747577667236328, 0.0009140968322753906, 0.0009534358978271484, 0.0009927749633789062, 0.001032114028930664, 0.0010714530944824219, 0.0011107921600341797, 0.0011501312255859375]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 4.0, 7.0, 3.0, 8.0, 3.0, 10.0, 5.0, 11.0, 23.0, 34.0, 62.0, 94.0, 157.0, 351.0, 1292.0, 1043025.0, 2624.0, 404.0, 166.0, 103.0, 53.0, 40.0, 24.0, 10.0, 16.0, 5.0, 6.0, 4.0, 5.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0289764404296875, -0.027963876724243164, -0.026951313018798828, -0.025938749313354492, -0.024926185607910156, -0.02391362190246582, -0.022901058197021484, -0.02188849449157715, -0.020875930786132812, -0.019863367080688477, -0.01885080337524414, -0.017838239669799805, -0.01682567596435547, -0.015813112258911133, -0.014800548553466797, -0.013787984848022461, -0.012775421142578125, -0.011762857437133789, -0.010750293731689453, -0.009737730026245117, -0.008725166320800781, -0.007712602615356445, -0.006700038909912109, -0.0056874752044677734, -0.0046749114990234375, -0.0036623477935791016, -0.0026497840881347656, -0.0016372203826904297, -0.0006246566772460938, 0.0003879070281982422, 0.0014004707336425781, 0.002413034439086914, 0.00342559814453125, 0.004438161849975586, 0.005450725555419922, 0.006463289260864258, 0.007475852966308594, 0.00848841667175293, 0.009500980377197266, 0.010513544082641602, 0.011526107788085938, 0.012538671493530273, 0.01355123519897461, 0.014563798904418945, 0.015576362609863281, 0.016588926315307617, 0.017601490020751953, 0.01861405372619629, 0.019626617431640625, 0.02063918113708496, 0.021651744842529297, 0.022664308547973633, 0.02367687225341797, 0.024689435958862305, 0.02570199966430664, 0.026714563369750977, 0.027727127075195312, 0.02873969078063965, 0.029752254486083984, 0.03076481819152832, 0.031777381896972656, 0.03278994560241699, 0.03380250930786133, 0.034815073013305664, 0.03582763671875]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 7.0, 41.0, 160.0, 304.0, 309.0, 144.0, 37.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001972215250134468, -0.001935682026669383, -0.0018991489196196198, -0.0018626156961545348, -0.0018260825891047716, -0.0017895493656396866, -0.0017530162585899234, -0.0017164830351248384, -0.0016799499280750751, -0.0016434167046099901, -0.001606883597560227, -0.0015703503740951419, -0.0015338172670453787, -0.0014972840435802937, -0.0014607509365305305, -0.0014242177130654454, -0.0013876844896003604, -0.0013511512661352754, -0.0013146181590855122, -0.0012780849356204271, -0.001241551828570664, -0.001205018605105579, -0.0011684854980558157, -0.0011319522745907307, -0.0010954190511256456, -0.0010588858276605606, -0.0010223527206107974, -0.0009858194971457124, -0.0009492863900959492, -0.0009127531666308641, -0.00087622000137344, -0.0008396868361160159, -0.0008031537872739136, -0.0007666206220164895, -0.0007300874567590654, -0.0006935542915016413, -0.0006570210680365562, -0.000620487960986793, -0.000583954737521708, -0.0005474215722642839, -0.0005108884070068598, -0.00047435524174943566, -0.00043782207649201155, -0.000401288882130757, -0.00036475571687333286, -0.00032822255161590874, -0.00029168935725465417, -0.00025515619199723005, -0.00021862302673980594, -0.00018208986148238182, -0.00014555668167304248, -0.00010902350913966075, -7.249033660627902e-05, -3.59571713488549e-05, 5.760084604844451e-07, 3.710918826982379e-05, 7.36423535272479e-05, 0.00011017552606062964, 0.00014670869859401137, 0.0001832418784033507, 0.00021977504366077483, 0.00025630820891819894, 0.0002928414032794535, 0.00032937456853687763, 0.00036590773379430175]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 7.0, 3.0, 3.0, 6.0, 6.0, 6.0, 8.0, 10.0, 15.0, 12.0, 19.0, 23.0, 16.0, 24.0, 16.0, 25.0, 28.0, 32.0, 43.0, 32.0, 23.0, 43.0, 43.0, 36.0, 39.0, 37.0, 42.0, 44.0, 45.0, 26.0, 50.0, 25.0, 20.0, 23.0, 26.0, 24.0, 18.0, 13.0, 19.0, 19.0, 17.0, 11.0, 5.0, 8.0, 4.0, 7.0, 2.0, 3.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0004375576972961426, -0.00042377132922410965, -0.0004099849611520767, -0.0003961985930800438, -0.00038241222500801086, -0.00036862585693597794, -0.000354839488863945, -0.0003410531207919121, -0.00032726675271987915, -0.0003134803846478462, -0.0002996940165758133, -0.00028590764850378036, -0.00027212128043174744, -0.0002583349123597145, -0.0002445485442876816, -0.00023076217621564865, -0.00021697580814361572, -0.0002031894400715828, -0.00018940307199954987, -0.00017561670392751694, -0.000161830335855484, -0.00014804396778345108, -0.00013425759971141815, -0.00012047123163938522, -0.0001066848635673523, -9.289849549531937e-05, -7.911212742328644e-05, -6.532575935125351e-05, -5.153939127922058e-05, -3.775302320718765e-05, -2.3966655135154724e-05, -1.0180287063121796e-05, 3.606081008911133e-06, 1.739244908094406e-05, 3.117881715297699e-05, 4.496518522500992e-05, 5.875155329704285e-05, 7.253792136907578e-05, 8.63242894411087e-05, 0.00010011065751314163, 0.00011389702558517456, 0.0001276833936572075, 0.00014146976172924042, 0.00015525612980127335, 0.00016904249787330627, 0.0001828288659453392, 0.00019661523401737213, 0.00021040160208940506, 0.000224187970161438, 0.00023797433823347092, 0.00025176070630550385, 0.0002655470743775368, 0.0002793334424495697, 0.00029311981052160263, 0.00030690617859363556, 0.0003206925466656685, 0.0003344789147377014, 0.00034826528280973434, 0.0003620516508817673, 0.0003758380189538002, 0.00038962438702583313, 0.00040341075509786606, 0.000417197123169899, 0.0004309834912419319, 0.00044476985931396484]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 7.0, 5.0, 7.0, 13.0, 12.0, 11.0, 11.0, 22.0, 22.0, 20.0, 25.0, 25.0, 34.0, 38.0, 36.0, 50.0, 43.0, 51.0, 48.0, 47.0, 37.0, 37.0, 41.0, 52.0, 42.0, 44.0, 27.0, 35.0, 20.0, 29.0, 19.0, 19.0, 18.0, 10.0, 8.0, 10.0, 10.0, 6.0, 2.0, 4.0, 6.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.515625, -7.26953125, -7.0234375, -6.77734375, -6.53125, -6.28515625, -6.0390625, -5.79296875, -5.546875, -5.30078125, -5.0546875, -4.80859375, -4.5625, -4.31640625, -4.0703125, -3.82421875, -3.578125, -3.33203125, -3.0859375, -2.83984375, -2.59375, -2.34765625, -2.1015625, -1.85546875, -1.609375, -1.36328125, -1.1171875, -0.87109375, -0.625, -0.37890625, -0.1328125, 0.11328125, 0.359375, 0.60546875, 0.8515625, 1.09765625, 1.34375, 1.58984375, 1.8359375, 2.08203125, 2.328125, 2.57421875, 2.8203125, 3.06640625, 3.3125, 3.55859375, 3.8046875, 4.05078125, 4.296875, 4.54296875, 4.7890625, 5.03515625, 5.28125, 5.52734375, 5.7734375, 6.01953125, 6.265625, 6.51171875, 6.7578125, 7.00390625, 7.25, 7.49609375, 7.7421875, 7.98828125, 8.234375]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 7.0, 4.0, 12.0, 12.0, 9.0, 22.0, 27.0, 27.0, 36.0, 44.0, 75.0, 105.0, 213.0, 379.0, 815.0, 1755.0, 4341.0, 11200.0, 31559.0, 95046.0, 315649.0, 396761.0, 125999.0, 40735.0, 14155.0, 5327.0, 2152.0, 938.0, 465.0, 253.0, 131.0, 84.0, 62.0, 43.0, 24.0, 29.0, 15.0, 13.0, 13.0, 12.0, 5.0, 1.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.1640625, -5.95941162109375, -5.7547607421875, -5.55010986328125, -5.345458984375, -5.14080810546875, -4.9361572265625, -4.73150634765625, -4.52685546875, -4.32220458984375, -4.1175537109375, -3.91290283203125, -3.708251953125, -3.50360107421875, -3.2989501953125, -3.09429931640625, -2.8896484375, -2.68499755859375, -2.4803466796875, -2.27569580078125, -2.071044921875, -1.86639404296875, -1.6617431640625, -1.45709228515625, -1.25244140625, -1.04779052734375, -0.8431396484375, -0.63848876953125, -0.433837890625, -0.22918701171875, -0.0245361328125, 0.18011474609375, 0.384765625, 0.58941650390625, 0.7940673828125, 0.99871826171875, 1.203369140625, 1.40802001953125, 1.6126708984375, 1.81732177734375, 2.02197265625, 2.22662353515625, 2.4312744140625, 2.63592529296875, 2.840576171875, 3.04522705078125, 3.2498779296875, 3.45452880859375, 3.6591796875, 3.86383056640625, 4.0684814453125, 4.27313232421875, 4.477783203125, 4.68243408203125, 4.8870849609375, 5.09173583984375, 5.29638671875, 5.50103759765625, 5.7056884765625, 5.91033935546875, 6.114990234375, 6.31964111328125, 6.5242919921875, 6.72894287109375, 6.93359375]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 9.0, 7.0, 14.0, 10.0, 11.0, 10.0, 19.0, 23.0, 30.0, 31.0, 32.0, 41.0, 40.0, 53.0, 45.0, 104.0, 360.0, 1628.0, 157.0, 56.0, 57.0, 49.0, 25.0, 34.0, 29.0, 38.0, 33.0, 28.0, 21.0, 12.0, 13.0, 8.0, 6.0, 3.0, 3.0, 9.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.1875, -27.339599609375, -26.49169921875, -25.643798828125, -24.7958984375, -23.947998046875, -23.10009765625, -22.252197265625, -21.404296875, -20.556396484375, -19.70849609375, -18.860595703125, -18.0126953125, -17.164794921875, -16.31689453125, -15.468994140625, -14.62109375, -13.773193359375, -12.92529296875, -12.077392578125, -11.2294921875, -10.381591796875, -9.53369140625, -8.685791015625, -7.837890625, -6.989990234375, -6.14208984375, -5.294189453125, -4.4462890625, -3.598388671875, -2.75048828125, -1.902587890625, -1.0546875, -0.206787109375, 0.64111328125, 1.489013671875, 2.3369140625, 3.184814453125, 4.03271484375, 4.880615234375, 5.728515625, 6.576416015625, 7.42431640625, 8.272216796875, 9.1201171875, 9.968017578125, 10.81591796875, 11.663818359375, 12.51171875, 13.359619140625, 14.20751953125, 15.055419921875, 15.9033203125, 16.751220703125, 17.59912109375, 18.447021484375, 19.294921875, 20.142822265625, 20.99072265625, 21.838623046875, 22.6865234375, 23.534423828125, 24.38232421875, 25.230224609375, 26.078125]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0, 3.0, 8.0, 4.0, 10.0, 7.0, 10.0, 16.0, 25.0, 34.0, 36.0, 65.0, 77.0, 74.0, 129.0, 189.0, 319.0, 457.0, 1253.0, 34123.0, 3088345.0, 18152.0, 1009.0, 465.0, 262.0, 175.0, 102.0, 78.0, 77.0, 49.0, 35.0, 30.0, 20.0, 22.0, 12.0, 8.0, 8.0, 9.0, 4.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.8125, -40.43896484375, -39.0654296875, -37.69189453125, -36.318359375, -34.94482421875, -33.5712890625, -32.19775390625, -30.82421875, -29.45068359375, -28.0771484375, -26.70361328125, -25.330078125, -23.95654296875, -22.5830078125, -21.20947265625, -19.8359375, -18.46240234375, -17.0888671875, -15.71533203125, -14.341796875, -12.96826171875, -11.5947265625, -10.22119140625, -8.84765625, -7.47412109375, -6.1005859375, -4.72705078125, -3.353515625, -1.97998046875, -0.6064453125, 0.76708984375, 2.140625, 3.51416015625, 4.8876953125, 6.26123046875, 7.634765625, 9.00830078125, 10.3818359375, 11.75537109375, 13.12890625, 14.50244140625, 15.8759765625, 17.24951171875, 18.623046875, 19.99658203125, 21.3701171875, 22.74365234375, 24.1171875, 25.49072265625, 26.8642578125, 28.23779296875, 29.611328125, 30.98486328125, 32.3583984375, 33.73193359375, 35.10546875, 36.47900390625, 37.8525390625, 39.22607421875, 40.599609375, 41.97314453125, 43.3466796875, 44.72021484375, 46.09375]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 7.0, 85.0, 332.0, 470.0, 105.0, 16.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.350236892700195, -28.962888717651367, -26.575538635253906, -24.188190460205078, -21.80084228515625, -19.413494110107422, -17.026145935058594, -14.638795852661133, -12.251447677612305, -9.864099502563477, -7.476750373840332, -5.089401721954346, -2.7020530700683594, -0.31470489501953125, 2.0726442337036133, 4.459993362426758, 6.847341537475586, 9.234689712524414, 11.622038841247559, 14.009387969970703, 16.39673614501953, 18.78408432006836, 21.171432495117188, 23.55878257751465, 25.946130752563477, 28.333478927612305, 30.720829010009766, 33.108177185058594, 35.49552536010742, 37.88287353515625, 40.27022171020508, 42.657569885253906, 45.044921875, 47.43227005004883, 49.819618225097656, 52.206966400146484, 54.59431457519531, 56.981666564941406, 59.369014739990234, 61.75636291503906, 64.14370727539062, 66.53105926513672, 68.91840362548828, 71.30575561523438, 73.69309997558594, 76.08045196533203, 78.4677963256836, 80.85514831542969, 83.24250030517578, 85.62985229492188, 88.01719665527344, 90.40454864501953, 92.7918930053711, 95.17924499511719, 97.56658935546875, 99.95394134521484, 102.34129333496094, 104.72864532470703, 107.1159896850586, 109.50334167480469, 111.89068603515625, 114.27803802490234, 116.6653823852539, 119.052734375, 121.44007873535156]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 4.0, 2.0, 6.0, 4.0, 2.0, 10.0, 8.0, 8.0, 10.0, 14.0, 22.0, 15.0, 19.0, 24.0, 30.0, 27.0, 30.0, 32.0, 39.0, 51.0, 40.0, 32.0, 45.0, 45.0, 36.0, 40.0, 40.0, 47.0, 34.0, 36.0, 35.0, 46.0, 24.0, 21.0, 29.0, 17.0, 18.0, 13.0, 11.0, 8.0, 6.0, 1.0, 7.0, 7.0, 2.0, 5.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-56.599449157714844, -54.77890396118164, -52.95835876464844, -51.137813568115234, -49.31726837158203, -47.49672317504883, -45.676177978515625, -43.85563278198242, -42.03508758544922, -40.214542388916016, -38.39399719238281, -36.57345199584961, -34.752906799316406, -32.9323616027832, -31.11181640625, -29.291271209716797, -27.47072410583496, -25.650178909301758, -23.829633712768555, -22.00908851623535, -20.18854331970215, -18.367996215820312, -16.54745101928711, -14.726906776428223, -12.90636157989502, -11.085816383361816, -9.265271186828613, -7.444725513458252, -5.624180316925049, -3.8036346435546875, -1.9830894470214844, -0.16254425048828125, 1.6580009460449219, 3.478546142578125, 5.299091339111328, 7.1196370124816895, 8.940181732177734, 10.760727882385254, 12.581273078918457, 14.40181827545166, 16.222362518310547, 18.04290771484375, 19.863452911376953, 21.683998107910156, 23.50454330444336, 25.325088500976562, 27.145633697509766, 28.96617889404297, 30.786725997924805, 32.60727310180664, 34.427818298339844, 36.24836349487305, 38.06890869140625, 39.88945388793945, 41.709999084472656, 43.53054428100586, 45.35108947753906, 47.171634674072266, 48.99217987060547, 50.81272506713867, 52.633270263671875, 54.45381546020508, 56.27436065673828, 58.094905853271484, 59.91545104980469]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 6.0, 3.0, 9.0, 3.0, 5.0, 17.0, 13.0, 15.0, 22.0, 16.0, 32.0, 20.0, 33.0, 30.0, 33.0, 42.0, 42.0, 45.0, 43.0, 62.0, 50.0, 48.0, 33.0, 45.0, 41.0, 38.0, 41.0, 37.0, 38.0, 20.0, 20.0, 18.0, 12.0, 15.0, 14.0, 11.0, 11.0, 9.0, 11.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.51171875, -7.25592041015625, -7.0001220703125, -6.74432373046875, -6.488525390625, -6.23272705078125, -5.9769287109375, -5.72113037109375, -5.46533203125, -5.20953369140625, -4.9537353515625, -4.69793701171875, -4.442138671875, -4.18634033203125, -3.9305419921875, -3.67474365234375, -3.4189453125, -3.16314697265625, -2.9073486328125, -2.65155029296875, -2.395751953125, -2.13995361328125, -1.8841552734375, -1.62835693359375, -1.37255859375, -1.11676025390625, -0.8609619140625, -0.60516357421875, -0.349365234375, -0.09356689453125, 0.1622314453125, 0.41802978515625, 0.673828125, 0.92962646484375, 1.1854248046875, 1.44122314453125, 1.697021484375, 1.95281982421875, 2.2086181640625, 2.46441650390625, 2.72021484375, 2.97601318359375, 3.2318115234375, 3.48760986328125, 3.743408203125, 3.99920654296875, 4.2550048828125, 4.51080322265625, 4.7666015625, 5.02239990234375, 5.2781982421875, 5.53399658203125, 5.789794921875, 6.04559326171875, 6.3013916015625, 6.55718994140625, 6.81298828125, 7.06878662109375, 7.3245849609375, 7.58038330078125, 7.836181640625, 8.09197998046875, 8.3477783203125, 8.60357666015625, 8.859375]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 6.0, 5.0, 6.0, 6.0, 5.0, 12.0, 12.0, 14.0, 11.0, 23.0, 28.0, 22.0, 39.0, 45.0, 70.0, 89.0, 142.0, 271.0, 867.0, 6264.0, 608779.0, 3528227.0, 46135.0, 2098.0, 437.0, 208.0, 124.0, 80.0, 55.0, 44.0, 37.0, 27.0, 19.0, 15.0, 21.0, 12.0, 6.0, 4.0, 7.0, 7.0, 6.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.984375, -29.025390625, -28.06640625, -27.107421875, -26.1484375, -25.189453125, -24.23046875, -23.271484375, -22.3125, -21.353515625, -20.39453125, -19.435546875, -18.4765625, -17.517578125, -16.55859375, -15.599609375, -14.640625, -13.681640625, -12.72265625, -11.763671875, -10.8046875, -9.845703125, -8.88671875, -7.927734375, -6.96875, -6.009765625, -5.05078125, -4.091796875, -3.1328125, -2.173828125, -1.21484375, -0.255859375, 0.703125, 1.662109375, 2.62109375, 3.580078125, 4.5390625, 5.498046875, 6.45703125, 7.416015625, 8.375, 9.333984375, 10.29296875, 11.251953125, 12.2109375, 13.169921875, 14.12890625, 15.087890625, 16.046875, 17.005859375, 17.96484375, 18.923828125, 19.8828125, 20.841796875, 21.80078125, 22.759765625, 23.71875, 24.677734375, 25.63671875, 26.595703125, 27.5546875, 28.513671875, 29.47265625, 30.431640625, 31.390625]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 5.0, 4.0, 1.0, 5.0, 6.0, 3.0, 18.0, 18.0, 15.0, 18.0, 40.0, 45.0, 52.0, 71.0, 82.0, 117.0, 148.0, 204.0, 301.0, 377.0, 435.0, 457.0, 425.0, 286.0, 220.0, 159.0, 151.0, 81.0, 62.0, 56.0, 53.0, 30.0, 32.0, 29.0, 26.0, 13.0, 10.0, 5.0, 4.0, 3.0, 6.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.921875, -10.5595703125, -10.197265625, -9.8349609375, -9.47265625, -9.1103515625, -8.748046875, -8.3857421875, -8.0234375, -7.6611328125, -7.298828125, -6.9365234375, -6.57421875, -6.2119140625, -5.849609375, -5.4873046875, -5.125, -4.7626953125, -4.400390625, -4.0380859375, -3.67578125, -3.3134765625, -2.951171875, -2.5888671875, -2.2265625, -1.8642578125, -1.501953125, -1.1396484375, -0.77734375, -0.4150390625, -0.052734375, 0.3095703125, 0.671875, 1.0341796875, 1.396484375, 1.7587890625, 2.12109375, 2.4833984375, 2.845703125, 3.2080078125, 3.5703125, 3.9326171875, 4.294921875, 4.6572265625, 5.01953125, 5.3818359375, 5.744140625, 6.1064453125, 6.46875, 6.8310546875, 7.193359375, 7.5556640625, 7.91796875, 8.2802734375, 8.642578125, 9.0048828125, 9.3671875, 9.7294921875, 10.091796875, 10.4541015625, 10.81640625, 11.1787109375, 11.541015625, 11.9033203125, 12.265625]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 4.0, 4.0, 3.0, 8.0, 7.0, 11.0, 6.0, 14.0, 26.0, 31.0, 34.0, 38.0, 41.0, 72.0, 79.0, 108.0, 103.0, 154.0, 220.0, 292.0, 513.0, 1676.0, 371815.0, 3812629.0, 4359.0, 680.0, 325.0, 230.0, 172.0, 143.0, 109.0, 79.0, 56.0, 50.0, 35.0, 29.0, 33.0, 23.0, 17.0, 12.0, 16.0, 10.0, 11.0, 2.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-72.6875, -70.4951171875, -68.302734375, -66.1103515625, -63.91796875, -61.7255859375, -59.533203125, -57.3408203125, -55.1484375, -52.9560546875, -50.763671875, -48.5712890625, -46.37890625, -44.1865234375, -41.994140625, -39.8017578125, -37.609375, -35.4169921875, -33.224609375, -31.0322265625, -28.83984375, -26.6474609375, -24.455078125, -22.2626953125, -20.0703125, -17.8779296875, -15.685546875, -13.4931640625, -11.30078125, -9.1083984375, -6.916015625, -4.7236328125, -2.53125, -0.3388671875, 1.853515625, 4.0458984375, 6.23828125, 8.4306640625, 10.623046875, 12.8154296875, 15.0078125, 17.2001953125, 19.392578125, 21.5849609375, 23.77734375, 25.9697265625, 28.162109375, 30.3544921875, 32.546875, 34.7392578125, 36.931640625, 39.1240234375, 41.31640625, 43.5087890625, 45.701171875, 47.8935546875, 50.0859375, 52.2783203125, 54.470703125, 56.6630859375, 58.85546875, 61.0478515625, 63.240234375, 65.4326171875, 67.625]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 53.0, 248.0, 469.0, 201.0, 35.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-177.4053192138672, -172.65817260742188, -167.91104125976562, -163.1638946533203, -158.416748046875, -153.66961669921875, -148.92247009277344, -144.17532348632812, -139.42819213867188, -134.68104553222656, -129.9339141845703, -125.186767578125, -120.43962860107422, -115.69248962402344, -110.94534301757812, -106.19820404052734, -101.45106506347656, -96.70392608642578, -91.956787109375, -87.20964050292969, -82.4625015258789, -77.71536254882812, -72.96821594238281, -68.22107696533203, -63.47393798828125, -58.72679901123047, -53.97965621948242, -49.232513427734375, -44.485374450683594, -39.73823547363281, -34.991092681884766, -30.24394989013672, -25.496803283691406, -20.749662399291992, -16.002521514892578, -11.255380630493164, -6.50823974609375, -1.761098861694336, 2.986042022705078, 7.733184814453125, 12.480323791503906, 17.22746467590332, 21.974605560302734, 26.72174644470215, 31.468887329101562, 36.216026306152344, 40.96316909790039, 45.71031188964844, 50.45745086669922, 55.20458984375, 59.95173263549805, 64.6988754272461, 69.44601440429688, 74.19315338134766, 78.94029235839844, 83.68743896484375, 88.43457794189453, 93.18171691894531, 97.92886352539062, 102.6760025024414, 107.42314147949219, 112.17028045654297, 116.91741943359375, 121.66456604003906, 126.41170501708984]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 5.0, 3.0, 8.0, 5.0, 13.0, 8.0, 8.0, 16.0, 14.0, 30.0, 26.0, 26.0, 30.0, 26.0, 38.0, 35.0, 43.0, 34.0, 35.0, 37.0, 39.0, 40.0, 29.0, 42.0, 38.0, 38.0, 47.0, 37.0, 32.0, 33.0, 26.0, 21.0, 27.0, 19.0, 23.0, 17.0, 8.0, 6.0, 11.0, 5.0, 5.0, 8.0, 4.0, 2.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-38.82942199707031, -37.46269989013672, -36.095977783203125, -34.729251861572266, -33.36252975463867, -31.995807647705078, -30.629085540771484, -29.262361526489258, -27.89563751220703, -26.528915405273438, -25.16219139099121, -23.795469284057617, -22.42874526977539, -21.062023162841797, -19.695301055908203, -18.328577041625977, -16.961854934692383, -15.595131874084473, -14.228408813476562, -12.861686706542969, -11.494962692260742, -10.128240585327148, -8.761517524719238, -7.394794464111328, -6.028071403503418, -4.661348342895508, -3.2946255207061768, -1.9279026985168457, -0.5611796379089355, 0.8055434226989746, 2.1722660064697266, 3.5389890670776367, 4.905712127685547, 6.272435188293457, 7.639158248901367, 9.005880355834961, 10.372604370117188, 11.739326477050781, 13.106049537658691, 14.472772598266602, 15.839495658874512, 17.206218719482422, 18.572940826416016, 19.939664840698242, 21.306386947631836, 22.673110961914062, 24.039833068847656, 25.40655517578125, 26.773279190063477, 28.14000129699707, 29.506725311279297, 30.87344741821289, 32.240169525146484, 33.606895446777344, 34.97361755371094, 36.34033966064453, 37.707061767578125, 39.07378387451172, 40.44050598144531, 41.80723190307617, 43.173954010009766, 44.54067611694336, 45.90739822387695, 47.27412414550781, 48.640846252441406]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 5.0, 2.0, 2.0, 8.0, 5.0, 11.0, 4.0, 8.0, 6.0, 21.0, 28.0, 12.0, 32.0, 21.0, 22.0, 38.0, 45.0, 31.0, 31.0, 48.0, 48.0, 49.0, 51.0, 38.0, 47.0, 31.0, 32.0, 33.0, 40.0, 32.0, 29.0, 44.0, 23.0, 18.0, 16.0, 22.0, 12.0, 10.0, 8.0, 13.0, 13.0, 6.0, 5.0, 1.0, 2.0, 1.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.28125, -7.0531005859375, -6.824951171875, -6.5968017578125, -6.36865234375, -6.1405029296875, -5.912353515625, -5.6842041015625, -5.4560546875, -5.2279052734375, -4.999755859375, -4.7716064453125, -4.54345703125, -4.3153076171875, -4.087158203125, -3.8590087890625, -3.630859375, -3.4027099609375, -3.174560546875, -2.9464111328125, -2.71826171875, -2.4901123046875, -2.261962890625, -2.0338134765625, -1.8056640625, -1.5775146484375, -1.349365234375, -1.1212158203125, -0.89306640625, -0.6649169921875, -0.436767578125, -0.2086181640625, 0.01953125, 0.2476806640625, 0.475830078125, 0.7039794921875, 0.93212890625, 1.1602783203125, 1.388427734375, 1.6165771484375, 1.8447265625, 2.0728759765625, 2.301025390625, 2.5291748046875, 2.75732421875, 2.9854736328125, 3.213623046875, 3.4417724609375, 3.669921875, 3.8980712890625, 4.126220703125, 4.3543701171875, 4.58251953125, 4.8106689453125, 5.038818359375, 5.2669677734375, 5.4951171875, 5.7232666015625, 5.951416015625, 6.1795654296875, 6.40771484375, 6.6358642578125, 6.864013671875, 7.0921630859375, 7.3203125]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 6.0, 1.0, 4.0, 9.0, 12.0, 22.0, 16.0, 32.0, 44.0, 47.0, 93.0, 100.0, 150.0, 230.0, 315.0, 422.0, 601.0, 844.0, 1214.0, 1695.0, 2423.0, 3643.0, 5186.0, 7696.0, 11722.0, 17630.0, 27165.0, 42485.0, 68527.0, 124143.0, 328488.0, 173264.0, 83853.0, 50858.0, 32248.0, 20919.0, 13559.0, 9068.0, 6082.0, 4300.0, 2835.0, 1855.0, 1384.0, 1021.0, 691.0, 437.0, 370.0, 238.0, 179.0, 137.0, 81.0, 64.0, 51.0, 24.0, 40.0, 10.0, 12.0, 14.0, 3.0, 7.0, 1.0, 2.0, 2.0], "bins": [-1.3564453125, -1.3136444091796875, -1.270843505859375, -1.2280426025390625, -1.18524169921875, -1.1424407958984375, -1.099639892578125, -1.0568389892578125, -1.0140380859375, -0.9712371826171875, -0.928436279296875, -0.8856353759765625, -0.84283447265625, -0.8000335693359375, -0.757232666015625, -0.7144317626953125, -0.671630859375, -0.6288299560546875, -0.586029052734375, -0.5432281494140625, -0.50042724609375, -0.4576263427734375, -0.414825439453125, -0.3720245361328125, -0.3292236328125, -0.2864227294921875, -0.243621826171875, -0.2008209228515625, -0.15802001953125, -0.1152191162109375, -0.072418212890625, -0.0296173095703125, 0.01318359375, 0.0559844970703125, 0.098785400390625, 0.1415863037109375, 0.18438720703125, 0.2271881103515625, 0.269989013671875, 0.3127899169921875, 0.3555908203125, 0.3983917236328125, 0.441192626953125, 0.4839935302734375, 0.52679443359375, 0.5695953369140625, 0.612396240234375, 0.6551971435546875, 0.697998046875, 0.7407989501953125, 0.783599853515625, 0.8264007568359375, 0.86920166015625, 0.9120025634765625, 0.954803466796875, 0.9976043701171875, 1.0404052734375, 1.0832061767578125, 1.126007080078125, 1.1688079833984375, 1.21160888671875, 1.2544097900390625, 1.297210693359375, 1.3400115966796875, 1.3828125]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 2.0, 3.0, 5.0, 3.0, 4.0, 7.0, 10.0, 10.0, 11.0, 13.0, 19.0, 24.0, 14.0, 28.0, 24.0, 25.0, 31.0, 22.0, 31.0, 40.0, 37.0, 35.0, 31.0, 33.0, 1057.0, 39.0, 39.0, 36.0, 33.0, 48.0, 37.0, 36.0, 28.0, 31.0, 23.0, 16.0, 23.0, 19.0, 18.0, 12.0, 13.0, 5.0, 15.0, 6.0, 4.0, 9.0, 7.0, 5.0, 2.0, 3.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-4.39453125, -4.25640869140625, -4.1182861328125, -3.98016357421875, -3.842041015625, -3.70391845703125, -3.5657958984375, -3.42767333984375, -3.28955078125, -3.15142822265625, -3.0133056640625, -2.87518310546875, -2.737060546875, -2.59893798828125, -2.4608154296875, -2.32269287109375, -2.1845703125, -2.04644775390625, -1.9083251953125, -1.77020263671875, -1.632080078125, -1.49395751953125, -1.3558349609375, -1.21771240234375, -1.07958984375, -0.94146728515625, -0.8033447265625, -0.66522216796875, -0.527099609375, -0.38897705078125, -0.2508544921875, -0.11273193359375, 0.025390625, 0.16351318359375, 0.3016357421875, 0.43975830078125, 0.577880859375, 0.71600341796875, 0.8541259765625, 0.99224853515625, 1.13037109375, 1.26849365234375, 1.4066162109375, 1.54473876953125, 1.682861328125, 1.82098388671875, 1.9591064453125, 2.09722900390625, 2.2353515625, 2.37347412109375, 2.5115966796875, 2.64971923828125, 2.787841796875, 2.92596435546875, 3.0640869140625, 3.20220947265625, 3.34033203125, 3.47845458984375, 3.6165771484375, 3.75469970703125, 3.892822265625, 4.03094482421875, 4.1690673828125, 4.30718994140625, 4.4453125]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 7.0, 9.0, 17.0, 24.0, 31.0, 39.0, 51.0, 92.0, 130.0, 184.0, 278.0, 402.0, 605.0, 930.0, 1398.0, 2111.0, 3324.0, 5051.0, 7860.0, 12247.0, 19402.0, 31142.0, 52634.0, 97844.0, 235411.0, 1357159.0, 113851.0, 60608.0, 34647.0, 21339.0, 13588.0, 8570.0, 5515.0, 3616.0, 2371.0, 1569.0, 1038.0, 665.0, 448.0, 330.0, 180.0, 134.0, 84.0, 66.0, 39.0, 31.0, 19.0, 20.0, 12.0, 5.0, 6.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0], "bins": [-1.5498046875, -1.5015411376953125, -1.453277587890625, -1.4050140380859375, -1.35675048828125, -1.3084869384765625, -1.260223388671875, -1.2119598388671875, -1.1636962890625, -1.1154327392578125, -1.067169189453125, -1.0189056396484375, -0.97064208984375, -0.9223785400390625, -0.874114990234375, -0.8258514404296875, -0.777587890625, -0.7293243408203125, -0.681060791015625, -0.6327972412109375, -0.58453369140625, -0.5362701416015625, -0.488006591796875, -0.4397430419921875, -0.3914794921875, -0.3432159423828125, -0.294952392578125, -0.2466888427734375, -0.19842529296875, -0.1501617431640625, -0.101898193359375, -0.0536346435546875, -0.00537109375, 0.0428924560546875, 0.091156005859375, 0.1394195556640625, 0.18768310546875, 0.2359466552734375, 0.284210205078125, 0.3324737548828125, 0.3807373046875, 0.4290008544921875, 0.477264404296875, 0.5255279541015625, 0.57379150390625, 0.6220550537109375, 0.670318603515625, 0.7185821533203125, 0.766845703125, 0.8151092529296875, 0.863372802734375, 0.9116363525390625, 0.95989990234375, 1.0081634521484375, 1.056427001953125, 1.1046905517578125, 1.1529541015625, 1.2012176513671875, 1.249481201171875, 1.2977447509765625, 1.34600830078125, 1.3942718505859375, 1.442535400390625, 1.4907989501953125, 1.5390625]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 5.0, 5.0, 6.0, 10.0, 12.0, 10.0, 16.0, 15.0, 15.0, 25.0, 27.0, 28.0, 20.0, 38.0, 47.0, 51.0, 45.0, 73.0, 56.0, 55.0, 66.0, 46.0, 39.0, 52.0, 37.0, 36.0, 27.0, 19.0, 16.0, 14.0, 18.0, 7.0, 12.0, 10.0, 10.0, 8.0, 5.0, 3.0, 4.0, 3.0, 4.0, 1.0, 4.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008997917175292969, -0.0008718818426132202, -0.0008439719676971436, -0.0008160620927810669, -0.0007881522178649902, -0.0007602423429489136, -0.0007323324680328369, -0.0007044225931167603, -0.0006765127182006836, -0.0006486028432846069, -0.0006206929683685303, -0.0005927830934524536, -0.000564873218536377, -0.0005369633436203003, -0.0005090534687042236, -0.00048114359378814697, -0.0004532337188720703, -0.00042532384395599365, -0.000397413969039917, -0.00036950409412384033, -0.00034159421920776367, -0.000313684344291687, -0.00028577446937561035, -0.0002578645944595337, -0.00022995471954345703, -0.00020204484462738037, -0.0001741349697113037, -0.00014622509479522705, -0.00011831521987915039, -9.040534496307373e-05, -6.249547004699707e-05, -3.458559513092041e-05, -6.67572021484375e-06, 2.123415470123291e-05, 4.914402961730957e-05, 7.705390453338623e-05, 0.00010496377944946289, 0.00013287365436553955, 0.0001607835292816162, 0.00018869340419769287, 0.00021660327911376953, 0.0002445131540298462, 0.00027242302894592285, 0.0003003329038619995, 0.00032824277877807617, 0.00035615265369415283, 0.0003840625286102295, 0.00041197240352630615, 0.0004398822784423828, 0.00046779215335845947, 0.0004957020282745361, 0.0005236119031906128, 0.0005515217781066895, 0.0005794316530227661, 0.0006073415279388428, 0.0006352514028549194, 0.0006631612777709961, 0.0006910711526870728, 0.0007189810276031494, 0.0007468909025192261, 0.0007748007774353027, 0.0008027106523513794, 0.0008306205272674561, 0.0008585304021835327, 0.0008864402770996094]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 3.0, 2.0, 4.0, 5.0, 7.0, 8.0, 10.0, 13.0, 8.0, 14.0, 13.0, 24.0, 21.0, 27.0, 36.0, 58.0, 78.0, 91.0, 119.0, 275.0, 640.0, 4730.0, 1037670.0, 3244.0, 597.0, 260.0, 134.0, 84.0, 88.0, 62.0, 39.0, 39.0, 27.0, 14.0, 22.0, 12.0, 20.0, 14.0, 8.0, 9.0, 7.0, 9.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.020294189453125, -0.019649267196655273, -0.019004344940185547, -0.01835942268371582, -0.017714500427246094, -0.017069578170776367, -0.01642465591430664, -0.015779733657836914, -0.015134811401367188, -0.014489889144897461, -0.013844966888427734, -0.013200044631958008, -0.012555122375488281, -0.011910200119018555, -0.011265277862548828, -0.010620355606079102, -0.009975433349609375, -0.009330511093139648, -0.008685588836669922, -0.008040666580200195, -0.007395744323730469, -0.006750822067260742, -0.006105899810791016, -0.005460977554321289, -0.0048160552978515625, -0.004171133041381836, -0.0035262107849121094, -0.002881288528442383, -0.0022363662719726562, -0.0015914440155029297, -0.0009465217590332031, -0.00030159950256347656, 0.00034332275390625, 0.0009882450103759766, 0.0016331672668457031, 0.0022780895233154297, 0.0029230117797851562, 0.003567934036254883, 0.004212856292724609, 0.004857778549194336, 0.0055027008056640625, 0.006147623062133789, 0.006792545318603516, 0.007437467575073242, 0.008082389831542969, 0.008727312088012695, 0.009372234344482422, 0.010017156600952148, 0.010662078857421875, 0.011307001113891602, 0.011951923370361328, 0.012596845626831055, 0.013241767883300781, 0.013886690139770508, 0.014531612396240234, 0.015176534652709961, 0.015821456909179688, 0.016466379165649414, 0.01711130142211914, 0.017756223678588867, 0.018401145935058594, 0.01904606819152832, 0.019690990447998047, 0.020335912704467773, 0.0209808349609375]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 6.0, 20.0, 60.0, 111.0, 216.0, 260.0, 185.0, 88.0, 42.0, 13.0, 6.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011449595913290977, -0.0011178526328876615, -0.0010907455580309033, -0.001063638599589467, -0.001036531524732709, -0.0010094245662912726, -0.0009823176078498363, -0.0009552105912007391, -0.0009281035745516419, -0.0009009965579025447, -0.0008738895412534475, -0.0008467825828120112, -0.000819675566162914, -0.0007925685495138168, -0.0007654615910723805, -0.0007383545744232833, -0.0007112475577741861, -0.0006841405411250889, -0.0006570335244759917, -0.0006299265660345554, -0.0006028195493854582, -0.000575712532736361, -0.0005486055742949247, -0.0005214985576458275, -0.0004943915409967303, -0.0004672845243476331, -0.0004401775368023664, -0.00041307054925709963, -0.0003859635326080024, -0.0003588565159589052, -0.00033174952841363847, -0.0003046425408683717, -0.00027753558242693543, -0.00025042856577783823, -0.00022332157823257148, -0.0001962145761353895, -0.00016910757403820753, -0.00014200057194102556, -0.00011489356984384358, -8.77865677466616e-05, -6.067956564947963e-05, -3.357256355229765e-05, -6.465561455115676e-06, 2.06414406420663e-05, 4.7748442739248276e-05, 7.485544483643025e-05, 0.00010196244693361223, 0.0001290694490307942, 0.00015617645112797618, 0.00018328345322515815, 0.00021039045532234013, 0.0002374974574195221, 0.0002646044595167041, 0.0002917114761658013, 0.00031881846371106803, 0.0003459254512563348, 0.000373032467905432, 0.0004001394845545292, 0.00042724647209979594, 0.0004543534596450627, 0.0004814604762941599, 0.0005085674929432571, 0.0005356745095923543, 0.0005627814680337906, 0.0005898884846828878]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 10.0, 4.0, 11.0, 6.0, 8.0, 8.0, 18.0, 19.0, 14.0, 17.0, 23.0, 28.0, 27.0, 31.0, 27.0, 31.0, 25.0, 23.0, 37.0, 28.0, 43.0, 34.0, 34.0, 33.0, 41.0, 33.0, 29.0, 37.0, 26.0, 30.0, 27.0, 27.0, 19.0, 25.0, 25.0, 27.0, 19.0, 22.0, 15.0, 7.0, 11.0, 6.0, 9.0, 7.0, 9.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 5.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.0004203319549560547, -0.000406801700592041, -0.00039327144622802734, -0.00037974119186401367, -0.0003662109375, -0.00035268068313598633, -0.00033915042877197266, -0.000325620174407959, -0.0003120899200439453, -0.00029855966567993164, -0.00028502941131591797, -0.0002714991569519043, -0.0002579689025878906, -0.00024443864822387695, -0.00023090839385986328, -0.0002173781394958496, -0.00020384788513183594, -0.00019031763076782227, -0.0001767873764038086, -0.00016325712203979492, -0.00014972686767578125, -0.00013619661331176758, -0.0001226663589477539, -0.00010913610458374023, -9.560585021972656e-05, -8.207559585571289e-05, -6.854534149169922e-05, -5.501508712768555e-05, -4.1484832763671875e-05, -2.7954578399658203e-05, -1.4424324035644531e-05, -8.940696716308594e-07, 1.2636184692382812e-05, 2.6166439056396484e-05, 3.9696693420410156e-05, 5.322694778442383e-05, 6.67572021484375e-05, 8.028745651245117e-05, 9.381771087646484e-05, 0.00010734796524047852, 0.00012087821960449219, 0.00013440847396850586, 0.00014793872833251953, 0.0001614689826965332, 0.00017499923706054688, 0.00018852949142456055, 0.00020205974578857422, 0.0002155900001525879, 0.00022912025451660156, 0.00024265050888061523, 0.0002561807632446289, 0.0002697110176086426, 0.00028324127197265625, 0.0002967715263366699, 0.0003103017807006836, 0.00032383203506469727, 0.00033736228942871094, 0.0003508925437927246, 0.0003644227981567383, 0.00037795305252075195, 0.0003914833068847656, 0.0004050135612487793, 0.00041854381561279297, 0.00043207406997680664, 0.0004456043243408203]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 5.0, 2.0, 2.0, 8.0, 5.0, 11.0, 4.0, 8.0, 6.0, 21.0, 28.0, 12.0, 32.0, 21.0, 22.0, 38.0, 45.0, 31.0, 31.0, 48.0, 48.0, 49.0, 51.0, 38.0, 47.0, 31.0, 32.0, 33.0, 40.0, 32.0, 29.0, 44.0, 23.0, 18.0, 16.0, 22.0, 12.0, 10.0, 8.0, 13.0, 13.0, 6.0, 5.0, 1.0, 2.0, 1.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.28125, -7.0531005859375, -6.824951171875, -6.5968017578125, -6.36865234375, -6.1405029296875, -5.912353515625, -5.6842041015625, -5.4560546875, -5.2279052734375, -4.999755859375, -4.7716064453125, -4.54345703125, -4.3153076171875, -4.087158203125, -3.8590087890625, -3.630859375, -3.4027099609375, -3.174560546875, -2.9464111328125, -2.71826171875, -2.4901123046875, -2.261962890625, -2.0338134765625, -1.8056640625, -1.5775146484375, -1.349365234375, -1.1212158203125, -0.89306640625, -0.6649169921875, -0.436767578125, -0.2086181640625, 0.01953125, 0.2476806640625, 0.475830078125, 0.7039794921875, 0.93212890625, 1.1602783203125, 1.388427734375, 1.6165771484375, 1.8447265625, 2.0728759765625, 2.301025390625, 2.5291748046875, 2.75732421875, 2.9854736328125, 3.213623046875, 3.4417724609375, 3.669921875, 3.8980712890625, 4.126220703125, 4.3543701171875, 4.58251953125, 4.8106689453125, 5.038818359375, 5.2669677734375, 5.4951171875, 5.7232666015625, 5.951416015625, 6.1795654296875, 6.40771484375, 6.6358642578125, 6.864013671875, 7.0921630859375, 7.3203125]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 8.0, 11.0, 10.0, 7.0, 12.0, 17.0, 22.0, 39.0, 29.0, 63.0, 52.0, 86.0, 116.0, 201.0, 295.0, 495.0, 1195.0, 4714.0, 37476.0, 562974.0, 406326.0, 28084.0, 3889.0, 1031.0, 452.0, 277.0, 186.0, 122.0, 98.0, 59.0, 49.0, 24.0, 39.0, 20.0, 11.0, 14.0, 12.0, 16.0, 6.0, 6.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-14.265625, -13.8189697265625, -13.372314453125, -12.9256591796875, -12.47900390625, -12.0323486328125, -11.585693359375, -11.1390380859375, -10.6923828125, -10.2457275390625, -9.799072265625, -9.3524169921875, -8.90576171875, -8.4591064453125, -8.012451171875, -7.5657958984375, -7.119140625, -6.6724853515625, -6.225830078125, -5.7791748046875, -5.33251953125, -4.8858642578125, -4.439208984375, -3.9925537109375, -3.5458984375, -3.0992431640625, -2.652587890625, -2.2059326171875, -1.75927734375, -1.3126220703125, -0.865966796875, -0.4193115234375, 0.02734375, 0.4739990234375, 0.920654296875, 1.3673095703125, 1.81396484375, 2.2606201171875, 2.707275390625, 3.1539306640625, 3.6005859375, 4.0472412109375, 4.493896484375, 4.9405517578125, 5.38720703125, 5.8338623046875, 6.280517578125, 6.7271728515625, 7.173828125, 7.6204833984375, 8.067138671875, 8.5137939453125, 8.96044921875, 9.4071044921875, 9.853759765625, 10.3004150390625, 10.7470703125, 11.1937255859375, 11.640380859375, 12.0870361328125, 12.53369140625, 12.9803466796875, 13.427001953125, 13.8736572265625, 14.3203125]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 4.0, 1.0, 5.0, 11.0, 11.0, 13.0, 17.0, 16.0, 24.0, 27.0, 21.0, 31.0, 42.0, 50.0, 52.0, 76.0, 99.0, 416.0, 1563.0, 130.0, 73.0, 53.0, 45.0, 43.0, 42.0, 27.0, 30.0, 23.0, 22.0, 20.0, 17.0, 15.0, 8.0, 7.0, 8.0, 5.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-27.65625, -26.820556640625, -25.98486328125, -25.149169921875, -24.3134765625, -23.477783203125, -22.64208984375, -21.806396484375, -20.970703125, -20.135009765625, -19.29931640625, -18.463623046875, -17.6279296875, -16.792236328125, -15.95654296875, -15.120849609375, -14.28515625, -13.449462890625, -12.61376953125, -11.778076171875, -10.9423828125, -10.106689453125, -9.27099609375, -8.435302734375, -7.599609375, -6.763916015625, -5.92822265625, -5.092529296875, -4.2568359375, -3.421142578125, -2.58544921875, -1.749755859375, -0.9140625, -0.078369140625, 0.75732421875, 1.593017578125, 2.4287109375, 3.264404296875, 4.10009765625, 4.935791015625, 5.771484375, 6.607177734375, 7.44287109375, 8.278564453125, 9.1142578125, 9.949951171875, 10.78564453125, 11.621337890625, 12.45703125, 13.292724609375, 14.12841796875, 14.964111328125, 15.7998046875, 16.635498046875, 17.47119140625, 18.306884765625, 19.142578125, 19.978271484375, 20.81396484375, 21.649658203125, 22.4853515625, 23.321044921875, 24.15673828125, 24.992431640625, 25.828125]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 7.0, 8.0, 7.0, 8.0, 9.0, 26.0, 23.0, 27.0, 29.0, 35.0, 57.0, 69.0, 110.0, 147.0, 277.0, 786.0, 4611.0, 3043941.0, 92592.0, 1775.0, 476.0, 207.0, 144.0, 92.0, 50.0, 45.0, 28.0, 29.0, 21.0, 18.0, 15.0, 12.0, 8.0, 4.0, 5.0, 4.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-58.4375, -56.5400390625, -54.642578125, -52.7451171875, -50.84765625, -48.9501953125, -47.052734375, -45.1552734375, -43.2578125, -41.3603515625, -39.462890625, -37.5654296875, -35.66796875, -33.7705078125, -31.873046875, -29.9755859375, -28.078125, -26.1806640625, -24.283203125, -22.3857421875, -20.48828125, -18.5908203125, -16.693359375, -14.7958984375, -12.8984375, -11.0009765625, -9.103515625, -7.2060546875, -5.30859375, -3.4111328125, -1.513671875, 0.3837890625, 2.28125, 4.1787109375, 6.076171875, 7.9736328125, 9.87109375, 11.7685546875, 13.666015625, 15.5634765625, 17.4609375, 19.3583984375, 21.255859375, 23.1533203125, 25.05078125, 26.9482421875, 28.845703125, 30.7431640625, 32.640625, 34.5380859375, 36.435546875, 38.3330078125, 40.23046875, 42.1279296875, 44.025390625, 45.9228515625, 47.8203125, 49.7177734375, 51.615234375, 53.5126953125, 55.41015625, 57.3076171875, 59.205078125, 61.1025390625, 63.0]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 82.0, 919.0, 15.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-532.5193481445312, -522.8936767578125, -513.2680053710938, -503.642333984375, -494.01666259765625, -484.3909912109375, -474.76531982421875, -465.1396179199219, -455.5139465332031, -445.8882751464844, -436.2626037597656, -426.6369323730469, -417.0112609863281, -407.38555908203125, -397.7598876953125, -388.13421630859375, -378.508544921875, -368.88287353515625, -359.2572021484375, -349.63153076171875, -340.005859375, -330.38018798828125, -320.7545166015625, -311.1288146972656, -301.503173828125, -291.87750244140625, -282.2518310546875, -272.62615966796875, -263.00048828125, -253.3748016357422, -243.74913024902344, -234.12344360351562, -224.49778747558594, -214.8721160888672, -205.24644470214844, -195.62075805664062, -185.99508666992188, -176.36941528320312, -166.74374389648438, -157.11807250976562, -147.49240112304688, -137.86672973632812, -128.24105834960938, -118.6153793334961, -108.98970031738281, -99.36402893066406, -89.73835754394531, -80.11267852783203, -70.48699951171875, -60.861324310302734, -51.23564910888672, -41.60997772216797, -31.984302520751953, -22.358627319335938, -12.732955932617188, -3.1072769165039062, 6.518394470214844, 16.14406967163086, 25.769742965698242, 35.395416259765625, 45.02109146118164, 54.646766662597656, 64.2724380493164, 73.89811706542969, 83.52378845214844]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 7.0, 7.0, 1.0, 4.0, 7.0, 8.0, 7.0, 10.0, 8.0, 12.0, 16.0, 17.0, 22.0, 22.0, 27.0, 24.0, 39.0, 36.0, 39.0, 31.0, 43.0, 36.0, 35.0, 44.0, 31.0, 45.0, 47.0, 32.0, 34.0, 33.0, 32.0, 29.0, 25.0, 24.0, 25.0, 22.0, 21.0, 20.0, 13.0, 12.0, 16.0, 16.0, 4.0, 7.0, 6.0, 1.0, 4.0, 0.0, 5.0, 2.0, 3.0], "bins": [-61.86175537109375, -60.15438461303711, -58.44701385498047, -56.73964309692383, -55.03227233886719, -53.32490158081055, -51.617530822753906, -49.91015625, -48.202789306640625, -46.495418548583984, -44.788047790527344, -43.0806770324707, -41.37330627441406, -39.66593551635742, -37.95856475830078, -36.251190185546875, -34.543819427490234, -32.836448669433594, -31.129077911376953, -29.421707153320312, -27.714336395263672, -26.00696563720703, -24.299592971801758, -22.592222213745117, -20.884851455688477, -19.177480697631836, -17.470109939575195, -15.762738227844238, -14.055367469787598, -12.347996711730957, -10.640625, -8.93325424194336, -7.225879669189453, -5.5185089111328125, -3.8111376762390137, -2.103766441345215, -0.3963956832885742, 1.3109750747680664, 3.0183467864990234, 4.725717544555664, 6.433088302612305, 8.140459060668945, 9.847829818725586, 11.555201530456543, 13.262572288513184, 14.969943046569824, 16.67731475830078, 18.384685516357422, 20.092056274414062, 21.799427032470703, 23.506797790527344, 25.214168548583984, 26.921539306640625, 28.628910064697266, 30.33628273010254, 32.04365539550781, 33.75102233886719, 35.45839309692383, 37.16576385498047, 38.87313461303711, 40.58050537109375, 42.28787612915039, 43.99524688720703, 45.70262145996094, 47.40999221801758]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 4.0, 4.0, 7.0, 8.0, 8.0, 12.0, 16.0, 18.0, 19.0, 23.0, 21.0, 27.0, 26.0, 34.0, 38.0, 46.0, 53.0, 42.0, 47.0, 40.0, 41.0, 47.0, 51.0, 28.0, 33.0, 38.0, 35.0, 31.0, 26.0, 31.0, 26.0, 26.0, 16.0, 15.0, 16.0, 10.0, 7.0, 5.0, 2.0, 11.0, 6.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.66796875, -7.42266845703125, -7.1773681640625, -6.93206787109375, -6.686767578125, -6.44146728515625, -6.1961669921875, -5.95086669921875, -5.70556640625, -5.46026611328125, -5.2149658203125, -4.96966552734375, -4.724365234375, -4.47906494140625, -4.2337646484375, -3.98846435546875, -3.7431640625, -3.49786376953125, -3.2525634765625, -3.00726318359375, -2.761962890625, -2.51666259765625, -2.2713623046875, -2.02606201171875, -1.78076171875, -1.53546142578125, -1.2901611328125, -1.04486083984375, -0.799560546875, -0.55426025390625, -0.3089599609375, -0.06365966796875, 0.181640625, 0.42694091796875, 0.6722412109375, 0.91754150390625, 1.162841796875, 1.40814208984375, 1.6534423828125, 1.89874267578125, 2.14404296875, 2.38934326171875, 2.6346435546875, 2.87994384765625, 3.125244140625, 3.37054443359375, 3.6158447265625, 3.86114501953125, 4.1064453125, 4.35174560546875, 4.5970458984375, 4.84234619140625, 5.087646484375, 5.33294677734375, 5.5782470703125, 5.82354736328125, 6.06884765625, 6.31414794921875, 6.5594482421875, 6.80474853515625, 7.050048828125, 7.29534912109375, 7.5406494140625, 7.78594970703125, 8.03125]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 3.0, 7.0, 7.0, 9.0, 11.0, 10.0, 17.0, 15.0, 16.0, 27.0, 28.0, 43.0, 46.0, 82.0, 133.0, 193.0, 317.0, 636.0, 2643.0, 30588.0, 1420687.0, 2652894.0, 79566.0, 4385.0, 862.0, 337.0, 196.0, 145.0, 83.0, 64.0, 47.0, 36.0, 37.0, 20.0, 18.0, 13.0, 17.0, 4.0, 7.0, 10.0, 8.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-24.25, -23.51806640625, -22.7861328125, -22.05419921875, -21.322265625, -20.59033203125, -19.8583984375, -19.12646484375, -18.39453125, -17.66259765625, -16.9306640625, -16.19873046875, -15.466796875, -14.73486328125, -14.0029296875, -13.27099609375, -12.5390625, -11.80712890625, -11.0751953125, -10.34326171875, -9.611328125, -8.87939453125, -8.1474609375, -7.41552734375, -6.68359375, -5.95166015625, -5.2197265625, -4.48779296875, -3.755859375, -3.02392578125, -2.2919921875, -1.56005859375, -0.828125, -0.09619140625, 0.6357421875, 1.36767578125, 2.099609375, 2.83154296875, 3.5634765625, 4.29541015625, 5.02734375, 5.75927734375, 6.4912109375, 7.22314453125, 7.955078125, 8.68701171875, 9.4189453125, 10.15087890625, 10.8828125, 11.61474609375, 12.3466796875, 13.07861328125, 13.810546875, 14.54248046875, 15.2744140625, 16.00634765625, 16.73828125, 17.47021484375, 18.2021484375, 18.93408203125, 19.666015625, 20.39794921875, 21.1298828125, 21.86181640625, 22.59375]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 6.0, 9.0, 17.0, 21.0, 26.0, 53.0, 70.0, 88.0, 176.0, 213.0, 312.0, 510.0, 671.0, 605.0, 462.0, 301.0, 211.0, 99.0, 82.0, 58.0, 32.0, 17.0, 13.0, 10.0, 7.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.15625, -16.599609375, -16.04296875, -15.486328125, -14.9296875, -14.373046875, -13.81640625, -13.259765625, -12.703125, -12.146484375, -11.58984375, -11.033203125, -10.4765625, -9.919921875, -9.36328125, -8.806640625, -8.25, -7.693359375, -7.13671875, -6.580078125, -6.0234375, -5.466796875, -4.91015625, -4.353515625, -3.796875, -3.240234375, -2.68359375, -2.126953125, -1.5703125, -1.013671875, -0.45703125, 0.099609375, 0.65625, 1.212890625, 1.76953125, 2.326171875, 2.8828125, 3.439453125, 3.99609375, 4.552734375, 5.109375, 5.666015625, 6.22265625, 6.779296875, 7.3359375, 7.892578125, 8.44921875, 9.005859375, 9.5625, 10.119140625, 10.67578125, 11.232421875, 11.7890625, 12.345703125, 12.90234375, 13.458984375, 14.015625, 14.572265625, 15.12890625, 15.685546875, 16.2421875, 16.798828125, 17.35546875, 17.912109375, 18.46875]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 7.0, 1.0, 4.0, 6.0, 10.0, 12.0, 22.0, 16.0, 28.0, 38.0, 40.0, 58.0, 73.0, 86.0, 148.0, 189.0, 265.0, 563.0, 1671.0, 29753.0, 4116447.0, 41320.0, 1839.0, 604.0, 289.0, 203.0, 134.0, 101.0, 72.0, 57.0, 68.0, 41.0, 27.0, 15.0, 17.0, 13.0, 17.0, 7.0, 4.0, 3.0, 7.0, 3.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.4375, -57.4248046875, -55.412109375, -53.3994140625, -51.38671875, -49.3740234375, -47.361328125, -45.3486328125, -43.3359375, -41.3232421875, -39.310546875, -37.2978515625, -35.28515625, -33.2724609375, -31.259765625, -29.2470703125, -27.234375, -25.2216796875, -23.208984375, -21.1962890625, -19.18359375, -17.1708984375, -15.158203125, -13.1455078125, -11.1328125, -9.1201171875, -7.107421875, -5.0947265625, -3.08203125, -1.0693359375, 0.943359375, 2.9560546875, 4.96875, 6.9814453125, 8.994140625, 11.0068359375, 13.01953125, 15.0322265625, 17.044921875, 19.0576171875, 21.0703125, 23.0830078125, 25.095703125, 27.1083984375, 29.12109375, 31.1337890625, 33.146484375, 35.1591796875, 37.171875, 39.1845703125, 41.197265625, 43.2099609375, 45.22265625, 47.2353515625, 49.248046875, 51.2607421875, 53.2734375, 55.2861328125, 57.298828125, 59.3115234375, 61.32421875, 63.3369140625, 65.349609375, 67.3623046875, 69.375]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 36.0, 166.0, 423.0, 301.0, 70.0, 11.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-161.69789123535156, -157.4183349609375, -153.13877868652344, -148.85922241210938, -144.57965087890625, -140.3000946044922, -136.02053833007812, -131.74098205566406, -127.46142578125, -123.18186950683594, -118.90230560302734, -114.62274932861328, -110.34319305419922, -106.06362915039062, -101.78407287597656, -97.5045166015625, -93.2249526977539, -88.94539642333984, -84.66583251953125, -80.38627624511719, -76.10671997070312, -71.82716369628906, -67.54759979248047, -63.268043518066406, -58.98848342895508, -54.70892333984375, -50.42936706542969, -46.14980697631836, -41.87024688720703, -37.59069061279297, -33.31113052368164, -29.031572341918945, -24.75200653076172, -20.472448348999023, -16.192890167236328, -11.913330078125, -7.633771896362305, -3.3542137145996094, 0.9253463745117188, 5.204904556274414, 9.48446273803711, 13.764020919799805, 18.0435791015625, 22.323139190673828, 26.602697372436523, 30.88225555419922, 35.16181564331055, 39.441375732421875, 43.72093200683594, 48.000492095947266, 52.28004837036133, 56.559608459472656, 60.83916473388672, 65.11872863769531, 69.39828491210938, 73.67784118652344, 77.9573974609375, 82.23695373535156, 86.51651763916016, 90.79607391357422, 95.07563018798828, 99.35519409179688, 103.63475036621094, 107.914306640625, 112.1938705444336]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 5.0, 1.0, 2.0, 7.0, 13.0, 10.0, 6.0, 8.0, 19.0, 18.0, 17.0, 26.0, 28.0, 27.0, 27.0, 25.0, 33.0, 30.0, 39.0, 40.0, 53.0, 36.0, 32.0, 36.0, 46.0, 36.0, 34.0, 33.0, 35.0, 31.0, 34.0, 28.0, 22.0, 30.0, 21.0, 17.0, 14.0, 17.0, 7.0, 14.0, 11.0, 9.0, 3.0, 6.0, 4.0, 7.0, 3.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-41.12879180908203, -39.9195442199707, -38.710296630859375, -37.50104904174805, -36.29180145263672, -35.08255386352539, -33.87330627441406, -32.664058685302734, -31.454811096191406, -30.245563507080078, -29.03631591796875, -27.827068328857422, -26.617820739746094, -25.408573150634766, -24.199325561523438, -22.99007797241211, -21.780832290649414, -20.571584701538086, -19.362337112426758, -18.15308952331543, -16.9438419342041, -15.734594345092773, -14.525347709655762, -13.316100120544434, -12.106852531433105, -10.897604942321777, -9.68835735321045, -8.479110717773438, -7.269862651824951, -6.060615062713623, -4.851367950439453, -3.642120361328125, -2.432872772216797, -1.2236253023147583, -0.014377832412719727, 1.1948695182800293, 2.4041171073913574, 3.6133646965026855, 4.8226118087768555, 6.031859397888184, 7.241106986999512, 8.45035457611084, 9.659602165222168, 10.86884880065918, 12.078096389770508, 13.287343978881836, 14.496591567993164, 15.705839157104492, 16.91508674621582, 18.12433433532715, 19.333581924438477, 20.542829513549805, 21.752077102661133, 22.96132469177246, 24.170570373535156, 25.379817962646484, 26.589065551757812, 27.79831314086914, 29.00756072998047, 30.216808319091797, 31.426055908203125, 32.63530349731445, 33.84455108642578, 35.05379867553711, 36.26304626464844]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 6.0, 5.0, 10.0, 9.0, 14.0, 13.0, 27.0, 18.0, 24.0, 25.0, 34.0, 28.0, 28.0, 38.0, 41.0, 39.0, 53.0, 53.0, 38.0, 42.0, 52.0, 49.0, 52.0, 23.0, 36.0, 29.0, 33.0, 32.0, 20.0, 27.0, 15.0, 18.0, 12.0, 12.0, 10.0, 14.0, 7.0, 5.0, 4.0, 4.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.4296875, -8.1729736328125, -7.916259765625, -7.6595458984375, -7.40283203125, -7.1461181640625, -6.889404296875, -6.6326904296875, -6.3759765625, -6.1192626953125, -5.862548828125, -5.6058349609375, -5.34912109375, -5.0924072265625, -4.835693359375, -4.5789794921875, -4.322265625, -4.0655517578125, -3.808837890625, -3.5521240234375, -3.29541015625, -3.0386962890625, -2.781982421875, -2.5252685546875, -2.2685546875, -2.0118408203125, -1.755126953125, -1.4984130859375, -1.24169921875, -0.9849853515625, -0.728271484375, -0.4715576171875, -0.21484375, 0.0418701171875, 0.298583984375, 0.5552978515625, 0.81201171875, 1.0687255859375, 1.325439453125, 1.5821533203125, 1.8388671875, 2.0955810546875, 2.352294921875, 2.6090087890625, 2.86572265625, 3.1224365234375, 3.379150390625, 3.6358642578125, 3.892578125, 4.1492919921875, 4.406005859375, 4.6627197265625, 4.91943359375, 5.1761474609375, 5.432861328125, 5.6895751953125, 5.9462890625, 6.2030029296875, 6.459716796875, 6.7164306640625, 6.97314453125, 7.2298583984375, 7.486572265625, 7.7432861328125, 8.0]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 6.0, 6.0, 16.0, 24.0, 39.0, 37.0, 85.0, 114.0, 186.0, 311.0, 491.0, 876.0, 1403.0, 2521.0, 4182.0, 7160.0, 12544.0, 22205.0, 40110.0, 76583.0, 175814.0, 402589.0, 149032.0, 68376.0, 36314.0, 20071.0, 11330.0, 6620.0, 3913.0, 2268.0, 1380.0, 765.0, 458.0, 275.0, 172.0, 91.0, 64.0, 48.0, 31.0, 17.0, 14.0, 5.0, 6.0, 6.0, 1.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8974609375, -1.837066650390625, -1.77667236328125, -1.716278076171875, -1.6558837890625, -1.595489501953125, -1.53509521484375, -1.474700927734375, -1.414306640625, -1.353912353515625, -1.29351806640625, -1.233123779296875, -1.1727294921875, -1.112335205078125, -1.05194091796875, -0.991546630859375, -0.93115234375, -0.870758056640625, -0.81036376953125, -0.749969482421875, -0.6895751953125, -0.629180908203125, -0.56878662109375, -0.508392333984375, -0.447998046875, -0.387603759765625, -0.32720947265625, -0.266815185546875, -0.2064208984375, -0.146026611328125, -0.08563232421875, -0.025238037109375, 0.03515625, 0.095550537109375, 0.15594482421875, 0.216339111328125, 0.2767333984375, 0.337127685546875, 0.39752197265625, 0.457916259765625, 0.518310546875, 0.578704833984375, 0.63909912109375, 0.699493408203125, 0.7598876953125, 0.820281982421875, 0.88067626953125, 0.941070556640625, 1.00146484375, 1.061859130859375, 1.12225341796875, 1.182647705078125, 1.2430419921875, 1.303436279296875, 1.36383056640625, 1.424224853515625, 1.484619140625, 1.545013427734375, 1.60540771484375, 1.665802001953125, 1.7261962890625, 1.786590576171875, 1.84698486328125, 1.907379150390625, 1.9677734375]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 0.0, 3.0, 4.0, 7.0, 8.0, 19.0, 11.0, 22.0, 16.0, 32.0, 23.0, 35.0, 27.0, 40.0, 30.0, 34.0, 31.0, 56.0, 45.0, 45.0, 1074.0, 48.0, 34.0, 36.0, 47.0, 35.0, 40.0, 32.0, 27.0, 25.0, 21.0, 26.0, 23.0, 18.0, 10.0, 12.0, 7.0, 7.0, 8.0, 5.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.73828125, -5.576904296875, -5.41552734375, -5.254150390625, -5.0927734375, -4.931396484375, -4.77001953125, -4.608642578125, -4.447265625, -4.285888671875, -4.12451171875, -3.963134765625, -3.8017578125, -3.640380859375, -3.47900390625, -3.317626953125, -3.15625, -2.994873046875, -2.83349609375, -2.672119140625, -2.5107421875, -2.349365234375, -2.18798828125, -2.026611328125, -1.865234375, -1.703857421875, -1.54248046875, -1.381103515625, -1.2197265625, -1.058349609375, -0.89697265625, -0.735595703125, -0.57421875, -0.412841796875, -0.25146484375, -0.090087890625, 0.0712890625, 0.232666015625, 0.39404296875, 0.555419921875, 0.716796875, 0.878173828125, 1.03955078125, 1.200927734375, 1.3623046875, 1.523681640625, 1.68505859375, 1.846435546875, 2.0078125, 2.169189453125, 2.33056640625, 2.491943359375, 2.6533203125, 2.814697265625, 2.97607421875, 3.137451171875, 3.298828125, 3.460205078125, 3.62158203125, 3.782958984375, 3.9443359375, 4.105712890625, 4.26708984375, 4.428466796875, 4.58984375]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 3.0, 3.0, 11.0, 10.0, 20.0, 22.0, 34.0, 42.0, 79.0, 120.0, 177.0, 243.0, 389.0, 592.0, 921.0, 1525.0, 2545.0, 4343.0, 7502.0, 12884.0, 22423.0, 38489.0, 70456.0, 154921.0, 1455264.0, 158021.0, 72633.0, 39015.0, 22553.0, 13253.0, 7500.0, 4397.0, 2601.0, 1528.0, 945.0, 583.0, 374.0, 251.0, 143.0, 112.0, 59.0, 43.0, 32.0, 24.0, 13.0, 11.0, 12.0, 7.0, 3.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.60546875, -1.549163818359375, -1.49285888671875, -1.436553955078125, -1.3802490234375, -1.323944091796875, -1.26763916015625, -1.211334228515625, -1.155029296875, -1.098724365234375, -1.04241943359375, -0.986114501953125, -0.9298095703125, -0.873504638671875, -0.81719970703125, -0.760894775390625, -0.70458984375, -0.648284912109375, -0.59197998046875, -0.535675048828125, -0.4793701171875, -0.423065185546875, -0.36676025390625, -0.310455322265625, -0.254150390625, -0.197845458984375, -0.14154052734375, -0.085235595703125, -0.0289306640625, 0.027374267578125, 0.08367919921875, 0.139984130859375, 0.1962890625, 0.252593994140625, 0.30889892578125, 0.365203857421875, 0.4215087890625, 0.477813720703125, 0.53411865234375, 0.590423583984375, 0.646728515625, 0.703033447265625, 0.75933837890625, 0.815643310546875, 0.8719482421875, 0.928253173828125, 0.98455810546875, 1.040863037109375, 1.09716796875, 1.153472900390625, 1.20977783203125, 1.266082763671875, 1.3223876953125, 1.378692626953125, 1.43499755859375, 1.491302490234375, 1.547607421875, 1.603912353515625, 1.66021728515625, 1.716522216796875, 1.7728271484375, 1.829132080078125, 1.88543701171875, 1.941741943359375, 1.998046875]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 2.0, 2.0, 1.0, 8.0, 3.0, 8.0, 8.0, 12.0, 11.0, 12.0, 12.0, 25.0, 32.0, 20.0, 44.0, 54.0, 64.0, 81.0, 87.0, 96.0, 84.0, 63.0, 65.0, 39.0, 41.0, 23.0, 34.0, 14.0, 8.0, 13.0, 8.0, 5.0, 4.0, 3.0, 7.0, 7.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0011377334594726562, -0.0011000186204910278, -0.0010623037815093994, -0.001024588942527771, -0.0009868741035461426, -0.0009491592645645142, -0.0009114444255828857, -0.0008737295866012573, -0.0008360147476196289, -0.0007982999086380005, -0.0007605850696563721, -0.0007228702306747437, -0.0006851553916931152, -0.0006474405527114868, -0.0006097257137298584, -0.00057201087474823, -0.0005342960357666016, -0.0004965811967849731, -0.0004588663578033447, -0.0004211515188217163, -0.0003834366798400879, -0.00034572184085845947, -0.00030800700187683105, -0.00027029216289520264, -0.00023257732391357422, -0.0001948624849319458, -0.00015714764595031738, -0.00011943280696868896, -8.171796798706055e-05, -4.400312900543213e-05, -6.288290023803711e-06, 3.142654895782471e-05, 6.914138793945312e-05, 0.00010685622692108154, 0.00014457106590270996, 0.00018228590488433838, 0.0002200007438659668, 0.0002577155828475952, 0.00029543042182922363, 0.00033314526081085205, 0.00037086009979248047, 0.0004085749387741089, 0.0004462897777557373, 0.0004840046167373657, 0.0005217194557189941, 0.0005594342947006226, 0.000597149133682251, 0.0006348639726638794, 0.0006725788116455078, 0.0007102936506271362, 0.0007480084896087646, 0.0007857233285903931, 0.0008234381675720215, 0.0008611530065536499, 0.0008988678455352783, 0.0009365826845169067, 0.0009742975234985352, 0.0010120123624801636, 0.001049727201461792, 0.0010874420404434204, 0.0011251568794250488, 0.0011628717184066772, 0.0012005865573883057, 0.001238301396369934, 0.0012760162353515625]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 2.0, 3.0, 1.0, 8.0, 7.0, 6.0, 10.0, 8.0, 15.0, 15.0, 29.0, 28.0, 48.0, 71.0, 96.0, 167.0, 292.0, 746.0, 74621.0, 970306.0, 1112.0, 367.0, 199.0, 103.0, 77.0, 47.0, 36.0, 34.0, 23.0, 18.0, 17.0, 15.0, 4.0, 5.0, 6.0, 6.0, 1.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0291290283203125, -0.028275728225708008, -0.027422428131103516, -0.026569128036499023, -0.02571582794189453, -0.02486252784729004, -0.024009227752685547, -0.023155927658081055, -0.022302627563476562, -0.02144932746887207, -0.020596027374267578, -0.019742727279663086, -0.018889427185058594, -0.0180361270904541, -0.01718282699584961, -0.016329526901245117, -0.015476226806640625, -0.014622926712036133, -0.01376962661743164, -0.012916326522827148, -0.012063026428222656, -0.011209726333618164, -0.010356426239013672, -0.00950312614440918, -0.008649826049804688, -0.007796525955200195, -0.006943225860595703, -0.006089925765991211, -0.005236625671386719, -0.0043833255767822266, -0.0035300254821777344, -0.002676725387573242, -0.00182342529296875, -0.0009701251983642578, -0.00011682510375976562, 0.0007364749908447266, 0.0015897750854492188, 0.002443075180053711, 0.003296375274658203, 0.004149675369262695, 0.0050029754638671875, 0.00585627555847168, 0.006709575653076172, 0.007562875747680664, 0.008416175842285156, 0.009269475936889648, 0.01012277603149414, 0.010976076126098633, 0.011829376220703125, 0.012682676315307617, 0.01353597640991211, 0.014389276504516602, 0.015242576599121094, 0.016095876693725586, 0.016949176788330078, 0.01780247688293457, 0.018655776977539062, 0.019509077072143555, 0.020362377166748047, 0.02121567726135254, 0.02206897735595703, 0.022922277450561523, 0.023775577545166016, 0.024628877639770508, 0.025482177734375]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 7.0, 30.0, 133.0, 365.0, 338.0, 105.0, 32.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0018662384245544672, -0.0018170290859416127, -0.00176781986374408, -0.0017186105251312256, -0.001669401302933693, -0.0016201919643208385, -0.001570982625707984, -0.0015217734035104513, -0.0014725640648975968, -0.0014233547262847424, -0.0013741455040872097, -0.0013249361654743552, -0.0012757268268615007, -0.001226517604663968, -0.0011773082660511136, -0.0011280989274382591, -0.0010788897052407265, -0.001029680366627872, -0.0009804711444303393, -0.0009312618058174849, -0.0008820525254122913, -0.0008328432450070977, -0.0007836339063942432, -0.0007344246259890497, -0.0006852153455838561, -0.0006360060651786625, -0.000586796784773469, -0.0005375874461606145, -0.0004883781657554209, -0.00043916888535022736, -0.00038995957584120333, -0.0003407502663321793, -0.00029154098592698574, -0.00024233169096987695, -0.00019312239601276815, -0.00014391310105565935, -9.470380609855056e-05, -4.549452569335699e-05, 3.714783815667033e-06, 5.292409332469106e-05, 0.00010213337372988462, 0.00015134266868699342, 0.00020055196364410222, 0.00024976127315312624, 0.0002989705535583198, 0.0003481798339635134, 0.0003973891434725374, 0.0004465984529815614, 0.000495807733386755, 0.0005450170137919486, 0.0005942262941971421, 0.0006434356328099966, 0.0006926449132151902, 0.0007418541936203837, 0.0007910635322332382, 0.0008402728126384318, 0.0008894820930436254, 0.0009386913734488189, 0.0009879006538540125, 0.001037109992466867, 0.0010863193310797215, 0.001135528553277254, 0.0011847378918901086, 0.001233947230502963, 0.0012831564527004957]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 6.0, 8.0, 10.0, 13.0, 10.0, 17.0, 22.0, 17.0, 20.0, 44.0, 31.0, 46.0, 35.0, 46.0, 42.0, 50.0, 39.0, 45.0, 46.0, 37.0, 35.0, 39.0, 45.0, 40.0, 28.0, 36.0, 31.0, 30.0, 20.0, 20.0, 19.0, 14.0, 14.0, 11.0, 5.0, 6.0, 7.0, 10.0, 3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005988478660583496, -0.000580761581659317, -0.0005626752972602844, -0.0005445890128612518, -0.0005265027284622192, -0.0005084164440631866, -0.000490330159664154, -0.00047224387526512146, -0.00045415759086608887, -0.0004360713064670563, -0.0004179850220680237, -0.0003998987376689911, -0.0003818124532699585, -0.0003637261688709259, -0.0003456398844718933, -0.0003275536000728607, -0.0003094673156738281, -0.00029138103127479553, -0.00027329474687576294, -0.00025520846247673035, -0.00023712217807769775, -0.00021903589367866516, -0.00020094960927963257, -0.00018286332488059998, -0.00016477704048156738, -0.0001466907560825348, -0.0001286044716835022, -0.0001105181872844696, -9.243190288543701e-05, -7.434561848640442e-05, -5.6259334087371826e-05, -3.8173049688339233e-05, -2.008676528930664e-05, -2.000480890274048e-06, 1.6085803508758545e-05, 3.417208790779114e-05, 5.225837230682373e-05, 7.034465670585632e-05, 8.843094110488892e-05, 0.00010651722550392151, 0.0001246035099029541, 0.0001426897943019867, 0.0001607760787010193, 0.00017886236310005188, 0.00019694864749908447, 0.00021503493189811707, 0.00023312121629714966, 0.00025120750069618225, 0.00026929378509521484, 0.00028738006949424744, 0.00030546635389328003, 0.0003235526382923126, 0.0003416389226913452, 0.0003597252070903778, 0.0003778114914894104, 0.000395897775888443, 0.0004139840602874756, 0.0004320703446865082, 0.00045015662908554077, 0.00046824291348457336, 0.00048632919788360596, 0.0005044154822826385, 0.0005225017666816711, 0.0005405880510807037, 0.0005586743354797363]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 6.0, 5.0, 10.0, 9.0, 14.0, 13.0, 27.0, 18.0, 24.0, 25.0, 34.0, 28.0, 28.0, 38.0, 41.0, 39.0, 53.0, 53.0, 38.0, 42.0, 52.0, 49.0, 52.0, 23.0, 36.0, 29.0, 33.0, 32.0, 20.0, 27.0, 15.0, 18.0, 12.0, 12.0, 10.0, 14.0, 7.0, 5.0, 4.0, 4.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.4296875, -8.1729736328125, -7.916259765625, -7.6595458984375, -7.40283203125, -7.1461181640625, -6.889404296875, -6.6326904296875, -6.3759765625, -6.1192626953125, -5.862548828125, -5.6058349609375, -5.34912109375, -5.0924072265625, -4.835693359375, -4.5789794921875, -4.322265625, -4.0655517578125, -3.808837890625, -3.5521240234375, -3.29541015625, -3.0386962890625, -2.781982421875, -2.5252685546875, -2.2685546875, -2.0118408203125, -1.755126953125, -1.4984130859375, -1.24169921875, -0.9849853515625, -0.728271484375, -0.4715576171875, -0.21484375, 0.0418701171875, 0.298583984375, 0.5552978515625, 0.81201171875, 1.0687255859375, 1.325439453125, 1.5821533203125, 1.8388671875, 2.0955810546875, 2.352294921875, 2.6090087890625, 2.86572265625, 3.1224365234375, 3.379150390625, 3.6358642578125, 3.892578125, 4.1492919921875, 4.406005859375, 4.6627197265625, 4.91943359375, 5.1761474609375, 5.432861328125, 5.6895751953125, 5.9462890625, 6.2030029296875, 6.459716796875, 6.7164306640625, 6.97314453125, 7.2298583984375, 7.486572265625, 7.7432861328125, 8.0]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 7.0, 6.0, 10.0, 11.0, 16.0, 18.0, 33.0, 39.0, 58.0, 62.0, 99.0, 128.0, 182.0, 213.0, 322.0, 451.0, 655.0, 997.0, 2984.0, 24936.0, 799044.0, 202558.0, 10981.0, 1851.0, 822.0, 575.0, 416.0, 283.0, 222.0, 150.0, 101.0, 79.0, 50.0, 43.0, 33.0, 32.0, 26.0, 23.0, 10.0, 13.0, 6.0, 5.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.34375, -20.693603515625, -20.04345703125, -19.393310546875, -18.7431640625, -18.093017578125, -17.44287109375, -16.792724609375, -16.142578125, -15.492431640625, -14.84228515625, -14.192138671875, -13.5419921875, -12.891845703125, -12.24169921875, -11.591552734375, -10.94140625, -10.291259765625, -9.64111328125, -8.990966796875, -8.3408203125, -7.690673828125, -7.04052734375, -6.390380859375, -5.740234375, -5.090087890625, -4.43994140625, -3.789794921875, -3.1396484375, -2.489501953125, -1.83935546875, -1.189208984375, -0.5390625, 0.111083984375, 0.76123046875, 1.411376953125, 2.0615234375, 2.711669921875, 3.36181640625, 4.011962890625, 4.662109375, 5.312255859375, 5.96240234375, 6.612548828125, 7.2626953125, 7.912841796875, 8.56298828125, 9.213134765625, 9.86328125, 10.513427734375, 11.16357421875, 11.813720703125, 12.4638671875, 13.114013671875, 13.76416015625, 14.414306640625, 15.064453125, 15.714599609375, 16.36474609375, 17.014892578125, 17.6650390625, 18.315185546875, 18.96533203125, 19.615478515625, 20.265625]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 3.0, 1.0, 6.0, 9.0, 8.0, 11.0, 11.0, 15.0, 13.0, 11.0, 21.0, 25.0, 31.0, 35.0, 46.0, 35.0, 34.0, 55.0, 77.0, 86.0, 404.0, 1592.0, 88.0, 55.0, 47.0, 45.0, 39.0, 37.0, 26.0, 30.0, 24.0, 22.0, 16.0, 16.0, 22.0, 10.0, 11.0, 8.0, 5.0, 4.0, 8.0, 2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.515625, -21.813720703125, -21.11181640625, -20.409912109375, -19.7080078125, -19.006103515625, -18.30419921875, -17.602294921875, -16.900390625, -16.198486328125, -15.49658203125, -14.794677734375, -14.0927734375, -13.390869140625, -12.68896484375, -11.987060546875, -11.28515625, -10.583251953125, -9.88134765625, -9.179443359375, -8.4775390625, -7.775634765625, -7.07373046875, -6.371826171875, -5.669921875, -4.968017578125, -4.26611328125, -3.564208984375, -2.8623046875, -2.160400390625, -1.45849609375, -0.756591796875, -0.0546875, 0.647216796875, 1.34912109375, 2.051025390625, 2.7529296875, 3.454833984375, 4.15673828125, 4.858642578125, 5.560546875, 6.262451171875, 6.96435546875, 7.666259765625, 8.3681640625, 9.070068359375, 9.77197265625, 10.473876953125, 11.17578125, 11.877685546875, 12.57958984375, 13.281494140625, 13.9833984375, 14.685302734375, 15.38720703125, 16.089111328125, 16.791015625, 17.492919921875, 18.19482421875, 18.896728515625, 19.5986328125, 20.300537109375, 21.00244140625, 21.704345703125, 22.40625]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 7.0, 2.0, 6.0, 9.0, 5.0, 14.0, 8.0, 28.0, 16.0, 19.0, 19.0, 33.0, 33.0, 35.0, 56.0, 76.0, 119.0, 226.0, 554.0, 2342.0, 3083604.0, 56374.0, 1120.0, 372.0, 168.0, 103.0, 75.0, 58.0, 42.0, 33.0, 28.0, 19.0, 14.0, 16.0, 15.0, 12.0, 11.0, 13.0, 6.0, 5.0, 2.0, 3.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-62.28125, -60.322265625, -58.36328125, -56.404296875, -54.4453125, -52.486328125, -50.52734375, -48.568359375, -46.609375, -44.650390625, -42.69140625, -40.732421875, -38.7734375, -36.814453125, -34.85546875, -32.896484375, -30.9375, -28.978515625, -27.01953125, -25.060546875, -23.1015625, -21.142578125, -19.18359375, -17.224609375, -15.265625, -13.306640625, -11.34765625, -9.388671875, -7.4296875, -5.470703125, -3.51171875, -1.552734375, 0.40625, 2.365234375, 4.32421875, 6.283203125, 8.2421875, 10.201171875, 12.16015625, 14.119140625, 16.078125, 18.037109375, 19.99609375, 21.955078125, 23.9140625, 25.873046875, 27.83203125, 29.791015625, 31.75, 33.708984375, 35.66796875, 37.626953125, 39.5859375, 41.544921875, 43.50390625, 45.462890625, 47.421875, 49.380859375, 51.33984375, 53.298828125, 55.2578125, 57.216796875, 59.17578125, 61.134765625, 63.09375]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 27.0, 82.0, 168.0, 239.0, 261.0, 131.0, 72.0, 22.0, 7.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.62895393371582, -16.690160751342773, -15.75136661529541, -14.812572479248047, -13.873779296875, -12.934985160827637, -11.996191024780273, -11.057397842407227, -10.118603706359863, -9.1798095703125, -8.241016387939453, -7.30222225189209, -6.363428592681885, -5.42463493347168, -4.485840797424316, -3.5470471382141113, -2.6082534790039062, -1.6694597005844116, -0.730665922164917, 0.2081279754638672, 1.1469216346740723, 2.0857152938842773, 3.0245094299316406, 3.9633030891418457, 4.902096748352051, 5.840890407562256, 6.779684066772461, 7.718478202819824, 8.657272338867188, 9.596065521240234, 10.534859657287598, 11.473653793334961, 12.412445068359375, 13.351239204406738, 14.290032386779785, 15.228826522827148, 16.167619705200195, 17.106414794921875, 18.045207977294922, 18.98400115966797, 19.922794342041016, 20.861587524414062, 21.800382614135742, 22.73917579650879, 23.677968978881836, 24.616764068603516, 25.555557250976562, 26.49435043334961, 27.43314552307129, 28.371938705444336, 29.310733795166016, 30.249526977539062, 31.18832015991211, 32.127113342285156, 33.06591033935547, 34.004703521728516, 34.94349670410156, 35.88228988647461, 36.821083068847656, 37.75988006591797, 38.698673248291016, 39.63746643066406, 40.57625961303711, 41.515052795410156, 42.4538459777832]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 3.0, 3.0, 6.0, 1.0, 10.0, 11.0, 6.0, 15.0, 13.0, 17.0, 22.0, 21.0, 22.0, 32.0, 29.0, 36.0, 28.0, 31.0, 35.0, 39.0, 47.0, 51.0, 52.0, 28.0, 51.0, 44.0, 31.0, 40.0, 28.0, 34.0, 27.0, 26.0, 24.0, 26.0, 24.0, 9.0, 13.0, 12.0, 8.0, 12.0, 3.0, 5.0, 5.0, 8.0, 5.0, 8.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-51.18046951293945, -49.59893035888672, -48.01738739013672, -46.435848236083984, -44.85430908203125, -43.272769927978516, -41.69123077392578, -40.10968780517578, -38.52814865112305, -36.94660949707031, -35.36506652832031, -33.78352737426758, -32.201988220214844, -30.62044906616211, -29.038908004760742, -27.457366943359375, -25.87582778930664, -24.294288635253906, -22.71274757385254, -21.131206512451172, -19.549667358398438, -17.968128204345703, -16.386587142944336, -14.805047035217285, -13.223506927490234, -11.641966819763184, -10.060426712036133, -8.478886604309082, -6.897346496582031, -5.3158063888549805, -3.7342662811279297, -2.152726173400879, -0.5711898803710938, 1.010350227355957, 2.591890335083008, 4.173430442810059, 5.754970550537109, 7.33651065826416, 8.918050765991211, 10.499590873718262, 12.081130981445312, 13.662671089172363, 15.244211196899414, 16.82575225830078, 18.407291412353516, 19.98883056640625, 21.570371627807617, 23.151912689208984, 24.73345184326172, 26.314990997314453, 27.89653205871582, 29.478073120117188, 31.059612274169922, 32.641151428222656, 34.222694396972656, 35.80423355102539, 37.385772705078125, 38.96731185913086, 40.548851013183594, 42.130393981933594, 43.71193313598633, 45.29347229003906, 46.87501525878906, 48.4565544128418, 50.03809356689453]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 3.0, 3.0, 4.0, 10.0, 11.0, 12.0, 19.0, 14.0, 26.0, 22.0, 28.0, 31.0, 24.0, 37.0, 43.0, 28.0, 35.0, 45.0, 55.0, 39.0, 41.0, 62.0, 54.0, 44.0, 30.0, 29.0, 40.0, 33.0, 35.0, 25.0, 21.0, 12.0, 16.0, 11.0, 16.0, 11.0, 10.0, 10.0, 5.0, 6.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6015625, -8.341064453125, -8.08056640625, -7.820068359375, -7.5595703125, -7.299072265625, -7.03857421875, -6.778076171875, -6.517578125, -6.257080078125, -5.99658203125, -5.736083984375, -5.4755859375, -5.215087890625, -4.95458984375, -4.694091796875, -4.43359375, -4.173095703125, -3.91259765625, -3.652099609375, -3.3916015625, -3.131103515625, -2.87060546875, -2.610107421875, -2.349609375, -2.089111328125, -1.82861328125, -1.568115234375, -1.3076171875, -1.047119140625, -0.78662109375, -0.526123046875, -0.265625, -0.005126953125, 0.25537109375, 0.515869140625, 0.7763671875, 1.036865234375, 1.29736328125, 1.557861328125, 1.818359375, 2.078857421875, 2.33935546875, 2.599853515625, 2.8603515625, 3.120849609375, 3.38134765625, 3.641845703125, 3.90234375, 4.162841796875, 4.42333984375, 4.683837890625, 4.9443359375, 5.204833984375, 5.46533203125, 5.725830078125, 5.986328125, 6.246826171875, 6.50732421875, 6.767822265625, 7.0283203125, 7.288818359375, 7.54931640625, 7.809814453125, 8.0703125]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0, 14.0, 4.0, 6.0, 11.0, 11.0, 15.0, 22.0, 25.0, 36.0, 38.0, 61.0, 81.0, 82.0, 127.0, 128.0, 178.0, 275.0, 338.0, 575.0, 1215.0, 3521.0, 17352.0, 260494.0, 2648224.0, 1188993.0, 60176.0, 7521.0, 2104.0, 891.0, 484.0, 285.0, 219.0, 158.0, 152.0, 106.0, 75.0, 62.0, 49.0, 31.0, 38.0, 23.0, 14.0, 17.0, 15.0, 10.0, 9.0, 8.0, 5.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-17.765625, -17.206298828125, -16.64697265625, -16.087646484375, -15.5283203125, -14.968994140625, -14.40966796875, -13.850341796875, -13.291015625, -12.731689453125, -12.17236328125, -11.613037109375, -11.0537109375, -10.494384765625, -9.93505859375, -9.375732421875, -8.81640625, -8.257080078125, -7.69775390625, -7.138427734375, -6.5791015625, -6.019775390625, -5.46044921875, -4.901123046875, -4.341796875, -3.782470703125, -3.22314453125, -2.663818359375, -2.1044921875, -1.545166015625, -0.98583984375, -0.426513671875, 0.1328125, 0.692138671875, 1.25146484375, 1.810791015625, 2.3701171875, 2.929443359375, 3.48876953125, 4.048095703125, 4.607421875, 5.166748046875, 5.72607421875, 6.285400390625, 6.8447265625, 7.404052734375, 7.96337890625, 8.522705078125, 9.08203125, 9.641357421875, 10.20068359375, 10.760009765625, 11.3193359375, 11.878662109375, 12.43798828125, 12.997314453125, 13.556640625, 14.115966796875, 14.67529296875, 15.234619140625, 15.7939453125, 16.353271484375, 16.91259765625, 17.471923828125, 18.03125]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 10.0, 9.0, 8.0, 11.0, 9.0, 22.0, 28.0, 40.0, 52.0, 94.0, 109.0, 159.0, 230.0, 280.0, 435.0, 514.0, 523.0, 413.0, 323.0, 208.0, 175.0, 129.0, 92.0, 49.0, 53.0, 33.0, 23.0, 12.0, 14.0, 7.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.21875, -13.8028564453125, -13.386962890625, -12.9710693359375, -12.55517578125, -12.1392822265625, -11.723388671875, -11.3074951171875, -10.8916015625, -10.4757080078125, -10.059814453125, -9.6439208984375, -9.22802734375, -8.8121337890625, -8.396240234375, -7.9803466796875, -7.564453125, -7.1485595703125, -6.732666015625, -6.3167724609375, -5.90087890625, -5.4849853515625, -5.069091796875, -4.6531982421875, -4.2373046875, -3.8214111328125, -3.405517578125, -2.9896240234375, -2.57373046875, -2.1578369140625, -1.741943359375, -1.3260498046875, -0.91015625, -0.4942626953125, -0.078369140625, 0.3375244140625, 0.75341796875, 1.1693115234375, 1.585205078125, 2.0010986328125, 2.4169921875, 2.8328857421875, 3.248779296875, 3.6646728515625, 4.08056640625, 4.4964599609375, 4.912353515625, 5.3282470703125, 5.744140625, 6.1600341796875, 6.575927734375, 6.9918212890625, 7.40771484375, 7.8236083984375, 8.239501953125, 8.6553955078125, 9.0712890625, 9.4871826171875, 9.903076171875, 10.3189697265625, 10.73486328125, 11.1507568359375, 11.566650390625, 11.9825439453125, 12.3984375]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 9.0, 9.0, 17.0, 15.0, 31.0, 49.0, 86.0, 144.0, 255.0, 484.0, 1882.0, 308927.0, 3877249.0, 3699.0, 683.0, 292.0, 187.0, 87.0, 60.0, 38.0, 30.0, 15.0, 22.0, 9.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.53125, -60.66162109375, -57.7919921875, -54.92236328125, -52.052734375, -49.18310546875, -46.3134765625, -43.44384765625, -40.57421875, -37.70458984375, -34.8349609375, -31.96533203125, -29.095703125, -26.22607421875, -23.3564453125, -20.48681640625, -17.6171875, -14.74755859375, -11.8779296875, -9.00830078125, -6.138671875, -3.26904296875, -0.3994140625, 2.47021484375, 5.33984375, 8.20947265625, 11.0791015625, 13.94873046875, 16.818359375, 19.68798828125, 22.5576171875, 25.42724609375, 28.296875, 31.16650390625, 34.0361328125, 36.90576171875, 39.775390625, 42.64501953125, 45.5146484375, 48.38427734375, 51.25390625, 54.12353515625, 56.9931640625, 59.86279296875, 62.732421875, 65.60205078125, 68.4716796875, 71.34130859375, 74.2109375, 77.08056640625, 79.9501953125, 82.81982421875, 85.689453125, 88.55908203125, 91.4287109375, 94.29833984375, 97.16796875, 100.03759765625, 102.9072265625, 105.77685546875, 108.646484375, 111.51611328125, 114.3857421875, 117.25537109375, 120.125]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 9.0, 587.0, 411.0, 10.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-267.61090087890625, -254.84072875976562, -242.070556640625, -229.30038452148438, -216.5302276611328, -203.7600555419922, -190.98988342285156, -178.2197265625, -165.44955444335938, -152.67938232421875, -139.90921020507812, -127.13904571533203, -114.36888122558594, -101.59870910644531, -88.82853698730469, -76.0583724975586, -63.28819274902344, -50.51802444458008, -37.74785614013672, -24.977684020996094, -12.207515716552734, 0.562652587890625, 13.33282470703125, 26.102989196777344, 38.87316131591797, 51.64332962036133, 64.41349792480469, 77.18367004394531, 89.95384216308594, 102.72400665283203, 115.49417877197266, 128.26434326171875, 141.03451538085938, 153.8046875, 166.57485961914062, 179.34503173828125, 192.1151885986328, 204.88536071777344, 217.65553283691406, 230.42568969726562, 243.19586181640625, 255.96603393554688, 268.7362060546875, 281.5063781738281, 294.27655029296875, 307.04669189453125, 319.81689453125, 332.5870361328125, 345.35723876953125, 358.1274108886719, 370.8975830078125, 383.6677551269531, 396.43792724609375, 409.20806884765625, 421.978271484375, 434.7484130859375, 447.5185852050781, 460.28875732421875, 473.0589294433594, 485.8291015625, 498.5992736816406, 511.36944580078125, 524.1395874023438, 536.9097900390625, 549.679931640625]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 7.0, 9.0, 9.0, 11.0, 8.0, 21.0, 14.0, 25.0, 22.0, 25.0, 30.0, 30.0, 35.0, 30.0, 44.0, 37.0, 30.0, 44.0, 41.0, 38.0, 39.0, 50.0, 40.0, 39.0, 29.0, 42.0, 29.0, 35.0, 21.0, 22.0, 25.0, 20.0, 21.0, 14.0, 9.0, 11.0, 10.0, 5.0, 8.0, 9.0, 5.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-46.94541931152344, -45.48090744018555, -44.016395568847656, -42.55188751220703, -41.08737564086914, -39.62286376953125, -38.158355712890625, -36.693843841552734, -35.229331970214844, -33.76482009887695, -32.30030822753906, -30.835800170898438, -29.371288299560547, -27.906776428222656, -26.4422664642334, -24.97775650024414, -23.51324462890625, -22.04873275756836, -20.5842227935791, -19.119712829589844, -17.655200958251953, -16.190689086914062, -14.726179122924805, -13.26166820526123, -11.797157287597656, -10.332646369934082, -8.868135452270508, -7.403624534606934, -5.939113616943359, -4.474602699279785, -3.010091781616211, -1.5455808639526367, -0.0810699462890625, 1.3834409713745117, 2.847951889038086, 4.31246280670166, 5.776973724365234, 7.241484642028809, 8.705995559692383, 10.170506477355957, 11.635017395019531, 13.099528312683105, 14.56403923034668, 16.028549194335938, 17.493061065673828, 18.95757293701172, 20.422082901000977, 21.886592864990234, 23.351104736328125, 24.815616607666016, 26.280126571655273, 27.74463653564453, 29.209148406982422, 30.673660278320312, 32.13816833496094, 33.60268020629883, 35.06719207763672, 36.53170394897461, 37.9962158203125, 39.460723876953125, 40.925235748291016, 42.389747619628906, 43.85425567626953, 45.31876754760742, 46.78327941894531]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 8.0, 3.0, 5.0, 7.0, 6.0, 14.0, 16.0, 20.0, 29.0, 22.0, 20.0, 27.0, 27.0, 31.0, 32.0, 50.0, 47.0, 60.0, 54.0, 44.0, 58.0, 57.0, 48.0, 44.0, 32.0, 44.0, 28.0, 22.0, 25.0, 28.0, 27.0, 22.0, 5.0, 12.0, 11.0, 6.0, 8.0, 9.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6875, -8.3939208984375, -8.100341796875, -7.8067626953125, -7.51318359375, -7.2196044921875, -6.926025390625, -6.6324462890625, -6.3388671875, -6.0452880859375, -5.751708984375, -5.4581298828125, -5.16455078125, -4.8709716796875, -4.577392578125, -4.2838134765625, -3.990234375, -3.6966552734375, -3.403076171875, -3.1094970703125, -2.81591796875, -2.5223388671875, -2.228759765625, -1.9351806640625, -1.6416015625, -1.3480224609375, -1.054443359375, -0.7608642578125, -0.46728515625, -0.1737060546875, 0.119873046875, 0.4134521484375, 0.70703125, 1.0006103515625, 1.294189453125, 1.5877685546875, 1.88134765625, 2.1749267578125, 2.468505859375, 2.7620849609375, 3.0556640625, 3.3492431640625, 3.642822265625, 3.9364013671875, 4.22998046875, 4.5235595703125, 4.817138671875, 5.1107177734375, 5.404296875, 5.6978759765625, 5.991455078125, 6.2850341796875, 6.57861328125, 6.8721923828125, 7.165771484375, 7.4593505859375, 7.7529296875, 8.0465087890625, 8.340087890625, 8.6336669921875, 8.92724609375, 9.2208251953125, 9.514404296875, 9.8079833984375, 10.1015625]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 2.0, 4.0, 7.0, 8.0, 14.0, 20.0, 26.0, 42.0, 84.0, 101.0, 177.0, 258.0, 432.0, 641.0, 979.0, 1530.0, 2333.0, 3679.0, 6002.0, 9136.0, 14754.0, 24653.0, 40435.0, 73085.0, 159116.0, 390638.0, 148537.0, 70276.0, 38879.0, 23785.0, 14100.0, 9049.0, 5773.0, 3486.0, 2315.0, 1460.0, 964.0, 642.0, 403.0, 281.0, 162.0, 103.0, 53.0, 56.0, 24.0, 16.0, 8.0, 8.0, 8.0, 5.0, 4.0, 1.0, 4.0, 2.0, 0.0, 2.0, 2.0], "bins": [-1.837890625, -1.781280517578125, -1.72467041015625, -1.668060302734375, -1.6114501953125, -1.554840087890625, -1.49822998046875, -1.441619873046875, -1.385009765625, -1.328399658203125, -1.27178955078125, -1.215179443359375, -1.1585693359375, -1.101959228515625, -1.04534912109375, -0.988739013671875, -0.93212890625, -0.875518798828125, -0.81890869140625, -0.762298583984375, -0.7056884765625, -0.649078369140625, -0.59246826171875, -0.535858154296875, -0.479248046875, -0.422637939453125, -0.36602783203125, -0.309417724609375, -0.2528076171875, -0.196197509765625, -0.13958740234375, -0.082977294921875, -0.0263671875, 0.030242919921875, 0.08685302734375, 0.143463134765625, 0.2000732421875, 0.256683349609375, 0.31329345703125, 0.369903564453125, 0.426513671875, 0.483123779296875, 0.53973388671875, 0.596343994140625, 0.6529541015625, 0.709564208984375, 0.76617431640625, 0.822784423828125, 0.87939453125, 0.936004638671875, 0.99261474609375, 1.049224853515625, 1.1058349609375, 1.162445068359375, 1.21905517578125, 1.275665283203125, 1.332275390625, 1.388885498046875, 1.44549560546875, 1.502105712890625, 1.5587158203125, 1.615325927734375, 1.67193603515625, 1.728546142578125, 1.78515625]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 11.0, 7.0, 16.0, 12.0, 15.0, 19.0, 25.0, 24.0, 31.0, 31.0, 32.0, 33.0, 30.0, 43.0, 42.0, 44.0, 44.0, 28.0, 1070.0, 32.0, 44.0, 51.0, 49.0, 35.0, 36.0, 31.0, 33.0, 11.0, 27.0, 13.0, 22.0, 25.0, 12.0, 12.0, 10.0, 13.0, 6.0, 8.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.015625, -4.84515380859375, -4.6746826171875, -4.50421142578125, -4.333740234375, -4.16326904296875, -3.9927978515625, -3.82232666015625, -3.65185546875, -3.48138427734375, -3.3109130859375, -3.14044189453125, -2.969970703125, -2.79949951171875, -2.6290283203125, -2.45855712890625, -2.2880859375, -2.11761474609375, -1.9471435546875, -1.77667236328125, -1.606201171875, -1.43572998046875, -1.2652587890625, -1.09478759765625, -0.92431640625, -0.75384521484375, -0.5833740234375, -0.41290283203125, -0.242431640625, -0.07196044921875, 0.0985107421875, 0.26898193359375, 0.439453125, 0.60992431640625, 0.7803955078125, 0.95086669921875, 1.121337890625, 1.29180908203125, 1.4622802734375, 1.63275146484375, 1.80322265625, 1.97369384765625, 2.1441650390625, 2.31463623046875, 2.485107421875, 2.65557861328125, 2.8260498046875, 2.99652099609375, 3.1669921875, 3.33746337890625, 3.5079345703125, 3.67840576171875, 3.848876953125, 4.01934814453125, 4.1898193359375, 4.36029052734375, 4.53076171875, 4.70123291015625, 4.8717041015625, 5.04217529296875, 5.212646484375, 5.38311767578125, 5.5535888671875, 5.72406005859375, 5.89453125]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 4.0, 7.0, 10.0, 21.0, 28.0, 40.0, 52.0, 80.0, 151.0, 242.0, 356.0, 530.0, 869.0, 1530.0, 2584.0, 4402.0, 7772.0, 12898.0, 21834.0, 37019.0, 67713.0, 145402.0, 1432655.0, 179492.0, 79994.0, 41877.0, 24331.0, 14366.0, 8497.0, 4964.0, 2926.0, 1750.0, 1058.0, 599.0, 406.0, 247.0, 161.0, 83.0, 56.0, 38.0, 39.0, 14.0, 13.0, 8.0, 8.0, 5.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.064453125, -2.0048065185546875, -1.945159912109375, -1.8855133056640625, -1.82586669921875, -1.7662200927734375, -1.706573486328125, -1.6469268798828125, -1.5872802734375, -1.5276336669921875, -1.467987060546875, -1.4083404541015625, -1.34869384765625, -1.2890472412109375, -1.229400634765625, -1.1697540283203125, -1.110107421875, -1.0504608154296875, -0.990814208984375, -0.9311676025390625, -0.87152099609375, -0.8118743896484375, -0.752227783203125, -0.6925811767578125, -0.6329345703125, -0.5732879638671875, -0.513641357421875, -0.4539947509765625, -0.39434814453125, -0.3347015380859375, -0.275054931640625, -0.2154083251953125, -0.15576171875, -0.0961151123046875, -0.036468505859375, 0.0231781005859375, 0.08282470703125, 0.1424713134765625, 0.202117919921875, 0.2617645263671875, 0.3214111328125, 0.3810577392578125, 0.440704345703125, 0.5003509521484375, 0.55999755859375, 0.6196441650390625, 0.679290771484375, 0.7389373779296875, 0.798583984375, 0.8582305908203125, 0.917877197265625, 0.9775238037109375, 1.03717041015625, 1.0968170166015625, 1.156463623046875, 1.2161102294921875, 1.2757568359375, 1.3354034423828125, 1.395050048828125, 1.4546966552734375, 1.51434326171875, 1.5739898681640625, 1.633636474609375, 1.6932830810546875, 1.7529296875]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 2.0, 5.0, 2.0, 9.0, 1.0, 10.0, 8.0, 17.0, 12.0, 22.0, 34.0, 27.0, 31.0, 62.0, 93.0, 82.0, 59.0, 81.0, 89.0, 72.0, 58.0, 49.0, 33.0, 26.0, 21.0, 25.0, 19.0, 5.0, 11.0, 7.0, 6.0, 3.0, 4.0, 7.0, 3.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0010738372802734375, -0.0010395050048828125, -0.0010051727294921875, -0.0009708404541015625, -0.0009365081787109375, -0.0009021759033203125, -0.0008678436279296875, -0.0008335113525390625, -0.0007991790771484375, -0.0007648468017578125, -0.0007305145263671875, -0.0006961822509765625, -0.0006618499755859375, -0.0006275177001953125, -0.0005931854248046875, -0.0005588531494140625, -0.0005245208740234375, -0.0004901885986328125, -0.0004558563232421875, -0.0004215240478515625, -0.0003871917724609375, -0.0003528594970703125, -0.0003185272216796875, -0.0002841949462890625, -0.0002498626708984375, -0.0002155303955078125, -0.0001811981201171875, -0.0001468658447265625, -0.0001125335693359375, -7.82012939453125e-05, -4.38690185546875e-05, -9.5367431640625e-06, 2.47955322265625e-05, 5.91278076171875e-05, 9.34600830078125e-05, 0.0001277923583984375, 0.0001621246337890625, 0.0001964569091796875, 0.0002307891845703125, 0.0002651214599609375, 0.0002994537353515625, 0.0003337860107421875, 0.0003681182861328125, 0.0004024505615234375, 0.0004367828369140625, 0.0004711151123046875, 0.0005054473876953125, 0.0005397796630859375, 0.0005741119384765625, 0.0006084442138671875, 0.0006427764892578125, 0.0006771087646484375, 0.0007114410400390625, 0.0007457733154296875, 0.0007801055908203125, 0.0008144378662109375, 0.0008487701416015625, 0.0008831024169921875, 0.0009174346923828125, 0.0009517669677734375, 0.0009860992431640625, 0.0010204315185546875, 0.0010547637939453125, 0.0010890960693359375, 0.0011234283447265625]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 5.0, 7.0, 10.0, 11.0, 6.0, 9.0, 14.0, 21.0, 32.0, 40.0, 46.0, 84.0, 104.0, 201.0, 436.0, 1709.0, 1034110.0, 10305.0, 643.0, 292.0, 140.0, 94.0, 50.0, 38.0, 33.0, 33.0, 19.0, 14.0, 12.0, 10.0, 9.0, 2.0, 6.0, 2.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.025848388671875, -0.02503228187561035, -0.024216175079345703, -0.023400068283081055, -0.022583961486816406, -0.021767854690551758, -0.02095174789428711, -0.02013564109802246, -0.019319534301757812, -0.018503427505493164, -0.017687320709228516, -0.016871213912963867, -0.01605510711669922, -0.01523900032043457, -0.014422893524169922, -0.013606786727905273, -0.012790679931640625, -0.011974573135375977, -0.011158466339111328, -0.01034235954284668, -0.009526252746582031, -0.008710145950317383, -0.007894039154052734, -0.007077932357788086, -0.0062618255615234375, -0.005445718765258789, -0.004629611968994141, -0.003813505172729492, -0.0029973983764648438, -0.0021812915802001953, -0.0013651847839355469, -0.0005490779876708984, 0.00026702880859375, 0.0010831356048583984, 0.0018992424011230469, 0.0027153491973876953, 0.0035314559936523438, 0.004347562789916992, 0.005163669586181641, 0.005979776382446289, 0.0067958831787109375, 0.007611989974975586, 0.008428096771240234, 0.009244203567504883, 0.010060310363769531, 0.01087641716003418, 0.011692523956298828, 0.012508630752563477, 0.013324737548828125, 0.014140844345092773, 0.014956951141357422, 0.01577305793762207, 0.01658916473388672, 0.017405271530151367, 0.018221378326416016, 0.019037485122680664, 0.019853591918945312, 0.02066969871520996, 0.02148580551147461, 0.022301912307739258, 0.023118019104003906, 0.023934125900268555, 0.024750232696533203, 0.02556633949279785, 0.0263824462890625]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 11.0, 21.0, 45.0, 54.0, 112.0, 178.0, 202.0, 129.0, 137.0, 69.0, 24.0, 14.0, 7.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0006128998356871307, -0.0005889044259674847, -0.0005649090744554996, -0.0005409136647358537, -0.0005169183132238686, -0.0004929229035042226, -0.0004689275228884071, -0.0004449321422725916, -0.00042093676165677607, -0.00039694138104096055, -0.00037294600042514503, -0.0003489506198093295, -0.00032495521008968353, -0.00030095985857769847, -0.0002769644488580525, -0.00025296906824223697, -0.00022897368762642145, -0.00020497830701060593, -0.0001809829263947904, -0.00015698753122705966, -0.00013299215061124414, -0.00010899676999542862, -8.500137482769787e-05, -6.100599421188235e-05, -3.701061359606683e-05, -1.3015229342272505e-05, 1.0980154911521822e-05, 3.497554280329496e-05, 5.897092341911048e-05, 8.2966304034926e-05, 0.00010696169920265675, 0.00013095707981847227, 0.0001549524604342878, 0.0001789478410501033, 0.00020294322166591883, 0.00022693861683364958, 0.00025093398289754987, 0.00027492939261719584, 0.00029892477323301136, 0.0003229201538488269, 0.0003469155344646424, 0.0003709109150804579, 0.00039490629569627345, 0.00041890167631208897, 0.00044289708603173494, 0.00046689243754372, 0.000490887847263366, 0.000514883198775351, 0.000538878608494997, 0.000562874018214643, 0.0005868693697266281, 0.000610864779446274, 0.0006348601309582591, 0.0006588555406779051, 0.0006828509503975511, 0.0007068463019095361, 0.0007308416534215212, 0.0007548370631411672, 0.0007788324146531522, 0.0008028278243727982, 0.0008268231758847833, 0.0008508185856044292, 0.0008748139953240752, 0.0008988093468360603, 0.0009228047565557063]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 6.0, 5.0, 8.0, 7.0, 6.0, 11.0, 16.0, 14.0, 21.0, 18.0, 19.0, 31.0, 30.0, 25.0, 37.0, 43.0, 38.0, 51.0, 51.0, 52.0, 56.0, 34.0, 37.0, 46.0, 34.0, 37.0, 33.0, 29.0, 38.0, 27.0, 22.0, 18.0, 14.0, 11.0, 22.0, 12.0, 10.0, 8.0, 6.0, 7.0, 6.0, 5.0, 5.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0005236268043518066, -0.0005076481029391289, -0.0004916694015264511, -0.00047569070011377335, -0.0004597119987010956, -0.0004437332972884178, -0.00042775459587574005, -0.0004117758944630623, -0.0003957971930503845, -0.00037981849163770676, -0.000363839790225029, -0.0003478610888123512, -0.00033188238739967346, -0.0003159036859869957, -0.00029992498457431793, -0.00028394628316164017, -0.0002679675817489624, -0.00025198888033628464, -0.00023601017892360687, -0.0002200314775109291, -0.00020405277609825134, -0.00018807407468557358, -0.0001720953732728958, -0.00015611667186021805, -0.00014013797044754028, -0.00012415926903486252, -0.00010818056762218475, -9.220186620950699e-05, -7.622316479682922e-05, -6.024446338415146e-05, -4.4265761971473694e-05, -2.828706055879593e-05, -1.2308359146118164e-05, 3.670342266559601e-06, 1.9649043679237366e-05, 3.562774509191513e-05, 5.1606446504592896e-05, 6.758514791727066e-05, 8.356384932994843e-05, 9.954255074262619e-05, 0.00011552125215530396, 0.00013149995356798172, 0.00014747865498065948, 0.00016345735639333725, 0.00017943605780601501, 0.00019541475921869278, 0.00021139346063137054, 0.0002273721620440483, 0.00024335086345672607, 0.00025932956486940384, 0.0002753082662820816, 0.00029128696769475937, 0.00030726566910743713, 0.0003232443705201149, 0.00033922307193279266, 0.00035520177334547043, 0.0003711804747581482, 0.00038715917617082596, 0.0004031378775835037, 0.0004191165789961815, 0.00043509528040885925, 0.000451073981821537, 0.0004670526832342148, 0.00048303138464689255, 0.0004990100860595703]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 8.0, 3.0, 5.0, 7.0, 6.0, 14.0, 16.0, 20.0, 29.0, 22.0, 20.0, 27.0, 27.0, 31.0, 32.0, 50.0, 47.0, 60.0, 54.0, 44.0, 58.0, 57.0, 48.0, 44.0, 32.0, 44.0, 28.0, 22.0, 25.0, 28.0, 27.0, 22.0, 5.0, 12.0, 11.0, 6.0, 8.0, 9.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6875, -8.3939208984375, -8.100341796875, -7.8067626953125, -7.51318359375, -7.2196044921875, -6.926025390625, -6.6324462890625, -6.3388671875, -6.0452880859375, -5.751708984375, -5.4581298828125, -5.16455078125, -4.8709716796875, -4.577392578125, -4.2838134765625, -3.990234375, -3.6966552734375, -3.403076171875, -3.1094970703125, -2.81591796875, -2.5223388671875, -2.228759765625, -1.9351806640625, -1.6416015625, -1.3480224609375, -1.054443359375, -0.7608642578125, -0.46728515625, -0.1737060546875, 0.119873046875, 0.4134521484375, 0.70703125, 1.0006103515625, 1.294189453125, 1.5877685546875, 1.88134765625, 2.1749267578125, 2.468505859375, 2.7620849609375, 3.0556640625, 3.3492431640625, 3.642822265625, 3.9364013671875, 4.22998046875, 4.5235595703125, 4.817138671875, 5.1107177734375, 5.404296875, 5.6978759765625, 5.991455078125, 6.2850341796875, 6.57861328125, 6.8721923828125, 7.165771484375, 7.4593505859375, 7.7529296875, 8.0465087890625, 8.340087890625, 8.6336669921875, 8.92724609375, 9.2208251953125, 9.514404296875, 9.8079833984375, 10.1015625]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 6.0, 8.0, 8.0, 13.0, 18.0, 25.0, 33.0, 42.0, 73.0, 79.0, 117.0, 165.0, 243.0, 424.0, 1008.0, 2547.0, 7585.0, 27367.0, 122531.0, 555519.0, 259004.0, 51191.0, 13405.0, 4027.0, 1498.0, 655.0, 290.0, 203.0, 147.0, 82.0, 60.0, 58.0, 32.0, 30.0, 22.0, 17.0, 12.0, 9.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.265625, -10.8865966796875, -10.507568359375, -10.1285400390625, -9.74951171875, -9.3704833984375, -8.991455078125, -8.6124267578125, -8.2333984375, -7.8543701171875, -7.475341796875, -7.0963134765625, -6.71728515625, -6.3382568359375, -5.959228515625, -5.5802001953125, -5.201171875, -4.8221435546875, -4.443115234375, -4.0640869140625, -3.68505859375, -3.3060302734375, -2.927001953125, -2.5479736328125, -2.1689453125, -1.7899169921875, -1.410888671875, -1.0318603515625, -0.65283203125, -0.2738037109375, 0.105224609375, 0.4842529296875, 0.86328125, 1.2423095703125, 1.621337890625, 2.0003662109375, 2.37939453125, 2.7584228515625, 3.137451171875, 3.5164794921875, 3.8955078125, 4.2745361328125, 4.653564453125, 5.0325927734375, 5.41162109375, 5.7906494140625, 6.169677734375, 6.5487060546875, 6.927734375, 7.3067626953125, 7.685791015625, 8.0648193359375, 8.44384765625, 8.8228759765625, 9.201904296875, 9.5809326171875, 9.9599609375, 10.3389892578125, 10.718017578125, 11.0970458984375, 11.47607421875, 11.8551025390625, 12.234130859375, 12.6131591796875, 12.9921875]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 6.0, 8.0, 10.0, 11.0, 16.0, 21.0, 24.0, 21.0, 27.0, 35.0, 34.0, 34.0, 30.0, 45.0, 56.0, 70.0, 118.0, 320.0, 1517.0, 179.0, 80.0, 60.0, 46.0, 34.0, 32.0, 39.0, 27.0, 26.0, 23.0, 21.0, 24.0, 13.0, 4.0, 3.0, 11.0, 10.0, 3.0, 1.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.546875, -21.82275390625, -21.0986328125, -20.37451171875, -19.650390625, -18.92626953125, -18.2021484375, -17.47802734375, -16.75390625, -16.02978515625, -15.3056640625, -14.58154296875, -13.857421875, -13.13330078125, -12.4091796875, -11.68505859375, -10.9609375, -10.23681640625, -9.5126953125, -8.78857421875, -8.064453125, -7.34033203125, -6.6162109375, -5.89208984375, -5.16796875, -4.44384765625, -3.7197265625, -2.99560546875, -2.271484375, -1.54736328125, -0.8232421875, -0.09912109375, 0.625, 1.34912109375, 2.0732421875, 2.79736328125, 3.521484375, 4.24560546875, 4.9697265625, 5.69384765625, 6.41796875, 7.14208984375, 7.8662109375, 8.59033203125, 9.314453125, 10.03857421875, 10.7626953125, 11.48681640625, 12.2109375, 12.93505859375, 13.6591796875, 14.38330078125, 15.107421875, 15.83154296875, 16.5556640625, 17.27978515625, 18.00390625, 18.72802734375, 19.4521484375, 20.17626953125, 20.900390625, 21.62451171875, 22.3486328125, 23.07275390625, 23.796875]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 4.0, 8.0, 4.0, 5.0, 8.0, 9.0, 7.0, 17.0, 15.0, 22.0, 29.0, 27.0, 52.0, 67.0, 71.0, 110.0, 143.0, 199.0, 265.0, 492.0, 1206.0, 7762.0, 164931.0, 2868800.0, 93425.0, 5500.0, 1007.0, 418.0, 278.0, 191.0, 155.0, 106.0, 70.0, 75.0, 56.0, 45.0, 29.0, 20.0, 15.0, 18.0, 5.0, 4.0, 12.0, 6.0, 5.0, 1.0, 4.0, 3.0, 6.0, 2.0, 2.0, 4.0], "bins": [-30.703125, -29.83642578125, -28.9697265625, -28.10302734375, -27.236328125, -26.36962890625, -25.5029296875, -24.63623046875, -23.76953125, -22.90283203125, -22.0361328125, -21.16943359375, -20.302734375, -19.43603515625, -18.5693359375, -17.70263671875, -16.8359375, -15.96923828125, -15.1025390625, -14.23583984375, -13.369140625, -12.50244140625, -11.6357421875, -10.76904296875, -9.90234375, -9.03564453125, -8.1689453125, -7.30224609375, -6.435546875, -5.56884765625, -4.7021484375, -3.83544921875, -2.96875, -2.10205078125, -1.2353515625, -0.36865234375, 0.498046875, 1.36474609375, 2.2314453125, 3.09814453125, 3.96484375, 4.83154296875, 5.6982421875, 6.56494140625, 7.431640625, 8.29833984375, 9.1650390625, 10.03173828125, 10.8984375, 11.76513671875, 12.6318359375, 13.49853515625, 14.365234375, 15.23193359375, 16.0986328125, 16.96533203125, 17.83203125, 18.69873046875, 19.5654296875, 20.43212890625, 21.298828125, 22.16552734375, 23.0322265625, 23.89892578125, 24.765625]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 18.0, 116.0, 477.0, 342.0, 58.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-117.6524658203125, -114.457763671875, -111.2630615234375, -108.068359375, -104.8736572265625, -101.678955078125, -98.4842529296875, -95.28955078125, -92.0948486328125, -88.900146484375, -85.7054443359375, -82.5107421875, -79.3160400390625, -76.121337890625, -72.9266357421875, -69.73193359375, -66.53722381591797, -63.34252166748047, -60.14781951904297, -56.95311737060547, -53.75841522216797, -50.56371307373047, -47.3690071105957, -44.1743049621582, -40.9796028137207, -37.7849006652832, -34.5901985168457, -31.39549446105957, -28.20079231262207, -25.00609016418457, -21.811386108398438, -18.616683959960938, -15.421981811523438, -12.227279663085938, -9.032576560974121, -5.837873458862305, -2.6431713104248047, 0.5515308380126953, 3.746234893798828, 6.940937042236328, 10.135639190673828, 13.330341339111328, 16.525043487548828, 19.71974754333496, 22.91444969177246, 26.10915184020996, 29.303855895996094, 32.498558044433594, 35.693260192871094, 38.887962341308594, 42.082664489746094, 45.277366638183594, 48.472068786621094, 51.666770935058594, 54.86147689819336, 58.05617904663086, 61.25088119506836, 64.44558715820312, 67.64028930664062, 70.83499145507812, 74.02969360351562, 77.22439575195312, 80.41909790039062, 83.61380004882812, 86.80850219726562]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 3.0, 3.0, 4.0, 10.0, 4.0, 11.0, 11.0, 14.0, 12.0, 15.0, 15.0, 24.0, 26.0, 28.0, 28.0, 39.0, 36.0, 42.0, 39.0, 43.0, 44.0, 44.0, 36.0, 46.0, 42.0, 40.0, 38.0, 41.0, 41.0, 33.0, 31.0, 24.0, 25.0, 26.0, 22.0, 9.0, 11.0, 10.0, 7.0, 4.0, 10.0, 5.0, 5.0, 2.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.74542999267578, -47.202842712402344, -45.66025924682617, -44.117671966552734, -42.57508850097656, -41.032501220703125, -39.48991394042969, -37.947330474853516, -36.404747009277344, -34.862159729003906, -33.319576263427734, -31.776988983154297, -30.234405517578125, -28.691818237304688, -27.149232864379883, -25.606647491455078, -24.06406021118164, -22.521474838256836, -20.97888946533203, -19.436302185058594, -17.893718719482422, -16.351131439208984, -14.80854606628418, -13.265960693359375, -11.72337532043457, -10.180789947509766, -8.638204574584961, -7.09561824798584, -5.553032875061035, -4.0104475021362305, -2.4678611755371094, -0.9252758026123047, 0.6173057556152344, 2.159891366958618, 3.702476978302002, 5.245062828063965, 6.7876482009887695, 8.330233573913574, 9.872819900512695, 11.4154052734375, 12.957990646362305, 14.50057601928711, 16.043161392211914, 17.58574676513672, 19.128334045410156, 20.670917510986328, 22.213504791259766, 23.75609016418457, 25.298675537109375, 26.84126091003418, 28.383846282958984, 29.926433563232422, 31.469017028808594, 33.01160430908203, 34.55419158935547, 36.09677505493164, 37.63935852050781, 39.18194580078125, 40.72452926635742, 42.26711654663086, 43.80970001220703, 45.35228729248047, 46.894874572753906, 48.43745803833008, 49.980045318603516]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 3.0, 14.0, 11.0, 14.0, 16.0, 17.0, 21.0, 20.0, 23.0, 26.0, 30.0, 22.0, 35.0, 39.0, 70.0, 50.0, 52.0, 65.0, 53.0, 49.0, 39.0, 43.0, 36.0, 40.0, 37.0, 29.0, 26.0, 30.0, 21.0, 10.0, 13.0, 10.0, 4.0, 16.0, 6.0, 8.0, 1.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.4453125, -8.1497802734375, -7.854248046875, -7.5587158203125, -7.26318359375, -6.9676513671875, -6.672119140625, -6.3765869140625, -6.0810546875, -5.7855224609375, -5.489990234375, -5.1944580078125, -4.89892578125, -4.6033935546875, -4.307861328125, -4.0123291015625, -3.716796875, -3.4212646484375, -3.125732421875, -2.8302001953125, -2.53466796875, -2.2391357421875, -1.943603515625, -1.6480712890625, -1.3525390625, -1.0570068359375, -0.761474609375, -0.4659423828125, -0.17041015625, 0.1251220703125, 0.420654296875, 0.7161865234375, 1.01171875, 1.3072509765625, 1.602783203125, 1.8983154296875, 2.19384765625, 2.4893798828125, 2.784912109375, 3.0804443359375, 3.3759765625, 3.6715087890625, 3.967041015625, 4.2625732421875, 4.55810546875, 4.8536376953125, 5.149169921875, 5.4447021484375, 5.740234375, 6.0357666015625, 6.331298828125, 6.6268310546875, 6.92236328125, 7.2178955078125, 7.513427734375, 7.8089599609375, 8.1044921875, 8.4000244140625, 8.695556640625, 8.9910888671875, 9.28662109375, 9.5821533203125, 9.877685546875, 10.1732177734375, 10.46875]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 2.0, 5.0, 5.0, 0.0, 6.0, 2.0, 5.0, 8.0, 13.0, 12.0, 15.0, 18.0, 20.0, 29.0, 32.0, 28.0, 34.0, 42.0, 56.0, 107.0, 214.0, 661.0, 2807.0, 32717.0, 2202899.0, 1923576.0, 27224.0, 2501.0, 603.0, 210.0, 104.0, 56.0, 48.0, 35.0, 38.0, 24.0, 20.0, 15.0, 21.0, 10.0, 17.0, 15.0, 5.0, 6.0, 9.0, 5.0, 4.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.53125, -28.577880859375, -27.62451171875, -26.671142578125, -25.7177734375, -24.764404296875, -23.81103515625, -22.857666015625, -21.904296875, -20.950927734375, -19.99755859375, -19.044189453125, -18.0908203125, -17.137451171875, -16.18408203125, -15.230712890625, -14.27734375, -13.323974609375, -12.37060546875, -11.417236328125, -10.4638671875, -9.510498046875, -8.55712890625, -7.603759765625, -6.650390625, -5.697021484375, -4.74365234375, -3.790283203125, -2.8369140625, -1.883544921875, -0.93017578125, 0.023193359375, 0.9765625, 1.929931640625, 2.88330078125, 3.836669921875, 4.7900390625, 5.743408203125, 6.69677734375, 7.650146484375, 8.603515625, 9.556884765625, 10.51025390625, 11.463623046875, 12.4169921875, 13.370361328125, 14.32373046875, 15.277099609375, 16.23046875, 17.183837890625, 18.13720703125, 19.090576171875, 20.0439453125, 20.997314453125, 21.95068359375, 22.904052734375, 23.857421875, 24.810791015625, 25.76416015625, 26.717529296875, 27.6708984375, 28.624267578125, 29.57763671875, 30.531005859375, 31.484375]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 2.0, 1.0, 8.0, 5.0, 6.0, 18.0, 19.0, 21.0, 35.0, 42.0, 66.0, 102.0, 152.0, 232.0, 293.0, 467.0, 531.0, 547.0, 407.0, 320.0, 235.0, 151.0, 111.0, 71.0, 58.0, 39.0, 36.0, 24.0, 18.0, 13.0, 13.0, 10.0, 7.0, 1.0, 5.0, 4.0, 1.0, 6.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.453125, -11.05908203125, -10.6650390625, -10.27099609375, -9.876953125, -9.48291015625, -9.0888671875, -8.69482421875, -8.30078125, -7.90673828125, -7.5126953125, -7.11865234375, -6.724609375, -6.33056640625, -5.9365234375, -5.54248046875, -5.1484375, -4.75439453125, -4.3603515625, -3.96630859375, -3.572265625, -3.17822265625, -2.7841796875, -2.39013671875, -1.99609375, -1.60205078125, -1.2080078125, -0.81396484375, -0.419921875, -0.02587890625, 0.3681640625, 0.76220703125, 1.15625, 1.55029296875, 1.9443359375, 2.33837890625, 2.732421875, 3.12646484375, 3.5205078125, 3.91455078125, 4.30859375, 4.70263671875, 5.0966796875, 5.49072265625, 5.884765625, 6.27880859375, 6.6728515625, 7.06689453125, 7.4609375, 7.85498046875, 8.2490234375, 8.64306640625, 9.037109375, 9.43115234375, 9.8251953125, 10.21923828125, 10.61328125, 11.00732421875, 11.4013671875, 11.79541015625, 12.189453125, 12.58349609375, 12.9775390625, 13.37158203125, 13.765625]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 7.0, 6.0, 8.0, 8.0, 7.0, 13.0, 18.0, 25.0, 29.0, 37.0, 77.0, 95.0, 196.0, 376.0, 1090.0, 4855.0, 52550.0, 3339771.0, 770376.0, 20542.0, 2821.0, 758.0, 257.0, 141.0, 74.0, 39.0, 35.0, 20.0, 11.0, 9.0, 10.0, 3.0, 7.0, 4.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.8125, -36.66064453125, -35.5087890625, -34.35693359375, -33.205078125, -32.05322265625, -30.9013671875, -29.74951171875, -28.59765625, -27.44580078125, -26.2939453125, -25.14208984375, -23.990234375, -22.83837890625, -21.6865234375, -20.53466796875, -19.3828125, -18.23095703125, -17.0791015625, -15.92724609375, -14.775390625, -13.62353515625, -12.4716796875, -11.31982421875, -10.16796875, -9.01611328125, -7.8642578125, -6.71240234375, -5.560546875, -4.40869140625, -3.2568359375, -2.10498046875, -0.953125, 0.19873046875, 1.3505859375, 2.50244140625, 3.654296875, 4.80615234375, 5.9580078125, 7.10986328125, 8.26171875, 9.41357421875, 10.5654296875, 11.71728515625, 12.869140625, 14.02099609375, 15.1728515625, 16.32470703125, 17.4765625, 18.62841796875, 19.7802734375, 20.93212890625, 22.083984375, 23.23583984375, 24.3876953125, 25.53955078125, 26.69140625, 27.84326171875, 28.9951171875, 30.14697265625, 31.298828125, 32.45068359375, 33.6025390625, 34.75439453125, 35.90625]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 11.0, 51.0, 179.0, 349.0, 307.0, 89.0, 20.0, 5.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.93477249145508, -55.85452651977539, -51.77428436279297, -47.69403839111328, -43.613792419433594, -39.533546447753906, -35.45330047607422, -31.373058319091797, -27.29281234741211, -23.212566375732422, -19.132322311401367, -15.052077293395996, -10.971832275390625, -6.8915863037109375, -2.811342239379883, 1.2689018249511719, 5.349147796630859, 9.42939281463623, 13.509637832641602, 17.589881896972656, 21.670127868652344, 25.75037384033203, 29.830617904663086, 33.91086196899414, 37.99110794067383, 42.071353912353516, 46.15159606933594, 50.231842041015625, 54.31208801269531, 58.392333984375, 62.47257995605469, 66.55282592773438, 70.63307189941406, 74.71331787109375, 78.79356384277344, 82.87380981445312, 86.95405578613281, 91.0343017578125, 95.11454010009766, 99.19478607177734, 103.27503204345703, 107.35527801513672, 111.4355239868164, 115.5157699584961, 119.59600830078125, 123.67625427246094, 127.75650024414062, 131.8367462158203, 135.9169921875, 139.9972381591797, 144.07748413085938, 148.15773010253906, 152.23797607421875, 156.31822204589844, 160.39846801757812, 164.47869873046875, 168.5589599609375, 172.6392059326172, 176.71945190429688, 180.79969787597656, 184.87994384765625, 188.96018981933594, 193.04043579101562, 197.12066650390625, 201.20091247558594]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 3.0, 7.0, 2.0, 9.0, 6.0, 6.0, 8.0, 11.0, 14.0, 17.0, 18.0, 22.0, 21.0, 23.0, 28.0, 29.0, 33.0, 37.0, 32.0, 44.0, 34.0, 49.0, 43.0, 31.0, 34.0, 43.0, 50.0, 37.0, 33.0, 25.0, 35.0, 28.0, 27.0, 22.0, 24.0, 27.0, 7.0, 13.0, 12.0, 10.0, 5.0, 8.0, 7.0, 1.0, 5.0, 9.0, 1.0, 6.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0], "bins": [-38.311622619628906, -37.13053512573242, -35.94944381713867, -34.76835632324219, -33.58726501464844, -32.40617752075195, -31.225086212158203, -30.04399871826172, -28.86290740966797, -27.68181800842285, -26.500728607177734, -25.319639205932617, -24.1385498046875, -22.957460403442383, -21.776371002197266, -20.59528350830078, -19.414194107055664, -18.233104705810547, -17.05201530456543, -15.870925903320312, -14.689836502075195, -13.508747100830078, -12.327658653259277, -11.14656925201416, -9.965479850769043, -8.784390449523926, -7.603301048278809, -6.42221212387085, -5.241122722625732, -4.060033321380615, -2.8789443969726562, -1.697854995727539, -0.5167655944824219, 0.6643236875534058, 1.8454129695892334, 3.0265021324157715, 4.207591533660889, 5.388680934906006, 6.569769859313965, 7.750859260559082, 8.9319486618042, 10.113038063049316, 11.294127464294434, 12.475215911865234, 13.656305313110352, 14.837394714355469, 16.018484115600586, 17.199573516845703, 18.38066291809082, 19.561752319335938, 20.742841720581055, 21.923931121826172, 23.10502052307129, 24.286109924316406, 25.46719741821289, 26.64828872680664, 27.829376220703125, 29.010465621948242, 30.19155502319336, 31.372644424438477, 32.553733825683594, 33.73482131958008, 34.91591262817383, 36.09700012207031, 37.27809143066406]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 3.0, 1.0, 2.0, 5.0, 6.0, 3.0, 7.0, 8.0, 9.0, 13.0, 16.0, 24.0, 21.0, 16.0, 30.0, 38.0, 42.0, 36.0, 44.0, 32.0, 38.0, 53.0, 31.0, 48.0, 49.0, 49.0, 48.0, 44.0, 35.0, 36.0, 37.0, 34.0, 40.0, 18.0, 12.0, 12.0, 13.0, 12.0, 8.0, 15.0, 9.0, 3.0, 1.0, 5.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.64453125, -7.35333251953125, -7.0621337890625, -6.77093505859375, -6.479736328125, -6.18853759765625, -5.8973388671875, -5.60614013671875, -5.31494140625, -5.02374267578125, -4.7325439453125, -4.44134521484375, -4.150146484375, -3.85894775390625, -3.5677490234375, -3.27655029296875, -2.9853515625, -2.69415283203125, -2.4029541015625, -2.11175537109375, -1.820556640625, -1.52935791015625, -1.2381591796875, -0.94696044921875, -0.65576171875, -0.36456298828125, -0.0733642578125, 0.21783447265625, 0.509033203125, 0.80023193359375, 1.0914306640625, 1.38262939453125, 1.673828125, 1.96502685546875, 2.2562255859375, 2.54742431640625, 2.838623046875, 3.12982177734375, 3.4210205078125, 3.71221923828125, 4.00341796875, 4.29461669921875, 4.5858154296875, 4.87701416015625, 5.168212890625, 5.45941162109375, 5.7506103515625, 6.04180908203125, 6.3330078125, 6.62420654296875, 6.9154052734375, 7.20660400390625, 7.497802734375, 7.78900146484375, 8.0802001953125, 8.37139892578125, 8.66259765625, 8.95379638671875, 9.2449951171875, 9.53619384765625, 9.827392578125, 10.11859130859375, 10.4097900390625, 10.70098876953125, 10.9921875]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 2.0, 11.0, 6.0, 17.0, 28.0, 45.0, 47.0, 83.0, 158.0, 211.0, 357.0, 589.0, 1005.0, 1561.0, 2881.0, 4743.0, 8181.0, 14104.0, 25738.0, 47520.0, 92112.0, 224265.0, 362467.0, 125298.0, 61543.0, 32884.0, 17940.0, 10300.0, 5774.0, 3536.0, 2022.0, 1255.0, 695.0, 450.0, 285.0, 153.0, 117.0, 59.0, 47.0, 14.0, 22.0, 14.0, 8.0, 8.0, 3.0, 1.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.13671875, -2.0682373046875, -1.999755859375, -1.9312744140625, -1.86279296875, -1.7943115234375, -1.725830078125, -1.6573486328125, -1.5888671875, -1.5203857421875, -1.451904296875, -1.3834228515625, -1.31494140625, -1.2464599609375, -1.177978515625, -1.1094970703125, -1.041015625, -0.9725341796875, -0.904052734375, -0.8355712890625, -0.76708984375, -0.6986083984375, -0.630126953125, -0.5616455078125, -0.4931640625, -0.4246826171875, -0.356201171875, -0.2877197265625, -0.21923828125, -0.1507568359375, -0.082275390625, -0.0137939453125, 0.0546875, 0.1231689453125, 0.191650390625, 0.2601318359375, 0.32861328125, 0.3970947265625, 0.465576171875, 0.5340576171875, 0.6025390625, 0.6710205078125, 0.739501953125, 0.8079833984375, 0.87646484375, 0.9449462890625, 1.013427734375, 1.0819091796875, 1.150390625, 1.2188720703125, 1.287353515625, 1.3558349609375, 1.42431640625, 1.4927978515625, 1.561279296875, 1.6297607421875, 1.6982421875, 1.7667236328125, 1.835205078125, 1.9036865234375, 1.97216796875, 2.0406494140625, 2.109130859375, 2.1776123046875, 2.24609375]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 4.0, 6.0, 10.0, 15.0, 12.0, 11.0, 12.0, 18.0, 16.0, 21.0, 17.0, 31.0, 24.0, 34.0, 30.0, 30.0, 32.0, 25.0, 34.0, 44.0, 46.0, 35.0, 1051.0, 35.0, 37.0, 32.0, 29.0, 44.0, 31.0, 20.0, 24.0, 31.0, 24.0, 13.0, 22.0, 10.0, 19.0, 14.0, 16.0, 16.0, 9.0, 10.0, 5.0, 7.0, 4.0, 7.0, 3.0, 3.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0], "bins": [-4.984375, -4.8299560546875, -4.675537109375, -4.5211181640625, -4.36669921875, -4.2122802734375, -4.057861328125, -3.9034423828125, -3.7490234375, -3.5946044921875, -3.440185546875, -3.2857666015625, -3.13134765625, -2.9769287109375, -2.822509765625, -2.6680908203125, -2.513671875, -2.3592529296875, -2.204833984375, -2.0504150390625, -1.89599609375, -1.7415771484375, -1.587158203125, -1.4327392578125, -1.2783203125, -1.1239013671875, -0.969482421875, -0.8150634765625, -0.66064453125, -0.5062255859375, -0.351806640625, -0.1973876953125, -0.04296875, 0.1114501953125, 0.265869140625, 0.4202880859375, 0.57470703125, 0.7291259765625, 0.883544921875, 1.0379638671875, 1.1923828125, 1.3468017578125, 1.501220703125, 1.6556396484375, 1.81005859375, 1.9644775390625, 2.118896484375, 2.2733154296875, 2.427734375, 2.5821533203125, 2.736572265625, 2.8909912109375, 3.04541015625, 3.1998291015625, 3.354248046875, 3.5086669921875, 3.6630859375, 3.8175048828125, 3.971923828125, 4.1263427734375, 4.28076171875, 4.4351806640625, 4.589599609375, 4.7440185546875, 4.8984375]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 8.0, 8.0, 21.0, 23.0, 27.0, 36.0, 45.0, 84.0, 104.0, 178.0, 258.0, 363.0, 549.0, 848.0, 1224.0, 1936.0, 2996.0, 4570.0, 7153.0, 10808.0, 16783.0, 26469.0, 42157.0, 71442.0, 143986.0, 1400293.0, 162738.0, 78154.0, 45311.0, 27698.0, 17650.0, 11482.0, 7590.0, 4812.0, 3165.0, 2085.0, 1396.0, 869.0, 592.0, 393.0, 289.0, 187.0, 106.0, 73.0, 50.0, 50.0, 18.0, 23.0, 15.0, 12.0, 6.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0], "bins": [-1.7138671875, -1.659576416015625, -1.60528564453125, -1.550994873046875, -1.4967041015625, -1.442413330078125, -1.38812255859375, -1.333831787109375, -1.279541015625, -1.225250244140625, -1.17095947265625, -1.116668701171875, -1.0623779296875, -1.008087158203125, -0.95379638671875, -0.899505615234375, -0.84521484375, -0.790924072265625, -0.73663330078125, -0.682342529296875, -0.6280517578125, -0.573760986328125, -0.51947021484375, -0.465179443359375, -0.410888671875, -0.356597900390625, -0.30230712890625, -0.248016357421875, -0.1937255859375, -0.139434814453125, -0.08514404296875, -0.030853271484375, 0.0234375, 0.077728271484375, 0.13201904296875, 0.186309814453125, 0.2406005859375, 0.294891357421875, 0.34918212890625, 0.403472900390625, 0.457763671875, 0.512054443359375, 0.56634521484375, 0.620635986328125, 0.6749267578125, 0.729217529296875, 0.78350830078125, 0.837799072265625, 0.89208984375, 0.946380615234375, 1.00067138671875, 1.054962158203125, 1.1092529296875, 1.163543701171875, 1.21783447265625, 1.272125244140625, 1.326416015625, 1.380706787109375, 1.43499755859375, 1.489288330078125, 1.5435791015625, 1.597869873046875, 1.65216064453125, 1.706451416015625, 1.7607421875]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 3.0, 4.0, 5.0, 8.0, 6.0, 4.0, 9.0, 11.0, 7.0, 13.0, 19.0, 30.0, 26.0, 28.0, 37.0, 24.0, 52.0, 51.0, 56.0, 70.0, 69.0, 50.0, 74.0, 49.0, 49.0, 44.0, 40.0, 26.0, 22.0, 27.0, 17.0, 10.0, 12.0, 7.0, 9.0, 6.0, 5.0, 5.0, 9.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.001087188720703125, -0.001052752137184143, -0.0010183155536651611, -0.0009838789701461792, -0.0009494423866271973, -0.0009150058031082153, -0.0008805692195892334, -0.0008461326360702515, -0.0008116960525512695, -0.0007772594690322876, -0.0007428228855133057, -0.0007083863019943237, -0.0006739497184753418, -0.0006395131349563599, -0.0006050765514373779, -0.000570639967918396, -0.0005362033843994141, -0.0005017668008804321, -0.0004673302173614502, -0.00043289363384246826, -0.00039845705032348633, -0.0003640204668045044, -0.00032958388328552246, -0.00029514729976654053, -0.0002607107162475586, -0.00022627413272857666, -0.00019183754920959473, -0.0001574009656906128, -0.00012296438217163086, -8.852779865264893e-05, -5.409121513366699e-05, -1.965463161468506e-05, 1.4781951904296875e-05, 4.921853542327881e-05, 8.365511894226074e-05, 0.00011809170246124268, 0.0001525282859802246, 0.00018696486949920654, 0.00022140145301818848, 0.0002558380365371704, 0.00029027462005615234, 0.0003247112035751343, 0.0003591477870941162, 0.00039358437061309814, 0.0004280209541320801, 0.000462457537651062, 0.0004968941211700439, 0.0005313307046890259, 0.0005657672882080078, 0.0006002038717269897, 0.0006346404552459717, 0.0006690770387649536, 0.0007035136222839355, 0.0007379502058029175, 0.0007723867893218994, 0.0008068233728408813, 0.0008412599563598633, 0.0008756965398788452, 0.0009101331233978271, 0.0009445697069168091, 0.000979006290435791, 0.001013442873954773, 0.0010478794574737549, 0.0010823160409927368, 0.0011167526245117188]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 2.0, 3.0, 2.0, 5.0, 4.0, 8.0, 10.0, 9.0, 12.0, 17.0, 19.0, 23.0, 21.0, 43.0, 48.0, 55.0, 92.0, 121.0, 177.0, 276.0, 485.0, 1205.0, 242347.0, 800370.0, 1617.0, 555.0, 293.0, 200.0, 132.0, 75.0, 72.0, 51.0, 36.0, 29.0, 30.0, 22.0, 20.0, 13.0, 16.0, 11.0, 7.0, 7.0, 6.0, 6.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0224151611328125, -0.02171635627746582, -0.02101755142211914, -0.02031874656677246, -0.01961994171142578, -0.0189211368560791, -0.018222332000732422, -0.017523527145385742, -0.016824722290039062, -0.016125917434692383, -0.015427112579345703, -0.014728307723999023, -0.014029502868652344, -0.013330698013305664, -0.012631893157958984, -0.011933088302612305, -0.011234283447265625, -0.010535478591918945, -0.009836673736572266, -0.009137868881225586, -0.008439064025878906, -0.0077402591705322266, -0.007041454315185547, -0.006342649459838867, -0.0056438446044921875, -0.004945039749145508, -0.004246234893798828, -0.0035474300384521484, -0.0028486251831054688, -0.002149820327758789, -0.0014510154724121094, -0.0007522106170654297, -5.340576171875e-05, 0.0006453990936279297, 0.0013442039489746094, 0.002043008804321289, 0.0027418136596679688, 0.0034406185150146484, 0.004139423370361328, 0.004838228225708008, 0.0055370330810546875, 0.006235837936401367, 0.006934642791748047, 0.0076334476470947266, 0.008332252502441406, 0.009031057357788086, 0.009729862213134766, 0.010428667068481445, 0.011127471923828125, 0.011826276779174805, 0.012525081634521484, 0.013223886489868164, 0.013922691345214844, 0.014621496200561523, 0.015320301055908203, 0.016019105911254883, 0.016717910766601562, 0.017416715621948242, 0.018115520477294922, 0.0188143253326416, 0.01951313018798828, 0.02021193504333496, 0.02091073989868164, 0.02160954475402832, 0.022308349609375]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 11.0, 347.0, 625.0, 31.0, 3.0, 0.0, 1.0], "bins": [-0.008169516921043396, -0.008031362667679787, -0.007893209345638752, -0.007755055092275143, -0.007616900838911533, -0.007478747051209211, -0.007340593263506889, -0.00720243901014328, -0.007064285222440958, -0.006926131434738636, -0.006787977181375027, -0.006649823393672705, -0.006511669140309095, -0.006373515352606773, -0.006235361099243164, -0.006097207311540842, -0.00595905352383852, -0.005820899736136198, -0.005682745482772589, -0.005544591695070267, -0.005406437441706657, -0.005268283654004335, -0.005130129866302013, -0.004991975612938404, -0.004853821359574795, -0.004715667571872473, -0.0045775133185088634, -0.0044393595308065414, -0.004301205277442932, -0.00416305148974061, -0.004024897702038288, -0.003886743448674679, -0.003748589660972357, -0.003610435640439391, -0.0034722816199064255, -0.0033341278322041035, -0.003195973811671138, -0.003057819791138172, -0.0029196657706052065, -0.002781511750072241, -0.002643357962369919, -0.002505203941836953, -0.0023670499213039875, -0.0022288961336016655, -0.0020907421130687, -0.0019525880925357342, -0.0018144340720027685, -0.0016762800514698029, -0.0015381260309368372, -0.0013999720104038715, -0.0012618181062862277, -0.001123664085753262, -0.0009855101816356182, -0.0008473561611026525, -0.0007092021405696869, -0.0005710481782443821, -0.0004328942741267383, -0.00029474031180143356, -0.00015658632037229836, -1.8432328943163157e-05, 0.00011972163338214159, 0.00025787559570744634, 0.000396029616240412, 0.0005341835785657167, 0.0006723375408910215]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 0.0, 5.0, 4.0, 3.0, 8.0, 7.0, 10.0, 13.0, 8.0, 16.0, 22.0, 27.0, 29.0, 29.0, 36.0, 25.0, 25.0, 42.0, 29.0, 40.0, 41.0, 29.0, 41.0, 32.0, 41.0, 36.0, 36.0, 33.0, 39.0, 39.0, 26.0, 25.0, 22.0, 18.0, 28.0, 29.0, 14.0, 19.0, 10.0, 22.0, 10.0, 7.0, 11.0, 5.0, 7.0, 3.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0005451440811157227, -0.0005279043689370155, -0.0005106646567583084, -0.0004934249445796013, -0.00047618523240089417, -0.00045894552022218704, -0.0004417058080434799, -0.0004244660958647728, -0.0004072263836860657, -0.00038998667150735855, -0.00037274695932865143, -0.0003555072471499443, -0.0003382675349712372, -0.00032102782279253006, -0.00030378811061382294, -0.0002865483984351158, -0.0002693086862564087, -0.00025206897407770157, -0.00023482926189899445, -0.00021758954972028732, -0.0002003498375415802, -0.00018311012536287308, -0.00016587041318416595, -0.00014863070100545883, -0.0001313909888267517, -0.00011415127664804459, -9.691156446933746e-05, -7.967185229063034e-05, -6.243214011192322e-05, -4.5192427933216095e-05, -2.7952715754508972e-05, -1.071300357580185e-05, 6.5267086029052734e-06, 2.3766420781612396e-05, 4.100613296031952e-05, 5.824584513902664e-05, 7.548555731773376e-05, 9.272526949644089e-05, 0.00010996498167514801, 0.00012720469385385513, 0.00014444440603256226, 0.00016168411821126938, 0.0001789238303899765, 0.00019616354256868362, 0.00021340325474739075, 0.00023064296692609787, 0.000247882679104805, 0.0002651223912835121, 0.00028236210346221924, 0.00029960181564092636, 0.0003168415278196335, 0.0003340812399983406, 0.00035132095217704773, 0.00036856066435575485, 0.000385800376534462, 0.0004030400887131691, 0.0004202798008918762, 0.00043751951307058334, 0.00045475922524929047, 0.0004719989374279976, 0.0004892386496067047, 0.0005064783617854118, 0.000523718073964119, 0.0005409577861428261, 0.0005581974983215332]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 3.0, 1.0, 2.0, 5.0, 6.0, 3.0, 7.0, 8.0, 9.0, 13.0, 16.0, 24.0, 21.0, 16.0, 30.0, 38.0, 42.0, 36.0, 44.0, 32.0, 38.0, 53.0, 31.0, 48.0, 49.0, 49.0, 48.0, 44.0, 35.0, 36.0, 37.0, 34.0, 40.0, 18.0, 12.0, 12.0, 13.0, 12.0, 8.0, 15.0, 9.0, 3.0, 1.0, 5.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.64453125, -7.35333251953125, -7.0621337890625, -6.77093505859375, -6.479736328125, -6.18853759765625, -5.8973388671875, -5.60614013671875, -5.31494140625, -5.02374267578125, -4.7325439453125, -4.44134521484375, -4.150146484375, -3.85894775390625, -3.5677490234375, -3.27655029296875, -2.9853515625, -2.69415283203125, -2.4029541015625, -2.11175537109375, -1.820556640625, -1.52935791015625, -1.2381591796875, -0.94696044921875, -0.65576171875, -0.36456298828125, -0.0733642578125, 0.21783447265625, 0.509033203125, 0.80023193359375, 1.0914306640625, 1.38262939453125, 1.673828125, 1.96502685546875, 2.2562255859375, 2.54742431640625, 2.838623046875, 3.12982177734375, 3.4210205078125, 3.71221923828125, 4.00341796875, 4.29461669921875, 4.5858154296875, 4.87701416015625, 5.168212890625, 5.45941162109375, 5.7506103515625, 6.04180908203125, 6.3330078125, 6.62420654296875, 6.9154052734375, 7.20660400390625, 7.497802734375, 7.78900146484375, 8.0802001953125, 8.37139892578125, 8.66259765625, 8.95379638671875, 9.2449951171875, 9.53619384765625, 9.827392578125, 10.11859130859375, 10.4097900390625, 10.70098876953125, 10.9921875]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 7.0, 4.0, 15.0, 17.0, 29.0, 35.0, 53.0, 70.0, 82.0, 114.0, 201.0, 260.0, 401.0, 599.0, 1089.0, 2020.0, 4496.0, 13788.0, 56619.0, 263600.0, 498478.0, 156471.0, 33581.0, 8994.0, 3354.0, 1576.0, 914.0, 526.0, 338.0, 249.0, 166.0, 121.0, 88.0, 60.0, 48.0, 22.0, 17.0, 14.0, 10.0, 9.0, 10.0, 4.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.9296875, -11.5821533203125, -11.234619140625, -10.8870849609375, -10.53955078125, -10.1920166015625, -9.844482421875, -9.4969482421875, -9.1494140625, -8.8018798828125, -8.454345703125, -8.1068115234375, -7.75927734375, -7.4117431640625, -7.064208984375, -6.7166748046875, -6.369140625, -6.0216064453125, -5.674072265625, -5.3265380859375, -4.97900390625, -4.6314697265625, -4.283935546875, -3.9364013671875, -3.5888671875, -3.2413330078125, -2.893798828125, -2.5462646484375, -2.19873046875, -1.8511962890625, -1.503662109375, -1.1561279296875, -0.80859375, -0.4610595703125, -0.113525390625, 0.2340087890625, 0.58154296875, 0.9290771484375, 1.276611328125, 1.6241455078125, 1.9716796875, 2.3192138671875, 2.666748046875, 3.0142822265625, 3.36181640625, 3.7093505859375, 4.056884765625, 4.4044189453125, 4.751953125, 5.0994873046875, 5.447021484375, 5.7945556640625, 6.14208984375, 6.4896240234375, 6.837158203125, 7.1846923828125, 7.5322265625, 7.8797607421875, 8.227294921875, 8.5748291015625, 8.92236328125, 9.2698974609375, 9.617431640625, 9.9649658203125, 10.3125]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 6.0, 5.0, 6.0, 8.0, 10.0, 13.0, 21.0, 14.0, 31.0, 29.0, 40.0, 44.0, 42.0, 52.0, 71.0, 101.0, 131.0, 322.0, 1452.0, 169.0, 80.0, 78.0, 48.0, 56.0, 41.0, 27.0, 24.0, 24.0, 28.0, 16.0, 11.0, 9.0, 17.0, 11.0, 7.0, 2.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.125, -24.342041015625, -23.55908203125, -22.776123046875, -21.9931640625, -21.210205078125, -20.42724609375, -19.644287109375, -18.861328125, -18.078369140625, -17.29541015625, -16.512451171875, -15.7294921875, -14.946533203125, -14.16357421875, -13.380615234375, -12.59765625, -11.814697265625, -11.03173828125, -10.248779296875, -9.4658203125, -8.682861328125, -7.89990234375, -7.116943359375, -6.333984375, -5.551025390625, -4.76806640625, -3.985107421875, -3.2021484375, -2.419189453125, -1.63623046875, -0.853271484375, -0.0703125, 0.712646484375, 1.49560546875, 2.278564453125, 3.0615234375, 3.844482421875, 4.62744140625, 5.410400390625, 6.193359375, 6.976318359375, 7.75927734375, 8.542236328125, 9.3251953125, 10.108154296875, 10.89111328125, 11.674072265625, 12.45703125, 13.239990234375, 14.02294921875, 14.805908203125, 15.5888671875, 16.371826171875, 17.15478515625, 17.937744140625, 18.720703125, 19.503662109375, 20.28662109375, 21.069580078125, 21.8525390625, 22.635498046875, 23.41845703125, 24.201416015625, 24.984375]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 10.0, 6.0, 15.0, 15.0, 22.0, 32.0, 36.0, 48.0, 61.0, 107.0, 159.0, 233.0, 436.0, 850.0, 3712.0, 231686.0, 2893689.0, 11734.0, 1389.0, 564.0, 283.0, 190.0, 147.0, 81.0, 48.0, 44.0, 31.0, 23.0, 20.0, 11.0, 9.0, 6.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-49.5625, -48.06982421875, -46.5771484375, -45.08447265625, -43.591796875, -42.09912109375, -40.6064453125, -39.11376953125, -37.62109375, -36.12841796875, -34.6357421875, -33.14306640625, -31.650390625, -30.15771484375, -28.6650390625, -27.17236328125, -25.6796875, -24.18701171875, -22.6943359375, -21.20166015625, -19.708984375, -18.21630859375, -16.7236328125, -15.23095703125, -13.73828125, -12.24560546875, -10.7529296875, -9.26025390625, -7.767578125, -6.27490234375, -4.7822265625, -3.28955078125, -1.796875, -0.30419921875, 1.1884765625, 2.68115234375, 4.173828125, 5.66650390625, 7.1591796875, 8.65185546875, 10.14453125, 11.63720703125, 13.1298828125, 14.62255859375, 16.115234375, 17.60791015625, 19.1005859375, 20.59326171875, 22.0859375, 23.57861328125, 25.0712890625, 26.56396484375, 28.056640625, 29.54931640625, 31.0419921875, 32.53466796875, 34.02734375, 35.52001953125, 37.0126953125, 38.50537109375, 39.998046875, 41.49072265625, 42.9833984375, 44.47607421875, 45.96875]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 7.0, 390.0, 596.0, 23.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-224.96949768066406, -218.3721466064453, -211.77479553222656, -205.1774444580078, -198.58009338378906, -191.9827423095703, -185.38540649414062, -178.78805541992188, -172.19070434570312, -165.59335327148438, -158.99600219726562, -152.39865112304688, -145.80130004882812, -139.20394897460938, -132.60659790039062, -126.0092544555664, -119.41189575195312, -112.81454467773438, -106.21719360351562, -99.61984252929688, -93.02249145507812, -86.42514038085938, -79.82779693603516, -73.2304458618164, -66.63309478759766, -60.035743713378906, -53.438392639160156, -46.84104537963867, -40.24369430541992, -33.64634323120117, -27.048995971679688, -20.451644897460938, -13.854293823242188, -7.256943702697754, -0.6595935821533203, 5.937755584716797, 12.535106658935547, 19.132457733154297, 25.72980499267578, 32.32715606689453, 38.92450714111328, 45.52185821533203, 52.11920928955078, 58.716556549072266, 65.31390380859375, 71.9112548828125, 78.50860595703125, 85.10595703125, 91.70330810546875, 98.3006591796875, 104.89801025390625, 111.495361328125, 118.09271240234375, 124.6900634765625, 131.28741455078125, 137.884765625, 144.48211669921875, 151.0794677734375, 157.67681884765625, 164.274169921875, 170.87152099609375, 177.4688720703125, 184.06622314453125, 190.66357421875, 197.2609100341797]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 6.0, 4.0, 8.0, 13.0, 11.0, 14.0, 10.0, 12.0, 11.0, 18.0, 26.0, 23.0, 30.0, 30.0, 38.0, 30.0, 33.0, 39.0, 32.0, 35.0, 49.0, 35.0, 40.0, 47.0, 47.0, 49.0, 39.0, 39.0, 31.0, 30.0, 32.0, 15.0, 24.0, 17.0, 14.0, 11.0, 15.0, 12.0, 4.0, 9.0, 6.0, 5.0, 5.0, 3.0, 2.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-45.344757080078125, -43.911895751953125, -42.47903823852539, -41.04617691040039, -39.613319396972656, -38.180458068847656, -36.747596740722656, -35.314735412597656, -33.88187789916992, -32.44901657104492, -31.016159057617188, -29.583297729492188, -28.15043830871582, -26.717578887939453, -25.284717559814453, -23.851858139038086, -22.41899871826172, -20.98613929748535, -19.553279876708984, -18.120418548583984, -16.687559127807617, -15.25469970703125, -13.821839332580566, -12.388978958129883, -10.956119537353516, -9.523260116577148, -8.090399742126465, -6.6575398445129395, -5.224679946899414, -3.7918200492858887, -2.3589601516723633, -0.9260997772216797, 0.5067558288574219, 1.9396157264709473, 3.3724756240844727, 4.805335521697998, 6.238195419311523, 7.671055316925049, 9.103915214538574, 10.536775588989258, 11.969635009765625, 13.402494430541992, 14.835354804992676, 16.26821517944336, 17.701074600219727, 19.133934020996094, 20.566795349121094, 21.99965476989746, 23.432514190673828, 24.865373611450195, 26.298233032226562, 27.731094360351562, 29.16395378112793, 30.596813201904297, 32.0296745300293, 33.46253204345703, 34.89539337158203, 36.32825469970703, 37.761112213134766, 39.193973541259766, 40.6268310546875, 42.0596923828125, 43.4925537109375, 44.9254150390625, 46.358272552490234]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [4.0, 2.0, 3.0, 2.0, 3.0, 5.0, 2.0, 9.0, 5.0, 10.0, 15.0, 18.0, 11.0, 22.0, 19.0, 17.0, 32.0, 32.0, 39.0, 33.0, 38.0, 42.0, 40.0, 49.0, 44.0, 44.0, 58.0, 40.0, 44.0, 39.0, 38.0, 40.0, 33.0, 35.0, 30.0, 15.0, 24.0, 13.0, 10.0, 15.0, 9.0, 7.0, 9.0, 2.0, 7.0, 4.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.39453125, -7.10137939453125, -6.8082275390625, -6.51507568359375, -6.221923828125, -5.92877197265625, -5.6356201171875, -5.34246826171875, -5.04931640625, -4.75616455078125, -4.4630126953125, -4.16986083984375, -3.876708984375, -3.58355712890625, -3.2904052734375, -2.99725341796875, -2.7041015625, -2.41094970703125, -2.1177978515625, -1.82464599609375, -1.531494140625, -1.23834228515625, -0.9451904296875, -0.65203857421875, -0.35888671875, -0.06573486328125, 0.2274169921875, 0.52056884765625, 0.813720703125, 1.10687255859375, 1.4000244140625, 1.69317626953125, 1.986328125, 2.27947998046875, 2.5726318359375, 2.86578369140625, 3.158935546875, 3.45208740234375, 3.7452392578125, 4.03839111328125, 4.33154296875, 4.62469482421875, 4.9178466796875, 5.21099853515625, 5.504150390625, 5.79730224609375, 6.0904541015625, 6.38360595703125, 6.6767578125, 6.96990966796875, 7.2630615234375, 7.55621337890625, 7.849365234375, 8.14251708984375, 8.4356689453125, 8.72882080078125, 9.02197265625, 9.31512451171875, 9.6082763671875, 9.90142822265625, 10.194580078125, 10.48773193359375, 10.7808837890625, 11.07403564453125, 11.3671875]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 6.0, 4.0, 0.0, 5.0, 3.0, 5.0, 11.0, 12.0, 20.0, 19.0, 21.0, 22.0, 44.0, 44.0, 69.0, 63.0, 99.0, 119.0, 186.0, 242.0, 339.0, 360.0, 590.0, 340963.0, 3848649.0, 644.0, 393.0, 304.0, 256.0, 197.0, 137.0, 104.0, 73.0, 64.0, 43.0, 34.0, 32.0, 18.0, 25.0, 13.0, 13.0, 12.0, 6.0, 9.0, 7.0, 1.0, 1.0, 5.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-248.625, -240.619140625, -232.61328125, -224.607421875, -216.6015625, -208.595703125, -200.58984375, -192.583984375, -184.578125, -176.572265625, -168.56640625, -160.560546875, -152.5546875, -144.548828125, -136.54296875, -128.537109375, -120.53125, -112.525390625, -104.51953125, -96.513671875, -88.5078125, -80.501953125, -72.49609375, -64.490234375, -56.484375, -48.478515625, -40.47265625, -32.466796875, -24.4609375, -16.455078125, -8.44921875, -0.443359375, 7.5625, 15.568359375, 23.57421875, 31.580078125, 39.5859375, 47.591796875, 55.59765625, 63.603515625, 71.609375, 79.615234375, 87.62109375, 95.626953125, 103.6328125, 111.638671875, 119.64453125, 127.650390625, 135.65625, 143.662109375, 151.66796875, 159.673828125, 167.6796875, 175.685546875, 183.69140625, 191.697265625, 199.703125, 207.708984375, 215.71484375, 223.720703125, 231.7265625, 239.732421875, 247.73828125, 255.744140625, 263.75]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 7.0, 12.0, 17.0, 23.0, 37.0, 50.0, 76.0, 91.0, 168.0, 261.0, 483.0, 744.0, 771.0, 529.0, 273.0, 164.0, 117.0, 84.0, 53.0, 35.0, 20.0, 18.0, 13.0, 10.0, 5.0, 7.0, 0.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.59375, -17.009765625, -16.42578125, -15.841796875, -15.2578125, -14.673828125, -14.08984375, -13.505859375, -12.921875, -12.337890625, -11.75390625, -11.169921875, -10.5859375, -10.001953125, -9.41796875, -8.833984375, -8.25, -7.666015625, -7.08203125, -6.498046875, -5.9140625, -5.330078125, -4.74609375, -4.162109375, -3.578125, -2.994140625, -2.41015625, -1.826171875, -1.2421875, -0.658203125, -0.07421875, 0.509765625, 1.09375, 1.677734375, 2.26171875, 2.845703125, 3.4296875, 4.013671875, 4.59765625, 5.181640625, 5.765625, 6.349609375, 6.93359375, 7.517578125, 8.1015625, 8.685546875, 9.26953125, 9.853515625, 10.4375, 11.021484375, 11.60546875, 12.189453125, 12.7734375, 13.357421875, 13.94140625, 14.525390625, 15.109375, 15.693359375, 16.27734375, 16.861328125, 17.4453125, 18.029296875, 18.61328125, 19.197265625, 19.78125]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 4.0, 3.0, 7.0, 8.0, 12.0, 10.0, 12.0, 15.0, 21.0, 24.0, 25.0, 35.0, 38.0, 48.0, 56.0, 81.0, 120.0, 392.0, 40930.0, 4150447.0, 1355.0, 213.0, 79.0, 69.0, 64.0, 42.0, 34.0, 24.0, 24.0, 23.0, 17.0, 9.0, 8.0, 4.0, 5.0, 6.0, 3.0, 7.0, 3.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-165.375, -160.8125, -156.25, -151.6875, -147.125, -142.5625, -138.0, -133.4375, -128.875, -124.3125, -119.75, -115.1875, -110.625, -106.0625, -101.5, -96.9375, -92.375, -87.8125, -83.25, -78.6875, -74.125, -69.5625, -65.0, -60.4375, -55.875, -51.3125, -46.75, -42.1875, -37.625, -33.0625, -28.5, -23.9375, -19.375, -14.8125, -10.25, -5.6875, -1.125, 3.4375, 8.0, 12.5625, 17.125, 21.6875, 26.25, 30.8125, 35.375, 39.9375, 44.5, 49.0625, 53.625, 58.1875, 62.75, 67.3125, 71.875, 76.4375, 81.0, 85.5625, 90.125, 94.6875, 99.25, 103.8125, 108.375, 112.9375, 117.5, 122.0625, 126.625]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 79.0, 567.0, 340.0, 23.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-116.81360626220703, -108.9644775390625, -101.11534881591797, -93.26622009277344, -85.41709899902344, -77.5679702758789, -69.71884155273438, -61.86971664428711, -54.02058792114258, -46.17145919799805, -38.32233428955078, -30.47320556640625, -22.62407875061035, -14.774951934814453, -6.925823211669922, 0.9233016967773438, 8.772430419921875, 16.621557235717773, 24.470684051513672, 32.3198127746582, 40.16893768310547, 48.01806640625, 55.86719512939453, 63.7163200378418, 71.56544494628906, 79.4145736694336, 87.26370239257812, 95.11282348632812, 102.96195220947266, 110.81108093261719, 118.66020965576172, 126.50933837890625, 134.3584747314453, 142.2075958251953, 150.05673217773438, 157.90585327148438, 165.75498962402344, 173.60411071777344, 181.4532470703125, 189.3023681640625, 197.1514892578125, 205.0006103515625, 212.84974670410156, 220.69886779785156, 228.54800415039062, 236.39712524414062, 244.24624633789062, 252.0953826904297, 259.94451904296875, 267.79364013671875, 275.64276123046875, 283.4919128417969, 291.3410339355469, 299.1901550292969, 307.0392761230469, 314.8883972167969, 322.7375183105469, 330.5866394042969, 338.4357604980469, 346.284912109375, 354.134033203125, 361.983154296875, 369.832275390625, 377.681396484375, 385.5305480957031]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 3.0, 4.0, 5.0, 8.0, 8.0, 8.0, 15.0, 13.0, 26.0, 22.0, 19.0, 22.0, 21.0, 27.0, 28.0, 42.0, 49.0, 34.0, 59.0, 46.0, 40.0, 43.0, 38.0, 43.0, 40.0, 32.0, 37.0, 29.0, 32.0, 21.0, 26.0, 25.0, 21.0, 16.0, 16.0, 14.0, 9.0, 16.0, 13.0, 3.0, 11.0, 3.0, 11.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-45.214332580566406, -43.81508255004883, -42.41583251953125, -41.01658630371094, -39.61733627319336, -38.21808624267578, -36.8188362121582, -35.419586181640625, -34.02033996582031, -32.621089935302734, -31.22184181213379, -29.82259178161621, -28.423343658447266, -27.024093627929688, -25.62484359741211, -24.225595474243164, -22.826345443725586, -21.427095413208008, -20.027847290039062, -18.628597259521484, -17.22934913635254, -15.830099105834961, -14.4308500289917, -13.031600952148438, -11.632351875305176, -10.233102798461914, -8.833853721618652, -7.434604167938232, -6.035355091094971, -4.636106014251709, -3.236856460571289, -1.8376073837280273, -0.4383583068847656, 0.9608908891677856, 2.360140085220337, 3.7593894004821777, 5.1586384773254395, 6.557887554168701, 7.957137107849121, 9.356386184692383, 10.755635261535645, 12.154884338378906, 13.554133415222168, 14.95338249206543, 16.352632522583008, 17.751880645751953, 19.15113067626953, 20.55038070678711, 21.949628829956055, 23.348878860473633, 24.748126983642578, 26.147377014160156, 27.5466251373291, 28.94587516784668, 30.345123291015625, 31.744373321533203, 33.14362335205078, 34.54287338256836, 35.94212341308594, 37.34136962890625, 38.74061965942383, 40.139869689941406, 41.539119720458984, 42.93836975097656, 44.337615966796875]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 7.0, 5.0, 11.0, 17.0, 7.0, 10.0, 9.0, 12.0, 22.0, 19.0, 21.0, 28.0, 35.0, 24.0, 42.0, 30.0, 37.0, 43.0, 36.0, 47.0, 38.0, 47.0, 46.0, 38.0, 36.0, 32.0, 22.0, 29.0, 30.0, 21.0, 22.0, 22.0, 22.0, 24.0, 17.0, 16.0, 10.0, 13.0, 10.0, 9.0, 9.0, 8.0, 6.0, 3.0, 4.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-7.24609375, -6.99932861328125, -6.7525634765625, -6.50579833984375, -6.259033203125, -6.01226806640625, -5.7655029296875, -5.51873779296875, -5.27197265625, -5.02520751953125, -4.7784423828125, -4.53167724609375, -4.284912109375, -4.03814697265625, -3.7913818359375, -3.54461669921875, -3.2978515625, -3.05108642578125, -2.8043212890625, -2.55755615234375, -2.310791015625, -2.06402587890625, -1.8172607421875, -1.57049560546875, -1.32373046875, -1.07696533203125, -0.8302001953125, -0.58343505859375, -0.336669921875, -0.08990478515625, 0.1568603515625, 0.40362548828125, 0.650390625, 0.89715576171875, 1.1439208984375, 1.39068603515625, 1.637451171875, 1.88421630859375, 2.1309814453125, 2.37774658203125, 2.62451171875, 2.87127685546875, 3.1180419921875, 3.36480712890625, 3.611572265625, 3.85833740234375, 4.1051025390625, 4.35186767578125, 4.5986328125, 4.84539794921875, 5.0921630859375, 5.33892822265625, 5.585693359375, 5.83245849609375, 6.0792236328125, 6.32598876953125, 6.57275390625, 6.81951904296875, 7.0662841796875, 7.31304931640625, 7.559814453125, 7.80657958984375, 8.0533447265625, 8.30010986328125, 8.546875]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 4.0, 13.0, 10.0, 22.0, 23.0, 44.0, 51.0, 90.0, 121.0, 164.0, 243.0, 329.0, 523.0, 710.0, 1033.0, 1468.0, 1981.0, 2921.0, 4272.0, 6037.0, 8779.0, 12640.0, 17930.0, 27191.0, 40400.0, 62148.0, 102820.0, 249500.0, 225498.0, 97977.0, 59669.0, 39148.0, 26565.0, 18015.0, 12186.0, 8610.0, 5934.0, 4084.0, 2874.0, 1974.0, 1463.0, 953.0, 698.0, 445.0, 326.0, 231.0, 151.0, 94.0, 61.0, 47.0, 33.0, 22.0, 13.0, 8.0, 6.0, 6.0, 1.0, 2.0], "bins": [-1.5810546875, -1.5345001220703125, -1.487945556640625, -1.4413909912109375, -1.39483642578125, -1.3482818603515625, -1.301727294921875, -1.2551727294921875, -1.2086181640625, -1.1620635986328125, -1.115509033203125, -1.0689544677734375, -1.02239990234375, -0.9758453369140625, -0.929290771484375, -0.8827362060546875, -0.836181640625, -0.7896270751953125, -0.743072509765625, -0.6965179443359375, -0.64996337890625, -0.6034088134765625, -0.556854248046875, -0.5102996826171875, -0.4637451171875, -0.4171905517578125, -0.370635986328125, -0.3240814208984375, -0.27752685546875, -0.2309722900390625, -0.184417724609375, -0.1378631591796875, -0.09130859375, -0.0447540283203125, 0.001800537109375, 0.0483551025390625, 0.09490966796875, 0.1414642333984375, 0.188018798828125, 0.2345733642578125, 0.2811279296875, 0.3276824951171875, 0.374237060546875, 0.4207916259765625, 0.46734619140625, 0.5139007568359375, 0.560455322265625, 0.6070098876953125, 0.653564453125, 0.7001190185546875, 0.746673583984375, 0.7932281494140625, 0.83978271484375, 0.8863372802734375, 0.932891845703125, 0.9794464111328125, 1.0260009765625, 1.0725555419921875, 1.119110107421875, 1.1656646728515625, 1.21221923828125, 1.2587738037109375, 1.305328369140625, 1.3518829345703125, 1.3984375]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 5.0, 9.0, 1.0, 10.0, 7.0, 11.0, 5.0, 11.0, 12.0, 20.0, 19.0, 31.0, 34.0, 33.0, 34.0, 24.0, 31.0, 32.0, 34.0, 27.0, 32.0, 43.0, 1058.0, 44.0, 50.0, 35.0, 45.0, 32.0, 36.0, 34.0, 38.0, 24.0, 23.0, 18.0, 19.0, 19.0, 21.0, 7.0, 9.0, 8.0, 10.0, 3.0, 7.0, 7.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-5.01953125, -4.85333251953125, -4.6871337890625, -4.52093505859375, -4.354736328125, -4.18853759765625, -4.0223388671875, -3.85614013671875, -3.68994140625, -3.52374267578125, -3.3575439453125, -3.19134521484375, -3.025146484375, -2.85894775390625, -2.6927490234375, -2.52655029296875, -2.3603515625, -2.19415283203125, -2.0279541015625, -1.86175537109375, -1.695556640625, -1.52935791015625, -1.3631591796875, -1.19696044921875, -1.03076171875, -0.86456298828125, -0.6983642578125, -0.53216552734375, -0.365966796875, -0.19976806640625, -0.0335693359375, 0.13262939453125, 0.298828125, 0.46502685546875, 0.6312255859375, 0.79742431640625, 0.963623046875, 1.12982177734375, 1.2960205078125, 1.46221923828125, 1.62841796875, 1.79461669921875, 1.9608154296875, 2.12701416015625, 2.293212890625, 2.45941162109375, 2.6256103515625, 2.79180908203125, 2.9580078125, 3.12420654296875, 3.2904052734375, 3.45660400390625, 3.622802734375, 3.78900146484375, 3.9552001953125, 4.12139892578125, 4.28759765625, 4.45379638671875, 4.6199951171875, 4.78619384765625, 4.952392578125, 5.11859130859375, 5.2847900390625, 5.45098876953125, 5.6171875]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 7.0, 7.0, 14.0, 15.0, 18.0, 29.0, 30.0, 63.0, 80.0, 132.0, 201.0, 271.0, 441.0, 582.0, 984.0, 1447.0, 2180.0, 3374.0, 5253.0, 8317.0, 13217.0, 21915.0, 36736.0, 63465.0, 122962.0, 1398236.0, 203572.0, 88958.0, 48814.0, 28880.0, 17185.0, 10500.0, 6737.0, 4285.0, 2810.0, 1842.0, 1162.0, 775.0, 548.0, 327.0, 237.0, 171.0, 108.0, 80.0, 56.0, 25.0, 33.0, 18.0, 15.0, 11.0, 5.0, 4.0, 2.0, 0.0, 2.0, 2.0], "bins": [-1.9677734375, -1.9095001220703125, -1.851226806640625, -1.7929534912109375, -1.73468017578125, -1.6764068603515625, -1.618133544921875, -1.5598602294921875, -1.5015869140625, -1.4433135986328125, -1.385040283203125, -1.3267669677734375, -1.26849365234375, -1.2102203369140625, -1.151947021484375, -1.0936737060546875, -1.035400390625, -0.9771270751953125, -0.918853759765625, -0.8605804443359375, -0.80230712890625, -0.7440338134765625, -0.685760498046875, -0.6274871826171875, -0.5692138671875, -0.5109405517578125, -0.452667236328125, -0.3943939208984375, -0.33612060546875, -0.2778472900390625, -0.219573974609375, -0.1613006591796875, -0.10302734375, -0.0447540283203125, 0.013519287109375, 0.0717926025390625, 0.13006591796875, 0.1883392333984375, 0.246612548828125, 0.3048858642578125, 0.3631591796875, 0.4214324951171875, 0.479705810546875, 0.5379791259765625, 0.59625244140625, 0.6545257568359375, 0.712799072265625, 0.7710723876953125, 0.829345703125, 0.8876190185546875, 0.945892333984375, 1.0041656494140625, 1.06243896484375, 1.1207122802734375, 1.178985595703125, 1.2372589111328125, 1.2955322265625, 1.3538055419921875, 1.412078857421875, 1.4703521728515625, 1.52862548828125, 1.5868988037109375, 1.645172119140625, 1.7034454345703125, 1.76171875]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 5.0, 10.0, 12.0, 18.0, 28.0, 28.0, 40.0, 57.0, 53.0, 64.0, 92.0, 91.0, 80.0, 90.0, 80.0, 65.0, 42.0, 38.0, 22.0, 16.0, 14.0, 15.0, 5.0, 9.0, 8.0, 4.0, 3.0, 0.0, 6.0, 4.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012693405151367188, -0.0012283921241760254, -0.001187443733215332, -0.0011464953422546387, -0.0011055469512939453, -0.001064598560333252, -0.0010236501693725586, -0.0009827017784118652, -0.0009417533874511719, -0.0009008049964904785, -0.0008598566055297852, -0.0008189082145690918, -0.0007779598236083984, -0.0007370114326477051, -0.0006960630416870117, -0.0006551146507263184, -0.000614166259765625, -0.0005732178688049316, -0.0005322694778442383, -0.0004913210868835449, -0.00045037269592285156, -0.0004094243049621582, -0.00036847591400146484, -0.0003275275230407715, -0.0002865791320800781, -0.00024563074111938477, -0.0002046823501586914, -0.00016373395919799805, -0.0001227855682373047, -8.183717727661133e-05, -4.088878631591797e-05, 5.960464477539063e-08, 4.100799560546875e-05, 8.195638656616211e-05, 0.00012290477752685547, 0.00016385316848754883, 0.0002048015594482422, 0.00024574995040893555, 0.0002866983413696289, 0.00032764673233032227, 0.0003685951232910156, 0.000409543514251709, 0.00045049190521240234, 0.0004914402961730957, 0.0005323886871337891, 0.0005733370780944824, 0.0006142854690551758, 0.0006552338600158691, 0.0006961822509765625, 0.0007371306419372559, 0.0007780790328979492, 0.0008190274238586426, 0.0008599758148193359, 0.0009009242057800293, 0.0009418725967407227, 0.000982820987701416, 0.0010237693786621094, 0.0010647177696228027, 0.001105666160583496, 0.0011466145515441895, 0.0011875629425048828, 0.0012285113334655762, 0.0012694597244262695, 0.0013104081153869629, 0.0013513565063476562]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 5.0, 11.0, 8.0, 9.0, 13.0, 25.0, 25.0, 33.0, 38.0, 66.0, 75.0, 105.0, 173.0, 276.0, 458.0, 1033.0, 108636.0, 934541.0, 1461.0, 603.0, 319.0, 177.0, 125.0, 94.0, 85.0, 39.0, 39.0, 29.0, 23.0, 9.0, 9.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.025360107421875, -0.024594783782958984, -0.02382946014404297, -0.023064136505126953, -0.022298812866210938, -0.021533489227294922, -0.020768165588378906, -0.02000284194946289, -0.019237518310546875, -0.01847219467163086, -0.017706871032714844, -0.016941547393798828, -0.016176223754882812, -0.015410900115966797, -0.014645576477050781, -0.013880252838134766, -0.01311492919921875, -0.012349605560302734, -0.011584281921386719, -0.010818958282470703, -0.010053634643554688, -0.009288311004638672, -0.008522987365722656, -0.007757663726806641, -0.006992340087890625, -0.006227016448974609, -0.005461692810058594, -0.004696369171142578, -0.0039310455322265625, -0.003165721893310547, -0.0024003982543945312, -0.0016350746154785156, -0.0008697509765625, -0.00010442733764648438, 0.0006608963012695312, 0.0014262199401855469, 0.0021915435791015625, 0.002956867218017578, 0.0037221908569335938, 0.004487514495849609, 0.005252838134765625, 0.006018161773681641, 0.006783485412597656, 0.007548809051513672, 0.008314132690429688, 0.009079456329345703, 0.009844779968261719, 0.010610103607177734, 0.01137542724609375, 0.012140750885009766, 0.012906074523925781, 0.013671398162841797, 0.014436721801757812, 0.015202045440673828, 0.015967369079589844, 0.01673269271850586, 0.017498016357421875, 0.01826333999633789, 0.019028663635253906, 0.019793987274169922, 0.020559310913085938, 0.021324634552001953, 0.02208995819091797, 0.022855281829833984, 0.02362060546875]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 9.0, 82.0, 398.0, 435.0, 84.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0024392285849899054, -0.002360579324886203, -0.002281930297613144, -0.0022032810375094414, -0.002124631777405739, -0.0020459825173020363, -0.0019673334900289774, -0.0018886842299252748, -0.0018100350862368941, -0.0017313859425485134, -0.0016527366824448109, -0.0015740875387564301, -0.0014954383950680494, -0.0014167891349643469, -0.0013381399912759662, -0.0012594908475875854, -0.001180841587483883, -0.0011021924437955022, -0.0010235431836917996, -0.0009448940400034189, -0.0008662448381073773, -0.0007875956362113357, -0.0007089464925229549, -0.0006302972906269133, -0.0005516480887308717, -0.00047299888683483005, -0.00039434971404261887, -0.0003157005412504077, -0.00023705133935436606, -0.00015840213745832443, -7.975296466611326e-05, -1.1037918739020824e-06, 7.75451771914959e-05, 0.0001561943645356223, 0.0002348435518797487, 0.0003134927246719599, 0.0003921419265680015, 0.00047079112846404314, 0.0005494402721524239, 0.0006280894740484655, 0.0007067386759445071, 0.0007853878778405488, 0.0008640370797365904, 0.0009426862234249711, 0.0010213353671133518, 0.0010999846272170544, 0.001178633770905435, 0.0012572829145938158, 0.0013359321746975183, 0.001414581318385899, 0.0014932305784896016, 0.0015718797221779823, 0.0016505289822816849, 0.0017291781259700656, 0.0018078272696584463, 0.0018864765297621489, 0.0019651255570352077, 0.0020437748171389103, 0.002122423844411969, 0.0022010731045156717, 0.0022797223646193743, 0.002358371391892433, 0.0024370206519961357, 0.0025156699120998383, 0.002594319172203541]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 3.0, 5.0, 6.0, 2.0, 5.0, 8.0, 11.0, 11.0, 15.0, 16.0, 12.0, 10.0, 16.0, 22.0, 31.0, 36.0, 22.0, 32.0, 39.0, 33.0, 33.0, 32.0, 40.0, 44.0, 50.0, 46.0, 37.0, 51.0, 44.0, 30.0, 27.0, 25.0, 35.0, 36.0, 22.0, 21.0, 21.0, 14.0, 12.0, 7.0, 16.0, 4.0, 7.0, 5.0, 9.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00046628713607788086, -0.0004509780555963516, -0.0004356689751148224, -0.00042035989463329315, -0.0004050508141517639, -0.0003897417336702347, -0.00037443265318870544, -0.0003591235727071762, -0.00034381449222564697, -0.00032850541174411774, -0.0003131963312625885, -0.00029788725078105927, -0.00028257817029953003, -0.0002672690898180008, -0.00025196000933647156, -0.00023665092885494232, -0.00022134184837341309, -0.00020603276789188385, -0.00019072368741035461, -0.00017541460692882538, -0.00016010552644729614, -0.0001447964459657669, -0.00012948736548423767, -0.00011417828500270844, -9.88692045211792e-05, -8.356012403964996e-05, -6.825104355812073e-05, -5.294196307659149e-05, -3.7632882595062256e-05, -2.232380211353302e-05, -7.014721632003784e-06, 8.294358849525452e-06, 2.3603439331054688e-05, 3.891251981258392e-05, 5.422160029411316e-05, 6.95306807756424e-05, 8.483976125717163e-05, 0.00010014884173870087, 0.0001154579222202301, 0.00013076700270175934, 0.00014607608318328857, 0.0001613851636648178, 0.00017669424414634705, 0.00019200332462787628, 0.00020731240510940552, 0.00022262148559093475, 0.000237930566072464, 0.0002532396465539932, 0.00026854872703552246, 0.0002838578075170517, 0.00029916688799858093, 0.00031447596848011017, 0.0003297850489616394, 0.00034509412944316864, 0.0003604032099246979, 0.0003757122904062271, 0.00039102137088775635, 0.0004063304513692856, 0.0004216395318508148, 0.00043694861233234406, 0.0004522576928138733, 0.0004675667732954025, 0.00048287585377693176, 0.000498184934258461, 0.0005134940147399902]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 7.0, 5.0, 11.0, 17.0, 7.0, 10.0, 9.0, 12.0, 22.0, 19.0, 21.0, 28.0, 35.0, 24.0, 42.0, 30.0, 37.0, 43.0, 36.0, 47.0, 38.0, 47.0, 46.0, 38.0, 36.0, 32.0, 22.0, 29.0, 30.0, 21.0, 22.0, 22.0, 22.0, 24.0, 17.0, 16.0, 10.0, 13.0, 10.0, 9.0, 9.0, 8.0, 6.0, 3.0, 4.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-7.24609375, -6.99932861328125, -6.7525634765625, -6.50579833984375, -6.259033203125, -6.01226806640625, -5.7655029296875, -5.51873779296875, -5.27197265625, -5.02520751953125, -4.7784423828125, -4.53167724609375, -4.284912109375, -4.03814697265625, -3.7913818359375, -3.54461669921875, -3.2978515625, -3.05108642578125, -2.8043212890625, -2.55755615234375, -2.310791015625, -2.06402587890625, -1.8172607421875, -1.57049560546875, -1.32373046875, -1.07696533203125, -0.8302001953125, -0.58343505859375, -0.336669921875, -0.08990478515625, 0.1568603515625, 0.40362548828125, 0.650390625, 0.89715576171875, 1.1439208984375, 1.39068603515625, 1.637451171875, 1.88421630859375, 2.1309814453125, 2.37774658203125, 2.62451171875, 2.87127685546875, 3.1180419921875, 3.36480712890625, 3.611572265625, 3.85833740234375, 4.1051025390625, 4.35186767578125, 4.5986328125, 4.84539794921875, 5.0921630859375, 5.33892822265625, 5.585693359375, 5.83245849609375, 6.0792236328125, 6.32598876953125, 6.57275390625, 6.81951904296875, 7.0662841796875, 7.31304931640625, 7.559814453125, 7.80657958984375, 8.0533447265625, 8.30010986328125, 8.546875]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 10.0, 13.0, 15.0, 16.0, 32.0, 38.0, 67.0, 67.0, 100.0, 114.0, 156.0, 228.0, 241.0, 338.0, 417.0, 531.0, 661.0, 867.0, 1168.0, 1713.0, 3618.0, 15081.0, 89284.0, 458709.0, 384059.0, 69367.0, 11858.0, 3298.0, 1629.0, 1116.0, 780.0, 664.0, 518.0, 410.0, 334.0, 241.0, 186.0, 155.0, 123.0, 72.0, 73.0, 56.0, 41.0, 27.0, 16.0, 21.0, 12.0, 5.0, 9.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0], "bins": [-12.609375, -12.2144775390625, -11.819580078125, -11.4246826171875, -11.02978515625, -10.6348876953125, -10.239990234375, -9.8450927734375, -9.4501953125, -9.0552978515625, -8.660400390625, -8.2655029296875, -7.87060546875, -7.4757080078125, -7.080810546875, -6.6859130859375, -6.291015625, -5.8961181640625, -5.501220703125, -5.1063232421875, -4.71142578125, -4.3165283203125, -3.921630859375, -3.5267333984375, -3.1318359375, -2.7369384765625, -2.342041015625, -1.9471435546875, -1.55224609375, -1.1573486328125, -0.762451171875, -0.3675537109375, 0.02734375, 0.4222412109375, 0.817138671875, 1.2120361328125, 1.60693359375, 2.0018310546875, 2.396728515625, 2.7916259765625, 3.1865234375, 3.5814208984375, 3.976318359375, 4.3712158203125, 4.76611328125, 5.1610107421875, 5.555908203125, 5.9508056640625, 6.345703125, 6.7406005859375, 7.135498046875, 7.5303955078125, 7.92529296875, 8.3201904296875, 8.715087890625, 9.1099853515625, 9.5048828125, 9.8997802734375, 10.294677734375, 10.6895751953125, 11.08447265625, 11.4793701171875, 11.874267578125, 12.2691650390625, 12.6640625]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 3.0, 3.0, 3.0, 6.0, 8.0, 9.0, 11.0, 21.0, 22.0, 22.0, 26.0, 48.0, 38.0, 46.0, 58.0, 71.0, 98.0, 254.0, 1621.0, 194.0, 96.0, 67.0, 55.0, 51.0, 45.0, 39.0, 28.0, 24.0, 18.0, 19.0, 14.0, 7.0, 5.0, 6.0, 6.0, 3.0, 3.0, 0.0, 4.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.046875, -20.250732421875, -19.45458984375, -18.658447265625, -17.8623046875, -17.066162109375, -16.27001953125, -15.473876953125, -14.677734375, -13.881591796875, -13.08544921875, -12.289306640625, -11.4931640625, -10.697021484375, -9.90087890625, -9.104736328125, -8.30859375, -7.512451171875, -6.71630859375, -5.920166015625, -5.1240234375, -4.327880859375, -3.53173828125, -2.735595703125, -1.939453125, -1.143310546875, -0.34716796875, 0.448974609375, 1.2451171875, 2.041259765625, 2.83740234375, 3.633544921875, 4.4296875, 5.225830078125, 6.02197265625, 6.818115234375, 7.6142578125, 8.410400390625, 9.20654296875, 10.002685546875, 10.798828125, 11.594970703125, 12.39111328125, 13.187255859375, 13.9833984375, 14.779541015625, 15.57568359375, 16.371826171875, 17.16796875, 17.964111328125, 18.76025390625, 19.556396484375, 20.3525390625, 21.148681640625, 21.94482421875, 22.740966796875, 23.537109375, 24.333251953125, 25.12939453125, 25.925537109375, 26.7216796875, 27.517822265625, 28.31396484375, 29.110107421875, 29.90625]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 7.0, 5.0, 4.0, 8.0, 7.0, 3.0, 13.0, 18.0, 18.0, 29.0, 32.0, 49.0, 83.0, 99.0, 179.0, 302.0, 604.0, 1903.0, 2823678.0, 315869.0, 1470.0, 542.0, 253.0, 166.0, 105.0, 63.0, 55.0, 41.0, 28.0, 13.0, 21.0, 16.0, 5.0, 8.0, 5.0, 1.0, 7.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-90.6875, -88.0146484375, -85.341796875, -82.6689453125, -79.99609375, -77.3232421875, -74.650390625, -71.9775390625, -69.3046875, -66.6318359375, -63.958984375, -61.2861328125, -58.61328125, -55.9404296875, -53.267578125, -50.5947265625, -47.921875, -45.2490234375, -42.576171875, -39.9033203125, -37.23046875, -34.5576171875, -31.884765625, -29.2119140625, -26.5390625, -23.8662109375, -21.193359375, -18.5205078125, -15.84765625, -13.1748046875, -10.501953125, -7.8291015625, -5.15625, -2.4833984375, 0.189453125, 2.8623046875, 5.53515625, 8.2080078125, 10.880859375, 13.5537109375, 16.2265625, 18.8994140625, 21.572265625, 24.2451171875, 26.91796875, 29.5908203125, 32.263671875, 34.9365234375, 37.609375, 40.2822265625, 42.955078125, 45.6279296875, 48.30078125, 50.9736328125, 53.646484375, 56.3193359375, 58.9921875, 61.6650390625, 64.337890625, 67.0107421875, 69.68359375, 72.3564453125, 75.029296875, 77.7021484375, 80.375]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 8.0, 376.0, 601.0, 31.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-274.7456359863281, -267.726318359375, -260.70697021484375, -253.68765258789062, -246.6683349609375, -239.6490020751953, -232.6296844482422, -225.6103515625, -218.59103393554688, -211.5717010498047, -204.55238342285156, -197.53305053710938, -190.51373291015625, -183.49440002441406, -176.47508239746094, -169.45574951171875, -162.43643188476562, -155.41709899902344, -148.3977813720703, -141.37844848632812, -134.359130859375, -127.33979797363281, -120.32048034667969, -113.3011474609375, -106.28181457519531, -99.26248931884766, -92.2431640625, -85.22383880615234, -78.20451354980469, -71.1851806640625, -64.16586303710938, -57.14653396606445, -50.12721252441406, -43.107887268066406, -36.08856201171875, -29.06923484802246, -22.049909591674805, -15.030582427978516, -8.01125717163086, -0.9919319152832031, 6.027393341064453, 13.04671859741211, 20.066043853759766, 27.085371017456055, 34.104698181152344, 41.1240234375, 48.143348693847656, 55.16267395019531, 62.18199920654297, 69.20132446289062, 76.22064971923828, 83.23997497558594, 90.2593002319336, 97.27862548828125, 104.29795837402344, 111.31727600097656, 118.33660888671875, 125.3559341430664, 132.37525939941406, 139.39459228515625, 146.41390991210938, 153.43324279785156, 160.4525604248047, 167.47189331054688, 174.4912109375]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 4.0, 2.0, 2.0, 1.0, 5.0, 4.0, 2.0, 1.0, 4.0, 9.0, 12.0, 7.0, 10.0, 15.0, 21.0, 19.0, 16.0, 9.0, 28.0, 27.0, 29.0, 22.0, 16.0, 36.0, 25.0, 28.0, 36.0, 37.0, 40.0, 37.0, 37.0, 37.0, 32.0, 26.0, 38.0, 43.0, 24.0, 27.0, 32.0, 18.0, 23.0, 26.0, 27.0, 13.0, 17.0, 10.0, 5.0, 12.0, 14.0, 8.0, 9.0, 3.0, 4.0, 8.0, 6.0, 3.0, 4.0, 2.0, 4.0, 2.0, 2.0], "bins": [-53.24000549316406, -51.717350006103516, -50.1946907043457, -48.672035217285156, -47.149375915527344, -45.6267204284668, -44.10406494140625, -42.58140563964844, -41.05875015258789, -39.536094665527344, -38.01343536376953, -36.490779876708984, -34.96812438964844, -33.445465087890625, -31.922809600830078, -30.4001522064209, -28.87749481201172, -27.35483741760254, -25.83218002319336, -24.309524536132812, -22.786867141723633, -21.264209747314453, -19.741554260253906, -18.218896865844727, -16.696239471435547, -15.173582077026367, -13.650925636291504, -12.12826919555664, -10.605611801147461, -9.082954406738281, -7.560297966003418, -6.037641525268555, -4.514984130859375, -2.9923272132873535, -1.469670295715332, 0.05298662185668945, 1.575643539428711, 3.0983004570007324, 4.620957374572754, 6.143613815307617, 7.666271209716797, 9.188928604125977, 10.71158504486084, 12.234241485595703, 13.756898880004883, 15.279556274414062, 16.80221176147461, 18.32486915588379, 19.84752655029297, 21.37018394470215, 22.892841339111328, 24.415496826171875, 25.938154220581055, 27.460811614990234, 28.98346710205078, 30.50612449645996, 32.02878189086914, 33.55143737792969, 35.0740966796875, 36.59675216674805, 38.119407653808594, 39.642066955566406, 41.16472244262695, 42.6873779296875, 44.21003723144531]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 8.0, 3.0, 3.0, 8.0, 5.0, 9.0, 6.0, 13.0, 23.0, 12.0, 27.0, 21.0, 24.0, 20.0, 22.0, 24.0, 22.0, 46.0, 35.0, 36.0, 39.0, 40.0, 46.0, 30.0, 39.0, 42.0, 38.0, 30.0, 35.0, 36.0, 24.0, 28.0, 22.0, 19.0, 20.0, 17.0, 16.0, 22.0, 16.0, 14.0, 11.0, 6.0, 10.0, 13.0, 5.0, 2.0, 4.0, 3.0, 8.0, 1.0, 3.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-7.265625, -7.0223388671875, -6.779052734375, -6.5357666015625, -6.29248046875, -6.0491943359375, -5.805908203125, -5.5626220703125, -5.3193359375, -5.0760498046875, -4.832763671875, -4.5894775390625, -4.34619140625, -4.1029052734375, -3.859619140625, -3.6163330078125, -3.373046875, -3.1297607421875, -2.886474609375, -2.6431884765625, -2.39990234375, -2.1566162109375, -1.913330078125, -1.6700439453125, -1.4267578125, -1.1834716796875, -0.940185546875, -0.6968994140625, -0.45361328125, -0.2103271484375, 0.032958984375, 0.2762451171875, 0.51953125, 0.7628173828125, 1.006103515625, 1.2493896484375, 1.49267578125, 1.7359619140625, 1.979248046875, 2.2225341796875, 2.4658203125, 2.7091064453125, 2.952392578125, 3.1956787109375, 3.43896484375, 3.6822509765625, 3.925537109375, 4.1688232421875, 4.412109375, 4.6553955078125, 4.898681640625, 5.1419677734375, 5.38525390625, 5.6285400390625, 5.871826171875, 6.1151123046875, 6.3583984375, 6.6016845703125, 6.844970703125, 7.0882568359375, 7.33154296875, 7.5748291015625, 7.818115234375, 8.0614013671875, 8.3046875]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 1.0, 5.0, 8.0, 13.0, 10.0, 18.0, 22.0, 16.0, 27.0, 37.0, 48.0, 56.0, 71.0, 93.0, 114.0, 140.0, 218.0, 414.0, 1017.0, 3567.0, 30330.0, 1254446.0, 2807491.0, 86768.0, 6370.0, 1405.0, 516.0, 261.0, 180.0, 138.0, 107.0, 92.0, 60.0, 53.0, 44.0, 33.0, 25.0, 18.0, 14.0, 13.0, 8.0, 4.0, 5.0, 6.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-32.71875, -31.760986328125, -30.80322265625, -29.845458984375, -28.8876953125, -27.929931640625, -26.97216796875, -26.014404296875, -25.056640625, -24.098876953125, -23.14111328125, -22.183349609375, -21.2255859375, -20.267822265625, -19.31005859375, -18.352294921875, -17.39453125, -16.436767578125, -15.47900390625, -14.521240234375, -13.5634765625, -12.605712890625, -11.64794921875, -10.690185546875, -9.732421875, -8.774658203125, -7.81689453125, -6.859130859375, -5.9013671875, -4.943603515625, -3.98583984375, -3.028076171875, -2.0703125, -1.112548828125, -0.15478515625, 0.802978515625, 1.7607421875, 2.718505859375, 3.67626953125, 4.634033203125, 5.591796875, 6.549560546875, 7.50732421875, 8.465087890625, 9.4228515625, 10.380615234375, 11.33837890625, 12.296142578125, 13.25390625, 14.211669921875, 15.16943359375, 16.127197265625, 17.0849609375, 18.042724609375, 19.00048828125, 19.958251953125, 20.916015625, 21.873779296875, 22.83154296875, 23.789306640625, 24.7470703125, 25.704833984375, 26.66259765625, 27.620361328125, 28.578125]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 7.0, 13.0, 16.0, 18.0, 21.0, 49.0, 52.0, 83.0, 95.0, 161.0, 232.0, 370.0, 591.0, 635.0, 532.0, 351.0, 247.0, 171.0, 129.0, 101.0, 56.0, 37.0, 34.0, 23.0, 24.0, 11.0, 6.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-18.265625, -17.6650390625, -17.064453125, -16.4638671875, -15.86328125, -15.2626953125, -14.662109375, -14.0615234375, -13.4609375, -12.8603515625, -12.259765625, -11.6591796875, -11.05859375, -10.4580078125, -9.857421875, -9.2568359375, -8.65625, -8.0556640625, -7.455078125, -6.8544921875, -6.25390625, -5.6533203125, -5.052734375, -4.4521484375, -3.8515625, -3.2509765625, -2.650390625, -2.0498046875, -1.44921875, -0.8486328125, -0.248046875, 0.3525390625, 0.953125, 1.5537109375, 2.154296875, 2.7548828125, 3.35546875, 3.9560546875, 4.556640625, 5.1572265625, 5.7578125, 6.3583984375, 6.958984375, 7.5595703125, 8.16015625, 8.7607421875, 9.361328125, 9.9619140625, 10.5625, 11.1630859375, 11.763671875, 12.3642578125, 12.96484375, 13.5654296875, 14.166015625, 14.7666015625, 15.3671875, 15.9677734375, 16.568359375, 17.1689453125, 17.76953125, 18.3701171875, 18.970703125, 19.5712890625, 20.171875]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 6.0, 6.0, 5.0, 8.0, 16.0, 13.0, 26.0, 32.0, 67.0, 74.0, 139.0, 235.0, 480.0, 1382.0, 6184.0, 405580.0, 3755407.0, 20797.0, 2380.0, 742.0, 275.0, 141.0, 81.0, 62.0, 41.0, 33.0, 18.0, 18.0, 11.0, 11.0, 5.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.84375, -58.0947265625, -56.345703125, -54.5966796875, -52.84765625, -51.0986328125, -49.349609375, -47.6005859375, -45.8515625, -44.1025390625, -42.353515625, -40.6044921875, -38.85546875, -37.1064453125, -35.357421875, -33.6083984375, -31.859375, -30.1103515625, -28.361328125, -26.6123046875, -24.86328125, -23.1142578125, -21.365234375, -19.6162109375, -17.8671875, -16.1181640625, -14.369140625, -12.6201171875, -10.87109375, -9.1220703125, -7.373046875, -5.6240234375, -3.875, -2.1259765625, -0.376953125, 1.3720703125, 3.12109375, 4.8701171875, 6.619140625, 8.3681640625, 10.1171875, 11.8662109375, 13.615234375, 15.3642578125, 17.11328125, 18.8623046875, 20.611328125, 22.3603515625, 24.109375, 25.8583984375, 27.607421875, 29.3564453125, 31.10546875, 32.8544921875, 34.603515625, 36.3525390625, 38.1015625, 39.8505859375, 41.599609375, 43.3486328125, 45.09765625, 46.8466796875, 48.595703125, 50.3447265625, 52.09375]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 445.0, 570.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1061.6839599609375, -1025.0833740234375, -988.4827270507812, -951.882080078125, -915.281494140625, -878.6808471679688, -842.0802001953125, -805.4796142578125, -768.8789672851562, -732.2783203125, -695.677734375, -659.0770874023438, -622.4764404296875, -585.8758544921875, -549.2752075195312, -512.674560546875, -476.073974609375, -439.4733581542969, -402.87274169921875, -366.2720947265625, -329.6714782714844, -293.07086181640625, -256.47021484375, -219.86959838867188, -183.26898193359375, -146.66836547851562, -110.06773376464844, -73.46710968017578, -36.866485595703125, -0.265869140625, 36.33476257324219, 72.93539428710938, 109.535888671875, 146.13650512695312, 182.7371368408203, 219.3377685546875, 255.93838500976562, 292.53900146484375, 329.1396484375, 365.7402648925781, 402.34088134765625, 438.9414978027344, 475.5421142578125, 512.1427612304688, 548.743408203125, 585.343994140625, 621.9446411132812, 658.5452880859375, 695.1458740234375, 731.7465209960938, 768.3471069335938, 804.94775390625, 841.54833984375, 878.1489868164062, 914.7496337890625, 951.3502197265625, 987.9508666992188, 1024.551513671875, 1061.152099609375, 1097.752685546875, 1134.3533935546875, 1170.9539794921875, 1207.5545654296875, 1244.1552734375, 1280.755859375]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 6.0, 6.0, 2.0, 10.0, 10.0, 11.0, 13.0, 13.0, 15.0, 12.0, 25.0, 21.0, 24.0, 27.0, 35.0, 36.0, 47.0, 39.0, 35.0, 34.0, 50.0, 44.0, 38.0, 38.0, 38.0, 35.0, 33.0, 44.0, 42.0, 29.0, 38.0, 28.0, 17.0, 17.0, 14.0, 15.0, 9.0, 6.0, 10.0, 11.0, 7.0, 6.0, 5.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-66.79718017578125, -64.73069763183594, -62.66421890258789, -60.597740173339844, -58.5312614440918, -56.46478271484375, -54.39830017089844, -52.33182144165039, -50.265342712402344, -48.1988639831543, -46.132381439208984, -44.06590270996094, -41.99942398071289, -39.932945251464844, -37.86646270751953, -35.799983978271484, -33.73350143432617, -31.667020797729492, -29.600542068481445, -27.534061431884766, -25.46758270263672, -23.40110206604004, -21.33462142944336, -19.268142700195312, -17.201662063598633, -15.13518238067627, -13.068702697753906, -11.002222061157227, -8.935742378234863, -6.8692626953125, -4.80278205871582, -2.736302375793457, -0.6698226928710938, 1.3966572284698486, 3.463137149810791, 5.5296173095703125, 7.596096992492676, 9.662576675415039, 11.729057312011719, 13.795536994934082, 15.862016677856445, 17.928497314453125, 19.994976043701172, 22.06145668029785, 24.12793731689453, 26.194416046142578, 28.260896682739258, 30.327377319335938, 32.393856048583984, 34.46033477783203, 36.526817321777344, 38.59329605102539, 40.65977478027344, 42.72625732421875, 44.7927360534668, 46.859214782714844, 48.925697326660156, 50.9921760559082, 53.058658599853516, 55.12513732910156, 57.19161605834961, 59.258094787597656, 61.32457733154297, 63.391056060791016, 65.45753479003906]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 5.0, 2.0, 9.0, 11.0, 9.0, 7.0, 9.0, 13.0, 22.0, 24.0, 19.0, 39.0, 24.0, 30.0, 31.0, 27.0, 33.0, 31.0, 34.0, 34.0, 28.0, 47.0, 42.0, 48.0, 32.0, 43.0, 29.0, 27.0, 31.0, 17.0, 32.0, 32.0, 22.0, 17.0, 26.0, 11.0, 15.0, 12.0, 18.0, 12.0, 11.0, 10.0, 6.0, 8.0, 5.0, 3.0, 3.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-5.8125, -5.6168212890625, -5.421142578125, -5.2254638671875, -5.02978515625, -4.8341064453125, -4.638427734375, -4.4427490234375, -4.2470703125, -4.0513916015625, -3.855712890625, -3.6600341796875, -3.46435546875, -3.2686767578125, -3.072998046875, -2.8773193359375, -2.681640625, -2.4859619140625, -2.290283203125, -2.0946044921875, -1.89892578125, -1.7032470703125, -1.507568359375, -1.3118896484375, -1.1162109375, -0.9205322265625, -0.724853515625, -0.5291748046875, -0.33349609375, -0.1378173828125, 0.057861328125, 0.2535400390625, 0.44921875, 0.6448974609375, 0.840576171875, 1.0362548828125, 1.23193359375, 1.4276123046875, 1.623291015625, 1.8189697265625, 2.0146484375, 2.2103271484375, 2.406005859375, 2.6016845703125, 2.79736328125, 2.9930419921875, 3.188720703125, 3.3843994140625, 3.580078125, 3.7757568359375, 3.971435546875, 4.1671142578125, 4.36279296875, 4.5584716796875, 4.754150390625, 4.9498291015625, 5.1455078125, 5.3411865234375, 5.536865234375, 5.7325439453125, 5.92822265625, 6.1239013671875, 6.319580078125, 6.5152587890625, 6.7109375]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 9.0, 17.0, 17.0, 24.0, 24.0, 54.0, 60.0, 87.0, 139.0, 177.0, 257.0, 339.0, 495.0, 694.0, 1070.0, 1529.0, 2181.0, 3101.0, 4471.0, 6406.0, 9680.0, 14168.0, 21110.0, 31259.0, 48057.0, 76197.0, 134176.0, 300805.0, 152921.0, 82277.0, 51641.0, 33846.0, 22764.0, 15068.0, 10407.0, 7171.0, 4873.0, 3383.0, 2327.0, 1640.0, 1086.0, 777.0, 545.0, 378.0, 285.0, 192.0, 117.0, 93.0, 65.0, 27.0, 26.0, 14.0, 10.0, 11.0, 5.0, 8.0, 1.0, 4.0, 1.0, 3.0, 0.0, 1.0], "bins": [-1.1328125, -1.0945281982421875, -1.056243896484375, -1.0179595947265625, -0.97967529296875, -0.9413909912109375, -0.903106689453125, -0.8648223876953125, -0.8265380859375, -0.7882537841796875, -0.749969482421875, -0.7116851806640625, -0.67340087890625, -0.6351165771484375, -0.596832275390625, -0.5585479736328125, -0.520263671875, -0.4819793701171875, -0.443695068359375, -0.4054107666015625, -0.36712646484375, -0.3288421630859375, -0.290557861328125, -0.2522735595703125, -0.2139892578125, -0.1757049560546875, -0.137420654296875, -0.0991363525390625, -0.06085205078125, -0.0225677490234375, 0.015716552734375, 0.0540008544921875, 0.09228515625, 0.1305694580078125, 0.168853759765625, 0.2071380615234375, 0.24542236328125, 0.2837066650390625, 0.321990966796875, 0.3602752685546875, 0.3985595703125, 0.4368438720703125, 0.475128173828125, 0.5134124755859375, 0.55169677734375, 0.5899810791015625, 0.628265380859375, 0.6665496826171875, 0.704833984375, 0.7431182861328125, 0.781402587890625, 0.8196868896484375, 0.85797119140625, 0.8962554931640625, 0.934539794921875, 0.9728240966796875, 1.0111083984375, 1.0493927001953125, 1.087677001953125, 1.1259613037109375, 1.16424560546875, 1.2025299072265625, 1.240814208984375, 1.2790985107421875, 1.3173828125]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 6.0, 6.0, 8.0, 11.0, 11.0, 16.0, 18.0, 21.0, 22.0, 26.0, 31.0, 27.0, 29.0, 36.0, 41.0, 44.0, 54.0, 44.0, 53.0, 1073.0, 33.0, 41.0, 44.0, 29.0, 48.0, 35.0, 33.0, 29.0, 20.0, 23.0, 18.0, 20.0, 12.0, 12.0, 11.0, 15.0, 8.0, 5.0, 7.0, 1.0, 5.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.69921875, -4.55328369140625, -4.4073486328125, -4.26141357421875, -4.115478515625, -3.96954345703125, -3.8236083984375, -3.67767333984375, -3.53173828125, -3.38580322265625, -3.2398681640625, -3.09393310546875, -2.947998046875, -2.80206298828125, -2.6561279296875, -2.51019287109375, -2.3642578125, -2.21832275390625, -2.0723876953125, -1.92645263671875, -1.780517578125, -1.63458251953125, -1.4886474609375, -1.34271240234375, -1.19677734375, -1.05084228515625, -0.9049072265625, -0.75897216796875, -0.613037109375, -0.46710205078125, -0.3211669921875, -0.17523193359375, -0.029296875, 0.11663818359375, 0.2625732421875, 0.40850830078125, 0.554443359375, 0.70037841796875, 0.8463134765625, 0.99224853515625, 1.13818359375, 1.28411865234375, 1.4300537109375, 1.57598876953125, 1.721923828125, 1.86785888671875, 2.0137939453125, 2.15972900390625, 2.3056640625, 2.45159912109375, 2.5975341796875, 2.74346923828125, 2.889404296875, 3.03533935546875, 3.1812744140625, 3.32720947265625, 3.47314453125, 3.61907958984375, 3.7650146484375, 3.91094970703125, 4.056884765625, 4.20281982421875, 4.3487548828125, 4.49468994140625, 4.640625]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 6.0, 13.0, 8.0, 18.0, 26.0, 38.0, 70.0, 83.0, 154.0, 216.0, 365.0, 532.0, 886.0, 1350.0, 2339.0, 3839.0, 6497.0, 10731.0, 18019.0, 30928.0, 55825.0, 114079.0, 1409883.0, 238386.0, 90775.0, 46812.0, 26341.0, 15475.0, 9185.0, 5546.0, 3352.0, 2022.0, 1235.0, 755.0, 481.0, 297.0, 192.0, 128.0, 84.0, 59.0, 30.0, 24.0, 17.0, 11.0, 7.0, 5.0, 7.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.62109375, -1.5702056884765625, -1.519317626953125, -1.4684295654296875, -1.41754150390625, -1.3666534423828125, -1.315765380859375, -1.2648773193359375, -1.2139892578125, -1.1631011962890625, -1.112213134765625, -1.0613250732421875, -1.01043701171875, -0.9595489501953125, -0.908660888671875, -0.8577728271484375, -0.806884765625, -0.7559967041015625, -0.705108642578125, -0.6542205810546875, -0.60333251953125, -0.5524444580078125, -0.501556396484375, -0.4506683349609375, -0.3997802734375, -0.3488922119140625, -0.298004150390625, -0.2471160888671875, -0.19622802734375, -0.1453399658203125, -0.094451904296875, -0.0435638427734375, 0.00732421875, 0.0582122802734375, 0.109100341796875, 0.1599884033203125, 0.21087646484375, 0.2617645263671875, 0.312652587890625, 0.3635406494140625, 0.4144287109375, 0.4653167724609375, 0.516204833984375, 0.5670928955078125, 0.61798095703125, 0.6688690185546875, 0.719757080078125, 0.7706451416015625, 0.821533203125, 0.8724212646484375, 0.923309326171875, 0.9741973876953125, 1.02508544921875, 1.0759735107421875, 1.126861572265625, 1.1777496337890625, 1.2286376953125, 1.2795257568359375, 1.330413818359375, 1.3813018798828125, 1.43218994140625, 1.4830780029296875, 1.533966064453125, 1.5848541259765625, 1.6357421875]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 3.0, 3.0, 3.0, 11.0, 6.0, 5.0, 7.0, 6.0, 9.0, 15.0, 13.0, 20.0, 27.0, 20.0, 34.0, 41.0, 35.0, 52.0, 63.0, 65.0, 70.0, 73.0, 52.0, 69.0, 53.0, 41.0, 43.0, 30.0, 25.0, 20.0, 16.0, 21.0, 11.0, 9.0, 5.0, 7.0, 2.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.000850677490234375, -0.0008240938186645508, -0.0007975101470947266, -0.0007709264755249023, -0.0007443428039550781, -0.0007177591323852539, -0.0006911754608154297, -0.0006645917892456055, -0.0006380081176757812, -0.000611424446105957, -0.0005848407745361328, -0.0005582571029663086, -0.0005316734313964844, -0.0005050897598266602, -0.00047850608825683594, -0.0004519224166870117, -0.0004253387451171875, -0.0003987550735473633, -0.00037217140197753906, -0.00034558773040771484, -0.0003190040588378906, -0.0002924203872680664, -0.0002658367156982422, -0.00023925304412841797, -0.00021266937255859375, -0.00018608570098876953, -0.0001595020294189453, -0.0001329183578491211, -0.00010633468627929688, -7.975101470947266e-05, -5.316734313964844e-05, -2.658367156982422e-05, 0.0, 2.658367156982422e-05, 5.316734313964844e-05, 7.975101470947266e-05, 0.00010633468627929688, 0.0001329183578491211, 0.0001595020294189453, 0.00018608570098876953, 0.00021266937255859375, 0.00023925304412841797, 0.0002658367156982422, 0.0002924203872680664, 0.0003190040588378906, 0.00034558773040771484, 0.00037217140197753906, 0.0003987550735473633, 0.0004253387451171875, 0.0004519224166870117, 0.00047850608825683594, 0.0005050897598266602, 0.0005316734313964844, 0.0005582571029663086, 0.0005848407745361328, 0.000611424446105957, 0.0006380081176757812, 0.0006645917892456055, 0.0006911754608154297, 0.0007177591323852539, 0.0007443428039550781, 0.0007709264755249023, 0.0007975101470947266, 0.0008240938186645508, 0.000850677490234375]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 5.0, 4.0, 3.0, 6.0, 4.0, 5.0, 7.0, 7.0, 12.0, 16.0, 19.0, 28.0, 29.0, 68.0, 55.0, 75.0, 132.0, 151.0, 279.0, 473.0, 820.0, 10825.0, 1026966.0, 6341.0, 849.0, 401.0, 281.0, 165.0, 132.0, 92.0, 75.0, 34.0, 47.0, 30.0, 25.0, 16.0, 17.0, 11.0, 13.0, 5.0, 12.0, 6.0, 5.0, 3.0, 4.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0181884765625, -0.01766061782836914, -0.01713275909423828, -0.016604900360107422, -0.016077041625976562, -0.015549182891845703, -0.015021324157714844, -0.014493465423583984, -0.013965606689453125, -0.013437747955322266, -0.012909889221191406, -0.012382030487060547, -0.011854171752929688, -0.011326313018798828, -0.010798454284667969, -0.01027059555053711, -0.00974273681640625, -0.00921487808227539, -0.008687019348144531, -0.008159160614013672, -0.0076313018798828125, -0.007103443145751953, -0.006575584411621094, -0.006047725677490234, -0.005519866943359375, -0.004992008209228516, -0.004464149475097656, -0.003936290740966797, -0.0034084320068359375, -0.002880573272705078, -0.0023527145385742188, -0.0018248558044433594, -0.0012969970703125, -0.0007691383361816406, -0.00024127960205078125, 0.0002865791320800781, 0.0008144378662109375, 0.0013422966003417969, 0.0018701553344726562, 0.0023980140686035156, 0.002925872802734375, 0.0034537315368652344, 0.003981590270996094, 0.004509449005126953, 0.0050373077392578125, 0.005565166473388672, 0.006093025207519531, 0.006620883941650391, 0.00714874267578125, 0.007676601409912109, 0.008204460144042969, 0.008732318878173828, 0.009260177612304688, 0.009788036346435547, 0.010315895080566406, 0.010843753814697266, 0.011371612548828125, 0.011899471282958984, 0.012427330017089844, 0.012955188751220703, 0.013483047485351562, 0.014010906219482422, 0.014538764953613281, 0.01506662368774414, 0.015594482421875]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 12.0, 36.0, 125.0, 308.0, 291.0, 165.0, 52.0, 14.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001707988209091127, -0.0016709232004359365, -0.001633858191780746, -0.0015967931831255555, -0.0015597282908856869, -0.0015226632822304964, -0.001485598273575306, -0.0014485332649201155, -0.001411468256264925, -0.0013744032476097345, -0.001337338238954544, -0.0013002732302993536, -0.0012632082216441631, -0.0012261433294042945, -0.001189078320749104, -0.0011520133120939136, -0.001114948303438723, -0.0010778832947835326, -0.0010408182861283422, -0.0010037532774731517, -0.0009666883270256221, -0.0009296233183704317, -0.0008925583679229021, -0.0008554933592677116, -0.0008184283506125212, -0.0007813633419573307, -0.0007442983333021402, -0.0007072333828546107, -0.0006701683741994202, -0.0006331033655442297, -0.0005960384150967002, -0.0005589734064415097, -0.0005219083395786583, -0.0004848433309234679, -0.00044777835137210786, -0.00041071337182074785, -0.0003736483631655574, -0.0003365833545103669, -0.0002995183749590069, -0.0002624533954076469, -0.00022538838675245643, -0.0001883233926491812, -0.00015125839854590595, -0.00011419340444263071, -7.712841033935547e-05, -4.006341623608023e-05, -2.99842213280499e-06, 3.406655741855502e-05, 7.113156607374549e-05, 0.00010819656017702073, 0.00014526155428029597, 0.0001823265483835712, 0.00021939154248684645, 0.0002564565511420369, 0.0002935215306933969, 0.00033058651024475694, 0.0003676515188999474, 0.00040471652755513787, 0.0004417815071064979, 0.0004788464866578579, 0.0005159114953130484, 0.0005529765039682388, 0.0005900415126234293, 0.0006271064630709589, 0.0006641714717261493]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 5.0, 10.0, 10.0, 8.0, 10.0, 10.0, 20.0, 28.0, 24.0, 21.0, 31.0, 30.0, 24.0, 30.0, 48.0, 40.0, 33.0, 37.0, 41.0, 38.0, 32.0, 48.0, 41.0, 40.0, 37.0, 37.0, 28.0, 20.0, 38.0, 21.0, 21.0, 18.0, 22.0, 14.0, 19.0, 12.0, 11.0, 12.0, 8.0, 9.0, 4.0, 6.0, 1.0, 4.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0004425644874572754, -0.00042877718806266785, -0.0004149898886680603, -0.00040120258927345276, -0.0003874152898788452, -0.00037362799048423767, -0.0003598406910896301, -0.0003460533916950226, -0.00033226609230041504, -0.0003184787929058075, -0.00030469149351119995, -0.0002909041941165924, -0.00027711689472198486, -0.0002633295953273773, -0.0002495422959327698, -0.00023575499653816223, -0.0002219676971435547, -0.00020818039774894714, -0.0001943930983543396, -0.00018060579895973206, -0.0001668184995651245, -0.00015303120017051697, -0.00013924390077590942, -0.00012545660138130188, -0.00011166930198669434, -9.788200259208679e-05, -8.409470319747925e-05, -7.03074038028717e-05, -5.652010440826416e-05, -4.2732805013656616e-05, -2.8945505619049072e-05, -1.5158206224441528e-05, -1.3709068298339844e-06, 1.241639256477356e-05, 2.6203691959381104e-05, 3.999099135398865e-05, 5.377829074859619e-05, 6.756559014320374e-05, 8.135288953781128e-05, 9.514018893241882e-05, 0.00010892748832702637, 0.0001227147877216339, 0.00013650208711624146, 0.000150289386510849, 0.00016407668590545654, 0.0001778639853000641, 0.00019165128469467163, 0.00020543858408927917, 0.00021922588348388672, 0.00023301318287849426, 0.0002468004822731018, 0.00026058778166770935, 0.0002743750810623169, 0.00028816238045692444, 0.000301949679851532, 0.0003157369792461395, 0.00032952427864074707, 0.0003433115780353546, 0.00035709887742996216, 0.0003708861768245697, 0.00038467347621917725, 0.0003984607756137848, 0.00041224807500839233, 0.0004260353744029999, 0.0004398226737976074]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 5.0, 2.0, 9.0, 11.0, 9.0, 7.0, 9.0, 13.0, 22.0, 24.0, 19.0, 38.0, 25.0, 30.0, 31.0, 27.0, 32.0, 32.0, 34.0, 34.0, 28.0, 47.0, 42.0, 48.0, 32.0, 43.0, 29.0, 27.0, 31.0, 17.0, 32.0, 32.0, 22.0, 17.0, 26.0, 11.0, 15.0, 12.0, 18.0, 12.0, 11.0, 10.0, 6.0, 8.0, 5.0, 3.0, 3.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-5.8125, -5.6168212890625, -5.421142578125, -5.2254638671875, -5.02978515625, -4.8341064453125, -4.638427734375, -4.4427490234375, -4.2470703125, -4.0513916015625, -3.855712890625, -3.6600341796875, -3.46435546875, -3.2686767578125, -3.072998046875, -2.8773193359375, -2.681640625, -2.4859619140625, -2.290283203125, -2.0946044921875, -1.89892578125, -1.7032470703125, -1.507568359375, -1.3118896484375, -1.1162109375, -0.9205322265625, -0.724853515625, -0.5291748046875, -0.33349609375, -0.1378173828125, 0.057861328125, 0.2535400390625, 0.44921875, 0.6448974609375, 0.840576171875, 1.0362548828125, 1.23193359375, 1.4276123046875, 1.623291015625, 1.8189697265625, 2.0146484375, 2.2103271484375, 2.406005859375, 2.6016845703125, 2.79736328125, 2.9930419921875, 3.188720703125, 3.3843994140625, 3.580078125, 3.7757568359375, 3.971435546875, 4.1671142578125, 4.36279296875, 4.5584716796875, 4.754150390625, 4.9498291015625, 5.1455078125, 5.3411865234375, 5.536865234375, 5.7325439453125, 5.92822265625, 6.1239013671875, 6.319580078125, 6.5152587890625, 6.7109375]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 8.0, 5.0, 16.0, 16.0, 22.0, 42.0, 47.0, 46.0, 70.0, 94.0, 153.0, 205.0, 314.0, 403.0, 596.0, 822.0, 1190.0, 1857.0, 3127.0, 7395.0, 32220.0, 276055.0, 621697.0, 77593.0, 13105.0, 4250.0, 2354.0, 1446.0, 1027.0, 692.0, 522.0, 317.0, 235.0, 176.0, 137.0, 87.0, 55.0, 47.0, 33.0, 16.0, 13.0, 14.0, 6.0, 10.0, 6.0, 1.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-17.9375, -17.413330078125, -16.88916015625, -16.364990234375, -15.8408203125, -15.316650390625, -14.79248046875, -14.268310546875, -13.744140625, -13.219970703125, -12.69580078125, -12.171630859375, -11.6474609375, -11.123291015625, -10.59912109375, -10.074951171875, -9.55078125, -9.026611328125, -8.50244140625, -7.978271484375, -7.4541015625, -6.929931640625, -6.40576171875, -5.881591796875, -5.357421875, -4.833251953125, -4.30908203125, -3.784912109375, -3.2607421875, -2.736572265625, -2.21240234375, -1.688232421875, -1.1640625, -0.639892578125, -0.11572265625, 0.408447265625, 0.9326171875, 1.456787109375, 1.98095703125, 2.505126953125, 3.029296875, 3.553466796875, 4.07763671875, 4.601806640625, 5.1259765625, 5.650146484375, 6.17431640625, 6.698486328125, 7.22265625, 7.746826171875, 8.27099609375, 8.795166015625, 9.3193359375, 9.843505859375, 10.36767578125, 10.891845703125, 11.416015625, 11.940185546875, 12.46435546875, 12.988525390625, 13.5126953125, 14.036865234375, 14.56103515625, 15.085205078125, 15.609375]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 6.0, 4.0, 7.0, 6.0, 8.0, 5.0, 14.0, 21.0, 20.0, 24.0, 26.0, 31.0, 38.0, 41.0, 41.0, 50.0, 60.0, 88.0, 260.0, 1593.0, 240.0, 86.0, 52.0, 46.0, 39.0, 40.0, 38.0, 22.0, 23.0, 28.0, 17.0, 9.0, 11.0, 8.0, 10.0, 10.0, 6.0, 7.0, 8.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.875, -19.28076171875, -18.6865234375, -18.09228515625, -17.498046875, -16.90380859375, -16.3095703125, -15.71533203125, -15.12109375, -14.52685546875, -13.9326171875, -13.33837890625, -12.744140625, -12.14990234375, -11.5556640625, -10.96142578125, -10.3671875, -9.77294921875, -9.1787109375, -8.58447265625, -7.990234375, -7.39599609375, -6.8017578125, -6.20751953125, -5.61328125, -5.01904296875, -4.4248046875, -3.83056640625, -3.236328125, -2.64208984375, -2.0478515625, -1.45361328125, -0.859375, -0.26513671875, 0.3291015625, 0.92333984375, 1.517578125, 2.11181640625, 2.7060546875, 3.30029296875, 3.89453125, 4.48876953125, 5.0830078125, 5.67724609375, 6.271484375, 6.86572265625, 7.4599609375, 8.05419921875, 8.6484375, 9.24267578125, 9.8369140625, 10.43115234375, 11.025390625, 11.61962890625, 12.2138671875, 12.80810546875, 13.40234375, 13.99658203125, 14.5908203125, 15.18505859375, 15.779296875, 16.37353515625, 16.9677734375, 17.56201171875, 18.15625]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 5.0, 5.0, 3.0, 6.0, 6.0, 10.0, 11.0, 14.0, 22.0, 27.0, 30.0, 35.0, 69.0, 78.0, 82.0, 98.0, 178.0, 276.0, 617.0, 1464.0, 39071.0, 3097336.0, 4120.0, 896.0, 424.0, 224.0, 142.0, 98.0, 73.0, 56.0, 49.0, 51.0, 31.0, 27.0, 19.0, 11.0, 15.0, 4.0, 5.0, 11.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-49.34375, -47.599609375, -45.85546875, -44.111328125, -42.3671875, -40.623046875, -38.87890625, -37.134765625, -35.390625, -33.646484375, -31.90234375, -30.158203125, -28.4140625, -26.669921875, -24.92578125, -23.181640625, -21.4375, -19.693359375, -17.94921875, -16.205078125, -14.4609375, -12.716796875, -10.97265625, -9.228515625, -7.484375, -5.740234375, -3.99609375, -2.251953125, -0.5078125, 1.236328125, 2.98046875, 4.724609375, 6.46875, 8.212890625, 9.95703125, 11.701171875, 13.4453125, 15.189453125, 16.93359375, 18.677734375, 20.421875, 22.166015625, 23.91015625, 25.654296875, 27.3984375, 29.142578125, 30.88671875, 32.630859375, 34.375, 36.119140625, 37.86328125, 39.607421875, 41.3515625, 43.095703125, 44.83984375, 46.583984375, 48.328125, 50.072265625, 51.81640625, 53.560546875, 55.3046875, 57.048828125, 58.79296875, 60.537109375, 62.28125]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 15.0, 48.0, 168.0, 303.0, 294.0, 141.0, 31.0, 6.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-76.7821044921875, -74.28544616699219, -71.78878784179688, -69.2921371459961, -66.79547882080078, -64.29882049560547, -61.802162170410156, -59.305503845214844, -56.8088493347168, -54.312191009521484, -51.81553649902344, -49.318878173828125, -46.82221984863281, -44.325565338134766, -41.82890701293945, -39.332252502441406, -36.835594177246094, -34.33893585205078, -31.842281341552734, -29.345623016357422, -26.848966598510742, -24.352310180664062, -21.85565185546875, -19.35899543762207, -16.86233901977539, -14.365682601928711, -11.869025230407715, -9.372367858886719, -6.875711441040039, -4.379055023193359, -1.8823976516723633, 0.6142597198486328, 3.1109161376953125, 5.60757303237915, 8.104229927062988, 10.600887298583984, 13.097543716430664, 15.594200134277344, 18.090858459472656, 20.587514877319336, 23.084171295166016, 25.580827713012695, 28.077484130859375, 30.574142456054688, 33.07080078125, 35.56745529174805, 38.06411361694336, 40.560768127441406, 43.05742645263672, 45.55408477783203, 48.05073928833008, 50.54739761352539, 53.04405212402344, 55.54071044921875, 58.03736877441406, 60.534027099609375, 63.03068161010742, 65.52733612060547, 68.02399444580078, 70.5206527709961, 73.0173110961914, 75.51396179199219, 78.0106201171875, 80.50727844238281, 83.00393676757812]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 11.0, 5.0, 13.0, 8.0, 10.0, 14.0, 18.0, 22.0, 23.0, 20.0, 39.0, 46.0, 33.0, 49.0, 50.0, 48.0, 46.0, 45.0, 41.0, 51.0, 44.0, 46.0, 40.0, 36.0, 39.0, 31.0, 29.0, 27.0, 21.0, 22.0, 16.0, 17.0, 14.0, 7.0, 8.0, 3.0, 4.0, 5.0, 1.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-62.88018798828125, -60.99924850463867, -59.118309020996094, -57.237369537353516, -55.35643005371094, -53.47549057006836, -51.59455108642578, -49.71360778808594, -47.832672119140625, -45.95173263549805, -44.07079315185547, -42.18985366821289, -40.30891418457031, -38.427974700927734, -36.547035217285156, -34.66609191894531, -32.785152435302734, -30.904212951660156, -29.023273468017578, -27.142333984375, -25.261394500732422, -23.380455017089844, -21.499513626098633, -19.618574142456055, -17.737634658813477, -15.856695175170898, -13.97575569152832, -12.094815254211426, -10.213875770568848, -8.33293628692627, -6.451995849609375, -4.571056365966797, -2.6901168823242188, -0.8091771602630615, 1.0717625617980957, 2.952702522277832, 4.83364200592041, 6.714581489562988, 8.595521926879883, 10.476461410522461, 12.357400894165039, 14.238340377807617, 16.119279861450195, 18.000221252441406, 19.881160736083984, 21.762100219726562, 23.64303970336914, 25.52397918701172, 27.404918670654297, 29.285858154296875, 31.166797637939453, 33.04773712158203, 34.92867660522461, 36.80961608886719, 38.69055938720703, 40.571495056152344, 42.45243835449219, 44.333377838134766, 46.214317321777344, 48.09525680541992, 49.9761962890625, 51.85713577270508, 53.738075256347656, 55.6190185546875, 57.49995422363281]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 8.0, 7.0, 9.0, 6.0, 17.0, 11.0, 17.0, 22.0, 17.0, 20.0, 30.0, 25.0, 28.0, 29.0, 38.0, 45.0, 48.0, 40.0, 41.0, 42.0, 52.0, 49.0, 41.0, 39.0, 38.0, 27.0, 30.0, 25.0, 35.0, 25.0, 21.0, 21.0, 13.0, 14.0, 11.0, 16.0, 10.0, 10.0, 9.0, 9.0, 3.0, 2.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-7.81640625, -7.58770751953125, -7.3590087890625, -7.13031005859375, -6.901611328125, -6.67291259765625, -6.4442138671875, -6.21551513671875, -5.98681640625, -5.75811767578125, -5.5294189453125, -5.30072021484375, -5.072021484375, -4.84332275390625, -4.6146240234375, -4.38592529296875, -4.1572265625, -3.92852783203125, -3.6998291015625, -3.47113037109375, -3.242431640625, -3.01373291015625, -2.7850341796875, -2.55633544921875, -2.32763671875, -2.09893798828125, -1.8702392578125, -1.64154052734375, -1.412841796875, -1.18414306640625, -0.9554443359375, -0.72674560546875, -0.498046875, -0.26934814453125, -0.0406494140625, 0.18804931640625, 0.416748046875, 0.64544677734375, 0.8741455078125, 1.10284423828125, 1.33154296875, 1.56024169921875, 1.7889404296875, 2.01763916015625, 2.246337890625, 2.47503662109375, 2.7037353515625, 2.93243408203125, 3.1611328125, 3.38983154296875, 3.6185302734375, 3.84722900390625, 4.075927734375, 4.30462646484375, 4.5333251953125, 4.76202392578125, 4.99072265625, 5.21942138671875, 5.4481201171875, 5.67681884765625, 5.905517578125, 6.13421630859375, 6.3629150390625, 6.59161376953125, 6.8203125]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 4.0, 5.0, 6.0, 3.0, 8.0, 6.0, 12.0, 13.0, 26.0, 26.0, 47.0, 50.0, 73.0, 106.0, 171.0, 241.0, 361.0, 644.0, 1064.0, 1813.0, 3479.0, 7402.0, 19005.0, 69784.0, 399608.0, 1601297.0, 1602391.0, 385395.0, 66511.0, 19188.0, 7509.0, 3336.0, 1876.0, 987.0, 636.0, 400.0, 244.0, 167.0, 118.0, 79.0, 64.0, 45.0, 30.0, 20.0, 15.0, 10.0, 5.0, 4.0, 6.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-10.453125, -10.1046142578125, -9.756103515625, -9.4075927734375, -9.05908203125, -8.7105712890625, -8.362060546875, -8.0135498046875, -7.6650390625, -7.3165283203125, -6.968017578125, -6.6195068359375, -6.27099609375, -5.9224853515625, -5.573974609375, -5.2254638671875, -4.876953125, -4.5284423828125, -4.179931640625, -3.8314208984375, -3.48291015625, -3.1343994140625, -2.785888671875, -2.4373779296875, -2.0888671875, -1.7403564453125, -1.391845703125, -1.0433349609375, -0.69482421875, -0.3463134765625, 0.002197265625, 0.3507080078125, 0.69921875, 1.0477294921875, 1.396240234375, 1.7447509765625, 2.09326171875, 2.4417724609375, 2.790283203125, 3.1387939453125, 3.4873046875, 3.8358154296875, 4.184326171875, 4.5328369140625, 4.88134765625, 5.2298583984375, 5.578369140625, 5.9268798828125, 6.275390625, 6.6239013671875, 6.972412109375, 7.3209228515625, 7.66943359375, 8.0179443359375, 8.366455078125, 8.7149658203125, 9.0634765625, 9.4119873046875, 9.760498046875, 10.1090087890625, 10.45751953125, 10.8060302734375, 11.154541015625, 11.5030517578125, 11.8515625]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 4.0, 2.0, 2.0, 7.0, 5.0, 8.0, 7.0, 10.0, 11.0, 15.0, 21.0, 26.0, 45.0, 62.0, 74.0, 115.0, 153.0, 184.0, 225.0, 326.0, 383.0, 524.0, 474.0, 375.0, 257.0, 196.0, 164.0, 114.0, 71.0, 55.0, 43.0, 32.0, 20.0, 15.0, 10.0, 6.0, 10.0, 11.0, 1.0, 3.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.8671875, -12.474609375, -12.08203125, -11.689453125, -11.296875, -10.904296875, -10.51171875, -10.119140625, -9.7265625, -9.333984375, -8.94140625, -8.548828125, -8.15625, -7.763671875, -7.37109375, -6.978515625, -6.5859375, -6.193359375, -5.80078125, -5.408203125, -5.015625, -4.623046875, -4.23046875, -3.837890625, -3.4453125, -3.052734375, -2.66015625, -2.267578125, -1.875, -1.482421875, -1.08984375, -0.697265625, -0.3046875, 0.087890625, 0.48046875, 0.873046875, 1.265625, 1.658203125, 2.05078125, 2.443359375, 2.8359375, 3.228515625, 3.62109375, 4.013671875, 4.40625, 4.798828125, 5.19140625, 5.583984375, 5.9765625, 6.369140625, 6.76171875, 7.154296875, 7.546875, 7.939453125, 8.33203125, 8.724609375, 9.1171875, 9.509765625, 9.90234375, 10.294921875, 10.6875, 11.080078125, 11.47265625, 11.865234375, 12.2578125]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 5.0, 4.0, 8.0, 8.0, 14.0, 26.0, 35.0, 60.0, 110.0, 203.0, 411.0, 1072.0, 3637.0, 618256.0, 3562157.0, 5751.0, 1330.0, 540.0, 245.0, 156.0, 93.0, 55.0, 27.0, 27.0, 15.0, 7.0, 8.0, 7.0, 4.0, 0.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-55.8125, -54.07421875, -52.3359375, -50.59765625, -48.859375, -47.12109375, -45.3828125, -43.64453125, -41.90625, -40.16796875, -38.4296875, -36.69140625, -34.953125, -33.21484375, -31.4765625, -29.73828125, -28.0, -26.26171875, -24.5234375, -22.78515625, -21.046875, -19.30859375, -17.5703125, -15.83203125, -14.09375, -12.35546875, -10.6171875, -8.87890625, -7.140625, -5.40234375, -3.6640625, -1.92578125, -0.1875, 1.55078125, 3.2890625, 5.02734375, 6.765625, 8.50390625, 10.2421875, 11.98046875, 13.71875, 15.45703125, 17.1953125, 18.93359375, 20.671875, 22.41015625, 24.1484375, 25.88671875, 27.625, 29.36328125, 31.1015625, 32.83984375, 34.578125, 36.31640625, 38.0546875, 39.79296875, 41.53125, 43.26953125, 45.0078125, 46.74609375, 48.484375, 50.22265625, 51.9609375, 53.69921875, 55.4375]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 48.0, 580.0, 365.0, 21.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-392.1648254394531, -383.2280578613281, -374.291259765625, -365.3544921875, -356.4176940917969, -347.4809265136719, -338.54412841796875, -329.60736083984375, -320.6705627441406, -311.7337951660156, -302.7969970703125, -293.8602294921875, -284.9234313964844, -275.9866638183594, -267.04986572265625, -258.11309814453125, -249.1763153076172, -240.23953247070312, -231.30274963378906, -222.365966796875, -213.42918395996094, -204.49240112304688, -195.55563354492188, -186.61883544921875, -177.68206787109375, -168.7452850341797, -159.80850219726562, -150.87171936035156, -141.9349365234375, -132.99815368652344, -124.0613784790039, -115.12459564208984, -106.18780517578125, -97.25102233886719, -88.31423950195312, -79.37745666503906, -70.440673828125, -61.5038948059082, -52.567115783691406, -43.630332946777344, -34.69355010986328, -25.75676727294922, -16.81998634338379, -7.883205413818359, 1.0535774230957031, 9.990360260009766, 18.927139282226562, 27.863922119140625, 36.80070495605469, 45.73748779296875, 54.67427062988281, 63.61104965209961, 72.54783630371094, 81.484619140625, 90.42139434814453, 99.3581771850586, 108.29496002197266, 117.23174285888672, 126.16852569580078, 135.1053009033203, 144.04208374023438, 152.97886657714844, 161.9156494140625, 170.85243225097656, 179.78921508789062]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 6.0, 6.0, 9.0, 8.0, 12.0, 10.0, 23.0, 16.0, 29.0, 26.0, 33.0, 29.0, 31.0, 27.0, 40.0, 48.0, 36.0, 42.0, 51.0, 37.0, 31.0, 31.0, 38.0, 44.0, 42.0, 51.0, 35.0, 33.0, 20.0, 32.0, 18.0, 18.0, 19.0, 15.0, 11.0, 11.0, 7.0, 7.0, 5.0, 2.0, 6.0, 1.0, 3.0, 1.0, 3.0, 0.0, 4.0], "bins": [-60.3609619140625, -58.730247497558594, -57.09953308105469, -55.468814849853516, -53.83810043334961, -52.2073860168457, -50.57666778564453, -48.945953369140625, -47.31523895263672, -45.68452453613281, -44.053810119628906, -42.423091888427734, -40.79237747192383, -39.16166305541992, -37.53094482421875, -35.900230407714844, -34.26951599121094, -32.63880157470703, -31.008085250854492, -29.377368927001953, -27.746654510498047, -26.11594009399414, -24.4852237701416, -22.854507446289062, -21.223793029785156, -19.59307861328125, -17.96236228942871, -16.331645965576172, -14.700931549072266, -13.070216178894043, -11.43950080871582, -9.808785438537598, -8.178070068359375, -6.547354698181152, -4.91663932800293, -3.285923957824707, -1.6552085876464844, -0.02449321746826172, 1.606222152709961, 3.2369375228881836, 4.867652893066406, 6.498368263244629, 8.129083633422852, 9.759799003601074, 11.390514373779297, 13.02122974395752, 14.651945114135742, 16.28266143798828, 17.913375854492188, 19.544090270996094, 21.174806594848633, 22.805522918701172, 24.436237335205078, 26.066951751708984, 27.697668075561523, 29.328384399414062, 30.95909881591797, 32.589813232421875, 34.22052764892578, 35.85124588012695, 37.48196029663086, 39.112674713134766, 40.74339294433594, 42.374107360839844, 44.00482177734375]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 8.0, 6.0, 10.0, 12.0, 16.0, 16.0, 17.0, 5.0, 19.0, 25.0, 24.0, 24.0, 28.0, 31.0, 33.0, 27.0, 31.0, 29.0, 31.0, 43.0, 33.0, 36.0, 44.0, 30.0, 30.0, 42.0, 20.0, 37.0, 38.0, 35.0, 28.0, 20.0, 16.0, 22.0, 20.0, 18.0, 16.0, 15.0, 11.0, 11.0, 13.0, 5.0, 12.0, 9.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0], "bins": [-5.2421875, -5.0736083984375, -4.905029296875, -4.7364501953125, -4.56787109375, -4.3992919921875, -4.230712890625, -4.0621337890625, -3.8935546875, -3.7249755859375, -3.556396484375, -3.3878173828125, -3.21923828125, -3.0506591796875, -2.882080078125, -2.7135009765625, -2.544921875, -2.3763427734375, -2.207763671875, -2.0391845703125, -1.87060546875, -1.7020263671875, -1.533447265625, -1.3648681640625, -1.1962890625, -1.0277099609375, -0.859130859375, -0.6905517578125, -0.52197265625, -0.3533935546875, -0.184814453125, -0.0162353515625, 0.15234375, 0.3209228515625, 0.489501953125, 0.6580810546875, 0.82666015625, 0.9952392578125, 1.163818359375, 1.3323974609375, 1.5009765625, 1.6695556640625, 1.838134765625, 2.0067138671875, 2.17529296875, 2.3438720703125, 2.512451171875, 2.6810302734375, 2.849609375, 3.0181884765625, 3.186767578125, 3.3553466796875, 3.52392578125, 3.6925048828125, 3.861083984375, 4.0296630859375, 4.1982421875, 4.3668212890625, 4.535400390625, 4.7039794921875, 4.87255859375, 5.0411376953125, 5.209716796875, 5.3782958984375, 5.546875]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 3.0, 6.0, 14.0, 9.0, 20.0, 25.0, 48.0, 88.0, 99.0, 129.0, 222.0, 402.0, 699.0, 1164.0, 1850.0, 3158.0, 5471.0, 8917.0, 14231.0, 22751.0, 37245.0, 62490.0, 110281.0, 272992.0, 247825.0, 104746.0, 60561.0, 35991.0, 21871.0, 13779.0, 8552.0, 5137.0, 3109.0, 1895.0, 1082.0, 658.0, 375.0, 224.0, 159.0, 97.0, 56.0, 45.0, 27.0, 8.0, 21.0, 12.0, 4.0, 5.0, 4.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.2978515625, -1.2559356689453125, -1.214019775390625, -1.1721038818359375, -1.13018798828125, -1.0882720947265625, -1.046356201171875, -1.0044403076171875, -0.9625244140625, -0.9206085205078125, -0.878692626953125, -0.8367767333984375, -0.79486083984375, -0.7529449462890625, -0.711029052734375, -0.6691131591796875, -0.627197265625, -0.5852813720703125, -0.543365478515625, -0.5014495849609375, -0.45953369140625, -0.4176177978515625, -0.375701904296875, -0.3337860107421875, -0.2918701171875, -0.2499542236328125, -0.208038330078125, -0.1661224365234375, -0.12420654296875, -0.0822906494140625, -0.040374755859375, 0.0015411376953125, 0.04345703125, 0.0853729248046875, 0.127288818359375, 0.1692047119140625, 0.21112060546875, 0.2530364990234375, 0.294952392578125, 0.3368682861328125, 0.3787841796875, 0.4207000732421875, 0.462615966796875, 0.5045318603515625, 0.54644775390625, 0.5883636474609375, 0.630279541015625, 0.6721954345703125, 0.714111328125, 0.7560272216796875, 0.797943115234375, 0.8398590087890625, 0.88177490234375, 0.9236907958984375, 0.965606689453125, 1.0075225830078125, 1.0494384765625, 1.0913543701171875, 1.133270263671875, 1.1751861572265625, 1.21710205078125, 1.2590179443359375, 1.300933837890625, 1.3428497314453125, 1.384765625]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 4.0, 2.0, 16.0, 10.0, 16.0, 8.0, 10.0, 21.0, 27.0, 20.0, 25.0, 31.0, 33.0, 46.0, 39.0, 41.0, 52.0, 34.0, 45.0, 1082.0, 44.0, 41.0, 35.0, 40.0, 37.0, 42.0, 29.0, 29.0, 22.0, 27.0, 21.0, 18.0, 20.0, 12.0, 14.0, 9.0, 8.0, 5.0, 3.0, 5.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0], "bins": [-4.61328125, -4.48046875, -4.34765625, -4.21484375, -4.08203125, -3.94921875, -3.81640625, -3.68359375, -3.55078125, -3.41796875, -3.28515625, -3.15234375, -3.01953125, -2.88671875, -2.75390625, -2.62109375, -2.48828125, -2.35546875, -2.22265625, -2.08984375, -1.95703125, -1.82421875, -1.69140625, -1.55859375, -1.42578125, -1.29296875, -1.16015625, -1.02734375, -0.89453125, -0.76171875, -0.62890625, -0.49609375, -0.36328125, -0.23046875, -0.09765625, 0.03515625, 0.16796875, 0.30078125, 0.43359375, 0.56640625, 0.69921875, 0.83203125, 0.96484375, 1.09765625, 1.23046875, 1.36328125, 1.49609375, 1.62890625, 1.76171875, 1.89453125, 2.02734375, 2.16015625, 2.29296875, 2.42578125, 2.55859375, 2.69140625, 2.82421875, 2.95703125, 3.08984375, 3.22265625, 3.35546875, 3.48828125, 3.62109375, 3.75390625, 3.88671875]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 1.0, 2.0, 2.0, 8.0, 11.0, 10.0, 22.0, 20.0, 32.0, 45.0, 71.0, 114.0, 193.0, 310.0, 430.0, 720.0, 1151.0, 1898.0, 3116.0, 5148.0, 8736.0, 14900.0, 25491.0, 45541.0, 88155.0, 215563.0, 1428308.0, 120484.0, 58859.0, 32223.0, 18481.0, 10785.0, 6482.0, 3749.0, 2300.0, 1382.0, 821.0, 541.0, 359.0, 230.0, 160.0, 93.0, 56.0, 52.0, 33.0, 21.0, 13.0, 8.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.357421875, -1.310943603515625, -1.26446533203125, -1.217987060546875, -1.1715087890625, -1.125030517578125, -1.07855224609375, -1.032073974609375, -0.985595703125, -0.939117431640625, -0.89263916015625, -0.846160888671875, -0.7996826171875, -0.753204345703125, -0.70672607421875, -0.660247802734375, -0.61376953125, -0.567291259765625, -0.52081298828125, -0.474334716796875, -0.4278564453125, -0.381378173828125, -0.33489990234375, -0.288421630859375, -0.241943359375, -0.195465087890625, -0.14898681640625, -0.102508544921875, -0.0560302734375, -0.009552001953125, 0.03692626953125, 0.083404541015625, 0.1298828125, 0.176361083984375, 0.22283935546875, 0.269317626953125, 0.3157958984375, 0.362274169921875, 0.40875244140625, 0.455230712890625, 0.501708984375, 0.548187255859375, 0.59466552734375, 0.641143798828125, 0.6876220703125, 0.734100341796875, 0.78057861328125, 0.827056884765625, 0.87353515625, 0.920013427734375, 0.96649169921875, 1.012969970703125, 1.0594482421875, 1.105926513671875, 1.15240478515625, 1.198883056640625, 1.245361328125, 1.291839599609375, 1.33831787109375, 1.384796142578125, 1.4312744140625, 1.477752685546875, 1.52423095703125, 1.570709228515625, 1.6171875]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 3.0, 1.0, 4.0, 3.0, 2.0, 3.0, 4.0, 7.0, 7.0, 12.0, 14.0, 15.0, 27.0, 17.0, 38.0, 33.0, 56.0, 60.0, 66.0, 74.0, 102.0, 68.0, 84.0, 61.0, 51.0, 36.0, 34.0, 30.0, 14.0, 21.0, 17.0, 9.0, 11.0, 7.0, 7.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0009160041809082031, -0.0008887127041816711, -0.0008614212274551392, -0.0008341297507286072, -0.0008068382740020752, -0.0007795467972755432, -0.0007522553205490112, -0.0007249638438224792, -0.0006976723670959473, -0.0006703808903694153, -0.0006430894136428833, -0.0006157979369163513, -0.0005885064601898193, -0.0005612149834632874, -0.0005339235067367554, -0.0005066320300102234, -0.0004793405532836914, -0.0004520490765571594, -0.00042475759983062744, -0.00039746612310409546, -0.0003701746463775635, -0.0003428831696510315, -0.0003155916929244995, -0.00028830021619796753, -0.00026100873947143555, -0.00023371726274490356, -0.00020642578601837158, -0.0001791343092918396, -0.00015184283256530762, -0.00012455135583877563, -9.725987911224365e-05, -6.996840238571167e-05, -4.267692565917969e-05, -1.5385448932647705e-05, 1.1906027793884277e-05, 3.919750452041626e-05, 6.648898124694824e-05, 9.378045797348022e-05, 0.00012107193470001221, 0.0001483634114265442, 0.00017565488815307617, 0.00020294636487960815, 0.00023023784160614014, 0.0002575293183326721, 0.0002848207950592041, 0.0003121122717857361, 0.00033940374851226807, 0.00036669522523880005, 0.00039398670196533203, 0.000421278178691864, 0.000448569655418396, 0.000475861132144928, 0.00050315260887146, 0.0005304440855979919, 0.0005577355623245239, 0.0005850270390510559, 0.0006123185157775879, 0.0006396099925041199, 0.0006669014692306519, 0.0006941929459571838, 0.0007214844226837158, 0.0007487758994102478, 0.0007760673761367798, 0.0008033588528633118, 0.0008306503295898438]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 7.0, 4.0, 8.0, 4.0, 11.0, 7.0, 11.0, 17.0, 27.0, 36.0, 48.0, 63.0, 90.0, 125.0, 158.0, 267.0, 415.0, 777.0, 4075.0, 1037218.0, 3067.0, 774.0, 460.0, 252.0, 193.0, 100.0, 60.0, 69.0, 57.0, 33.0, 25.0, 22.0, 13.0, 19.0, 10.0, 8.0, 6.0, 8.0, 7.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0180511474609375, -0.017495393753051758, -0.016939640045166016, -0.016383886337280273, -0.01582813262939453, -0.015272378921508789, -0.014716625213623047, -0.014160871505737305, -0.013605117797851562, -0.01304936408996582, -0.012493610382080078, -0.011937856674194336, -0.011382102966308594, -0.010826349258422852, -0.01027059555053711, -0.009714841842651367, -0.009159088134765625, -0.008603334426879883, -0.00804758071899414, -0.0074918270111083984, -0.006936073303222656, -0.006380319595336914, -0.005824565887451172, -0.00526881217956543, -0.0047130584716796875, -0.004157304763793945, -0.003601551055908203, -0.003045797348022461, -0.0024900436401367188, -0.0019342899322509766, -0.0013785362243652344, -0.0008227825164794922, -0.00026702880859375, 0.0002887248992919922, 0.0008444786071777344, 0.0014002323150634766, 0.0019559860229492188, 0.002511739730834961, 0.003067493438720703, 0.0036232471466064453, 0.0041790008544921875, 0.00473475456237793, 0.005290508270263672, 0.005846261978149414, 0.006402015686035156, 0.0069577693939208984, 0.007513523101806641, 0.008069276809692383, 0.008625030517578125, 0.009180784225463867, 0.00973653793334961, 0.010292291641235352, 0.010848045349121094, 0.011403799057006836, 0.011959552764892578, 0.01251530647277832, 0.013071060180664062, 0.013626813888549805, 0.014182567596435547, 0.014738321304321289, 0.015294075012207031, 0.015849828720092773, 0.016405582427978516, 0.016961336135864258, 0.01751708984375]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 22.0, 59.0, 124.0, 238.0, 271.0, 174.0, 77.0, 28.0, 8.0, 2.0, 2.0, 1.0], "bins": [-0.0013548614224418998, -0.0013307540211826563, -0.0013066466199234128, -0.0012825392186641693, -0.0012584318174049258, -0.0012343242997303605, -0.001210216898471117, -0.0011861094972118735, -0.00116200209595263, -0.0011378946946933866, -0.001113787293434143, -0.0010896798921748996, -0.001065572490915656, -0.0010414649732410908, -0.0010173575719818473, -0.0009932501707226038, -0.0009691427694633603, -0.0009450353682041168, -0.0009209279669448733, -0.0008968205074779689, -0.0008727131062187254, -0.000848605704959482, -0.0008244983037002385, -0.0008003908442333341, -0.0007762835011817515, -0.000752176099922508, -0.0007280686986632645, -0.0007039612391963601, -0.0006798538379371166, -0.0006557464366778731, -0.0006316390354186296, -0.0006075316341593862, -0.0005834242329001427, -0.0005593168316408992, -0.0005352094303816557, -0.0005111019709147513, -0.0004869945696555078, -0.0004628871683962643, -0.0004387797671370208, -0.0004146723367739469, -0.00039056490641087294, -0.00036645750515162945, -0.0003423500747885555, -0.000318242673529312, -0.00029413524316623807, -0.0002700278419069946, -0.0002459204406477511, -0.00022181301028467715, -0.00019770559447351843, -0.00017359817866235971, -0.000149490762851201, -0.00012538334704004228, -0.00010127593850484118, -7.716852269368246e-05, -5.306111415848136e-05, -2.8953698347322643e-05, -4.846282536163926e-06, 1.9261131456005387e-05, 4.33685454481747e-05, 6.747595762135461e-05, 9.158337343251333e-05, 0.00011569078924367204, 0.00013979819777887315, 0.00016390561359003186, 0.00018801302940119058]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 7.0, 4.0, 7.0, 4.0, 7.0, 15.0, 14.0, 12.0, 19.0, 16.0, 27.0, 17.0, 19.0, 21.0, 20.0, 37.0, 30.0, 33.0, 38.0, 56.0, 37.0, 38.0, 47.0, 41.0, 37.0, 34.0, 38.0, 26.0, 45.0, 36.0, 35.0, 21.0, 25.0, 23.0, 13.0, 11.0, 12.0, 12.0, 20.0, 13.0, 12.0, 10.0, 2.0, 3.0, 3.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.0003533363342285156, -0.0003420161083340645, -0.00033069588243961334, -0.0003193756565451622, -0.00030805543065071106, -0.0002967352047562599, -0.0002854149788618088, -0.00027409475296735764, -0.0002627745270729065, -0.00025145430117845535, -0.0002401340752840042, -0.00022881384938955307, -0.00021749362349510193, -0.0002061733976006508, -0.00019485317170619965, -0.0001835329458117485, -0.00017221271991729736, -0.00016089249402284622, -0.00014957226812839508, -0.00013825204223394394, -0.0001269318163394928, -0.00011561159044504166, -0.00010429136455059052, -9.297113865613937e-05, -8.165091276168823e-05, -7.033068686723709e-05, -5.901046097278595e-05, -4.769023507833481e-05, -3.637000918388367e-05, -2.5049783289432526e-05, -1.3729557394981384e-05, -2.409331500530243e-06, 8.910894393920898e-06, 2.023112028837204e-05, 3.155134618282318e-05, 4.287157207727432e-05, 5.4191797971725464e-05, 6.55120238661766e-05, 7.683224976062775e-05, 8.815247565507889e-05, 9.947270154953003e-05, 0.00011079292744398117, 0.0001221131533384323, 0.00013343337923288345, 0.0001447536051273346, 0.00015607383102178574, 0.00016739405691623688, 0.00017871428281068802, 0.00019003450870513916, 0.0002013547345995903, 0.00021267496049404144, 0.00022399518638849258, 0.00023531541228294373, 0.00024663563817739487, 0.000257955864071846, 0.00026927608996629715, 0.0002805963158607483, 0.00029191654175519943, 0.0003032367676496506, 0.0003145569935441017, 0.00032587721943855286, 0.000337197445333004, 0.00034851767122745514, 0.0003598378971219063, 0.0003711581230163574]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 8.0, 6.0, 10.0, 12.0, 16.0, 16.0, 17.0, 5.0, 19.0, 25.0, 24.0, 24.0, 28.0, 31.0, 33.0, 27.0, 31.0, 29.0, 31.0, 43.0, 33.0, 36.0, 44.0, 30.0, 30.0, 42.0, 20.0, 37.0, 38.0, 35.0, 28.0, 20.0, 16.0, 22.0, 20.0, 18.0, 16.0, 15.0, 11.0, 11.0, 13.0, 5.0, 12.0, 9.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0], "bins": [-5.2421875, -5.0736083984375, -4.905029296875, -4.7364501953125, -4.56787109375, -4.3992919921875, -4.230712890625, -4.0621337890625, -3.8935546875, -3.7249755859375, -3.556396484375, -3.3878173828125, -3.21923828125, -3.0506591796875, -2.882080078125, -2.7135009765625, -2.544921875, -2.3763427734375, -2.207763671875, -2.0391845703125, -1.87060546875, -1.7020263671875, -1.533447265625, -1.3648681640625, -1.1962890625, -1.0277099609375, -0.859130859375, -0.6905517578125, -0.52197265625, -0.3533935546875, -0.184814453125, -0.0162353515625, 0.15234375, 0.3209228515625, 0.489501953125, 0.6580810546875, 0.82666015625, 0.9952392578125, 1.163818359375, 1.3323974609375, 1.5009765625, 1.6695556640625, 1.838134765625, 2.0067138671875, 2.17529296875, 2.3438720703125, 2.512451171875, 2.6810302734375, 2.849609375, 3.0181884765625, 3.186767578125, 3.3553466796875, 3.52392578125, 3.6925048828125, 3.861083984375, 4.0296630859375, 4.1982421875, 4.3668212890625, 4.535400390625, 4.7039794921875, 4.87255859375, 5.0411376953125, 5.209716796875, 5.3782958984375, 5.546875]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 8.0, 10.0, 10.0, 27.0, 24.0, 30.0, 56.0, 56.0, 90.0, 97.0, 145.0, 233.0, 304.0, 424.0, 641.0, 1016.0, 1707.0, 3446.0, 8364.0, 22493.0, 75271.0, 369375.0, 435490.0, 86417.0, 24739.0, 9079.0, 3873.0, 1866.0, 1052.0, 691.0, 453.0, 285.0, 197.0, 155.0, 85.0, 74.0, 62.0, 51.0, 38.0, 29.0, 20.0, 19.0, 13.0, 12.0, 6.0, 8.0, 7.0, 0.0, 2.0, 3.0, 2.0, 0.0, 3.0, 2.0], "bins": [-10.203125, -9.884765625, -9.56640625, -9.248046875, -8.9296875, -8.611328125, -8.29296875, -7.974609375, -7.65625, -7.337890625, -7.01953125, -6.701171875, -6.3828125, -6.064453125, -5.74609375, -5.427734375, -5.109375, -4.791015625, -4.47265625, -4.154296875, -3.8359375, -3.517578125, -3.19921875, -2.880859375, -2.5625, -2.244140625, -1.92578125, -1.607421875, -1.2890625, -0.970703125, -0.65234375, -0.333984375, -0.015625, 0.302734375, 0.62109375, 0.939453125, 1.2578125, 1.576171875, 1.89453125, 2.212890625, 2.53125, 2.849609375, 3.16796875, 3.486328125, 3.8046875, 4.123046875, 4.44140625, 4.759765625, 5.078125, 5.396484375, 5.71484375, 6.033203125, 6.3515625, 6.669921875, 6.98828125, 7.306640625, 7.625, 7.943359375, 8.26171875, 8.580078125, 8.8984375, 9.216796875, 9.53515625, 9.853515625, 10.171875]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 6.0, 5.0, 10.0, 9.0, 9.0, 10.0, 11.0, 22.0, 20.0, 26.0, 30.0, 40.0, 59.0, 44.0, 56.0, 100.0, 371.0, 1728.0, 119.0, 76.0, 43.0, 48.0, 36.0, 40.0, 23.0, 26.0, 18.0, 22.0, 11.0, 9.0, 6.0, 3.0, 5.0, 6.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0], "bins": [-25.328125, -24.681640625, -24.03515625, -23.388671875, -22.7421875, -22.095703125, -21.44921875, -20.802734375, -20.15625, -19.509765625, -18.86328125, -18.216796875, -17.5703125, -16.923828125, -16.27734375, -15.630859375, -14.984375, -14.337890625, -13.69140625, -13.044921875, -12.3984375, -11.751953125, -11.10546875, -10.458984375, -9.8125, -9.166015625, -8.51953125, -7.873046875, -7.2265625, -6.580078125, -5.93359375, -5.287109375, -4.640625, -3.994140625, -3.34765625, -2.701171875, -2.0546875, -1.408203125, -0.76171875, -0.115234375, 0.53125, 1.177734375, 1.82421875, 2.470703125, 3.1171875, 3.763671875, 4.41015625, 5.056640625, 5.703125, 6.349609375, 6.99609375, 7.642578125, 8.2890625, 8.935546875, 9.58203125, 10.228515625, 10.875, 11.521484375, 12.16796875, 12.814453125, 13.4609375, 14.107421875, 14.75390625, 15.400390625, 16.046875]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 6.0, 5.0, 11.0, 13.0, 13.0, 18.0, 28.0, 33.0, 59.0, 90.0, 141.0, 350.0, 710.0, 4811.0, 3134015.0, 3937.0, 698.0, 293.0, 163.0, 95.0, 65.0, 44.0, 25.0, 16.0, 15.0, 13.0, 5.0, 7.0, 7.0, 8.0, 6.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.75, -46.7578125, -44.765625, -42.7734375, -40.78125, -38.7890625, -36.796875, -34.8046875, -32.8125, -30.8203125, -28.828125, -26.8359375, -24.84375, -22.8515625, -20.859375, -18.8671875, -16.875, -14.8828125, -12.890625, -10.8984375, -8.90625, -6.9140625, -4.921875, -2.9296875, -0.9375, 1.0546875, 3.046875, 5.0390625, 7.03125, 9.0234375, 11.015625, 13.0078125, 15.0, 16.9921875, 18.984375, 20.9765625, 22.96875, 24.9609375, 26.953125, 28.9453125, 30.9375, 32.9296875, 34.921875, 36.9140625, 38.90625, 40.8984375, 42.890625, 44.8828125, 46.875, 48.8671875, 50.859375, 52.8515625, 54.84375, 56.8359375, 58.828125, 60.8203125, 62.8125, 64.8046875, 66.796875, 68.7890625, 70.78125, 72.7734375, 74.765625, 76.7578125, 78.75]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 23.0, 380.0, 543.0, 65.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.07620620727539, -32.20527267456055, -29.334339141845703, -26.46340560913086, -23.592472076416016, -20.721538543701172, -17.850603103637695, -14.979669570922852, -12.108736038208008, -9.237802505493164, -6.366868495941162, -3.49593448638916, -0.6250009536743164, 2.2459325790405273, 5.1168670654296875, 7.987800598144531, 10.858734130859375, 13.729667663574219, 16.600601196289062, 19.471534729003906, 22.34246826171875, 25.213401794433594, 28.08433723449707, 30.955270767211914, 33.826202392578125, 36.69713592529297, 39.56806945800781, 42.439002990722656, 45.3099365234375, 48.180870056152344, 51.05180358886719, 53.92273712158203, 56.793678283691406, 59.66461181640625, 62.535545349121094, 65.40647888183594, 68.27741241455078, 71.14834594726562, 74.01927947998047, 76.89021301269531, 79.76114654541016, 82.632080078125, 85.50301361083984, 88.37394714355469, 91.24488067626953, 94.11581420898438, 96.98674774169922, 99.85768127441406, 102.72862243652344, 105.59955596923828, 108.47048950195312, 111.34142303466797, 114.21235656738281, 117.08329010009766, 119.9542236328125, 122.82515716552734, 125.69609069824219, 128.56703186035156, 131.43795776367188, 134.30889892578125, 137.17982482910156, 140.05076599121094, 142.92169189453125, 145.79263305664062, 148.66355895996094]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 5.0, 2.0, 6.0, 4.0, 11.0, 13.0, 6.0, 15.0, 13.0, 19.0, 28.0, 27.0, 29.0, 28.0, 45.0, 52.0, 44.0, 49.0, 53.0, 67.0, 54.0, 48.0, 53.0, 51.0, 35.0, 38.0, 33.0, 26.0, 28.0, 27.0, 12.0, 19.0, 15.0, 12.0, 14.0, 7.0, 9.0, 3.0, 4.0, 4.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.09817123413086, -31.74242401123047, -30.386676788330078, -29.030929565429688, -27.675182342529297, -26.319435119628906, -24.963687896728516, -23.607940673828125, -22.252193450927734, -20.896446228027344, -19.540699005126953, -18.184951782226562, -16.829204559326172, -15.473457336425781, -14.117709159851074, -12.761961936950684, -11.406213760375977, -10.050466537475586, -8.694719314575195, -7.3389716148376465, -5.983224391937256, -4.627477169036865, -3.2717294692993164, -1.9159822463989258, -0.5602350234985352, 0.795512318611145, 2.151259660720825, 3.507007122039795, 4.8627543449401855, 6.218501567840576, 7.574249267578125, 8.929996490478516, 10.285743713378906, 11.641490936279297, 12.997238159179688, 14.352985382080078, 15.708732604980469, 17.06447982788086, 18.42022705078125, 19.77597427368164, 21.13172149658203, 22.487468719482422, 23.843215942382812, 25.198963165283203, 26.554710388183594, 27.910457611083984, 29.266204833984375, 30.621952056884766, 31.97770118713379, 33.33345031738281, 34.6891975402832, 36.044944763183594, 37.400691986083984, 38.756439208984375, 40.112186431884766, 41.467933654785156, 42.82368087768555, 44.17942810058594, 45.53517532348633, 46.89092254638672, 48.24666976928711, 49.6024169921875, 50.95816421508789, 52.31391143798828, 53.66965866088867]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 4.0, 3.0, 5.0, 5.0, 8.0, 7.0, 8.0, 9.0, 13.0, 15.0, 22.0, 20.0, 17.0, 17.0, 19.0, 26.0, 18.0, 34.0, 41.0, 37.0, 30.0, 44.0, 48.0, 34.0, 32.0, 37.0, 48.0, 25.0, 39.0, 35.0, 34.0, 31.0, 30.0, 27.0, 28.0, 21.0, 20.0, 16.0, 15.0, 14.0, 15.0, 15.0, 12.0, 6.0, 6.0, 6.0, 6.0, 5.0, 3.0, 1.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.44140625, -5.23199462890625, -5.0225830078125, -4.81317138671875, -4.603759765625, -4.39434814453125, -4.1849365234375, -3.97552490234375, -3.76611328125, -3.55670166015625, -3.3472900390625, -3.13787841796875, -2.928466796875, -2.71905517578125, -2.5096435546875, -2.30023193359375, -2.0908203125, -1.88140869140625, -1.6719970703125, -1.46258544921875, -1.253173828125, -1.04376220703125, -0.8343505859375, -0.62493896484375, -0.41552734375, -0.20611572265625, 0.0032958984375, 0.21270751953125, 0.422119140625, 0.63153076171875, 0.8409423828125, 1.05035400390625, 1.259765625, 1.46917724609375, 1.6785888671875, 1.88800048828125, 2.097412109375, 2.30682373046875, 2.5162353515625, 2.72564697265625, 2.93505859375, 3.14447021484375, 3.3538818359375, 3.56329345703125, 3.772705078125, 3.98211669921875, 4.1915283203125, 4.40093994140625, 4.6103515625, 4.81976318359375, 5.0291748046875, 5.23858642578125, 5.447998046875, 5.65740966796875, 5.8668212890625, 6.07623291015625, 6.28564453125, 6.49505615234375, 6.7044677734375, 6.91387939453125, 7.123291015625, 7.33270263671875, 7.5421142578125, 7.75152587890625, 7.9609375]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 2.0, 3.0, 8.0, 5.0, 10.0, 20.0, 22.0, 30.0, 34.0, 36.0, 46.0, 53.0, 56.0, 81.0, 105.0, 134.0, 225.0, 329.0, 453.0, 771.0, 1815.0, 9388.0, 2302874.0, 1865452.0, 8224.0, 1686.0, 730.0, 497.0, 320.0, 219.0, 148.0, 99.0, 78.0, 57.0, 54.0, 40.0, 37.0, 40.0, 27.0, 20.0, 13.0, 10.0, 12.0, 6.0, 6.0, 9.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-47.125, -45.552734375, -43.98046875, -42.408203125, -40.8359375, -39.263671875, -37.69140625, -36.119140625, -34.546875, -32.974609375, -31.40234375, -29.830078125, -28.2578125, -26.685546875, -25.11328125, -23.541015625, -21.96875, -20.396484375, -18.82421875, -17.251953125, -15.6796875, -14.107421875, -12.53515625, -10.962890625, -9.390625, -7.818359375, -6.24609375, -4.673828125, -3.1015625, -1.529296875, 0.04296875, 1.615234375, 3.1875, 4.759765625, 6.33203125, 7.904296875, 9.4765625, 11.048828125, 12.62109375, 14.193359375, 15.765625, 17.337890625, 18.91015625, 20.482421875, 22.0546875, 23.626953125, 25.19921875, 26.771484375, 28.34375, 29.916015625, 31.48828125, 33.060546875, 34.6328125, 36.205078125, 37.77734375, 39.349609375, 40.921875, 42.494140625, 44.06640625, 45.638671875, 47.2109375, 48.783203125, 50.35546875, 51.927734375, 53.5]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 2.0, 3.0, 2.0, 8.0, 15.0, 27.0, 55.0, 124.0, 256.0, 517.0, 886.0, 928.0, 630.0, 318.0, 136.0, 75.0, 45.0, 18.0, 16.0, 6.0, 4.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.65625, -11.95458984375, -11.2529296875, -10.55126953125, -9.849609375, -9.14794921875, -8.4462890625, -7.74462890625, -7.04296875, -6.34130859375, -5.6396484375, -4.93798828125, -4.236328125, -3.53466796875, -2.8330078125, -2.13134765625, -1.4296875, -0.72802734375, -0.0263671875, 0.67529296875, 1.376953125, 2.07861328125, 2.7802734375, 3.48193359375, 4.18359375, 4.88525390625, 5.5869140625, 6.28857421875, 6.990234375, 7.69189453125, 8.3935546875, 9.09521484375, 9.796875, 10.49853515625, 11.2001953125, 11.90185546875, 12.603515625, 13.30517578125, 14.0068359375, 14.70849609375, 15.41015625, 16.11181640625, 16.8134765625, 17.51513671875, 18.216796875, 18.91845703125, 19.6201171875, 20.32177734375, 21.0234375, 21.72509765625, 22.4267578125, 23.12841796875, 23.830078125, 24.53173828125, 25.2333984375, 25.93505859375, 26.63671875, 27.33837890625, 28.0400390625, 28.74169921875, 29.443359375, 30.14501953125, 30.8466796875, 31.54833984375, 32.25]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 5.0, 4.0, 5.0, 18.0, 31.0, 59.0, 144.0, 335.0, 1434.0, 18773.0, 3831306.0, 336667.0, 4400.0, 679.0, 239.0, 93.0, 48.0, 24.0, 9.0, 4.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.71875, -35.4423828125, -34.166015625, -32.8896484375, -31.61328125, -30.3369140625, -29.060546875, -27.7841796875, -26.5078125, -25.2314453125, -23.955078125, -22.6787109375, -21.40234375, -20.1259765625, -18.849609375, -17.5732421875, -16.296875, -15.0205078125, -13.744140625, -12.4677734375, -11.19140625, -9.9150390625, -8.638671875, -7.3623046875, -6.0859375, -4.8095703125, -3.533203125, -2.2568359375, -0.98046875, 0.2958984375, 1.572265625, 2.8486328125, 4.125, 5.4013671875, 6.677734375, 7.9541015625, 9.23046875, 10.5068359375, 11.783203125, 13.0595703125, 14.3359375, 15.6123046875, 16.888671875, 18.1650390625, 19.44140625, 20.7177734375, 21.994140625, 23.2705078125, 24.546875, 25.8232421875, 27.099609375, 28.3759765625, 29.65234375, 30.9287109375, 32.205078125, 33.4814453125, 34.7578125, 36.0341796875, 37.310546875, 38.5869140625, 39.86328125, 41.1396484375, 42.416015625, 43.6923828125, 44.96875]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 10.0, 29.0, 94.0, 163.0, 240.0, 235.0, 134.0, 67.0, 24.0, 10.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-88.14614868164062, -82.07158660888672, -75.99702453613281, -69.92245483398438, -63.84789276123047, -57.77333068847656, -51.69876480102539, -45.62419891357422, -39.54963684082031, -33.475074768066406, -27.400508880615234, -21.325944900512695, -15.251380920410156, -9.176816940307617, -3.102252960205078, 2.9723129272460938, 9.046875, 15.121438980102539, 21.196002960205078, 27.270566940307617, 33.345130920410156, 39.41969299316406, 45.494258880615234, 51.568824768066406, 57.64338684082031, 63.71794891357422, 69.79251098632812, 75.86708068847656, 81.94164276123047, 88.01620483398438, 94.09077453613281, 100.16533660888672, 106.23989868164062, 112.31446075439453, 118.38902282714844, 124.46359252929688, 130.53814697265625, 136.6127166748047, 142.68728637695312, 148.7618408203125, 154.83641052246094, 160.91098022460938, 166.98553466796875, 173.0601043701172, 179.13467407226562, 185.209228515625, 191.28379821777344, 197.35836791992188, 203.43292236328125, 209.5074920654297, 215.58204650878906, 221.6566162109375, 227.73117065429688, 233.8057403564453, 239.88031005859375, 245.95486450195312, 252.02943420410156, 258.10400390625, 264.1785583496094, 270.25311279296875, 276.32769775390625, 282.4022521972656, 288.476806640625, 294.5513916015625, 300.6259460449219]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 1.0, 4.0, 5.0, 8.0, 3.0, 13.0, 15.0, 22.0, 12.0, 17.0, 36.0, 37.0, 31.0, 42.0, 44.0, 43.0, 45.0, 48.0, 53.0, 46.0, 42.0, 59.0, 43.0, 39.0, 39.0, 42.0, 34.0, 32.0, 30.0, 26.0, 25.0, 16.0, 17.0, 12.0, 3.0, 8.0, 7.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.53618621826172, -50.936256408691406, -49.336326599121094, -47.73639678955078, -46.136470794677734, -44.53654098510742, -42.93661117553711, -41.3366813659668, -39.736751556396484, -38.13682174682617, -36.53689193725586, -34.93696594238281, -33.3370361328125, -31.737106323242188, -30.137176513671875, -28.537246704101562, -26.937318801879883, -25.33738899230957, -23.73746109008789, -22.137531280517578, -20.537601470947266, -18.937671661376953, -17.337743759155273, -15.737813949584961, -14.137885093688965, -12.537956237792969, -10.938026428222656, -9.33809757232666, -7.738168239593506, -6.138238906860352, -4.5383100509643555, -2.938380241394043, -1.3384513854980469, 0.26147782802581787, 1.8614070415496826, 3.461336135864258, 5.061265468597412, 6.661194801330566, 8.261123657226562, 9.861053466796875, 11.460982322692871, 13.060911178588867, 14.66084098815918, 16.26076889038086, 17.860698699951172, 19.460628509521484, 21.060558319091797, 22.66048812866211, 24.26041603088379, 25.8603458404541, 27.46027374267578, 29.060203552246094, 30.660133361816406, 32.26006317138672, 33.85999298095703, 35.459922790527344, 37.05984878540039, 38.6597785949707, 40.259708404541016, 41.85963439941406, 43.459564208984375, 45.05949401855469, 46.659423828125, 48.25935363769531, 49.859283447265625]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 2.0, 0.0, 5.0, 5.0, 5.0, 10.0, 6.0, 9.0, 8.0, 12.0, 10.0, 11.0, 23.0, 23.0, 31.0, 31.0, 23.0, 32.0, 29.0, 38.0, 42.0, 43.0, 41.0, 36.0, 35.0, 36.0, 45.0, 50.0, 34.0, 35.0, 22.0, 40.0, 32.0, 34.0, 22.0, 26.0, 20.0, 20.0, 9.0, 17.0, 14.0, 8.0, 6.0, 9.0, 6.0, 6.0, 3.0, 1.0, 2.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-62.375, -60.41552734375, -58.4560546875, -56.49658203125, -54.537109375, -52.57763671875, -50.6181640625, -48.65869140625, -46.69921875, -44.73974609375, -42.7802734375, -40.82080078125, -38.861328125, -36.90185546875, -34.9423828125, -32.98291015625, -31.0234375, -29.06396484375, -27.1044921875, -25.14501953125, -23.185546875, -21.22607421875, -19.2666015625, -17.30712890625, -15.34765625, -13.38818359375, -11.4287109375, -9.46923828125, -7.509765625, -5.55029296875, -3.5908203125, -1.63134765625, 0.328125, 2.28759765625, 4.2470703125, 6.20654296875, 8.166015625, 10.12548828125, 12.0849609375, 14.04443359375, 16.00390625, 17.96337890625, 19.9228515625, 21.88232421875, 23.841796875, 25.80126953125, 27.7607421875, 29.72021484375, 31.6796875, 33.63916015625, 35.5986328125, 37.55810546875, 39.517578125, 41.47705078125, 43.4365234375, 45.39599609375, 47.35546875, 49.31494140625, 51.2744140625, 53.23388671875, 55.193359375, 57.15283203125, 59.1123046875, 61.07177734375, 63.03125]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 6.0, 12.0, 15.0, 7.0, 19.0, 30.0, 39.0, 70.0, 96.0, 115.0, 185.0, 257.0, 352.0, 567.0, 745.0, 1131.0, 1607.0, 2430.0, 3470.0, 5156.0, 7634.0, 11405.0, 17648.0, 27072.0, 42296.0, 67621.0, 119101.0, 278329.0, 202017.0, 96403.0, 57268.0, 36015.0, 23468.0, 15190.0, 9852.0, 6561.0, 4556.0, 3089.0, 2089.0, 1457.0, 964.0, 677.0, 481.0, 335.0, 204.0, 157.0, 110.0, 92.0, 46.0, 32.0, 25.0, 19.0, 19.0, 8.0, 4.0, 6.0, 5.0, 2.0, 0.0, 3.0], "bins": [-11.515625, -11.15380859375, -10.7919921875, -10.43017578125, -10.068359375, -9.70654296875, -9.3447265625, -8.98291015625, -8.62109375, -8.25927734375, -7.8974609375, -7.53564453125, -7.173828125, -6.81201171875, -6.4501953125, -6.08837890625, -5.7265625, -5.36474609375, -5.0029296875, -4.64111328125, -4.279296875, -3.91748046875, -3.5556640625, -3.19384765625, -2.83203125, -2.47021484375, -2.1083984375, -1.74658203125, -1.384765625, -1.02294921875, -0.6611328125, -0.29931640625, 0.0625, 0.42431640625, 0.7861328125, 1.14794921875, 1.509765625, 1.87158203125, 2.2333984375, 2.59521484375, 2.95703125, 3.31884765625, 3.6806640625, 4.04248046875, 4.404296875, 4.76611328125, 5.1279296875, 5.48974609375, 5.8515625, 6.21337890625, 6.5751953125, 6.93701171875, 7.298828125, 7.66064453125, 8.0224609375, 8.38427734375, 8.74609375, 9.10791015625, 9.4697265625, 9.83154296875, 10.193359375, 10.55517578125, 10.9169921875, 11.27880859375, 11.640625]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 1.0, 2.0, 2.0, 4.0, 6.0, 5.0, 10.0, 9.0, 13.0, 19.0, 16.0, 18.0, 20.0, 20.0, 22.0, 27.0, 34.0, 26.0, 40.0, 37.0, 39.0, 42.0, 37.0, 36.0, 34.0, 1062.0, 28.0, 30.0, 34.0, 29.0, 41.0, 26.0, 29.0, 20.0, 29.0, 22.0, 19.0, 17.0, 11.0, 18.0, 10.0, 21.0, 6.0, 10.0, 14.0, 12.0, 11.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-35.90625, -34.755859375, -33.60546875, -32.455078125, -31.3046875, -30.154296875, -29.00390625, -27.853515625, -26.703125, -25.552734375, -24.40234375, -23.251953125, -22.1015625, -20.951171875, -19.80078125, -18.650390625, -17.5, -16.349609375, -15.19921875, -14.048828125, -12.8984375, -11.748046875, -10.59765625, -9.447265625, -8.296875, -7.146484375, -5.99609375, -4.845703125, -3.6953125, -2.544921875, -1.39453125, -0.244140625, 0.90625, 2.056640625, 3.20703125, 4.357421875, 5.5078125, 6.658203125, 7.80859375, 8.958984375, 10.109375, 11.259765625, 12.41015625, 13.560546875, 14.7109375, 15.861328125, 17.01171875, 18.162109375, 19.3125, 20.462890625, 21.61328125, 22.763671875, 23.9140625, 25.064453125, 26.21484375, 27.365234375, 28.515625, 29.666015625, 30.81640625, 31.966796875, 33.1171875, 34.267578125, 35.41796875, 36.568359375, 37.71875]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 4.0, 7.0, 11.0, 18.0, 20.0, 34.0, 48.0, 56.0, 89.0, 161.0, 200.0, 330.0, 447.0, 700.0, 1062.0, 1736.0, 2572.0, 4109.0, 6498.0, 9981.0, 15303.0, 23990.0, 39027.0, 66563.0, 127970.0, 1385542.0, 191572.0, 88038.0, 48842.0, 29281.0, 18639.0, 11893.0, 7883.0, 5061.0, 3308.0, 2139.0, 1385.0, 886.0, 577.0, 396.0, 262.0, 165.0, 117.0, 57.0, 47.0, 39.0, 24.0, 22.0, 10.0, 6.0, 4.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-13.2109375, -12.8072509765625, -12.403564453125, -11.9998779296875, -11.59619140625, -11.1925048828125, -10.788818359375, -10.3851318359375, -9.9814453125, -9.5777587890625, -9.174072265625, -8.7703857421875, -8.36669921875, -7.9630126953125, -7.559326171875, -7.1556396484375, -6.751953125, -6.3482666015625, -5.944580078125, -5.5408935546875, -5.13720703125, -4.7335205078125, -4.329833984375, -3.9261474609375, -3.5224609375, -3.1187744140625, -2.715087890625, -2.3114013671875, -1.90771484375, -1.5040283203125, -1.100341796875, -0.6966552734375, -0.29296875, 0.1107177734375, 0.514404296875, 0.9180908203125, 1.32177734375, 1.7254638671875, 2.129150390625, 2.5328369140625, 2.9365234375, 3.3402099609375, 3.743896484375, 4.1475830078125, 4.55126953125, 4.9549560546875, 5.358642578125, 5.7623291015625, 6.166015625, 6.5697021484375, 6.973388671875, 7.3770751953125, 7.78076171875, 8.1844482421875, 8.588134765625, 8.9918212890625, 9.3955078125, 9.7991943359375, 10.202880859375, 10.6065673828125, 11.01025390625, 11.4139404296875, 11.817626953125, 12.2213134765625, 12.625]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 6.0, 3.0, 8.0, 6.0, 9.0, 10.0, 21.0, 22.0, 17.0, 29.0, 44.0, 33.0, 43.0, 52.0, 47.0, 65.0, 83.0, 76.0, 68.0, 57.0, 55.0, 39.0, 36.0, 41.0, 23.0, 23.0, 26.0, 13.0, 17.0, 6.0, 3.0, 8.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00865936279296875, -0.008375883102416992, -0.008092403411865234, -0.0078089237213134766, -0.007525444030761719, -0.007241964340209961, -0.006958484649658203, -0.006675004959106445, -0.0063915252685546875, -0.00610804557800293, -0.005824565887451172, -0.005541086196899414, -0.005257606506347656, -0.0049741268157958984, -0.004690647125244141, -0.004407167434692383, -0.004123687744140625, -0.003840208053588867, -0.0035567283630371094, -0.0032732486724853516, -0.0029897689819335938, -0.002706289291381836, -0.002422809600830078, -0.0021393299102783203, -0.0018558502197265625, -0.0015723705291748047, -0.0012888908386230469, -0.001005411148071289, -0.0007219314575195312, -0.00043845176696777344, -0.00015497207641601562, 0.0001285076141357422, 0.0004119873046875, 0.0006954669952392578, 0.0009789466857910156, 0.0012624263763427734, 0.0015459060668945312, 0.001829385757446289, 0.002112865447998047, 0.0023963451385498047, 0.0026798248291015625, 0.0029633045196533203, 0.003246784210205078, 0.003530263900756836, 0.0038137435913085938, 0.0040972232818603516, 0.004380702972412109, 0.004664182662963867, 0.004947662353515625, 0.005231142044067383, 0.005514621734619141, 0.0057981014251708984, 0.006081581115722656, 0.006365060806274414, 0.006648540496826172, 0.00693202018737793, 0.0072154998779296875, 0.007498979568481445, 0.007782459259033203, 0.008065938949584961, 0.008349418640136719, 0.008632898330688477, 0.008916378021240234, 0.009199857711791992, 0.00948333740234375]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 12.0, 14.0, 11.0, 16.0, 25.0, 34.0, 47.0, 45.0, 96.0, 118.0, 158.0, 258.0, 413.0, 701.0, 1438.0, 4373.0, 17962.0, 94959.0, 510334.0, 342472.0, 57351.0, 11942.0, 3074.0, 1117.0, 532.0, 352.0, 191.0, 134.0, 102.0, 68.0, 52.0, 35.0, 33.0, 29.0, 12.0, 18.0, 12.0, 3.0, 4.0, 4.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.07464599609375, -0.07256412506103516, -0.07048225402832031, -0.06840038299560547, -0.06631851196289062, -0.06423664093017578, -0.06215476989746094, -0.060072898864746094, -0.05799102783203125, -0.055909156799316406, -0.05382728576660156, -0.05174541473388672, -0.049663543701171875, -0.04758167266845703, -0.04549980163574219, -0.043417930603027344, -0.0413360595703125, -0.039254188537597656, -0.03717231750488281, -0.03509044647216797, -0.033008575439453125, -0.03092670440673828, -0.028844833374023438, -0.026762962341308594, -0.02468109130859375, -0.022599220275878906, -0.020517349243164062, -0.01843547821044922, -0.016353607177734375, -0.014271736145019531, -0.012189865112304688, -0.010107994079589844, -0.008026123046875, -0.005944252014160156, -0.0038623809814453125, -0.0017805099487304688, 0.000301361083984375, 0.0023832321166992188, 0.0044651031494140625, 0.006546974182128906, 0.00862884521484375, 0.010710716247558594, 0.012792587280273438, 0.014874458312988281, 0.016956329345703125, 0.01903820037841797, 0.021120071411132812, 0.023201942443847656, 0.0252838134765625, 0.027365684509277344, 0.029447555541992188, 0.03152942657470703, 0.033611297607421875, 0.03569316864013672, 0.03777503967285156, 0.039856910705566406, 0.04193878173828125, 0.044020652770996094, 0.04610252380371094, 0.04818439483642578, 0.050266265869140625, 0.05234813690185547, 0.05443000793457031, 0.056511878967285156, 0.05859375]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 9.0, 8.0, 28.0, 35.0, 73.0, 97.0, 118.0, 157.0, 123.0, 133.0, 85.0, 70.0, 35.0, 18.0, 10.0, 1.0, 3.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004514477681368589, -0.004135251976549625, -0.0037560262717306614, -0.0033768003340810537, -0.0029975746292620897, -0.0026183489244431257, -0.002239122986793518, -0.001859897281974554, -0.00148067157715559, -0.001101445872336626, -0.0007222200511023402, -0.0003429942298680544, 3.6231474950909615e-05, 0.0004154571797698736, 0.0007946831174194813, 0.0011739088222384453, 0.0015531345270574093, 0.0019323602318763733, 0.0023115859366953373, 0.002690811874344945, 0.003070037579163909, 0.003449263283982873, 0.0038284892216324806, 0.004207714926451445, 0.004586940631270409, 0.004966166336089373, 0.005345392040908337, 0.005724618211388588, 0.006103843450546265, 0.006483069621026516, 0.00686229532584548, 0.007241521030664444, 0.007620746269822121, 0.007999972440302372, 0.008379197679460049, 0.0087584238499403, 0.009137649089097977, 0.009516875259578228, 0.00989610143005848, 0.010275326669216156, 0.010654551908373833, 0.011033778078854084, 0.01141300331801176, 0.011792229488492012, 0.012171454727649689, 0.01255068089812994, 0.012929907068610191, 0.013309132307767868, 0.01368835847824812, 0.01406758464872837, 0.014446809887886047, 0.014826036058366299, 0.015205261297523975, 0.015584487468004227, 0.015963712707161903, 0.01634293794631958, 0.016722165048122406, 0.017101390287280083, 0.01748061738908291, 0.017859842628240585, 0.018239067867398262, 0.01861829310655594, 0.018997520208358765, 0.01937674544751644, 0.019755970686674118]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 4.0, 4.0, 8.0, 4.0, 5.0, 13.0, 3.0, 8.0, 10.0, 20.0, 20.0, 21.0, 28.0, 19.0, 28.0, 39.0, 34.0, 35.0, 48.0, 35.0, 40.0, 33.0, 37.0, 38.0, 37.0, 29.0, 37.0, 31.0, 24.0, 29.0, 41.0, 30.0, 25.0, 28.0, 20.0, 17.0, 21.0, 12.0, 15.0, 16.0, 7.0, 13.0, 12.0, 3.0, 9.0, 6.0, 1.0, 4.0, 2.0, 6.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.004232347011566162, -0.00410831905901432, -0.003984291106462479, -0.003860263153910637, -0.003736235201358795, -0.0036122072488069534, -0.0034881792962551117, -0.00336415134370327, -0.0032401233911514282, -0.0031160954385995865, -0.0029920674860477448, -0.002868039533495903, -0.0027440115809440613, -0.0026199836283922195, -0.002495955675840378, -0.002371927723288536, -0.0022478997707366943, -0.0021238718181848526, -0.001999843865633011, -0.0018758159130811691, -0.0017517879605293274, -0.0016277600079774857, -0.001503732055425644, -0.0013797041028738022, -0.0012556761503219604, -0.0011316481977701187, -0.001007620245218277, -0.0008835922926664352, -0.0007595643401145935, -0.0006355363875627518, -0.00051150843501091, -0.0003874804824590683, -0.00026345252990722656, -0.00013942457735538483, -1.539662480354309e-05, 0.00010863132774829865, 0.00023265928030014038, 0.0003566872328519821, 0.00048071518540382385, 0.0006047431379556656, 0.0007287710905075073, 0.0008527990430593491, 0.0009768269956111908, 0.0011008549481630325, 0.0012248829007148743, 0.001348910853266716, 0.0014729388058185577, 0.0015969667583703995, 0.0017209947109222412, 0.001845022663474083, 0.0019690506160259247, 0.0020930785685777664, 0.002217106521129608, 0.00234113447368145, 0.0024651624262332916, 0.0025891903787851334, 0.002713218331336975, 0.002837246283888817, 0.0029612742364406586, 0.0030853021889925003, 0.003209330141544342, 0.0033333580940961838, 0.0034573860466480255, 0.0035814139991998672, 0.003705441951751709]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 2.0, 0.0, 5.0, 5.0, 5.0, 10.0, 6.0, 9.0, 8.0, 13.0, 11.0, 9.0, 23.0, 24.0, 30.0, 32.0, 22.0, 32.0, 29.0, 38.0, 43.0, 42.0, 42.0, 38.0, 32.0, 36.0, 45.0, 52.0, 33.0, 34.0, 22.0, 40.0, 32.0, 34.0, 23.0, 25.0, 21.0, 19.0, 9.0, 17.0, 14.0, 8.0, 6.0, 9.0, 6.0, 6.0, 3.0, 1.0, 2.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-62.3125, -60.35400390625, -58.3955078125, -56.43701171875, -54.478515625, -52.52001953125, -50.5615234375, -48.60302734375, -46.64453125, -44.68603515625, -42.7275390625, -40.76904296875, -38.810546875, -36.85205078125, -34.8935546875, -32.93505859375, -30.9765625, -29.01806640625, -27.0595703125, -25.10107421875, -23.142578125, -21.18408203125, -19.2255859375, -17.26708984375, -15.30859375, -13.35009765625, -11.3916015625, -9.43310546875, -7.474609375, -5.51611328125, -3.5576171875, -1.59912109375, 0.359375, 2.31787109375, 4.2763671875, 6.23486328125, 8.193359375, 10.15185546875, 12.1103515625, 14.06884765625, 16.02734375, 17.98583984375, 19.9443359375, 21.90283203125, 23.861328125, 25.81982421875, 27.7783203125, 29.73681640625, 31.6953125, 33.65380859375, 35.6123046875, 37.57080078125, 39.529296875, 41.48779296875, 43.4462890625, 45.40478515625, 47.36328125, 49.32177734375, 51.2802734375, 53.23876953125, 55.197265625, 57.15576171875, 59.1142578125, 61.07275390625, 63.03125]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 6.0, 4.0, 15.0, 13.0, 14.0, 13.0, 57.0, 46.0, 68.0, 121.0, 151.0, 310.0, 448.0, 866.0, 1765.0, 3944.0, 10112.0, 38130.0, 270881.0, 604310.0, 88575.0, 17303.0, 5944.0, 2623.0, 1221.0, 632.0, 353.0, 204.0, 143.0, 89.0, 67.0, 40.0, 20.0, 20.0, 13.0, 13.0, 8.0, 3.0, 6.0, 7.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.671875, -20.99951171875, -20.3271484375, -19.65478515625, -18.982421875, -18.31005859375, -17.6376953125, -16.96533203125, -16.29296875, -15.62060546875, -14.9482421875, -14.27587890625, -13.603515625, -12.93115234375, -12.2587890625, -11.58642578125, -10.9140625, -10.24169921875, -9.5693359375, -8.89697265625, -8.224609375, -7.55224609375, -6.8798828125, -6.20751953125, -5.53515625, -4.86279296875, -4.1904296875, -3.51806640625, -2.845703125, -2.17333984375, -1.5009765625, -0.82861328125, -0.15625, 0.51611328125, 1.1884765625, 1.86083984375, 2.533203125, 3.20556640625, 3.8779296875, 4.55029296875, 5.22265625, 5.89501953125, 6.5673828125, 7.23974609375, 7.912109375, 8.58447265625, 9.2568359375, 9.92919921875, 10.6015625, 11.27392578125, 11.9462890625, 12.61865234375, 13.291015625, 13.96337890625, 14.6357421875, 15.30810546875, 15.98046875, 16.65283203125, 17.3251953125, 17.99755859375, 18.669921875, 19.34228515625, 20.0146484375, 20.68701171875, 21.359375]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 7.0, 7.0, 13.0, 23.0, 32.0, 61.0, 63.0, 103.0, 94.0, 2142.0, 112.0, 105.0, 93.0, 73.0, 35.0, 41.0, 18.0, 12.0, 13.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-170.125, -163.744140625, -157.36328125, -150.982421875, -144.6015625, -138.220703125, -131.83984375, -125.458984375, -119.078125, -112.697265625, -106.31640625, -99.935546875, -93.5546875, -87.173828125, -80.79296875, -74.412109375, -68.03125, -61.650390625, -55.26953125, -48.888671875, -42.5078125, -36.126953125, -29.74609375, -23.365234375, -16.984375, -10.603515625, -4.22265625, 2.158203125, 8.5390625, 14.919921875, 21.30078125, 27.681640625, 34.0625, 40.443359375, 46.82421875, 53.205078125, 59.5859375, 65.966796875, 72.34765625, 78.728515625, 85.109375, 91.490234375, 97.87109375, 104.251953125, 110.6328125, 117.013671875, 123.39453125, 129.775390625, 136.15625, 142.537109375, 148.91796875, 155.298828125, 161.6796875, 168.060546875, 174.44140625, 180.822265625, 187.203125, 193.583984375, 199.96484375, 206.345703125, 212.7265625, 219.107421875, 225.48828125, 231.869140625, 238.25]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 3.0, 7.0, 7.0, 9.0, 20.0, 27.0, 36.0, 53.0, 93.0, 149.0, 240.0, 446.0, 966.0, 2917.0, 30347.0, 2953128.0, 148564.0, 5946.0, 1346.0, 598.0, 313.0, 182.0, 111.0, 81.0, 35.0, 30.0, 12.0, 15.0, 10.0, 5.0, 7.0, 3.0, 5.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-46.46875, -45.236328125, -44.00390625, -42.771484375, -41.5390625, -40.306640625, -39.07421875, -37.841796875, -36.609375, -35.376953125, -34.14453125, -32.912109375, -31.6796875, -30.447265625, -29.21484375, -27.982421875, -26.75, -25.517578125, -24.28515625, -23.052734375, -21.8203125, -20.587890625, -19.35546875, -18.123046875, -16.890625, -15.658203125, -14.42578125, -13.193359375, -11.9609375, -10.728515625, -9.49609375, -8.263671875, -7.03125, -5.798828125, -4.56640625, -3.333984375, -2.1015625, -0.869140625, 0.36328125, 1.595703125, 2.828125, 4.060546875, 5.29296875, 6.525390625, 7.7578125, 8.990234375, 10.22265625, 11.455078125, 12.6875, 13.919921875, 15.15234375, 16.384765625, 17.6171875, 18.849609375, 20.08203125, 21.314453125, 22.546875, 23.779296875, 25.01171875, 26.244140625, 27.4765625, 28.708984375, 29.94140625, 31.173828125, 32.40625]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [3.0, 4.0, 2.0, 15.0, 90.0, 471.0, 329.0, 61.0, 21.0, 5.0, 7.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-101.57868957519531, -84.30937194824219, -67.04005432128906, -49.77073669433594, -32.50141906738281, -15.232101440429688, 2.0372161865234375, 19.306533813476562, 36.57585144042969, 53.84516906738281, 71.11448669433594, 88.38380432128906, 105.65312194824219, 122.92243957519531, 140.19175720214844, 157.46107482910156, 174.7303924560547, 191.9997100830078, 209.26902770996094, 226.53834533691406, 243.8076629638672, 261.07696533203125, 278.3463134765625, 295.6156005859375, 312.88494873046875, 330.1542663574219, 347.423583984375, 364.6929016113281, 381.96221923828125, 399.2315368652344, 416.5008544921875, 433.7701721191406, 451.03948974609375, 468.3088073730469, 485.578125, 502.8474426269531, 520.1167602539062, 537.3861083984375, 554.6553955078125, 571.9246826171875, 589.1940307617188, 606.46337890625, 623.732666015625, 641.001953125, 658.2713012695312, 675.5406494140625, 692.8099365234375, 710.0792236328125, 727.3485717773438, 744.617919921875, 761.88720703125, 779.156494140625, 796.4258422851562, 813.6951904296875, 830.9644775390625, 848.2337646484375, 865.5031127929688, 882.7724609375, 900.041748046875, 917.31103515625, 934.5803833007812, 951.8497314453125, 969.1190185546875, 986.3883056640625, 1003.6576538085938]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 8.0, 8.0, 7.0, 5.0, 12.0, 11.0, 7.0, 16.0, 12.0, 11.0, 18.0, 21.0, 25.0, 35.0, 35.0, 39.0, 35.0, 27.0, 34.0, 40.0, 45.0, 42.0, 49.0, 45.0, 34.0, 37.0, 51.0, 28.0, 41.0, 30.0, 19.0, 33.0, 19.0, 21.0, 16.0, 12.0, 16.0, 16.0, 12.0, 11.0, 6.0, 6.0, 4.0, 5.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-108.2690200805664, -104.6438980102539, -101.0187759399414, -97.3936538696289, -93.7685317993164, -90.1434097290039, -86.51829528808594, -82.89317321777344, -79.26805114746094, -75.64292907714844, -72.01780700683594, -68.39268493652344, -64.76756286621094, -61.14244079589844, -57.5173225402832, -53.8922004699707, -50.26707458496094, -46.64195251464844, -43.01683044433594, -39.39170837402344, -35.76658630371094, -32.14146423339844, -28.516345977783203, -24.891223907470703, -21.266101837158203, -17.640979766845703, -14.01585865020752, -10.390737533569336, -6.765615463256836, -3.140493392944336, 0.48462677001953125, 4.109748840332031, 7.7348785400390625, 11.360000610351562, 14.985121726989746, 18.61024284362793, 22.23536491394043, 25.86048698425293, 29.485607147216797, 33.1107292175293, 36.7358512878418, 40.3609733581543, 43.9860954284668, 47.61121368408203, 51.23633575439453, 54.86145782470703, 58.48657989501953, 62.11170196533203, 65.73682403564453, 69.36194610595703, 72.98706817626953, 76.61219024658203, 80.23731231689453, 83.86243438720703, 87.487548828125, 91.1126708984375, 94.73779296875, 98.3629150390625, 101.988037109375, 105.6131591796875, 109.23828125, 112.8634033203125, 116.488525390625, 120.1136474609375, 123.73876953125]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 3.0, 5.0, 7.0, 7.0, 7.0, 14.0, 24.0, 32.0, 46.0, 53.0, 56.0, 109.0, 140.0, 171.0, 211.0, 248.0, 348.0, 430.0, 578.0, 830.0, 1245.0, 1040567.0, 873.0, 591.0, 472.0, 360.0, 243.0, 234.0, 163.0, 126.0, 90.0, 75.0, 59.0, 47.0, 20.0, 26.0, 11.0, 12.0, 9.0, 4.0, 11.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-44.7052116394043, -43.309852600097656, -41.914493560791016, -40.519134521484375, -39.123779296875, -37.72842025756836, -36.33306121826172, -34.93770217895508, -33.54234313964844, -32.1469841003418, -30.75162696838379, -29.35626792907715, -27.960908889770508, -26.5655517578125, -25.17019271850586, -23.77483367919922, -22.37947654724121, -20.98411750793457, -19.588760375976562, -18.193401336669922, -16.79804229736328, -15.402684211730957, -14.007326126098633, -12.611967086791992, -11.216609001159668, -9.821250915527344, -8.425891876220703, -7.030533790588379, -5.6351752281188965, -4.239816665649414, -2.84445858001709, -1.4490995407104492, -0.053741455078125, 1.3416169881820679, 2.7369754314422607, 4.132333755493164, 5.5276923179626465, 6.923050880432129, 8.318408966064453, 9.713768005371094, 11.109126091003418, 12.504484176635742, 13.899843215942383, 15.295201301574707, 16.69055938720703, 18.085918426513672, 19.481277465820312, 20.876636505126953, 22.27199363708496, 23.6673526763916, 25.06270980834961, 26.45806884765625, 27.85342788696289, 29.24878692626953, 30.64414405822754, 32.03950500488281, 33.43486022949219, 34.83021926879883, 36.22557830810547, 37.620933532714844, 39.016292572021484, 40.411651611328125, 41.807010650634766, 43.202369689941406, 44.59772872924805]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 6.0, 11.0, 12.0, 19.0, 14.0, 38.0, 141.0, 51462624.0, 158.0, 45.0, 23.0, 9.0, 5.0, 3.0, 11.0, 9.0, 14.0, 3.0, 3.0, 5.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9344.880859375, -8912.078125, -8479.275390625, -8046.47216796875, -7613.66943359375, -7180.86669921875, -6748.0634765625, -6315.2607421875, -5882.4580078125, -5449.6552734375, -5016.8525390625, -4584.04931640625, -4151.24658203125, -3718.44384765625, -3285.640869140625, -2852.837890625, -2420.03515625, -1987.2322998046875, -1554.429443359375, -1121.6265869140625, -688.82373046875, -256.02099609375, 176.781982421875, 609.5849609375, 1042.3876953125, 1475.1905517578125, 1907.993408203125, 2340.79638671875, 2773.59912109375, 3206.40185546875, 3639.204833984375, 4072.0078125, 4504.810546875, 4937.61328125, 5370.416015625, 5803.21923828125, 6236.02197265625, 6668.82470703125, 7101.6279296875, 7534.4306640625, 7967.2333984375, 8400.0361328125, 8832.8388671875, 9265.6416015625, 9698.4453125, 10131.248046875, 10564.05078125, 10996.853515625, 11429.65625, 11862.458984375, 12295.26171875, 12728.064453125, 13160.8671875, 13593.669921875, 14026.4736328125, 14459.2763671875, 14892.0791015625, 15324.8818359375, 15757.6845703125, 16190.4873046875, 16623.291015625, 17056.09375, 17488.896484375, 17921.69921875, 18354.501953125]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 4.0, 6.0, 3.0, 7.0, 14.0, 14.0, 32.0, 38.0, 56.0, 84.0, 140.0, 195.0, 268.0, 441.0, 672.0, 1080.0, 1741.0, 2793.0, 4954.0, 8321.0, 14639.0, 25744.0, 46103.0, 84229.0, 160594.0, 332398.0, 3490297.0, 1480104.0, 306231.0, 149652.0, 79415.0, 43393.0, 24205.0, 13864.0, 7908.0, 4554.0, 2711.0, 1692.0, 998.0, 657.0, 387.0, 256.0, 162.0, 134.0, 80.0, 48.0, 41.0, 25.0, 23.0, 13.0, 9.0, 3.0, 3.0, 5.0, 1.0, 3.0], "bins": [-8.65625, -8.4085693359375, -8.160888671875, -7.9132080078125, -7.66552734375, -7.4178466796875, -7.170166015625, -6.9224853515625, -6.6748046875, -6.4271240234375, -6.179443359375, -5.9317626953125, -5.68408203125, -5.4364013671875, -5.188720703125, -4.9410400390625, -4.693359375, -4.4456787109375, -4.197998046875, -3.9503173828125, -3.70263671875, -3.4549560546875, -3.207275390625, -2.9595947265625, -2.7119140625, -2.4642333984375, -2.216552734375, -1.9688720703125, -1.72119140625, -1.4735107421875, -1.225830078125, -0.9781494140625, -0.73046875, -0.4827880859375, -0.235107421875, 0.0125732421875, 0.26025390625, 0.5079345703125, 0.755615234375, 1.0032958984375, 1.2509765625, 1.4986572265625, 1.746337890625, 1.9940185546875, 2.24169921875, 2.4893798828125, 2.737060546875, 2.9847412109375, 3.232421875, 3.4801025390625, 3.727783203125, 3.9754638671875, 4.22314453125, 4.4708251953125, 4.718505859375, 4.9661865234375, 5.2138671875, 5.4615478515625, 5.709228515625, 5.9569091796875, 6.20458984375, 6.4522705078125, 6.699951171875, 6.9476318359375, 7.1953125]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 3.0, 5.0, 9.0, 12.0, 6.0, 15.0, 20.0, 18.0, 12.0, 25.0, 22.0, 32.0, 31.0, 28.0, 24.0, 43.0, 43.0, 37.0, 55.0, 131.0, 617.0, 323.0, 83.0, 55.0, 50.0, 29.0, 33.0, 30.0, 34.0, 25.0, 24.0, 28.0, 23.0, 18.0, 17.0, 11.0, 13.0, 7.0, 10.0, 9.0, 6.0, 3.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.5, -12.05126953125, -11.6025390625, -11.15380859375, -10.705078125, -10.25634765625, -9.8076171875, -9.35888671875, -8.91015625, -8.46142578125, -8.0126953125, -7.56396484375, -7.115234375, -6.66650390625, -6.2177734375, -5.76904296875, -5.3203125, -4.87158203125, -4.4228515625, -3.97412109375, -3.525390625, -3.07666015625, -2.6279296875, -2.17919921875, -1.73046875, -1.28173828125, -0.8330078125, -0.38427734375, 0.064453125, 0.51318359375, 0.9619140625, 1.41064453125, 1.859375, 2.30810546875, 2.7568359375, 3.20556640625, 3.654296875, 4.10302734375, 4.5517578125, 5.00048828125, 5.44921875, 5.89794921875, 6.3466796875, 6.79541015625, 7.244140625, 7.69287109375, 8.1416015625, 8.59033203125, 9.0390625, 9.48779296875, 9.9365234375, 10.38525390625, 10.833984375, 11.28271484375, 11.7314453125, 12.18017578125, 12.62890625, 13.07763671875, 13.5263671875, 13.97509765625, 14.423828125, 14.87255859375, 15.3212890625, 15.77001953125, 16.21875]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 3.0, 0.0, 6.0, 6.0, 9.0, 5.0, 15.0, 15.0, 31.0, 30.0, 65.0, 123.0, 209.0, 258.0, 434.0, 722.0, 1215.0, 1920.0, 3399.0, 6278.0, 11397.0, 20393.0, 38028.0, 74100.0, 150878.0, 358177.0, 4105310.0, 1013461.0, 259188.0, 118634.0, 58658.0, 30803.0, 16455.0, 8981.0, 5074.0, 2930.0, 1676.0, 888.0, 612.0, 368.0, 219.0, 133.0, 131.0, 82.0, 44.0, 28.0, 9.0, 9.0, 8.0, 13.0, 5.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 0.0, 3.0], "bins": [-8.546875, -8.2603759765625, -7.973876953125, -7.6873779296875, -7.40087890625, -7.1143798828125, -6.827880859375, -6.5413818359375, -6.2548828125, -5.9683837890625, -5.681884765625, -5.3953857421875, -5.10888671875, -4.8223876953125, -4.535888671875, -4.2493896484375, -3.962890625, -3.6763916015625, -3.389892578125, -3.1033935546875, -2.81689453125, -2.5303955078125, -2.243896484375, -1.9573974609375, -1.6708984375, -1.3843994140625, -1.097900390625, -0.8114013671875, -0.52490234375, -0.2384033203125, 0.048095703125, 0.3345947265625, 0.62109375, 0.9075927734375, 1.194091796875, 1.4805908203125, 1.76708984375, 2.0535888671875, 2.340087890625, 2.6265869140625, 2.9130859375, 3.1995849609375, 3.486083984375, 3.7725830078125, 4.05908203125, 4.3455810546875, 4.632080078125, 4.9185791015625, 5.205078125, 5.4915771484375, 5.778076171875, 6.0645751953125, 6.35107421875, 6.6375732421875, 6.924072265625, 7.2105712890625, 7.4970703125, 7.7835693359375, 8.070068359375, 8.3565673828125, 8.64306640625, 8.9295654296875, 9.216064453125, 9.5025634765625, 9.7890625]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 6.0, 9.0, 17.0, 16.0, 16.0, 15.0, 17.0, 25.0, 29.0, 29.0, 42.0, 38.0, 37.0, 58.0, 57.0, 130.0, 376.0, 539.0, 119.0, 70.0, 61.0, 41.0, 45.0, 29.0, 28.0, 27.0, 23.0, 27.0, 21.0, 11.0, 7.0, 15.0, 10.0, 7.0, 8.0, 7.0, 2.0, 2.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-10.390625, -10.0450439453125, -9.699462890625, -9.3538818359375, -9.00830078125, -8.6627197265625, -8.317138671875, -7.9715576171875, -7.6259765625, -7.2803955078125, -6.934814453125, -6.5892333984375, -6.24365234375, -5.8980712890625, -5.552490234375, -5.2069091796875, -4.861328125, -4.5157470703125, -4.170166015625, -3.8245849609375, -3.47900390625, -3.1334228515625, -2.787841796875, -2.4422607421875, -2.0966796875, -1.7510986328125, -1.405517578125, -1.0599365234375, -0.71435546875, -0.3687744140625, -0.023193359375, 0.3223876953125, 0.66796875, 1.0135498046875, 1.359130859375, 1.7047119140625, 2.05029296875, 2.3958740234375, 2.741455078125, 3.0870361328125, 3.4326171875, 3.7781982421875, 4.123779296875, 4.4693603515625, 4.81494140625, 5.1605224609375, 5.506103515625, 5.8516845703125, 6.197265625, 6.5428466796875, 6.888427734375, 7.2340087890625, 7.57958984375, 7.9251708984375, 8.270751953125, 8.6163330078125, 8.9619140625, 9.3074951171875, 9.653076171875, 9.9986572265625, 10.34423828125, 10.6898193359375, 11.035400390625, 11.3809814453125, 11.7265625]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 11.0, 10.0, 2.0, 13.0, 41.0, 27.0, 53.0, 62.0, 77.0, 137.0, 141.0, 287.0, 386.0, 637.0, 885.0, 1435.0, 2513.0, 4808.0, 11439.0, 33902.0, 221455.0, 5927881.0, 54969.0, 15792.0, 6472.0, 3022.0, 1787.0, 1079.0, 639.0, 466.0, 285.0, 211.0, 165.0, 108.0, 70.0, 43.0, 32.0, 17.0, 26.0, 15.0, 23.0, 9.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-26.453125, -25.576416015625, -24.69970703125, -23.822998046875, -22.9462890625, -22.069580078125, -21.19287109375, -20.316162109375, -19.439453125, -18.562744140625, -17.68603515625, -16.809326171875, -15.9326171875, -15.055908203125, -14.17919921875, -13.302490234375, -12.42578125, -11.549072265625, -10.67236328125, -9.795654296875, -8.9189453125, -8.042236328125, -7.16552734375, -6.288818359375, -5.412109375, -4.535400390625, -3.65869140625, -2.781982421875, -1.9052734375, -1.028564453125, -0.15185546875, 0.724853515625, 1.6015625, 2.478271484375, 3.35498046875, 4.231689453125, 5.1083984375, 5.985107421875, 6.86181640625, 7.738525390625, 8.615234375, 9.491943359375, 10.36865234375, 11.245361328125, 12.1220703125, 12.998779296875, 13.87548828125, 14.752197265625, 15.62890625, 16.505615234375, 17.38232421875, 18.259033203125, 19.1357421875, 20.012451171875, 20.88916015625, 21.765869140625, 22.642578125, 23.519287109375, 24.39599609375, 25.272705078125, 26.1494140625, 27.026123046875, 27.90283203125, 28.779541015625, 29.65625]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 5.0, 5.0, 10.0, 11.0, 9.0, 8.0, 20.0, 30.0, 26.0, 31.0, 37.0, 43.0, 47.0, 47.0, 82.0, 127.0, 269.0, 555.0, 190.0, 106.0, 65.0, 53.0, 45.0, 29.0, 35.0, 27.0, 21.0, 24.0, 17.0, 17.0, 6.0, 11.0, 2.0, 4.0, 3.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.31640625, -7.03765869140625, -6.7589111328125, -6.48016357421875, -6.201416015625, -5.92266845703125, -5.6439208984375, -5.36517333984375, -5.08642578125, -4.80767822265625, -4.5289306640625, -4.25018310546875, -3.971435546875, -3.69268798828125, -3.4139404296875, -3.13519287109375, -2.8564453125, -2.57769775390625, -2.2989501953125, -2.02020263671875, -1.741455078125, -1.46270751953125, -1.1839599609375, -0.90521240234375, -0.62646484375, -0.34771728515625, -0.0689697265625, 0.20977783203125, 0.488525390625, 0.76727294921875, 1.0460205078125, 1.32476806640625, 1.603515625, 1.88226318359375, 2.1610107421875, 2.43975830078125, 2.718505859375, 2.99725341796875, 3.2760009765625, 3.55474853515625, 3.83349609375, 4.11224365234375, 4.3909912109375, 4.66973876953125, 4.948486328125, 5.22723388671875, 5.5059814453125, 5.78472900390625, 6.0634765625, 6.34222412109375, 6.6209716796875, 6.89971923828125, 7.178466796875, 7.45721435546875, 7.7359619140625, 8.01470947265625, 8.29345703125, 8.57220458984375, 8.8509521484375, 9.12969970703125, 9.408447265625, 9.68719482421875, 9.9659423828125, 10.24468994140625, 10.5234375]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 8.0, 14.0, 13.0, 16.0, 22.0, 42.0, 64.0, 111.0, 339.0, 176.0, 78.0, 48.0, 25.0, 16.0, 10.0, 8.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.07371711730957, -17.342132568359375, -16.610549926757812, -15.878965377807617, -15.147382736206055, -14.41579818725586, -13.68421459197998, -12.952630996704102, -12.221047401428223, -11.489463806152344, -10.757880210876465, -10.026296615600586, -9.29471206665039, -8.563129425048828, -7.831544876098633, -7.099961280822754, -6.368377685546875, -5.636794090270996, -4.905210494995117, -4.17362642288208, -3.442042827606201, -2.7104592323303223, -1.9788751602172852, -1.2472915649414062, -0.5157079696655273, 0.2158757448196411, 0.9474594593048096, 1.6790432929992676, 2.4106268882751465, 3.1422104835510254, 3.8737945556640625, 4.605378150939941, 5.336963653564453, 6.068547248840332, 6.800130844116211, 7.531714916229248, 8.263298034667969, 8.994882583618164, 9.726466178894043, 10.458049774169922, 11.1896333694458, 11.92121696472168, 12.652800559997559, 13.384384155273438, 14.115968704223633, 14.847551345825195, 15.57913589477539, 16.310718536376953, 17.04230308532715, 17.773887634277344, 18.505470275878906, 19.2370548248291, 19.968637466430664, 20.70022201538086, 21.431804656982422, 22.163389205932617, 22.894973754882812, 23.626558303833008, 24.35814094543457, 25.089725494384766, 25.821308135986328, 26.552892684936523, 27.28447723388672, 28.01605987548828, 28.747642517089844]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 4.0, 2.0, 5.0, 7.0, 6.0, 11.0, 14.0, 11.0, 19.0, 15.0, 27.0, 24.0, 16.0, 33.0, 16.0, 30.0, 31.0, 21.0, 33.0, 39.0, 45.0, 32.0, 41.0, 53.0, 47.0, 36.0, 41.0, 23.0, 41.0, 33.0, 30.0, 22.0, 31.0, 30.0, 22.0, 19.0, 21.0, 19.0, 13.0, 8.0, 7.0, 9.0, 7.0, 4.0, 2.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-10.302553176879883, -9.99184513092041, -9.681138038635254, -9.370429992675781, -9.059721946716309, -8.749013900756836, -8.43830680847168, -8.127598762512207, -7.816891193389893, -7.506183624267578, -7.1954755783081055, -6.884768009185791, -6.574060440063477, -6.263352394104004, -5.9526448249816895, -5.641937255859375, -5.331229209899902, -5.020521640777588, -4.709813594818115, -4.399106025695801, -4.088397979736328, -3.7776904106140137, -3.466982841491699, -3.1562750339508057, -2.845567226409912, -2.5348594188690186, -2.224151611328125, -1.9134440422058105, -1.602736234664917, -1.2920284271240234, -0.9813207387924194, -0.6706130504608154, -0.3599061965942383, -0.0491984486579895, 0.2615092992782593, 0.5722170472145081, 0.8829247951507568, 1.1936326026916504, 1.5043402910232544, 1.8150479793548584, 2.125755786895752, 2.4364635944366455, 2.747171401977539, 3.0578789710998535, 3.368586778640747, 3.6792945861816406, 3.990002155303955, 4.3007097244262695, 4.611417770385742, 4.922125339508057, 5.232833385467529, 5.543540954589844, 5.854249000549316, 6.164956569671631, 6.475664138793945, 6.786372184753418, 7.097079753875732, 7.407787322998047, 7.7184953689575195, 8.029203414916992, 8.339910507202148, 8.650618553161621, 8.961326599121094, 9.27203369140625, 9.582741737365723]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 3.0, 4.0, 9.0, 10.0, 24.0, 18.0, 26.0, 40.0, 59.0, 70.0, 93.0, 98.0, 169.0, 229.0, 287.0, 400.0, 558.0, 806.0, 1240.0, 1803.0, 2841.0, 4867.0, 9073.0, 18967.0, 54657.0, 3973262.0, 80600.0, 21594.0, 9439.0, 4910.0, 2712.0, 1694.0, 1098.0, 746.0, 495.0, 394.0, 268.0, 191.0, 139.0, 92.0, 85.0, 53.0, 38.0, 32.0, 23.0, 15.0, 21.0, 7.0, 6.0, 8.0, 2.0, 3.0, 1.0, 1.0, 4.0, 4.0, 2.0], "bins": [-0.025726318359375, -0.024937868118286133, -0.024149417877197266, -0.0233609676361084, -0.02257251739501953, -0.021784067153930664, -0.020995616912841797, -0.02020716667175293, -0.019418716430664062, -0.018630266189575195, -0.017841815948486328, -0.01705336570739746, -0.016264915466308594, -0.015476465225219727, -0.01468801498413086, -0.013899564743041992, -0.013111114501953125, -0.012322664260864258, -0.01153421401977539, -0.010745763778686523, -0.009957313537597656, -0.009168863296508789, -0.008380413055419922, -0.007591962814331055, -0.0068035125732421875, -0.00601506233215332, -0.005226612091064453, -0.004438161849975586, -0.0036497116088867188, -0.0028612613677978516, -0.0020728111267089844, -0.0012843608856201172, -0.00049591064453125, 0.0002925395965576172, 0.0010809898376464844, 0.0018694400787353516, 0.0026578903198242188, 0.003446340560913086, 0.004234790802001953, 0.00502324104309082, 0.0058116912841796875, 0.006600141525268555, 0.007388591766357422, 0.008177042007446289, 0.008965492248535156, 0.009753942489624023, 0.01054239273071289, 0.011330842971801758, 0.012119293212890625, 0.012907743453979492, 0.01369619369506836, 0.014484643936157227, 0.015273094177246094, 0.01606154441833496, 0.016849994659423828, 0.017638444900512695, 0.018426895141601562, 0.01921534538269043, 0.020003795623779297, 0.020792245864868164, 0.02158069610595703, 0.0223691463470459, 0.023157596588134766, 0.023946046829223633, 0.0247344970703125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 0.0, 4.0, 3.0, 0.0, 3.0, 6.0, 7.0, 6.0, 3.0, 7.0, 9.0, 9.0, 10.0, 19.0, 19.0, 129.0, 653.0, 16.0, 20.0, 9.0, 12.0, 7.0, 11.0, 7.0, 5.0, 3.0, 1.0, 2.0, 6.0, 2.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0031833648681640625, -0.0030736923217773438, -0.002964019775390625, -0.0028543472290039062, -0.0027446746826171875, -0.0026350021362304688, -0.00252532958984375, -0.0024156570434570312, -0.0023059844970703125, -0.0021963119506835938, -0.002086639404296875, -0.0019769668579101562, -0.0018672943115234375, -0.0017576217651367188, -0.00164794921875, -0.0015382766723632812, -0.0014286041259765625, -0.0013189315795898438, -0.001209259033203125, -0.0010995864868164062, -0.0009899139404296875, -0.0008802413940429688, -0.00077056884765625, -0.0006608963012695312, -0.0005512237548828125, -0.00044155120849609375, -0.000331878662109375, -0.00022220611572265625, -0.0001125335693359375, -2.86102294921875e-06, 0.0001068115234375, 0.00021648406982421875, 0.0003261566162109375, 0.00043582916259765625, 0.000545501708984375, 0.0006551742553710938, 0.0007648468017578125, 0.0008745193481445312, 0.00098419189453125, 0.0010938644409179688, 0.0012035369873046875, 0.0013132095336914062, 0.001422882080078125, 0.0015325546264648438, 0.0016422271728515625, 0.0017518997192382812, 0.001861572265625, 0.0019712448120117188, 0.0020809173583984375, 0.0021905899047851562, 0.002300262451171875, 0.0024099349975585938, 0.0025196075439453125, 0.0026292800903320312, 0.00273895263671875, 0.0028486251831054688, 0.0029582977294921875, 0.0030679702758789062, 0.003177642822265625, 0.0032873153686523438, 0.0033969879150390625, 0.0035066604614257812, 0.0036163330078125, 0.0037260055541992188, 0.0038356781005859375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 5.0, 9.0, 15.0, 18.0, 24.0, 47.0, 49.0, 101.0, 180.0, 308.0, 593.0, 1383.0, 3951.0, 18320.0, 230569.0, 3838787.0, 84409.0, 10692.0, 2693.0, 1014.0, 469.0, 243.0, 152.0, 67.0, 63.0, 35.0, 26.0, 21.0, 7.0, 14.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0513916015625, -0.0496978759765625, -0.048004150390625, -0.0463104248046875, -0.04461669921875, -0.0429229736328125, -0.041229248046875, -0.0395355224609375, -0.037841796875, -0.0361480712890625, -0.034454345703125, -0.0327606201171875, -0.03106689453125, -0.0293731689453125, -0.027679443359375, -0.0259857177734375, -0.0242919921875, -0.0225982666015625, -0.020904541015625, -0.0192108154296875, -0.01751708984375, -0.0158233642578125, -0.014129638671875, -0.0124359130859375, -0.0107421875, -0.0090484619140625, -0.007354736328125, -0.0056610107421875, -0.00396728515625, -0.0022735595703125, -0.000579833984375, 0.0011138916015625, 0.0028076171875, 0.0045013427734375, 0.006195068359375, 0.0078887939453125, 0.00958251953125, 0.0112762451171875, 0.012969970703125, 0.0146636962890625, 0.016357421875, 0.0180511474609375, 0.019744873046875, 0.0214385986328125, 0.02313232421875, 0.0248260498046875, 0.026519775390625, 0.0282135009765625, 0.0299072265625, 0.0316009521484375, 0.033294677734375, 0.0349884033203125, 0.03668212890625, 0.0383758544921875, 0.040069580078125, 0.0417633056640625, 0.04345703125, 0.0451507568359375, 0.046844482421875, 0.0485382080078125, 0.05023193359375, 0.0519256591796875, 0.053619384765625, 0.0553131103515625, 0.0570068359375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 5.0, 2.0, 2.0, 11.0, 7.0, 19.0, 19.0, 24.0, 41.0, 49.0, 51.0, 79.0, 102.0, 147.0, 162.0, 287.0, 726.0, 1284.0, 319.0, 176.0, 123.0, 106.0, 73.0, 58.0, 53.0, 44.0, 23.0, 16.0, 15.0, 10.0, 10.0, 11.0, 6.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.00629425048828125, -0.006114959716796875, -0.0059356689453125, -0.005756378173828125, -0.00557708740234375, -0.005397796630859375, -0.005218505859375, -0.005039215087890625, -0.00485992431640625, -0.004680633544921875, -0.0045013427734375, -0.004322052001953125, -0.00414276123046875, -0.003963470458984375, -0.0037841796875, -0.003604888916015625, -0.00342559814453125, -0.003246307373046875, -0.0030670166015625, -0.002887725830078125, -0.00270843505859375, -0.002529144287109375, -0.002349853515625, -0.002170562744140625, -0.00199127197265625, -0.001811981201171875, -0.0016326904296875, -0.001453399658203125, -0.00127410888671875, -0.001094818115234375, -0.00091552734375, -0.000736236572265625, -0.00055694580078125, -0.000377655029296875, -0.0001983642578125, -1.9073486328125e-05, 0.00016021728515625, 0.000339508056640625, 0.000518798828125, 0.000698089599609375, 0.00087738037109375, 0.001056671142578125, 0.0012359619140625, 0.001415252685546875, 0.00159454345703125, 0.001773834228515625, 0.001953125, 0.002132415771484375, 0.00231170654296875, 0.002490997314453125, 0.0026702880859375, 0.002849578857421875, 0.00302886962890625, 0.003208160400390625, 0.003387451171875, 0.003566741943359375, 0.00374603271484375, 0.003925323486328125, 0.0041046142578125, 0.004283905029296875, 0.00446319580078125, 0.004642486572265625, 0.00482177734375, 0.005001068115234375, 0.00518035888671875]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 6.0, 12.0, 34.0, 141.0, 344.0, 288.0, 117.0, 36.0, 12.0, 6.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.10133396089076996, -0.0982494130730629, -0.09516487270593643, -0.09208032488822937, -0.08899577707052231, -0.08591122925281525, -0.08282668888568878, -0.07974214106798172, -0.07665759325027466, -0.0735730454325676, -0.07048850506544113, -0.06740395724773407, -0.06431940943002701, -0.061234865337610245, -0.05815032124519348, -0.05506577342748642, -0.051981229335069656, -0.04889668524265289, -0.04581213742494583, -0.04272759333252907, -0.039643045514822006, -0.03655850142240524, -0.03347395360469818, -0.030389409512281418, -0.027304863557219505, -0.024220317602157593, -0.02113577164709568, -0.018051225692033768, -0.01496668066829443, -0.011882134713232517, -0.00879758968949318, -0.005713043734431267, -0.0026284977793693542, 0.00045604794286191463, 0.0035405936650931835, 0.006625139154493809, 0.009709685109555721, 0.012794231064617634, 0.015878776088356972, 0.018963322043418884, 0.022047867998480797, 0.02513241395354271, 0.028216959908604622, 0.031301505863666534, 0.0343860499560833, 0.03747059777379036, 0.04055514186620712, 0.043639689683914185, 0.04672423377633095, 0.04980877786874771, 0.05289332568645477, 0.055977869778871536, 0.0590624175965786, 0.06214696168899536, 0.06523150950670242, 0.06831605732440948, 0.07140059769153595, 0.07448514550924301, 0.07756968587636948, 0.08065423369407654, 0.0837387815117836, 0.08682332932949066, 0.08990786969661713, 0.09299241751432419, 0.09607696533203125]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 2.0, 2.0, 5.0, 7.0, 3.0, 9.0, 11.0, 16.0, 14.0, 19.0, 31.0, 26.0, 37.0, 38.0, 39.0, 41.0, 55.0, 66.0, 53.0, 60.0, 50.0, 60.0, 37.0, 51.0, 39.0, 38.0, 33.0, 23.0, 18.0, 20.0, 25.0, 15.0, 12.0, 7.0, 11.0, 8.0, 4.0, 6.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.017923951148986816, -0.01731100305914879, -0.01669805683195591, -0.01608511060476303, -0.015472162514925003, -0.01485921535640955, -0.014246268197894096, -0.013633321039378643, -0.01302037388086319, -0.012407426722347736, -0.011794479563832283, -0.01118153240531683, -0.010568585246801376, -0.009955638088285923, -0.00934269092977047, -0.008729743771255016, -0.008116796612739563, -0.00750384945422411, -0.006890902295708656, -0.006277955137193203, -0.00566500797867775, -0.005052060820162296, -0.004439113661646843, -0.0038261665031313896, -0.0032132193446159363, -0.002600272186100483, -0.0019873250275850296, -0.0013743778690695763, -0.0007614307105541229, -0.00014848355203866959, 0.00046446360647678375, 0.001077410764992237, 0.0016903579235076904, 0.0023033050820231438, 0.002916252240538597, 0.0035291993990540504, 0.004142146557569504, 0.004755093716084957, 0.0053680408746004105, 0.005980988033115864, 0.006593935191631317, 0.0072068823501467705, 0.007819829508662224, 0.008432776667177677, 0.00904572382569313, 0.009658670984208584, 0.010271618142724037, 0.01088456530123949, 0.011497512459754944, 0.012110459618270397, 0.01272340677678585, 0.013336353935301304, 0.013949301093816757, 0.01456224825233221, 0.015175195410847664, 0.015788141638040543, 0.01640108972787857, 0.0170140378177166, 0.017626984044909477, 0.018239930272102356, 0.018852878361940384, 0.019465826451778412, 0.02007877267897129, 0.02069171890616417, 0.021304666996002197]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 7.0, 5.0, 4.0, 11.0, 13.0, 17.0, 18.0, 20.0, 34.0, 49.0, 76.0, 115.0, 130.0, 205.0, 274.0, 360.0, 512.0, 681.0, 1004.0, 1529.0, 2271.0, 3573.0, 5784.0, 10562.0, 23840.0, 621283.0, 327274.0, 22417.0, 10233.0, 5660.0, 3483.0, 2276.0, 1409.0, 970.0, 633.0, 487.0, 358.0, 244.0, 202.0, 146.0, 101.0, 86.0, 54.0, 38.0, 19.0, 31.0, 19.0, 7.0, 10.0, 10.0, 5.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.032440185546875, -0.03142547607421875, -0.0304107666015625, -0.02939605712890625, -0.02838134765625, -0.02736663818359375, -0.0263519287109375, -0.02533721923828125, -0.024322509765625, -0.02330780029296875, -0.0222930908203125, -0.02127838134765625, -0.020263671875, -0.01924896240234375, -0.0182342529296875, -0.01721954345703125, -0.016204833984375, -0.01519012451171875, -0.0141754150390625, -0.01316070556640625, -0.01214599609375, -0.01113128662109375, -0.0101165771484375, -0.00910186767578125, -0.008087158203125, -0.00707244873046875, -0.0060577392578125, -0.00504302978515625, -0.0040283203125, -0.00301361083984375, -0.0019989013671875, -0.00098419189453125, 3.0517578125e-05, 0.00104522705078125, 0.0020599365234375, 0.00307464599609375, 0.00408935546875, 0.00510406494140625, 0.0061187744140625, 0.00713348388671875, 0.008148193359375, 0.00916290283203125, 0.0101776123046875, 0.01119232177734375, 0.01220703125, 0.01322174072265625, 0.0142364501953125, 0.01525115966796875, 0.016265869140625, 0.01728057861328125, 0.0182952880859375, 0.01930999755859375, 0.02032470703125, 0.02133941650390625, 0.0223541259765625, 0.02336883544921875, 0.024383544921875, 0.02539825439453125, 0.0264129638671875, 0.02742767333984375, 0.0284423828125, 0.02945709228515625, 0.0304718017578125, 0.03148651123046875, 0.032501220703125]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 5.0, 1.0, 1.0, 4.0, 5.0, 0.0, 3.0, 5.0, 6.0, 4.0, 3.0, 7.0, 11.0, 6.0, 14.0, 14.0, 25.0, 178.0, 424.0, 174.0, 28.0, 21.0, 12.0, 8.0, 5.0, 8.0, 7.0, 6.0, 2.0, 1.0, 5.0, 3.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0031185150146484375, -0.003015875816345215, -0.002913236618041992, -0.0028105974197387695, -0.002707958221435547, -0.0026053190231323242, -0.0025026798248291016, -0.002400040626525879, -0.0022974014282226562, -0.0021947622299194336, -0.002092123031616211, -0.0019894838333129883, -0.0018868446350097656, -0.001784205436706543, -0.0016815662384033203, -0.0015789270401000977, -0.001476287841796875, -0.0013736486434936523, -0.0012710094451904297, -0.001168370246887207, -0.0010657310485839844, -0.0009630918502807617, -0.0008604526519775391, -0.0007578134536743164, -0.0006551742553710938, -0.0005525350570678711, -0.00044989585876464844, -0.0003472566604614258, -0.0002446174621582031, -0.00014197826385498047, -3.933906555175781e-05, 6.330013275146484e-05, 0.0001659393310546875, 0.00026857852935791016, 0.0003712177276611328, 0.00047385692596435547, 0.0005764961242675781, 0.0006791353225708008, 0.0007817745208740234, 0.0008844137191772461, 0.0009870529174804688, 0.0010896921157836914, 0.001192331314086914, 0.0012949705123901367, 0.0013976097106933594, 0.001500248908996582, 0.0016028881072998047, 0.0017055273056030273, 0.00180816650390625, 0.0019108057022094727, 0.0020134449005126953, 0.002116084098815918, 0.0022187232971191406, 0.0023213624954223633, 0.002424001693725586, 0.0025266408920288086, 0.0026292800903320312, 0.002731919288635254, 0.0028345584869384766, 0.0029371976852416992, 0.003039836883544922, 0.0031424760818481445, 0.003245115280151367, 0.00334775447845459, 0.0034503936767578125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 6.0, 3.0, 9.0, 5.0, 5.0, 9.0, 20.0, 26.0, 31.0, 41.0, 57.0, 77.0, 122.0, 156.0, 199.0, 310.0, 446.0, 698.0, 1142.0, 2024.0, 3739.0, 8522.0, 30101.0, 618507.0, 341901.0, 24245.0, 7510.0, 3520.0, 1834.0, 1119.0, 712.0, 461.0, 265.0, 201.0, 150.0, 101.0, 63.0, 59.0, 39.0, 34.0, 30.0, 19.0, 9.0, 10.0, 7.0, 7.0, 3.0, 2.0, 1.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0472412109375, -0.0456085205078125, -0.043975830078125, -0.0423431396484375, -0.04071044921875, -0.0390777587890625, -0.037445068359375, -0.0358123779296875, -0.0341796875, -0.0325469970703125, -0.030914306640625, -0.0292816162109375, -0.02764892578125, -0.0260162353515625, -0.024383544921875, -0.0227508544921875, -0.0211181640625, -0.0194854736328125, -0.017852783203125, -0.0162200927734375, -0.01458740234375, -0.0129547119140625, -0.011322021484375, -0.0096893310546875, -0.008056640625, -0.0064239501953125, -0.004791259765625, -0.0031585693359375, -0.00152587890625, 0.0001068115234375, 0.001739501953125, 0.0033721923828125, 0.0050048828125, 0.0066375732421875, 0.008270263671875, 0.0099029541015625, 0.01153564453125, 0.0131683349609375, 0.014801025390625, 0.0164337158203125, 0.01806640625, 0.0196990966796875, 0.021331787109375, 0.0229644775390625, 0.02459716796875, 0.0262298583984375, 0.027862548828125, 0.0294952392578125, 0.0311279296875, 0.0327606201171875, 0.034393310546875, 0.0360260009765625, 0.03765869140625, 0.0392913818359375, 0.040924072265625, 0.0425567626953125, 0.044189453125, 0.0458221435546875, 0.047454833984375, 0.0490875244140625, 0.05072021484375, 0.0523529052734375, 0.053985595703125, 0.0556182861328125, 0.0572509765625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 5.0, 4.0, 4.0, 7.0, 7.0, 4.0, 10.0, 10.0, 15.0, 11.0, 12.0, 16.0, 20.0, 34.0, 32.0, 44.0, 26.0, 39.0, 38.0, 43.0, 40.0, 46.0, 41.0, 48.0, 34.0, 40.0, 24.0, 33.0, 43.0, 47.0, 30.0, 22.0, 26.0, 29.0, 23.0, 9.0, 17.0, 15.0, 15.0, 10.0, 9.0, 8.0, 6.0, 3.0, 2.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.0136871337890625, -0.01326000690460205, -0.012832880020141602, -0.012405753135681152, -0.011978626251220703, -0.011551499366760254, -0.011124372482299805, -0.010697245597839355, -0.010270118713378906, -0.009842991828918457, -0.009415864944458008, -0.008988738059997559, -0.00856161117553711, -0.00813448429107666, -0.007707357406616211, -0.007280230522155762, -0.0068531036376953125, -0.006425976753234863, -0.005998849868774414, -0.005571722984313965, -0.005144596099853516, -0.004717469215393066, -0.004290342330932617, -0.003863215446472168, -0.0034360885620117188, -0.0030089616775512695, -0.0025818347930908203, -0.002154707908630371, -0.0017275810241699219, -0.0013004541397094727, -0.0008733272552490234, -0.0004462003707885742, -1.9073486328125e-05, 0.0004080533981323242, 0.0008351802825927734, 0.0012623071670532227, 0.0016894340515136719, 0.002116560935974121, 0.0025436878204345703, 0.0029708147048950195, 0.0033979415893554688, 0.003825068473815918, 0.004252195358276367, 0.004679322242736816, 0.005106449127197266, 0.005533576011657715, 0.005960702896118164, 0.006387829780578613, 0.0068149566650390625, 0.007242083549499512, 0.007669210433959961, 0.00809633731842041, 0.00852346420288086, 0.008950591087341309, 0.009377717971801758, 0.009804844856262207, 0.010231971740722656, 0.010659098625183105, 0.011086225509643555, 0.011513352394104004, 0.011940479278564453, 0.012367606163024902, 0.012794733047485352, 0.0132218599319458, 0.01364898681640625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 5.0, 6.0, 15.0, 10.0, 13.0, 18.0, 29.0, 57.0, 93.0, 120.0, 275.0, 585.0, 1659.0, 8468.0, 986241.0, 45734.0, 3417.0, 953.0, 391.0, 201.0, 97.0, 56.0, 32.0, 20.0, 12.0, 16.0, 12.0, 7.0, 6.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.10980224609375, -0.10689449310302734, -0.10398674011230469, -0.10107898712158203, -0.09817123413085938, -0.09526348114013672, -0.09235572814941406, -0.0894479751586914, -0.08654022216796875, -0.0836324691772461, -0.08072471618652344, -0.07781696319580078, -0.07490921020507812, -0.07200145721435547, -0.06909370422363281, -0.06618595123291016, -0.0632781982421875, -0.060370445251464844, -0.05746269226074219, -0.05455493927001953, -0.051647186279296875, -0.04873943328857422, -0.04583168029785156, -0.042923927307128906, -0.04001617431640625, -0.037108421325683594, -0.03420066833496094, -0.03129291534423828, -0.028385162353515625, -0.02547740936279297, -0.022569656372070312, -0.019661903381347656, -0.016754150390625, -0.013846397399902344, -0.010938644409179688, -0.008030891418457031, -0.005123138427734375, -0.0022153854370117188, 0.0006923675537109375, 0.0036001205444335938, 0.00650787353515625, 0.009415626525878906, 0.012323379516601562, 0.015231132507324219, 0.018138885498046875, 0.02104663848876953, 0.023954391479492188, 0.026862144470214844, 0.0297698974609375, 0.032677650451660156, 0.03558540344238281, 0.03849315643310547, 0.041400909423828125, 0.04430866241455078, 0.04721641540527344, 0.050124168395996094, 0.05303192138671875, 0.055939674377441406, 0.05884742736816406, 0.06175518035888672, 0.06466293334960938, 0.06757068634033203, 0.07047843933105469, 0.07338619232177734, 0.0762939453125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 3.0, 3.0, 2.0, 1.0, 5.0, 4.0, 2.0, 9.0, 7.0, 9.0, 14.0, 19.0, 24.0, 47.0, 57.0, 124.0, 168.0, 182.0, 120.0, 53.0, 33.0, 34.0, 19.0, 18.0, 11.0, 10.0, 8.0, 5.0, 4.0, 5.0, 4.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.832578659057617e-05, -3.728549927473068e-05, -3.624521195888519e-05, -3.52049246430397e-05, -3.4164637327194214e-05, -3.3124350011348724e-05, -3.2084062695503235e-05, -3.1043775379657745e-05, -3.0003488063812256e-05, -2.8963200747966766e-05, -2.7922913432121277e-05, -2.6882626116275787e-05, -2.5842338800430298e-05, -2.480205148458481e-05, -2.376176416873932e-05, -2.272147685289383e-05, -2.168118953704834e-05, -2.064090222120285e-05, -1.960061490535736e-05, -1.856032758951187e-05, -1.7520040273666382e-05, -1.6479752957820892e-05, -1.5439465641975403e-05, -1.4399178326129913e-05, -1.3358891010284424e-05, -1.2318603694438934e-05, -1.1278316378593445e-05, -1.0238029062747955e-05, -9.197741746902466e-06, -8.157454431056976e-06, -7.117167115211487e-06, -6.076879799365997e-06, -5.036592483520508e-06, -3.996305167675018e-06, -2.956017851829529e-06, -1.9157305359840393e-06, -8.754432201385498e-07, 1.648440957069397e-07, 1.2051314115524292e-06, 2.2454187273979187e-06, 3.285706043243408e-06, 4.325993359088898e-06, 5.366280674934387e-06, 6.406567990779877e-06, 7.446855306625366e-06, 8.487142622470856e-06, 9.527429938316345e-06, 1.0567717254161835e-05, 1.1608004570007324e-05, 1.2648291885852814e-05, 1.3688579201698303e-05, 1.4728866517543793e-05, 1.5769153833389282e-05, 1.6809441149234772e-05, 1.784972846508026e-05, 1.889001578092575e-05, 1.993030309677124e-05, 2.097059041261673e-05, 2.201087772846222e-05, 2.305116504430771e-05, 2.4091452360153198e-05, 2.5131739675998688e-05, 2.6172026991844177e-05, 2.7212314307689667e-05, 2.8252601623535156e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 2.0, 5.0, 3.0, 5.0, 12.0, 16.0, 24.0, 39.0, 69.0, 60.0, 79.0, 175.0, 222.0, 371.0, 616.0, 1170.0, 2381.0, 5559.0, 16136.0, 96525.0, 869270.0, 38409.0, 9790.0, 3627.0, 1672.0, 901.0, 497.0, 314.0, 219.0, 115.0, 67.0, 71.0, 33.0, 21.0, 22.0, 8.0, 15.0, 5.0, 14.0, 6.0, 7.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.061492919921875, -0.05939340591430664, -0.05729389190673828, -0.05519437789916992, -0.05309486389160156, -0.0509953498840332, -0.048895835876464844, -0.046796321868896484, -0.044696807861328125, -0.042597293853759766, -0.040497779846191406, -0.03839826583862305, -0.03629875183105469, -0.03419923782348633, -0.03209972381591797, -0.03000020980834961, -0.02790069580078125, -0.02580118179321289, -0.02370166778564453, -0.021602153778076172, -0.019502639770507812, -0.017403125762939453, -0.015303611755371094, -0.013204097747802734, -0.011104583740234375, -0.009005069732666016, -0.006905555725097656, -0.004806041717529297, -0.0027065277099609375, -0.0006070137023925781, 0.0014925003051757812, 0.0035920143127441406, 0.0056915283203125, 0.007791042327880859, 0.009890556335449219, 0.011990070343017578, 0.014089584350585938, 0.016189098358154297, 0.018288612365722656, 0.020388126373291016, 0.022487640380859375, 0.024587154388427734, 0.026686668395996094, 0.028786182403564453, 0.030885696411132812, 0.03298521041870117, 0.03508472442626953, 0.03718423843383789, 0.03928375244140625, 0.04138326644897461, 0.04348278045654297, 0.04558229446411133, 0.04768180847167969, 0.04978132247924805, 0.051880836486816406, 0.053980350494384766, 0.056079864501953125, 0.058179378509521484, 0.060278892517089844, 0.0623784065246582, 0.06447792053222656, 0.06657743453979492, 0.06867694854736328, 0.07077646255493164, 0.0728759765625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 3.0, 4.0, 7.0, 4.0, 12.0, 12.0, 18.0, 23.0, 18.0, 45.0, 66.0, 384.0, 173.0, 56.0, 36.0, 24.0, 14.0, 17.0, 15.0, 15.0, 5.0, 9.0, 7.0, 7.0, 7.0, 7.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.06103515625, -0.05933094024658203, -0.05762672424316406, -0.055922508239746094, -0.054218292236328125, -0.052514076232910156, -0.05080986022949219, -0.04910564422607422, -0.04740142822265625, -0.04569721221923828, -0.04399299621582031, -0.042288780212402344, -0.040584564208984375, -0.038880348205566406, -0.03717613220214844, -0.03547191619873047, -0.0337677001953125, -0.03206348419189453, -0.030359268188476562, -0.028655052185058594, -0.026950836181640625, -0.025246620178222656, -0.023542404174804688, -0.02183818817138672, -0.02013397216796875, -0.01842975616455078, -0.016725540161132812, -0.015021324157714844, -0.013317108154296875, -0.011612892150878906, -0.009908676147460938, -0.008204460144042969, -0.006500244140625, -0.004796028137207031, -0.0030918121337890625, -0.0013875961303710938, 0.000316619873046875, 0.0020208358764648438, 0.0037250518798828125, 0.005429267883300781, 0.00713348388671875, 0.008837699890136719, 0.010541915893554688, 0.012246131896972656, 0.013950347900390625, 0.015654563903808594, 0.017358779907226562, 0.01906299591064453, 0.0207672119140625, 0.02247142791748047, 0.024175643920898438, 0.025879859924316406, 0.027584075927734375, 0.029288291931152344, 0.030992507934570312, 0.03269672393798828, 0.03440093994140625, 0.03610515594482422, 0.03780937194824219, 0.039513587951660156, 0.041217803955078125, 0.042922019958496094, 0.04462623596191406, 0.04633045196533203, 0.04803466796875]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 5.0, 12.0, 15.0, 56.0, 576.0, 278.0, 32.0, 5.0, 10.0, 9.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.000304102897644, -0.9707699418067932, -0.9412357807159424, -0.9117015600204468, -0.882167398929596, -0.8526332378387451, -0.8230990767478943, -0.7935649156570435, -0.7640306949615479, -0.734496533870697, -0.7049623727798462, -0.6754281520843506, -0.6458939909934998, -0.6163598299026489, -0.5868256688117981, -0.5572915077209473, -0.5277572870254517, -0.49822312593460083, -0.4686889350414276, -0.4391547739505768, -0.40962058305740356, -0.38008642196655273, -0.3505522608757019, -0.3210180699825287, -0.29148393869400024, -0.2619497776031494, -0.2324155867099762, -0.20288142561912537, -0.17334723472595215, -0.14381307363510132, -0.1142788976430893, -0.08474472165107727, -0.05521053075790405, -0.025676356628537178, 0.0038578175008296967, 0.03339198976755142, 0.06292616575956345, 0.09246033430099487, 0.1219945102930069, 0.15152868628501892, 0.18106286227703094, 0.21059703826904297, 0.240131214261055, 0.269665390253067, 0.29919955134391785, 0.32873374223709106, 0.3582679033279419, 0.3878020644187927, 0.41733625531196594, 0.4468704164028168, 0.47640460729599, 0.5059387683868408, 0.5354729294776917, 0.5650070905685425, 0.5945413112640381, 0.6240754723548889, 0.6536096334457397, 0.6831437945365906, 0.7126779556274414, 0.742212176322937, 0.7717463374137878, 0.8012804985046387, 0.8308146595954895, 0.8603488206863403, 0.8898830413818359]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 3.0, 8.0, 3.0, 6.0, 7.0, 7.0, 12.0, 17.0, 30.0, 48.0, 80.0, 92.0, 136.0, 131.0, 104.0, 94.0, 59.0, 39.0, 33.0, 23.0, 11.0, 12.0, 8.0, 7.0, 8.0, 4.0, 3.0, 2.0, 6.0, 4.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.2899765372276306, -0.2810823321342468, -0.27218812704086304, -0.26329392194747925, -0.25439971685409546, -0.24550551176071167, -0.23661132156848907, -0.22771711647510529, -0.2188229113817215, -0.2099287062883377, -0.20103450119495392, -0.19214029610157013, -0.18324610590934753, -0.17435190081596375, -0.16545769572257996, -0.15656349062919617, -0.14766928553581238, -0.1387750804424286, -0.1298808753490448, -0.12098667770624161, -0.11209247261285782, -0.10319826751947403, -0.09430406987667084, -0.08540986478328705, -0.07651565968990326, -0.06762145459651947, -0.05872725322842598, -0.04983305186033249, -0.0409388467669487, -0.03204464167356491, -0.02315044030547142, -0.01425623893737793, -0.005362033843994141, 0.003532169386744499, 0.012426372617483139, 0.02132057584822178, 0.03021477907896042, 0.03910898417234421, 0.0480031855404377, 0.05689738690853119, 0.06579159200191498, 0.07468579709529877, 0.08358000218868256, 0.09247419983148575, 0.10136840492486954, 0.11026261001825333, 0.11915680766105652, 0.1280510127544403, 0.1369452178478241, 0.14583942294120789, 0.15473362803459167, 0.16362783312797546, 0.17252203822135925, 0.18141624331474304, 0.19031043350696564, 0.19920463860034943, 0.20809884369373322, 0.216993048787117, 0.2258872538805008, 0.23478145897388458, 0.24367564916610718, 0.25256985425949097, 0.26146405935287476, 0.27035826444625854, 0.27925246953964233]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 4.0, 3.0, 4.0, 1.0, 2.0, 3.0, 5.0, 6.0, 12.0, 14.0, 16.0, 17.0, 18.0, 38.0, 49.0, 134.0, 1372.0, 4027697.0, 163736.0, 892.0, 104.0, 45.0, 31.0, 16.0, 18.0, 13.0, 10.0, 5.0, 6.0, 5.0, 4.0, 4.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.91015625, -2.819122314453125, -2.72808837890625, -2.637054443359375, -2.5460205078125, -2.454986572265625, -2.36395263671875, -2.272918701171875, -2.181884765625, -2.090850830078125, -1.99981689453125, -1.908782958984375, -1.8177490234375, -1.726715087890625, -1.63568115234375, -1.544647216796875, -1.45361328125, -1.362579345703125, -1.27154541015625, -1.180511474609375, -1.0894775390625, -0.998443603515625, -0.90740966796875, -0.816375732421875, -0.725341796875, -0.634307861328125, -0.54327392578125, -0.452239990234375, -0.3612060546875, -0.270172119140625, -0.17913818359375, -0.088104248046875, 0.0029296875, 0.093963623046875, 0.18499755859375, 0.276031494140625, 0.3670654296875, 0.458099365234375, 0.54913330078125, 0.640167236328125, 0.731201171875, 0.822235107421875, 0.91326904296875, 1.004302978515625, 1.0953369140625, 1.186370849609375, 1.27740478515625, 1.368438720703125, 1.45947265625, 1.550506591796875, 1.64154052734375, 1.732574462890625, 1.8236083984375, 1.914642333984375, 2.00567626953125, 2.096710205078125, 2.187744140625, 2.278778076171875, 2.36981201171875, 2.460845947265625, 2.5518798828125, 2.642913818359375, 2.73394775390625, 2.824981689453125, 2.916015625]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 3.0, 3.0, 4.0, 2.0, 1.0, 2.0, 7.0, 6.0, 3.0, 6.0, 6.0, 7.0, 16.0, 11.0, 28.0, 61.0, 137.0, 223.0, 209.0, 120.0, 53.0, 21.0, 14.0, 6.0, 13.0, 7.0, 6.0, 3.0, 6.0, 5.0, 1.0, 2.0, 5.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002197265625, -0.00211256742477417, -0.00202786922454834, -0.0019431710243225098, -0.0018584728240966797, -0.0017737746238708496, -0.0016890764236450195, -0.0016043782234191895, -0.0015196800231933594, -0.0014349818229675293, -0.0013502836227416992, -0.0012655854225158691, -0.001180887222290039, -0.001096189022064209, -0.001011490821838379, -0.0009267926216125488, -0.0008420944213867188, -0.0007573962211608887, -0.0006726980209350586, -0.0005879998207092285, -0.0005033016204833984, -0.00041860342025756836, -0.0003339052200317383, -0.0002492070198059082, -0.00016450881958007812, -7.981061935424805e-05, 4.887580871582031e-06, 8.958578109741211e-05, 0.0001742839813232422, 0.00025898218154907227, 0.00034368038177490234, 0.0004283785820007324, 0.0005130767822265625, 0.0005977749824523926, 0.0006824731826782227, 0.0007671713829040527, 0.0008518695831298828, 0.0009365677833557129, 0.001021265983581543, 0.001105964183807373, 0.0011906623840332031, 0.0012753605842590332, 0.0013600587844848633, 0.0014447569847106934, 0.0015294551849365234, 0.0016141533851623535, 0.0016988515853881836, 0.0017835497856140137, 0.0018682479858398438, 0.0019529461860656738, 0.002037644386291504, 0.002122342586517334, 0.002207040786743164, 0.002291738986968994, 0.0023764371871948242, 0.0024611353874206543, 0.0025458335876464844, 0.0026305317878723145, 0.0027152299880981445, 0.0027999281883239746, 0.0028846263885498047, 0.0029693245887756348, 0.003054022789001465, 0.003138720989227295, 0.003223419189453125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 1.0, 9.0, 3.0, 6.0, 10.0, 6.0, 12.0, 9.0, 15.0, 30.0, 39.0, 42.0, 48.0, 49.0, 83.0, 98.0, 100.0, 163.0, 504.0, 19392.0, 4166344.0, 6101.0, 314.0, 150.0, 132.0, 115.0, 106.0, 94.0, 59.0, 67.0, 55.0, 33.0, 25.0, 19.0, 17.0, 6.0, 9.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.50634765625, -0.4920387268066406, -0.47772979736328125, -0.4634208679199219, -0.4491119384765625, -0.4348030090332031, -0.42049407958984375, -0.4061851501464844, -0.391876220703125, -0.3775672912597656, -0.36325836181640625, -0.3489494323730469, -0.3346405029296875, -0.3203315734863281, -0.30602264404296875, -0.2917137145996094, -0.27740478515625, -0.2630958557128906, -0.24878692626953125, -0.23447799682617188, -0.2201690673828125, -0.20586013793945312, -0.19155120849609375, -0.17724227905273438, -0.162933349609375, -0.14862442016601562, -0.13431549072265625, -0.12000656127929688, -0.1056976318359375, -0.09138870239257812, -0.07707977294921875, -0.06277084350585938, -0.0484619140625, -0.034152984619140625, -0.01984405517578125, -0.005535125732421875, 0.0087738037109375, 0.023082733154296875, 0.03739166259765625, 0.051700592041015625, 0.066009521484375, 0.08031845092773438, 0.09462738037109375, 0.10893630981445312, 0.1232452392578125, 0.13755416870117188, 0.15186309814453125, 0.16617202758789062, 0.18048095703125, 0.19478988647460938, 0.20909881591796875, 0.22340774536132812, 0.2377166748046875, 0.2520256042480469, 0.26633453369140625, 0.2806434631347656, 0.294952392578125, 0.3092613220214844, 0.32357025146484375, 0.3378791809082031, 0.3521881103515625, 0.3664970397949219, 0.38080596923828125, 0.3951148986816406, 0.409423828125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 4.0, 2.0, 6.0, 5.0, 2.0, 5.0, 10.0, 18.0, 13.0, 17.0, 19.0, 26.0, 22.0, 29.0, 39.0, 60.0, 57.0, 77.0, 93.0, 123.0, 158.0, 156.0, 183.0, 268.0, 1017.0, 337.0, 204.0, 168.0, 162.0, 113.0, 127.0, 104.0, 85.0, 86.0, 59.0, 40.0, 40.0, 36.0, 28.0, 13.0, 15.0, 9.0, 10.0, 7.0, 6.0, 9.0, 6.0, 3.0, 3.0, 1.0, 2.0, 2.0], "bins": [-0.004314422607421875, -0.004196733236312866, -0.004079043865203857, -0.003961354494094849, -0.00384366512298584, -0.003725975751876831, -0.0036082863807678223, -0.0034905970096588135, -0.0033729076385498047, -0.003255218267440796, -0.003137528896331787, -0.0030198395252227783, -0.0029021501541137695, -0.0027844607830047607, -0.002666771411895752, -0.002549082040786743, -0.0024313926696777344, -0.0023137032985687256, -0.002196013927459717, -0.002078324556350708, -0.0019606351852416992, -0.0018429458141326904, -0.0017252564430236816, -0.0016075670719146729, -0.001489877700805664, -0.0013721883296966553, -0.0012544989585876465, -0.0011368095874786377, -0.001019120216369629, -0.0009014308452606201, -0.0007837414741516113, -0.0006660521030426025, -0.0005483627319335938, -0.00043067336082458496, -0.00031298398971557617, -0.00019529461860656738, -7.76052474975586e-05, 4.0084123611450195e-05, 0.00015777349472045898, 0.0002754628658294678, 0.00039315223693847656, 0.0005108416080474854, 0.0006285309791564941, 0.0007462203502655029, 0.0008639097213745117, 0.0009815990924835205, 0.0010992884635925293, 0.001216977834701538, 0.0013346672058105469, 0.0014523565769195557, 0.0015700459480285645, 0.0016877353191375732, 0.001805424690246582, 0.0019231140613555908, 0.0020408034324645996, 0.0021584928035736084, 0.002276182174682617, 0.002393871545791626, 0.0025115609169006348, 0.0026292502880096436, 0.0027469396591186523, 0.002864629030227661, 0.00298231840133667, 0.0031000077724456787, 0.0032176971435546875]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 66.0, 947.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1739683449268341, -0.132224440574646, -0.09048055112361908, -0.04873666167259216, -0.006992757320404053, 0.03475114703178406, 0.07649502158164978, 0.11823892593383789, 0.159982830286026, 0.2017267346382141, 0.24347062408924103, 0.28521451354026794, 0.32695841789245605, 0.36870232224464417, 0.4104461967945099, 0.452190101146698, 0.4939340054988861, 0.5356779098510742, 0.5774217844009399, 0.6191656589508057, 0.6609095931053162, 0.7026535272598267, 0.7443974018096924, 0.7861412763595581, 0.8278851509094238, 0.8696290254592896, 0.9113729596138, 0.9531168341636658, 0.9948607683181763, 1.036604642868042, 1.0783485174179077, 1.1200923919677734, 1.1618363857269287, 1.2035802602767944, 1.2453241348266602, 1.2870681285858154, 1.3288120031356812, 1.3705558776855469, 1.4122997522354126, 1.4540436267852783, 1.4957876205444336, 1.5375314950942993, 1.579275369644165, 1.6210193634033203, 1.662763237953186, 1.7045071125030518, 1.7462509870529175, 1.7879948616027832, 1.829738736152649, 1.8714826107025146, 1.9132264852523804, 1.954970359802246, 1.9967143535614014, 2.0384583473205566, 2.080202102661133, 2.121946096420288, 2.1636898517608643, 2.2054338455200195, 2.2471776008605957, 2.288921594619751, 2.330665349960327, 2.3724093437194824, 2.4141530990600586, 2.455897092819214, 2.497641086578369]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 6.0, 10.0, 21.0, 38.0, 79.0, 127.0, 144.0, 155.0, 135.0, 127.0, 71.0, 41.0, 25.0, 21.0, 12.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03615427017211914, -0.03323473781347275, -0.030315201729536057, -0.027395667508244514, -0.024476133286952972, -0.02155659906566143, -0.01863706484436989, -0.015717530623078346, -0.012797996401786804, -0.009878462180495262, -0.00695892795920372, -0.004039393737912178, -0.001119859516620636, 0.001799674704670906, 0.004719208925962448, 0.00763874314725399, 0.010558277368545532, 0.013477811589837074, 0.016397345811128616, 0.01931688003242016, 0.0222364142537117, 0.025155948475003242, 0.028075482696294785, 0.030995016917586327, 0.03391455113887787, 0.03683408349752426, 0.03975361958146095, 0.042673155665397644, 0.04559268802404404, 0.04851222038269043, 0.05143175646662712, 0.05435129255056381, 0.057270824909210205, 0.0601903572678566, 0.06310988962650299, 0.06602942943572998, 0.06894896179437637, 0.07186849415302277, 0.07478803396224976, 0.07770756632089615, 0.08062709867954254, 0.08354663103818893, 0.08646616339683533, 0.08938570320606232, 0.09230523556470871, 0.0952247679233551, 0.09814430773258209, 0.10106384009122849, 0.10398337244987488, 0.10690290480852127, 0.10982243716716766, 0.11274197697639465, 0.11566150933504105, 0.11858104169368744, 0.12150058150291443, 0.12442011386156082, 0.12733964622020721, 0.1302591860294342, 0.1331787109375, 0.136098250746727, 0.13901779055595398, 0.14193731546401978, 0.14485685527324677, 0.14777638018131256, 0.15069591999053955]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 8.0, 5.0, 5.0, 8.0, 18.0, 9.0, 25.0, 28.0, 49.0, 68.0, 91.0, 135.0, 158.0, 228.0, 338.0, 489.0, 715.0, 933.0, 1445.0, 2005.0, 3130.0, 4919.0, 8208.0, 15719.0, 43284.0, 526241.0, 366703.0, 36963.0, 14619.0, 7875.0, 4595.0, 3042.0, 1979.0, 1363.0, 907.0, 646.0, 477.0, 321.0, 230.0, 155.0, 126.0, 97.0, 56.0, 43.0, 31.0, 22.0, 13.0, 13.0, 5.0, 8.0, 8.0, 1.0, 3.0, 4.0, 1.0, 0.0, 2.0], "bins": [-0.032501220703125, -0.031514644622802734, -0.03052806854248047, -0.029541492462158203, -0.028554916381835938, -0.027568340301513672, -0.026581764221191406, -0.02559518814086914, -0.024608612060546875, -0.02362203598022461, -0.022635459899902344, -0.021648883819580078, -0.020662307739257812, -0.019675731658935547, -0.01868915557861328, -0.017702579498291016, -0.01671600341796875, -0.015729427337646484, -0.014742851257324219, -0.013756275177001953, -0.012769699096679688, -0.011783123016357422, -0.010796546936035156, -0.00980997085571289, -0.008823394775390625, -0.00783681869506836, -0.006850242614746094, -0.005863666534423828, -0.0048770904541015625, -0.003890514373779297, -0.0029039382934570312, -0.0019173622131347656, -0.0009307861328125, 5.5789947509765625e-05, 0.0010423660278320312, 0.002028942108154297, 0.0030155181884765625, 0.004002094268798828, 0.004988670349121094, 0.005975246429443359, 0.006961822509765625, 0.00794839859008789, 0.008934974670410156, 0.009921550750732422, 0.010908126831054688, 0.011894702911376953, 0.012881278991699219, 0.013867855072021484, 0.01485443115234375, 0.015841007232666016, 0.01682758331298828, 0.017814159393310547, 0.018800735473632812, 0.019787311553955078, 0.020773887634277344, 0.02176046371459961, 0.022747039794921875, 0.02373361587524414, 0.024720191955566406, 0.025706768035888672, 0.026693344116210938, 0.027679920196533203, 0.02866649627685547, 0.029653072357177734, 0.0306396484375]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 5.0, 3.0, 3.0, 4.0, 4.0, 7.0, 2.0, 6.0, 10.0, 10.0, 21.0, 23.0, 36.0, 69.0, 85.0, 97.0, 104.0, 131.0, 127.0, 86.0, 52.0, 34.0, 23.0, 9.0, 5.0, 9.0, 6.0, 4.0, 5.0, 3.0, 1.0, 1.0, 5.0, 1.0, 1.0, 1.0, 0.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.002086639404296875, -0.0020141303539276123, -0.0019416213035583496, -0.001869112253189087, -0.0017966032028198242, -0.0017240941524505615, -0.0016515851020812988, -0.0015790760517120361, -0.0015065670013427734, -0.0014340579509735107, -0.001361548900604248, -0.0012890398502349854, -0.0012165307998657227, -0.00114402174949646, -0.0010715126991271973, -0.0009990036487579346, -0.0009264945983886719, -0.0008539855480194092, -0.0007814764976501465, -0.0007089674472808838, -0.0006364583969116211, -0.0005639493465423584, -0.0004914402961730957, -0.000418931245803833, -0.0003464221954345703, -0.0002739131450653076, -0.00020140409469604492, -0.00012889504432678223, -5.638599395751953e-05, 1.6123056411743164e-05, 8.863210678100586e-05, 0.00016114115715026855, 0.00023365020751953125, 0.00030615925788879395, 0.00037866830825805664, 0.00045117735862731934, 0.000523686408996582, 0.0005961954593658447, 0.0006687045097351074, 0.0007412135601043701, 0.0008137226104736328, 0.0008862316608428955, 0.0009587407112121582, 0.001031249761581421, 0.0011037588119506836, 0.0011762678623199463, 0.001248776912689209, 0.0013212859630584717, 0.0013937950134277344, 0.001466304063796997, 0.0015388131141662598, 0.0016113221645355225, 0.0016838312149047852, 0.0017563402652740479, 0.0018288493156433105, 0.0019013583660125732, 0.001973867416381836, 0.0020463764667510986, 0.0021188855171203613, 0.002191394567489624, 0.0022639036178588867, 0.0023364126682281494, 0.002408921718597412, 0.002481430768966675, 0.0025539398193359375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 3.0, 2.0, 11.0, 8.0, 7.0, 11.0, 13.0, 14.0, 20.0, 17.0, 27.0, 32.0, 42.0, 34.0, 68.0, 80.0, 304.0, 1985.0, 49145.0, 985310.0, 10048.0, 843.0, 169.0, 68.0, 39.0, 36.0, 36.0, 33.0, 27.0, 29.0, 19.0, 12.0, 10.0, 10.0, 11.0, 10.0, 7.0, 4.0, 4.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10650634765625, -0.10299205780029297, -0.09947776794433594, -0.0959634780883789, -0.09244918823242188, -0.08893489837646484, -0.08542060852050781, -0.08190631866455078, -0.07839202880859375, -0.07487773895263672, -0.07136344909667969, -0.06784915924072266, -0.06433486938476562, -0.060820579528808594, -0.05730628967285156, -0.05379199981689453, -0.0502777099609375, -0.04676342010498047, -0.04324913024902344, -0.039734840393066406, -0.036220550537109375, -0.032706260681152344, -0.029191970825195312, -0.02567768096923828, -0.02216339111328125, -0.01864910125732422, -0.015134811401367188, -0.011620521545410156, -0.008106231689453125, -0.004591941833496094, -0.0010776519775390625, 0.0024366378784179688, 0.005950927734375, 0.009465217590332031, 0.012979507446289062, 0.016493797302246094, 0.020008087158203125, 0.023522377014160156, 0.027036666870117188, 0.03055095672607422, 0.03406524658203125, 0.03757953643798828, 0.04109382629394531, 0.044608116149902344, 0.048122406005859375, 0.051636695861816406, 0.05515098571777344, 0.05866527557373047, 0.0621795654296875, 0.06569385528564453, 0.06920814514160156, 0.0727224349975586, 0.07623672485351562, 0.07975101470947266, 0.08326530456542969, 0.08677959442138672, 0.09029388427734375, 0.09380817413330078, 0.09732246398925781, 0.10083675384521484, 0.10435104370117188, 0.1078653335571289, 0.11137962341308594, 0.11489391326904297, 0.118408203125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 4.0, 4.0, 6.0, 4.0, 15.0, 20.0, 15.0, 20.0, 16.0, 18.0, 29.0, 29.0, 47.0, 41.0, 45.0, 45.0, 50.0, 56.0, 50.0, 37.0, 37.0, 35.0, 48.0, 40.0, 34.0, 42.0, 42.0, 31.0, 21.0, 26.0, 16.0, 9.0, 5.0, 13.0, 10.0, 6.0, 8.0, 5.0, 6.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.00942230224609375, -0.009146571159362793, -0.008870840072631836, -0.008595108985900879, -0.008319377899169922, -0.008043646812438965, -0.007767915725708008, -0.007492184638977051, -0.007216453552246094, -0.006940722465515137, -0.00666499137878418, -0.006389260292053223, -0.006113529205322266, -0.005837798118591309, -0.0055620670318603516, -0.0052863359451293945, -0.0050106048583984375, -0.0047348737716674805, -0.0044591426849365234, -0.004183411598205566, -0.003907680511474609, -0.0036319494247436523, -0.0033562183380126953, -0.0030804872512817383, -0.0028047561645507812, -0.0025290250778198242, -0.002253293991088867, -0.00197756290435791, -0.0017018318176269531, -0.001426100730895996, -0.001150369644165039, -0.000874638557434082, -0.000598907470703125, -0.00032317638397216797, -4.744529724121094e-05, 0.0002282857894897461, 0.0005040168762207031, 0.0007797479629516602, 0.0010554790496826172, 0.0013312101364135742, 0.0016069412231445312, 0.0018826723098754883, 0.0021584033966064453, 0.0024341344833374023, 0.0027098655700683594, 0.0029855966567993164, 0.0032613277435302734, 0.0035370588302612305, 0.0038127899169921875, 0.0040885210037231445, 0.0043642520904541016, 0.004639983177185059, 0.004915714263916016, 0.005191445350646973, 0.00546717643737793, 0.005742907524108887, 0.006018638610839844, 0.006294369697570801, 0.006570100784301758, 0.006845831871032715, 0.007121562957763672, 0.007397294044494629, 0.007673025131225586, 0.007948756217956543, 0.0082244873046875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 9.0, 11.0, 21.0, 48.0, 292.0, 262673.0, 785084.0, 321.0, 47.0, 25.0, 11.0, 7.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.257568359375, -0.24242019653320312, -0.22727203369140625, -0.21212387084960938, -0.1969757080078125, -0.18182754516601562, -0.16667938232421875, -0.15153121948242188, -0.136383056640625, -0.12123489379882812, -0.10608673095703125, -0.09093856811523438, -0.0757904052734375, -0.060642242431640625, -0.04549407958984375, -0.030345916748046875, -0.01519775390625, -4.9591064453125e-05, 0.01509857177734375, 0.030246734619140625, 0.0453948974609375, 0.060543060302734375, 0.07569122314453125, 0.09083938598632812, 0.105987548828125, 0.12113571166992188, 0.13628387451171875, 0.15143203735351562, 0.1665802001953125, 0.18172836303710938, 0.19687652587890625, 0.21202468872070312, 0.2271728515625, 0.24232101440429688, 0.25746917724609375, 0.2726173400878906, 0.2877655029296875, 0.3029136657714844, 0.31806182861328125, 0.3332099914550781, 0.348358154296875, 0.3635063171386719, 0.37865447998046875, 0.3938026428222656, 0.4089508056640625, 0.4240989685058594, 0.43924713134765625, 0.4543952941894531, 0.46954345703125, 0.4846916198730469, 0.49983978271484375, 0.5149879455566406, 0.5301361083984375, 0.5452842712402344, 0.5604324340820312, 0.5755805969238281, 0.590728759765625, 0.6058769226074219, 0.6210250854492188, 0.6361732482910156, 0.6513214111328125, 0.6664695739746094, 0.6816177368164062, 0.6967658996582031, 0.7119140625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 5.0, 2.0, 6.0, 8.0, 8.0, 8.0, 14.0, 14.0, 32.0, 37.0, 64.0, 114.0, 300.0, 170.0, 84.0, 46.0, 18.0, 21.0, 14.0, 12.0, 9.0, 4.0, 3.0, 4.0, 2.0, 4.0, 2.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012183189392089844, -0.0001156739890575409, -0.00010951608419418335, -0.0001033581793308258, -9.720027446746826e-05, -9.104236960411072e-05, -8.488446474075317e-05, -7.872655987739563e-05, -7.256865501403809e-05, -6.641075015068054e-05, -6.0252845287323e-05, -5.4094940423965454e-05, -4.793703556060791e-05, -4.1779130697250366e-05, -3.562122583389282e-05, -2.946332097053528e-05, -2.3305416107177734e-05, -1.714751124382019e-05, -1.0989606380462646e-05, -4.8317015171051025e-06, 1.3262033462524414e-06, 7.484108209609985e-06, 1.364201307296753e-05, 1.9799917936325073e-05, 2.5957822799682617e-05, 3.211572766304016e-05, 3.8273632526397705e-05, 4.443153738975525e-05, 5.058944225311279e-05, 5.674734711647034e-05, 6.290525197982788e-05, 6.906315684318542e-05, 7.522106170654297e-05, 8.137896656990051e-05, 8.753687143325806e-05, 9.36947762966156e-05, 9.985268115997314e-05, 0.00010601058602333069, 0.00011216849088668823, 0.00011832639575004578, 0.00012448430061340332, 0.00013064220547676086, 0.0001368001103401184, 0.00014295801520347595, 0.0001491159200668335, 0.00015527382493019104, 0.00016143172979354858, 0.00016758963465690613, 0.00017374753952026367, 0.00017990544438362122, 0.00018606334924697876, 0.0001922212541103363, 0.00019837915897369385, 0.0002045370638370514, 0.00021069496870040894, 0.00021685287356376648, 0.00022301077842712402, 0.00022916868329048157, 0.0002353265881538391, 0.00024148449301719666, 0.0002476423978805542, 0.00025380030274391174, 0.0002599582076072693, 0.00026611611247062683, 0.0002722740173339844]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 5.0, 4.0, 10.0, 16.0, 19.0, 31.0, 34.0, 61.0, 90.0, 122.0, 187.0, 272.0, 463.0, 900.0, 2173.0, 8301.0, 202034.0, 818072.0, 10527.0, 2621.0, 1096.0, 539.0, 344.0, 214.0, 143.0, 81.0, 48.0, 50.0, 33.0, 19.0, 11.0, 7.0, 7.0, 6.0, 1.0, 5.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0777587890625, -0.07540702819824219, -0.07305526733398438, -0.07070350646972656, -0.06835174560546875, -0.06599998474121094, -0.06364822387695312, -0.06129646301269531, -0.0589447021484375, -0.05659294128417969, -0.054241180419921875, -0.05188941955566406, -0.04953765869140625, -0.04718589782714844, -0.044834136962890625, -0.04248237609863281, -0.040130615234375, -0.03777885437011719, -0.035427093505859375, -0.03307533264160156, -0.03072357177734375, -0.028371810913085938, -0.026020050048828125, -0.023668289184570312, -0.0213165283203125, -0.018964767456054688, -0.016613006591796875, -0.014261245727539062, -0.01190948486328125, -0.009557723999023438, -0.007205963134765625, -0.0048542022705078125, -0.00250244140625, -0.0001506805419921875, 0.002201080322265625, 0.0045528411865234375, 0.00690460205078125, 0.009256362915039062, 0.011608123779296875, 0.013959884643554688, 0.0163116455078125, 0.018663406372070312, 0.021015167236328125, 0.023366928100585938, 0.02571868896484375, 0.028070449829101562, 0.030422210693359375, 0.03277397155761719, 0.035125732421875, 0.03747749328613281, 0.039829254150390625, 0.04218101501464844, 0.04453277587890625, 0.04688453674316406, 0.049236297607421875, 0.05158805847167969, 0.0539398193359375, 0.05629158020019531, 0.058643341064453125, 0.06099510192871094, 0.06334686279296875, 0.06569862365722656, 0.06805038452148438, 0.07040214538574219, 0.07275390625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 9.0, 7.0, 24.0, 45.0, 93.0, 539.0, 166.0, 57.0, 26.0, 11.0, 12.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.054412841796875, -0.05288553237915039, -0.05135822296142578, -0.04983091354370117, -0.04830360412597656, -0.04677629470825195, -0.045248985290527344, -0.043721675872802734, -0.042194366455078125, -0.040667057037353516, -0.039139747619628906, -0.0376124382019043, -0.03608512878417969, -0.03455781936645508, -0.03303050994873047, -0.03150320053100586, -0.02997589111328125, -0.02844858169555664, -0.02692127227783203, -0.025393962860107422, -0.023866653442382812, -0.022339344024658203, -0.020812034606933594, -0.019284725189208984, -0.017757415771484375, -0.016230106353759766, -0.014702796936035156, -0.013175487518310547, -0.011648178100585938, -0.010120868682861328, -0.008593559265136719, -0.007066249847412109, -0.0055389404296875, -0.004011631011962891, -0.0024843215942382812, -0.0009570121765136719, 0.0005702972412109375, 0.002097606658935547, 0.0036249160766601562, 0.005152225494384766, 0.006679534912109375, 0.008206844329833984, 0.009734153747558594, 0.011261463165283203, 0.012788772583007812, 0.014316082000732422, 0.01584339141845703, 0.01737070083618164, 0.01889801025390625, 0.02042531967163086, 0.02195262908935547, 0.023479938507080078, 0.025007247924804688, 0.026534557342529297, 0.028061866760253906, 0.029589176177978516, 0.031116485595703125, 0.032643795013427734, 0.034171104431152344, 0.03569841384887695, 0.03722572326660156, 0.03875303268432617, 0.04028034210205078, 0.04180765151977539, 0.0433349609375]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 8.0, 11.0, 21.0, 57.0, 173.0, 398.0, 228.0, 66.0, 18.0, 12.0, 2.0, 4.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12946845591068268, -0.12167449295520782, -0.11388052254915237, -0.10608655959367752, -0.09829258918762207, -0.09049862623214722, -0.08270466327667236, -0.07491070032119751, -0.06711672991514206, -0.05932276323437691, -0.051528796553611755, -0.0437348335981369, -0.03594086691737175, -0.028146900236606598, -0.020352937281131744, -0.012558970600366592, -0.00476500391960144, 0.003028961829841137, 0.010822927579283714, 0.018616892397403717, 0.02641085907816887, 0.03420482575893402, 0.041998788714408875, 0.049792755395174026, 0.05758672207593918, 0.06538068503141403, 0.07317465543746948, 0.08096861839294434, 0.08876258134841919, 0.09655655175447464, 0.1043505147099495, 0.11214448511600494, 0.11993846297264099, 0.12773242592811584, 0.1355263888835907, 0.14332035183906555, 0.1511143296957016, 0.15890829265117645, 0.1667022556066513, 0.17449621856212616, 0.1822901964187622, 0.19008415937423706, 0.19787812232971191, 0.20567208528518677, 0.21346606314182281, 0.22126002609729767, 0.22905398905277252, 0.23684795200824738, 0.24464191496372223, 0.2524358928203583, 0.26022985577583313, 0.268023818731308, 0.27581778168678284, 0.2836117446422577, 0.29140570759773254, 0.2991996705532074, 0.30699363350868225, 0.3147875964641571, 0.32258155941963196, 0.3303755223751068, 0.33816948533058167, 0.3459634780883789, 0.35375744104385376, 0.3615514039993286, 0.36934536695480347]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 7.0, 4.0, 13.0, 19.0, 34.0, 43.0, 47.0, 50.0, 65.0, 99.0, 107.0, 96.0, 122.0, 65.0, 65.0, 50.0, 45.0, 27.0, 15.0, 14.0, 8.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07828134298324585, -0.07420427352190018, -0.0701272040605545, -0.06605012714862823, -0.06197305768728256, -0.05789598822593689, -0.05381891503930092, -0.04974184185266495, -0.045664772391319275, -0.0415877029299736, -0.03751062974333763, -0.03343355655670166, -0.029356487095355988, -0.025279415771365166, -0.021202344447374344, -0.017125273123383522, -0.0130482017993927, -0.008971130475401878, -0.0048940591514110565, -0.0008169878274202347, 0.003260083496570587, 0.007337154820561409, 0.01141422614455223, 0.015491297468543053, 0.019568368792533875, 0.023645440116524696, 0.027722511440515518, 0.03179958462715149, 0.03587665408849716, 0.039953723549842834, 0.044030796736478806, 0.04810786992311478, 0.05218493938446045, 0.05626200884580612, 0.06033908203244209, 0.06441615521907806, 0.06849322468042374, 0.07257029414176941, 0.07664737105369568, 0.08072444051504135, 0.08480150997638702, 0.0888785794377327, 0.09295564889907837, 0.09703272581100464, 0.10110979527235031, 0.10518686473369598, 0.10926394164562225, 0.11334101110696793, 0.1174180805683136, 0.12149515002965927, 0.12557221949100494, 0.1296492964029312, 0.1337263584136963, 0.13780343532562256, 0.14188051223754883, 0.1459575742483139, 0.15003465116024017, 0.15411172807216644, 0.15818879008293152, 0.1622658669948578, 0.16634294390678406, 0.17042000591754913, 0.1744970828294754, 0.17857414484024048, 0.18265122175216675]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 4.0, 0.0, 0.0, 6.0, 8.0, 6.0, 2.0, 6.0, 2.0, 4.0, 6.0, 6.0, 4.0, 12.0, 12.0, 18.0, 12.0, 12.0, 12.0, 24.0, 22.0, 18.0, 20.0, 152.0, 4193344.0, 368.0, 40.0, 20.0, 38.0, 16.0, 12.0, 4.0, 20.0, 8.0, 4.0, 8.0, 10.0, 2.0, 6.0, 6.0, 2.0, 6.0, 6.0, 2.0, 0.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.544921875, -1.484222412109375, -1.42352294921875, -1.362823486328125, -1.3021240234375, -1.241424560546875, -1.18072509765625, -1.120025634765625, -1.059326171875, -0.998626708984375, -0.93792724609375, -0.877227783203125, -0.8165283203125, -0.755828857421875, -0.69512939453125, -0.634429931640625, -0.57373046875, -0.513031005859375, -0.45233154296875, -0.391632080078125, -0.3309326171875, -0.270233154296875, -0.20953369140625, -0.148834228515625, -0.088134765625, -0.027435302734375, 0.03326416015625, 0.093963623046875, 0.1546630859375, 0.215362548828125, 0.27606201171875, 0.336761474609375, 0.3974609375, 0.458160400390625, 0.51885986328125, 0.579559326171875, 0.6402587890625, 0.700958251953125, 0.76165771484375, 0.822357177734375, 0.883056640625, 0.943756103515625, 1.00445556640625, 1.065155029296875, 1.1258544921875, 1.186553955078125, 1.24725341796875, 1.307952880859375, 1.36865234375, 1.429351806640625, 1.49005126953125, 1.550750732421875, 1.6114501953125, 1.672149658203125, 1.73284912109375, 1.793548583984375, 1.854248046875, 1.914947509765625, 1.97564697265625, 2.036346435546875, 2.0970458984375, 2.157745361328125, 2.21844482421875, 2.279144287109375, 2.33984375]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 1.0, 3.0, 4.0, 1.0, 4.0, 11.0, 5.0, 12.0, 28.0, 52.0, 105.0, 171.0, 208.0, 179.0, 119.0, 45.0, 17.0, 9.0, 7.0, 6.0, 7.0, 6.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0019664764404296875, -0.001839965581893921, -0.0017134547233581543, -0.0015869438648223877, -0.001460433006286621, -0.0013339221477508545, -0.0012074112892150879, -0.0010809004306793213, -0.0009543895721435547, -0.0008278787136077881, -0.0007013678550720215, -0.0005748569965362549, -0.0004483461380004883, -0.0003218352794647217, -0.00019532442092895508, -6.881356239318848e-05, 5.7697296142578125e-05, 0.00018420815467834473, 0.00031071901321411133, 0.00043722987174987793, 0.0005637407302856445, 0.0006902515888214111, 0.0008167624473571777, 0.0009432733058929443, 0.001069784164428711, 0.0011962950229644775, 0.0013228058815002441, 0.0014493167400360107, 0.0015758275985717773, 0.001702338457107544, 0.0018288493156433105, 0.001955360174179077, 0.0020818710327148438, 0.0022083818912506104, 0.002334892749786377, 0.0024614036083221436, 0.00258791446685791, 0.0027144253253936768, 0.0028409361839294434, 0.00296744704246521, 0.0030939579010009766, 0.003220468759536743, 0.0033469796180725098, 0.0034734904766082764, 0.003600001335144043, 0.0037265121936798096, 0.003853023052215576, 0.003979533910751343, 0.004106044769287109, 0.004232555627822876, 0.004359066486358643, 0.004485577344894409, 0.004612088203430176, 0.004738599061965942, 0.004865109920501709, 0.004991620779037476, 0.005118131637573242, 0.005244642496109009, 0.005371153354644775, 0.005497664213180542, 0.005624175071716309, 0.005750685930252075, 0.005877196788787842, 0.006003707647323608, 0.006130218505859375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 11.0, 10.0, 19.0, 46.0, 73.0, 167.0, 976.0, 4191515.0, 1085.0, 187.0, 100.0, 45.0, 23.0, 11.0, 7.0, 6.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.33203125, -1.3033905029296875, -1.274749755859375, -1.2461090087890625, -1.21746826171875, -1.1888275146484375, -1.160186767578125, -1.1315460205078125, -1.1029052734375, -1.0742645263671875, -1.045623779296875, -1.0169830322265625, -0.98834228515625, -0.9597015380859375, -0.931060791015625, -0.9024200439453125, -0.873779296875, -0.8451385498046875, -0.816497802734375, -0.7878570556640625, -0.75921630859375, -0.7305755615234375, -0.701934814453125, -0.6732940673828125, -0.6446533203125, -0.6160125732421875, -0.587371826171875, -0.5587310791015625, -0.53009033203125, -0.5014495849609375, -0.472808837890625, -0.4441680908203125, -0.41552734375, -0.3868865966796875, -0.358245849609375, -0.3296051025390625, -0.30096435546875, -0.2723236083984375, -0.243682861328125, -0.2150421142578125, -0.1864013671875, -0.1577606201171875, -0.129119873046875, -0.1004791259765625, -0.07183837890625, -0.0431976318359375, -0.014556884765625, 0.0140838623046875, 0.042724609375, 0.0713653564453125, 0.100006103515625, 0.1286468505859375, 0.15728759765625, 0.1859283447265625, 0.214569091796875, 0.2432098388671875, 0.2718505859375, 0.3004913330078125, 0.329132080078125, 0.3577728271484375, 0.38641357421875, 0.4150543212890625, 0.443695068359375, 0.4723358154296875, 0.5009765625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 8.0, 8.0, 9.0, 9.0, 22.0, 54.0, 68.0, 184.0, 398.0, 2133.0, 667.0, 252.0, 113.0, 67.0, 31.0, 21.0, 13.0, 9.0, 4.0, 5.0, 0.0, 3.0, 5.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.01451873779296875, -0.014143943786621094, -0.013769149780273438, -0.013394355773925781, -0.013019561767578125, -0.012644767761230469, -0.012269973754882812, -0.011895179748535156, -0.0115203857421875, -0.011145591735839844, -0.010770797729492188, -0.010396003723144531, -0.010021209716796875, -0.009646415710449219, -0.009271621704101562, -0.008896827697753906, -0.00852203369140625, -0.008147239685058594, -0.0077724456787109375, -0.007397651672363281, -0.007022857666015625, -0.006648063659667969, -0.0062732696533203125, -0.005898475646972656, -0.005523681640625, -0.005148887634277344, -0.0047740936279296875, -0.004399299621582031, -0.004024505615234375, -0.0036497116088867188, -0.0032749176025390625, -0.0029001235961914062, -0.00252532958984375, -0.0021505355834960938, -0.0017757415771484375, -0.0014009475708007812, -0.001026153564453125, -0.0006513595581054688, -0.0002765655517578125, 9.822845458984375e-05, 0.0004730224609375, 0.0008478164672851562, 0.0012226104736328125, 0.0015974044799804688, 0.001972198486328125, 0.0023469924926757812, 0.0027217864990234375, 0.0030965805053710938, 0.00347137451171875, 0.0038461685180664062, 0.0042209625244140625, 0.004595756530761719, 0.004970550537109375, 0.005345344543457031, 0.0057201385498046875, 0.006094932556152344, 0.0064697265625, 0.006844520568847656, 0.0072193145751953125, 0.007594108581542969, 0.007968902587890625, 0.008343696594238281, 0.008718490600585938, 0.009093284606933594, 0.00946807861328125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 29.0, 989.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.1909985542297363, -3.1370694637298584, -3.0831403732299805, -3.0292112827301025, -2.9752821922302246, -2.9213531017303467, -2.8674240112304688, -2.8134946823120117, -2.759565591812134, -2.705636501312256, -2.651707410812378, -2.5977783203125, -2.543849229812622, -2.489920139312744, -2.435990810394287, -2.3820619583129883, -2.3281328678131104, -2.2742037773132324, -2.2202746868133545, -2.1663455963134766, -2.1124165058135986, -2.0584874153137207, -2.0045580863952637, -1.9506291151046753, -1.8966999053955078, -1.8427708148956299, -1.788841724395752, -1.734912633895874, -1.6809834241867065, -1.6270543336868286, -1.5731252431869507, -1.5191961526870728, -1.4652670621871948, -1.411337971687317, -1.357408881187439, -1.3034796714782715, -1.2495505809783936, -1.1956214904785156, -1.1416923999786377, -1.0877633094787598, -1.0338342189788818, -0.9799051284790039, -0.9259759783744812, -0.8720468878746033, -0.8181177973747253, -0.7641886472702026, -0.7102595567703247, -0.6563304662704468, -0.6024013757705688, -0.5484722852706909, -0.4945431649684906, -0.4406140446662903, -0.38668495416641235, -0.33275583386421204, -0.2788267135620117, -0.2248976230621338, -0.17096847295761108, -0.11703936755657196, -0.06311025470495224, -0.00918114185333252, 0.044747963547706604, 0.09867706894874573, 0.15260618925094604, 0.20653527975082397, 0.2604644000530243]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 12.0, 14.0, 40.0, 63.0, 146.0, 176.0, 196.0, 160.0, 104.0, 54.0, 23.0, 18.0, 5.0, 1.0, 0.0, 3.0], "bins": [-0.29174840450286865, -0.2863435745239258, -0.2809387743473053, -0.2755339741706848, -0.27012914419174194, -0.2647243142127991, -0.2593195140361786, -0.2539147138595581, -0.24850988388061523, -0.24310506880283356, -0.23770025372505188, -0.2322954386472702, -0.22689062356948853, -0.22148580849170685, -0.21608099341392517, -0.2106761783361435, -0.20527136325836182, -0.19986654818058014, -0.19446173310279846, -0.18905691802501678, -0.1836521029472351, -0.17824728786945343, -0.17284247279167175, -0.16743765771389008, -0.1620328426361084, -0.15662802755832672, -0.15122321248054504, -0.14581839740276337, -0.1404135823249817, -0.1350087672472, -0.12960395216941833, -0.12419913709163666, -0.11879432201385498, -0.1133895069360733, -0.10798469185829163, -0.10257987678050995, -0.09717506170272827, -0.0917702466249466, -0.08636543154716492, -0.08096061646938324, -0.07555580139160156, -0.07015098631381989, -0.06474617123603821, -0.05934135615825653, -0.053936541080474854, -0.048531726002693176, -0.0431269109249115, -0.03772209584712982, -0.032317280769348145, -0.026912465691566467, -0.02150765061378479, -0.016102835536003113, -0.010698020458221436, -0.005293205380439758, 0.00011160969734191895, 0.005516424775123596, 0.010921239852905273, 0.01632605493068695, 0.021730870008468628, 0.027135685086250305, 0.03254050016403198, 0.03794531524181366, 0.04335013031959534, 0.048754945397377014, 0.05415976047515869]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 1.0, 2.0, 5.0, 6.0, 6.0, 10.0, 11.0, 11.0, 15.0, 20.0, 30.0, 24.0, 45.0, 30.0, 50.0, 38.0, 50.0, 62.0, 329.0, 477158.0, 569928.0, 339.0, 59.0, 62.0, 55.0, 40.0, 29.0, 27.0, 23.0, 16.0, 16.0, 16.0, 10.0, 9.0, 5.0, 3.0, 4.0, 5.0, 0.0, 0.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.214111328125, -0.20672988891601562, -0.19934844970703125, -0.19196701049804688, -0.1845855712890625, -0.17720413208007812, -0.16982269287109375, -0.16244125366210938, -0.155059814453125, -0.14767837524414062, -0.14029693603515625, -0.13291549682617188, -0.1255340576171875, -0.11815261840820312, -0.11077117919921875, -0.10338973999023438, -0.09600830078125, -0.08862686157226562, -0.08124542236328125, -0.07386398315429688, -0.0664825439453125, -0.059101104736328125, -0.05171966552734375, -0.044338226318359375, -0.036956787109375, -0.029575347900390625, -0.02219390869140625, -0.014812469482421875, -0.0074310302734375, -4.9591064453125e-05, 0.00733184814453125, 0.014713287353515625, 0.0220947265625, 0.029476165771484375, 0.03685760498046875, 0.044239044189453125, 0.0516204833984375, 0.059001922607421875, 0.06638336181640625, 0.07376480102539062, 0.081146240234375, 0.08852767944335938, 0.09590911865234375, 0.10329055786132812, 0.1106719970703125, 0.11805343627929688, 0.12543487548828125, 0.13281631469726562, 0.14019775390625, 0.14757919311523438, 0.15496063232421875, 0.16234207153320312, 0.1697235107421875, 0.17710494995117188, 0.18448638916015625, 0.19186782836914062, 0.199249267578125, 0.20663070678710938, 0.21401214599609375, 0.22139358520507812, 0.2287750244140625, 0.23615646362304688, 0.24353790283203125, 0.2509193420410156, 0.25830078125]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 13.0, 84.0, 485.0, 369.0, 65.0, 5.0, 0.0, 0.0, 1.0], "bins": [-0.061767578125, -0.06069976091384888, -0.059631943702697754, -0.05856412649154663, -0.05749630928039551, -0.056428492069244385, -0.05536067485809326, -0.05429285764694214, -0.053225040435791016, -0.05215722322463989, -0.05108940601348877, -0.050021588802337646, -0.04895377159118652, -0.0478859543800354, -0.04681813716888428, -0.045750319957733154, -0.04468250274658203, -0.04361468553543091, -0.042546868324279785, -0.04147905111312866, -0.04041123390197754, -0.039343416690826416, -0.03827559947967529, -0.03720778226852417, -0.03613996505737305, -0.035072147846221924, -0.0340043306350708, -0.03293651342391968, -0.031868696212768555, -0.03080087900161743, -0.02973306179046631, -0.028665244579315186, -0.027597427368164062, -0.02652961015701294, -0.025461792945861816, -0.024393975734710693, -0.02332615852355957, -0.022258341312408447, -0.021190524101257324, -0.0201227068901062, -0.019054889678955078, -0.017987072467803955, -0.016919255256652832, -0.01585143804550171, -0.014783620834350586, -0.013715803623199463, -0.01264798641204834, -0.011580169200897217, -0.010512351989746094, -0.00944453477859497, -0.008376717567443848, -0.007308900356292725, -0.0062410831451416016, -0.0051732659339904785, -0.0041054487228393555, -0.0030376315116882324, -0.0019698143005371094, -0.0009019970893859863, 0.00016582012176513672, 0.0012336373329162598, 0.002301454544067383, 0.003369271755218506, 0.004437088966369629, 0.005504906177520752, 0.006572723388671875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 10.0, 5.0, 6.0, 9.0, 14.0, 10.0, 10.0, 19.0, 18.0, 37.0, 52.0, 69.0, 112.0, 212.0, 468.0, 1888.0, 33472.0, 974300.0, 34796.0, 1997.0, 455.0, 206.0, 117.0, 74.0, 54.0, 32.0, 48.0, 15.0, 9.0, 11.0, 7.0, 5.0, 9.0, 1.0, 3.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1279296875, -0.12359428405761719, -0.11925888061523438, -0.11492347717285156, -0.11058807373046875, -0.10625267028808594, -0.10191726684570312, -0.09758186340332031, -0.0932464599609375, -0.08891105651855469, -0.08457565307617188, -0.08024024963378906, -0.07590484619140625, -0.07156944274902344, -0.06723403930664062, -0.06289863586425781, -0.058563232421875, -0.05422782897949219, -0.049892425537109375, -0.04555702209472656, -0.04122161865234375, -0.03688621520996094, -0.032550811767578125, -0.028215408325195312, -0.0238800048828125, -0.019544601440429688, -0.015209197998046875, -0.010873794555664062, -0.00653839111328125, -0.0022029876708984375, 0.002132415771484375, 0.0064678192138671875, 0.01080322265625, 0.015138626098632812, 0.019474029541015625, 0.023809432983398438, 0.02814483642578125, 0.03248023986816406, 0.036815643310546875, 0.04115104675292969, 0.0454864501953125, 0.04982185363769531, 0.054157257080078125, 0.05849266052246094, 0.06282806396484375, 0.06716346740722656, 0.07149887084960938, 0.07583427429199219, 0.080169677734375, 0.08450508117675781, 0.08884048461914062, 0.09317588806152344, 0.09751129150390625, 0.10184669494628906, 0.10618209838867188, 0.11051750183105469, 0.1148529052734375, 0.11918830871582031, 0.12352371215820312, 0.12785911560058594, 0.13219451904296875, 0.13652992248535156, 0.14086532592773438, 0.1452007293701172, 0.1495361328125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 3.0, 6.0, 5.0, 9.0, 13.0, 17.0, 16.0, 13.0, 17.0, 22.0, 35.0, 43.0, 49.0, 58.0, 64.0, 63.0, 69.0, 58.0, 64.0, 68.0, 53.0, 45.0, 51.0, 34.0, 38.0, 20.0, 12.0, 13.0, 10.0, 13.0, 6.0, 4.0, 5.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.038665771484375, -0.03717327117919922, -0.03568077087402344, -0.034188270568847656, -0.032695770263671875, -0.031203269958496094, -0.029710769653320312, -0.02821826934814453, -0.02672576904296875, -0.02523326873779297, -0.023740768432617188, -0.022248268127441406, -0.020755767822265625, -0.019263267517089844, -0.017770767211914062, -0.01627826690673828, -0.0147857666015625, -0.013293266296386719, -0.011800765991210938, -0.010308265686035156, -0.008815765380859375, -0.007323265075683594, -0.0058307647705078125, -0.004338264465332031, -0.00284576416015625, -0.0013532638549804688, 0.0001392364501953125, 0.0016317367553710938, 0.003124237060546875, 0.004616737365722656, 0.0061092376708984375, 0.007601737976074219, 0.00909423828125, 0.010586738586425781, 0.012079238891601562, 0.013571739196777344, 0.015064239501953125, 0.016556739807128906, 0.018049240112304688, 0.01954174041748047, 0.02103424072265625, 0.02252674102783203, 0.024019241333007812, 0.025511741638183594, 0.027004241943359375, 0.028496742248535156, 0.029989242553710938, 0.03148174285888672, 0.0329742431640625, 0.03446674346923828, 0.03595924377441406, 0.037451744079589844, 0.038944244384765625, 0.040436744689941406, 0.04192924499511719, 0.04342174530029297, 0.04491424560546875, 0.04640674591064453, 0.04789924621582031, 0.049391746520996094, 0.050884246826171875, 0.052376747131347656, 0.05386924743652344, 0.05536174774169922, 0.056854248046875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 4.0, 3.0, 5.0, 6.0, 11.0, 9.0, 20.0, 18.0, 23.0, 34.0, 55.0, 150.0, 343.0, 1832.0, 44282.0, 994770.0, 5744.0, 762.0, 234.0, 79.0, 54.0, 38.0, 18.0, 16.0, 13.0, 5.0, 7.0, 6.0, 4.0, 7.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1590576171875, -0.15379905700683594, -0.14854049682617188, -0.1432819366455078, -0.13802337646484375, -0.1327648162841797, -0.12750625610351562, -0.12224769592285156, -0.1169891357421875, -0.11173057556152344, -0.10647201538085938, -0.10121345520019531, -0.09595489501953125, -0.09069633483886719, -0.08543777465820312, -0.08017921447753906, -0.074920654296875, -0.06966209411621094, -0.06440353393554688, -0.05914497375488281, -0.05388641357421875, -0.04862785339355469, -0.043369293212890625, -0.03811073303222656, -0.0328521728515625, -0.027593612670898438, -0.022335052490234375, -0.017076492309570312, -0.01181793212890625, -0.0065593719482421875, -0.001300811767578125, 0.0039577484130859375, 0.00921630859375, 0.014474868774414062, 0.019733428955078125, 0.024991989135742188, 0.03025054931640625, 0.03550910949707031, 0.040767669677734375, 0.04602622985839844, 0.0512847900390625, 0.05654335021972656, 0.061801910400390625, 0.06706047058105469, 0.07231903076171875, 0.07757759094238281, 0.08283615112304688, 0.08809471130371094, 0.093353271484375, 0.09861183166503906, 0.10387039184570312, 0.10912895202636719, 0.11438751220703125, 0.11964607238769531, 0.12490463256835938, 0.13016319274902344, 0.1354217529296875, 0.14068031311035156, 0.14593887329101562, 0.1511974334716797, 0.15645599365234375, 0.1617145538330078, 0.16697311401367188, 0.17223167419433594, 0.177490234375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 5.0, 1.0, 4.0, 5.0, 6.0, 15.0, 7.0, 14.0, 19.0, 23.0, 42.0, 77.0, 160.0, 216.0, 163.0, 106.0, 42.0, 31.0, 19.0, 9.0, 8.0, 8.0, 7.0, 6.0, 3.0, 4.0, 3.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.4139881134033203e-05, -2.332311123609543e-05, -2.2506341338157654e-05, -2.168957144021988e-05, -2.0872801542282104e-05, -2.005603164434433e-05, -1.9239261746406555e-05, -1.842249184846878e-05, -1.7605721950531006e-05, -1.678895205259323e-05, -1.5972182154655457e-05, -1.5155412256717682e-05, -1.4338642358779907e-05, -1.3521872460842133e-05, -1.2705102562904358e-05, -1.1888332664966583e-05, -1.1071562767028809e-05, -1.0254792869091034e-05, -9.43802297115326e-06, -8.621253073215485e-06, -7.80448317527771e-06, -6.987713277339935e-06, -6.170943379402161e-06, -5.354173481464386e-06, -4.537403583526611e-06, -3.7206336855888367e-06, -2.903863787651062e-06, -2.0870938897132874e-06, -1.2703239917755127e-06, -4.5355409383773804e-07, 3.632158041000366e-07, 1.1799857020378113e-06, 1.996755599975586e-06, 2.8135254979133606e-06, 3.6302953958511353e-06, 4.44706529378891e-06, 5.2638351917266846e-06, 6.080605089664459e-06, 6.897374987602234e-06, 7.714144885540009e-06, 8.530914783477783e-06, 9.347684681415558e-06, 1.0164454579353333e-05, 1.0981224477291107e-05, 1.1797994375228882e-05, 1.2614764273166656e-05, 1.3431534171104431e-05, 1.4248304069042206e-05, 1.506507396697998e-05, 1.5881843864917755e-05, 1.669861376285553e-05, 1.7515383660793304e-05, 1.833215355873108e-05, 1.9148923456668854e-05, 1.996569335460663e-05, 2.0782463252544403e-05, 2.1599233150482178e-05, 2.2416003048419952e-05, 2.3232772946357727e-05, 2.4049542844295502e-05, 2.4866312742233276e-05, 2.568308264017105e-05, 2.6499852538108826e-05, 2.73166224360466e-05, 2.8133392333984375e-05]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 7.0, 5.0, 2.0, 6.0, 14.0, 18.0, 22.0, 47.0, 115.0, 296.0, 1800.0, 76930.0, 965120.0, 3385.0, 464.0, 151.0, 73.0, 35.0, 20.0, 12.0, 13.0, 9.0, 3.0, 6.0, 1.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.29052734375, -0.2817573547363281, -0.27298736572265625, -0.2642173767089844, -0.2554473876953125, -0.24667739868164062, -0.23790740966796875, -0.22913742065429688, -0.220367431640625, -0.21159744262695312, -0.20282745361328125, -0.19405746459960938, -0.1852874755859375, -0.17651748657226562, -0.16774749755859375, -0.15897750854492188, -0.15020751953125, -0.14143753051757812, -0.13266754150390625, -0.12389755249023438, -0.1151275634765625, -0.10635757446289062, -0.09758758544921875, -0.08881759643554688, -0.080047607421875, -0.07127761840820312, -0.06250762939453125, -0.053737640380859375, -0.0449676513671875, -0.036197662353515625, -0.02742767333984375, -0.018657684326171875, -0.0098876953125, -0.001117706298828125, 0.00765228271484375, 0.016422271728515625, 0.0251922607421875, 0.033962249755859375, 0.04273223876953125, 0.051502227783203125, 0.060272216796875, 0.06904220581054688, 0.07781219482421875, 0.08658218383789062, 0.0953521728515625, 0.10412216186523438, 0.11289215087890625, 0.12166213989257812, 0.13043212890625, 0.13920211791992188, 0.14797210693359375, 0.15674209594726562, 0.1655120849609375, 0.17428207397460938, 0.18305206298828125, 0.19182205200195312, 0.200592041015625, 0.20936203002929688, 0.21813201904296875, 0.22690200805664062, 0.2356719970703125, 0.24444198608398438, 0.25321197509765625, 0.2619819641113281, 0.270751953125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 6.0, 2.0, 3.0, 2.0, 4.0, 11.0, 8.0, 19.0, 32.0, 99.0, 314.0, 334.0, 82.0, 31.0, 15.0, 11.0, 11.0, 6.0, 3.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05743408203125, -0.05456829071044922, -0.05170249938964844, -0.048836708068847656, -0.045970916748046875, -0.043105125427246094, -0.04023933410644531, -0.03737354278564453, -0.03450775146484375, -0.03164196014404297, -0.028776168823242188, -0.025910377502441406, -0.023044586181640625, -0.020178794860839844, -0.017313003540039062, -0.014447212219238281, -0.0115814208984375, -0.008715629577636719, -0.0058498382568359375, -0.0029840469360351562, -0.000118255615234375, 0.0027475357055664062, 0.0056133270263671875, 0.008479118347167969, 0.01134490966796875, 0.014210700988769531, 0.017076492309570312, 0.019942283630371094, 0.022808074951171875, 0.025673866271972656, 0.028539657592773438, 0.03140544891357422, 0.034271240234375, 0.03713703155517578, 0.04000282287597656, 0.042868614196777344, 0.045734405517578125, 0.048600196838378906, 0.05146598815917969, 0.05433177947998047, 0.05719757080078125, 0.06006336212158203, 0.06292915344238281, 0.0657949447631836, 0.06866073608398438, 0.07152652740478516, 0.07439231872558594, 0.07725811004638672, 0.0801239013671875, 0.08298969268798828, 0.08585548400878906, 0.08872127532958984, 0.09158706665039062, 0.0944528579711914, 0.09731864929199219, 0.10018444061279297, 0.10305023193359375, 0.10591602325439453, 0.10878181457519531, 0.1116476058959961, 0.11451339721679688, 0.11737918853759766, 0.12024497985839844, 0.12311077117919922, 0.1259765625]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 753.0, 253.0, 5.0, 3.0, 1.0], "bins": [-7.7874979972839355, -7.657405853271484, -7.527313709259033, -7.397221088409424, -7.267128944396973, -7.1370368003845215, -7.00694465637207, -6.876852512359619, -6.746760368347168, -6.616668224334717, -6.486576080322266, -6.356483459472656, -6.226391315460205, -6.096299171447754, -5.966207027435303, -5.836114883422852, -5.706022262573242, -5.575930118560791, -5.44583797454834, -5.3157453536987305, -5.185653209686279, -5.055561065673828, -4.925468921661377, -4.795376777648926, -4.665284156799316, -4.535192012786865, -4.405099868774414, -4.275007247924805, -4.1449151039123535, -4.014822959899902, -3.884730815887451, -3.754638671875, -3.624547004699707, -3.494454860687256, -3.3643624782562256, -3.2342703342437744, -3.104177951812744, -2.974085807800293, -2.843993663787842, -2.7139015197753906, -2.5838091373443604, -2.453716993331909, -2.323624610900879, -2.1935324668884277, -2.0634403228759766, -1.9333479404449463, -1.8032557964324951, -1.6731635332107544, -1.5430712699890137, -1.412979006767273, -1.2828867435455322, -1.152794599533081, -1.0227023363113403, -0.8926100730895996, -0.7625178694725037, -0.6324256658554077, -0.5023333430290222, -0.3722411096096039, -0.24214887619018555, -0.11205664277076721, 0.018035590648651123, 0.14812785387039185, 0.2782200574874878, 0.40831226110458374, 0.5384045243263245]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 4.0, 15.0, 25.0, 35.0, 55.0, 69.0, 95.0, 113.0, 122.0, 104.0, 108.0, 86.0, 57.0, 44.0, 34.0, 23.0, 8.0, 6.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.9329677224159241, -0.9136562943458557, -0.8943448066711426, -0.8750333786010742, -0.8557219505310059, -0.8364104628562927, -0.8170990347862244, -0.7977875471115112, -0.7784761190414429, -0.7591646909713745, -0.7398532032966614, -0.720541775226593, -0.7012302875518799, -0.6819188594818115, -0.6626074314117432, -0.6432960033416748, -0.6239845156669617, -0.6046730875968933, -0.5853615999221802, -0.5660501718521118, -0.5467387437820435, -0.5274272561073303, -0.508115828037262, -0.4888043701648712, -0.46949291229248047, -0.4501814544200897, -0.430869996547699, -0.4115585684776306, -0.39224711060523987, -0.3729356527328491, -0.35362422466278076, -0.33431276679039, -0.31500130891799927, -0.2956898510456085, -0.2763783931732178, -0.2570669651031494, -0.23775550723075867, -0.21844404935836792, -0.19913260638713837, -0.1798211634159088, -0.16050970554351807, -0.14119824767112732, -0.12188680469989777, -0.10257535427808762, -0.08326390385627747, -0.06395245343446732, -0.044641003012657166, -0.025329560041427612, -0.006018102169036865, 0.013293348252773285, 0.032604798674583435, 0.051916249096393585, 0.07122769951820374, 0.09053914994001389, 0.10985060036182404, 0.1291620433330536, 0.14847350120544434, 0.16778495907783508, 0.18709640204906464, 0.2064078450202942, 0.22571930289268494, 0.24503076076507568, 0.26434218883514404, 0.2836536467075348, 0.30296510457992554]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 5.0, 19.0, 62.0, 137.0, 558.0, 4109777.0, 83426.0, 261.0, 35.0, 8.0, 3.0, 1.0, 1.0], "bins": [-2.09375, -2.0569839477539062, -2.0202178955078125, -1.9834518432617188, -1.946685791015625, -1.9099197387695312, -1.8731536865234375, -1.8363876342773438, -1.79962158203125, -1.7628555297851562, -1.7260894775390625, -1.6893234252929688, -1.652557373046875, -1.6157913208007812, -1.5790252685546875, -1.5422592163085938, -1.5054931640625, -1.4687271118164062, -1.4319610595703125, -1.3951950073242188, -1.358428955078125, -1.3216629028320312, -1.2848968505859375, -1.2481307983398438, -1.21136474609375, -1.1745986938476562, -1.1378326416015625, -1.1010665893554688, -1.064300537109375, -1.0275344848632812, -0.9907684326171875, -0.9540023803710938, -0.917236328125, -0.8804702758789062, -0.8437042236328125, -0.8069381713867188, -0.770172119140625, -0.7334060668945312, -0.6966400146484375, -0.6598739624023438, -0.62310791015625, -0.5863418579101562, -0.5495758056640625, -0.5128097534179688, -0.476043701171875, -0.43927764892578125, -0.4025115966796875, -0.36574554443359375, -0.3289794921875, -0.29221343994140625, -0.2554473876953125, -0.21868133544921875, -0.181915283203125, -0.14514923095703125, -0.1083831787109375, -0.07161712646484375, -0.03485107421875, 0.00191497802734375, 0.0386810302734375, 0.07544708251953125, 0.112213134765625, 0.14897918701171875, 0.1857452392578125, 0.22251129150390625, 0.25927734375]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 15.0, 63.0, 236.0, 385.0, 218.0, 87.0, 10.0, 4.0, 0.0, 1.0], "bins": [-0.06884765625, -0.06764960289001465, -0.0664515495300293, -0.06525349617004395, -0.0640554428100586, -0.06285738945007324, -0.06165933609008789, -0.06046128273010254, -0.05926322937011719, -0.058065176010131836, -0.056867122650146484, -0.05566906929016113, -0.05447101593017578, -0.05327296257019043, -0.05207490921020508, -0.05087685585021973, -0.049678802490234375, -0.04848074913024902, -0.04728269577026367, -0.04608464241027832, -0.04488658905029297, -0.04368853569030762, -0.042490482330322266, -0.041292428970336914, -0.04009437561035156, -0.03889632225036621, -0.03769826889038086, -0.03650021553039551, -0.035302162170410156, -0.034104108810424805, -0.03290605545043945, -0.0317080020904541, -0.03050994873046875, -0.0293118953704834, -0.028113842010498047, -0.026915788650512695, -0.025717735290527344, -0.024519681930541992, -0.02332162857055664, -0.02212357521057129, -0.020925521850585938, -0.019727468490600586, -0.018529415130615234, -0.017331361770629883, -0.01613330841064453, -0.01493525505065918, -0.013737201690673828, -0.012539148330688477, -0.011341094970703125, -0.010143041610717773, -0.008944988250732422, -0.00774693489074707, -0.006548881530761719, -0.005350828170776367, -0.004152774810791016, -0.002954721450805664, -0.0017566680908203125, -0.0005586147308349609, 0.0006394386291503906, 0.0018374919891357422, 0.0030355453491210938, 0.004233598709106445, 0.005431652069091797, 0.0066297054290771484, 0.0078277587890625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 5.0, 19.0, 55.0, 107.0, 171.0, 265.0, 446.0, 4189889.0, 2756.0, 348.0, 123.0, 66.0, 24.0, 8.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-2.560546875, -2.499267578125, -2.43798828125, -2.376708984375, -2.3154296875, -2.254150390625, -2.19287109375, -2.131591796875, -2.0703125, -2.009033203125, -1.94775390625, -1.886474609375, -1.8251953125, -1.763916015625, -1.70263671875, -1.641357421875, -1.580078125, -1.518798828125, -1.45751953125, -1.396240234375, -1.3349609375, -1.273681640625, -1.21240234375, -1.151123046875, -1.08984375, -1.028564453125, -0.96728515625, -0.906005859375, -0.8447265625, -0.783447265625, -0.72216796875, -0.660888671875, -0.599609375, -0.538330078125, -0.47705078125, -0.415771484375, -0.3544921875, -0.293212890625, -0.23193359375, -0.170654296875, -0.109375, -0.048095703125, 0.01318359375, 0.074462890625, 0.1357421875, 0.197021484375, 0.25830078125, 0.319580078125, 0.380859375, 0.442138671875, 0.50341796875, 0.564697265625, 0.6259765625, 0.687255859375, 0.74853515625, 0.809814453125, 0.87109375, 0.932373046875, 0.99365234375, 1.054931640625, 1.1162109375, 1.177490234375, 1.23876953125, 1.300048828125, 1.361328125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 19.0, 3827.0, 217.0, 21.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.366455078125, -0.3589305877685547, -0.3514060974121094, -0.34388160705566406, -0.33635711669921875, -0.32883262634277344, -0.3213081359863281, -0.3137836456298828, -0.3062591552734375, -0.2987346649169922, -0.2912101745605469, -0.28368568420410156, -0.27616119384765625, -0.26863670349121094, -0.2611122131347656, -0.2535877227783203, -0.246063232421875, -0.2385387420654297, -0.23101425170898438, -0.22348976135253906, -0.21596527099609375, -0.20844078063964844, -0.20091629028320312, -0.1933917999267578, -0.1858673095703125, -0.1783428192138672, -0.17081832885742188, -0.16329383850097656, -0.15576934814453125, -0.14824485778808594, -0.14072036743164062, -0.1331958770751953, -0.12567138671875, -0.11814689636230469, -0.11062240600585938, -0.10309791564941406, -0.09557342529296875, -0.08804893493652344, -0.08052444458007812, -0.07299995422363281, -0.0654754638671875, -0.05795097351074219, -0.050426483154296875, -0.04290199279785156, -0.03537750244140625, -0.027853012084960938, -0.020328521728515625, -0.012804031372070312, -0.005279541015625, 0.0022449493408203125, 0.009769439697265625, 0.017293930053710938, 0.02481842041015625, 0.03234291076660156, 0.039867401123046875, 0.04739189147949219, 0.0549163818359375, 0.06244087219238281, 0.06996536254882812, 0.07748985290527344, 0.08501434326171875, 0.09253883361816406, 0.10006332397460938, 0.10758781433105469, 0.1151123046875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 62.0, 910.0, 36.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.599719524383545, -4.4937334060668945, -4.387746810913086, -4.2817606925964355, -4.175774097442627, -4.069787979125977, -3.963801383972168, -3.8578152656555176, -3.751828908920288, -3.6458425521850586, -3.539856195449829, -3.4338698387145996, -3.32788348197937, -3.2218971252441406, -3.1159110069274902, -3.0099246501922607, -2.9039382934570312, -2.7979519367218018, -2.6919655799865723, -2.5859792232513428, -2.4799928665161133, -2.374006748199463, -2.2680201530456543, -2.162034034729004, -2.0560474395751953, -1.9500610828399658, -1.8440747261047363, -1.7380883693695068, -1.632102131843567, -1.5261157751083374, -1.420129418373108, -1.314143180847168, -1.2081568241119385, -1.102170467376709, -0.9961841702461243, -0.8901978135108948, -0.7842115163803101, -0.6782251596450806, -0.5722388029098511, -0.46625250577926636, -0.36026614904403687, -0.25427982211112976, -0.14829348027706146, -0.042307138442993164, 0.06367918848991394, 0.16966551542282104, 0.27565187215805054, 0.38163816928863525, 0.48762452602386475, 0.5936108827590942, 0.699597179889679, 0.8055835366249084, 0.9115698337554932, 1.0175561904907227, 1.1235425472259521, 1.2295289039611816, 1.3355152606964111, 1.4415016174316406, 1.5474879741668701, 1.6534743309020996, 1.7594605684280396, 1.865446925163269, 1.9714332818984985, 2.0774195194244385, 2.183405876159668]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 7.0, 23.0, 27.0, 56.0, 112.0, 145.0, 153.0, 170.0, 105.0, 83.0, 69.0, 32.0, 5.0, 11.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1943914890289307, -1.155416488647461, -1.1164414882659912, -1.077466368675232, -1.0384913682937622, -0.9995163679122925, -0.9605413675308228, -0.9215663075447083, -0.8825912475585938, -0.843616247177124, -0.8046411871910095, -0.7656661868095398, -0.7266911268234253, -0.6877161264419556, -0.6487411260604858, -0.6097660660743713, -0.5707910656929016, -0.5318160653114319, -0.4928410053253174, -0.45386600494384766, -0.41489094495773315, -0.3759159445762634, -0.3369409143924713, -0.2979658842086792, -0.2589908540248871, -0.22001582384109497, -0.18104079365730286, -0.14206577837467194, -0.10309074819087982, -0.06411571800708771, -0.025140702724456787, 0.013834327459335327, 0.05280935764312744, 0.09178438782691956, 0.13075941801071167, 0.1697344332933426, 0.2087094634771347, 0.24768449366092682, 0.28665950894355774, 0.32563453912734985, 0.36460956931114197, 0.4035845994949341, 0.4425596296787262, 0.4815346598625183, 0.520509660243988, 0.5594847202301025, 0.5984597206115723, 0.637434720993042, 0.6764097809791565, 0.7153847813606262, 0.7543598413467407, 0.7933348417282104, 0.832309901714325, 0.8712849020957947, 0.9102599620819092, 0.9492349624633789, 0.9882099628448486, 1.0271849632263184, 1.066159963607788, 1.1051350831985474, 1.144110083580017, 1.1830850839614868, 1.2220600843429565, 1.2610352039337158, 1.3000102043151855]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 9.0, 13.0, 18.0, 29.0, 42.0, 69.0, 117.0, 330.0, 1255.0, 9866.0, 967527.0, 65575.0, 2699.0, 599.0, 186.0, 77.0, 53.0, 30.0, 26.0, 12.0, 4.0, 5.0, 7.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.489501953125, -0.4740715026855469, -0.45864105224609375, -0.4432106018066406, -0.4277801513671875, -0.4123497009277344, -0.39691925048828125, -0.3814888000488281, -0.366058349609375, -0.3506278991699219, -0.33519744873046875, -0.3197669982910156, -0.3043365478515625, -0.2889060974121094, -0.27347564697265625, -0.2580451965332031, -0.24261474609375, -0.22718429565429688, -0.21175384521484375, -0.19632339477539062, -0.1808929443359375, -0.16546249389648438, -0.15003204345703125, -0.13460159301757812, -0.119171142578125, -0.10374069213867188, -0.08831024169921875, -0.07287979125976562, -0.0574493408203125, -0.042018890380859375, -0.02658843994140625, -0.011157989501953125, 0.0042724609375, 0.019702911376953125, 0.03513336181640625, 0.050563812255859375, 0.0659942626953125, 0.08142471313476562, 0.09685516357421875, 0.11228561401367188, 0.127716064453125, 0.14314651489257812, 0.15857696533203125, 0.17400741577148438, 0.1894378662109375, 0.20486831665039062, 0.22029876708984375, 0.23572921752929688, 0.25115966796875, 0.2665901184082031, 0.28202056884765625, 0.2974510192871094, 0.3128814697265625, 0.3283119201660156, 0.34374237060546875, 0.3591728210449219, 0.374603271484375, 0.3900337219238281, 0.40546417236328125, 0.4208946228027344, 0.4363250732421875, 0.4517555236816406, 0.46718597412109375, 0.4826164245605469, 0.498046875]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 3.0, 10.0, 33.0, 44.0, 114.0, 150.0, 202.0, 166.0, 122.0, 90.0, 39.0, 25.0, 5.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.09674072265625, -0.0947122573852539, -0.09268379211425781, -0.09065532684326172, -0.08862686157226562, -0.08659839630126953, -0.08456993103027344, -0.08254146575927734, -0.08051300048828125, -0.07848453521728516, -0.07645606994628906, -0.07442760467529297, -0.07239913940429688, -0.07037067413330078, -0.06834220886230469, -0.0663137435913086, -0.0642852783203125, -0.062256813049316406, -0.06022834777832031, -0.05819988250732422, -0.056171417236328125, -0.05414295196533203, -0.05211448669433594, -0.050086021423339844, -0.04805755615234375, -0.046029090881347656, -0.04400062561035156, -0.04197216033935547, -0.039943695068359375, -0.03791522979736328, -0.03588676452636719, -0.033858299255371094, -0.031829833984375, -0.029801368713378906, -0.027772903442382812, -0.02574443817138672, -0.023715972900390625, -0.02168750762939453, -0.019659042358398438, -0.017630577087402344, -0.01560211181640625, -0.013573646545410156, -0.011545181274414062, -0.009516716003417969, -0.007488250732421875, -0.005459785461425781, -0.0034313201904296875, -0.0014028549194335938, 0.0006256103515625, 0.0026540756225585938, 0.0046825408935546875, 0.006711006164550781, 0.008739471435546875, 0.010767936706542969, 0.012796401977539062, 0.014824867248535156, 0.01685333251953125, 0.018881797790527344, 0.020910263061523438, 0.02293872833251953, 0.024967193603515625, 0.02699565887451172, 0.029024124145507812, 0.031052589416503906, 0.0330810546875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 9.0, 8.0, 8.0, 12.0, 16.0, 15.0, 29.0, 34.0, 41.0, 65.0, 121.0, 254.0, 706.0, 5342.0, 809154.0, 228728.0, 2927.0, 505.0, 225.0, 114.0, 64.0, 44.0, 34.0, 29.0, 15.0, 11.0, 9.0, 11.0, 6.0, 4.0, 2.0, 4.0, 5.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.32275390625, -0.313232421875, -0.3037109375, -0.294189453125, -0.28466796875, -0.275146484375, -0.265625, -0.256103515625, -0.24658203125, -0.237060546875, -0.2275390625, -0.218017578125, -0.20849609375, -0.198974609375, -0.189453125, -0.179931640625, -0.17041015625, -0.160888671875, -0.1513671875, -0.141845703125, -0.13232421875, -0.122802734375, -0.11328125, -0.103759765625, -0.09423828125, -0.084716796875, -0.0751953125, -0.065673828125, -0.05615234375, -0.046630859375, -0.037109375, -0.027587890625, -0.01806640625, -0.008544921875, 0.0009765625, 0.010498046875, 0.02001953125, 0.029541015625, 0.0390625, 0.048583984375, 0.05810546875, 0.067626953125, 0.0771484375, 0.086669921875, 0.09619140625, 0.105712890625, 0.115234375, 0.124755859375, 0.13427734375, 0.143798828125, 0.1533203125, 0.162841796875, 0.17236328125, 0.181884765625, 0.19140625, 0.200927734375, 0.21044921875, 0.219970703125, 0.2294921875, 0.239013671875, 0.24853515625, 0.258056640625, 0.267578125, 0.277099609375, 0.28662109375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 4.0, 2.0, 9.0, 10.0, 11.0, 11.0, 18.0, 21.0, 38.0, 35.0, 30.0, 40.0, 43.0, 53.0, 61.0, 62.0, 67.0, 58.0, 55.0, 58.0, 50.0, 42.0, 43.0, 32.0, 33.0, 35.0, 14.0, 16.0, 9.0, 18.0, 7.0, 4.0, 6.0, 2.0, 5.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11346435546875, -0.11010932922363281, -0.10675430297851562, -0.10339927673339844, -0.10004425048828125, -0.09668922424316406, -0.09333419799804688, -0.08997917175292969, -0.0866241455078125, -0.08326911926269531, -0.07991409301757812, -0.07655906677246094, -0.07320404052734375, -0.06984901428222656, -0.06649398803710938, -0.06313896179199219, -0.059783935546875, -0.05642890930175781, -0.053073883056640625, -0.04971885681152344, -0.04636383056640625, -0.04300880432128906, -0.039653778076171875, -0.03629875183105469, -0.0329437255859375, -0.029588699340820312, -0.026233673095703125, -0.022878646850585938, -0.01952362060546875, -0.016168594360351562, -0.012813568115234375, -0.009458541870117188, -0.006103515625, -0.0027484893798828125, 0.000606536865234375, 0.0039615631103515625, 0.00731658935546875, 0.010671615600585938, 0.014026641845703125, 0.017381668090820312, 0.0207366943359375, 0.024091720581054688, 0.027446746826171875, 0.030801773071289062, 0.03415679931640625, 0.03751182556152344, 0.040866851806640625, 0.04422187805175781, 0.047576904296875, 0.05093193054199219, 0.054286956787109375, 0.05764198303222656, 0.06099700927734375, 0.06435203552246094, 0.06770706176757812, 0.07106208801269531, 0.0744171142578125, 0.07777214050292969, 0.08112716674804688, 0.08448219299316406, 0.08783721923828125, 0.09119224548339844, 0.09454727172851562, 0.09790229797363281, 0.10125732421875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 4.0, 11.0, 10.0, 11.0, 20.0, 30.0, 45.0, 85.0, 177.0, 340.0, 962.0, 3994.0, 59826.0, 955153.0, 23853.0, 2691.0, 676.0, 304.0, 136.0, 66.0, 49.0, 37.0, 23.0, 17.0, 9.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08892822265625, -0.0855569839477539, -0.08218574523925781, -0.07881450653076172, -0.07544326782226562, -0.07207202911376953, -0.06870079040527344, -0.06532955169677734, -0.06195831298828125, -0.058587074279785156, -0.05521583557128906, -0.05184459686279297, -0.048473358154296875, -0.04510211944580078, -0.04173088073730469, -0.038359642028808594, -0.0349884033203125, -0.031617164611816406, -0.028245925903320312, -0.02487468719482422, -0.021503448486328125, -0.01813220977783203, -0.014760971069335938, -0.011389732360839844, -0.00801849365234375, -0.004647254943847656, -0.0012760162353515625, 0.0020952224731445312, 0.005466461181640625, 0.008837699890136719, 0.012208938598632812, 0.015580177307128906, 0.018951416015625, 0.022322654724121094, 0.025693893432617188, 0.02906513214111328, 0.032436370849609375, 0.03580760955810547, 0.03917884826660156, 0.042550086975097656, 0.04592132568359375, 0.049292564392089844, 0.05266380310058594, 0.05603504180908203, 0.059406280517578125, 0.06277751922607422, 0.06614875793457031, 0.0695199966430664, 0.0728912353515625, 0.0762624740600586, 0.07963371276855469, 0.08300495147705078, 0.08637619018554688, 0.08974742889404297, 0.09311866760253906, 0.09648990631103516, 0.09986114501953125, 0.10323238372802734, 0.10660362243652344, 0.10997486114501953, 0.11334609985351562, 0.11671733856201172, 0.12008857727050781, 0.1234598159790039, 0.1268310546875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 5.0, 3.0, 3.0, 1.0, 2.0, 11.0, 8.0, 11.0, 7.0, 15.0, 17.0, 23.0, 39.0, 52.0, 65.0, 73.0, 104.0, 94.0, 93.0, 80.0, 70.0, 49.0, 35.0, 34.0, 24.0, 16.0, 13.0, 11.0, 15.0, 7.0, 6.0, 3.0, 3.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-1.2874603271484375e-05, -1.2501142919063568e-05, -1.2127682566642761e-05, -1.1754222214221954e-05, -1.1380761861801147e-05, -1.100730150938034e-05, -1.0633841156959534e-05, -1.0260380804538727e-05, -9.88692045211792e-06, -9.513460099697113e-06, -9.139999747276306e-06, -8.7665393948555e-06, -8.393079042434692e-06, -8.019618690013885e-06, -7.646158337593079e-06, -7.272697985172272e-06, -6.899237632751465e-06, -6.525777280330658e-06, -6.152316927909851e-06, -5.778856575489044e-06, -5.405396223068237e-06, -5.03193587064743e-06, -4.6584755182266235e-06, -4.285015165805817e-06, -3.91155481338501e-06, -3.538094460964203e-06, -3.164634108543396e-06, -2.791173756122589e-06, -2.4177134037017822e-06, -2.0442530512809753e-06, -1.6707926988601685e-06, -1.2973323464393616e-06, -9.238719940185547e-07, -5.504116415977478e-07, -1.7695128917694092e-07, 1.9650906324386597e-07, 5.699694156646729e-07, 9.434297680854797e-07, 1.3168901205062866e-06, 1.6903504729270935e-06, 2.0638108253479004e-06, 2.4372711777687073e-06, 2.810731530189514e-06, 3.184191882610321e-06, 3.557652235031128e-06, 3.931112587451935e-06, 4.304572939872742e-06, 4.678033292293549e-06, 5.0514936447143555e-06, 5.424953997135162e-06, 5.798414349555969e-06, 6.171874701976776e-06, 6.545335054397583e-06, 6.91879540681839e-06, 7.292255759239197e-06, 7.665716111660004e-06, 8.03917646408081e-06, 8.412636816501617e-06, 8.786097168922424e-06, 9.159557521343231e-06, 9.533017873764038e-06, 9.906478226184845e-06, 1.0279938578605652e-05, 1.0653398931026459e-05, 1.1026859283447266e-05]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 7.0, 6.0, 8.0, 16.0, 23.0, 30.0, 83.0, 188.0, 546.0, 2733.0, 310573.0, 729882.0, 3527.0, 604.0, 175.0, 81.0, 36.0, 15.0, 7.0, 6.0, 4.0, 4.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1842041015625, -0.1786327362060547, -0.17306137084960938, -0.16749000549316406, -0.16191864013671875, -0.15634727478027344, -0.15077590942382812, -0.1452045440673828, -0.1396331787109375, -0.1340618133544922, -0.12849044799804688, -0.12291908264160156, -0.11734771728515625, -0.11177635192871094, -0.10620498657226562, -0.10063362121582031, -0.095062255859375, -0.08949089050292969, -0.08391952514648438, -0.07834815979003906, -0.07277679443359375, -0.06720542907714844, -0.061634063720703125, -0.05606269836425781, -0.0504913330078125, -0.04491996765136719, -0.039348602294921875, -0.03377723693847656, -0.02820587158203125, -0.022634506225585938, -0.017063140869140625, -0.011491775512695312, -0.00592041015625, -0.0003490447998046875, 0.005222320556640625, 0.010793685913085938, 0.01636505126953125, 0.021936416625976562, 0.027507781982421875, 0.03307914733886719, 0.0386505126953125, 0.04422187805175781, 0.049793243408203125, 0.05536460876464844, 0.06093597412109375, 0.06650733947753906, 0.07207870483398438, 0.07765007019042969, 0.083221435546875, 0.08879280090332031, 0.09436416625976562, 0.09993553161621094, 0.10550689697265625, 0.11107826232910156, 0.11664962768554688, 0.12222099304199219, 0.1277923583984375, 0.1333637237548828, 0.13893508911132812, 0.14450645446777344, 0.15007781982421875, 0.15564918518066406, 0.16122055053710938, 0.1667919158935547, 0.17236328125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 10.0, 12.0, 21.0, 40.0, 58.0, 106.0, 212.0, 217.0, 149.0, 80.0, 46.0, 25.0, 14.0, 7.0, 6.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11199951171875, -0.1092829704284668, -0.1065664291381836, -0.10384988784790039, -0.10113334655761719, -0.09841680526733398, -0.09570026397705078, -0.09298372268676758, -0.09026718139648438, -0.08755064010620117, -0.08483409881591797, -0.08211755752563477, -0.07940101623535156, -0.07668447494506836, -0.07396793365478516, -0.07125139236450195, -0.06853485107421875, -0.06581830978393555, -0.06310176849365234, -0.06038522720336914, -0.05766868591308594, -0.054952144622802734, -0.05223560333251953, -0.04951906204223633, -0.046802520751953125, -0.04408597946166992, -0.04136943817138672, -0.038652896881103516, -0.03593635559082031, -0.03321981430053711, -0.030503273010253906, -0.027786731719970703, -0.0250701904296875, -0.022353649139404297, -0.019637107849121094, -0.01692056655883789, -0.014204025268554688, -0.011487483978271484, -0.008770942687988281, -0.006054401397705078, -0.003337860107421875, -0.0006213188171386719, 0.0020952224731445312, 0.004811763763427734, 0.0075283050537109375, 0.01024484634399414, 0.012961387634277344, 0.015677928924560547, 0.01839447021484375, 0.021111011505126953, 0.023827552795410156, 0.02654409408569336, 0.029260635375976562, 0.031977176666259766, 0.03469371795654297, 0.03741025924682617, 0.040126800537109375, 0.04284334182739258, 0.04555988311767578, 0.048276424407958984, 0.05099296569824219, 0.05370950698852539, 0.056426048278808594, 0.0591425895690918, 0.061859130859375]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 8.0, 9.0, 15.0, 44.0, 135.0, 314.0, 261.0, 125.0, 36.0, 26.0, 15.0, 10.0, 5.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.21256709098815918, -0.19015376269817352, -0.16774044930934906, -0.1453271210193634, -0.12291380017995834, -0.10050047934055328, -0.07808715105056763, -0.055673837661743164, -0.03326050937175751, -0.010847186669707298, 0.01156613603234291, 0.03397946059703827, 0.05639278143644333, 0.07880610227584839, 0.10121943056583405, 0.12363274395465851, 0.14604607224464417, 0.16845940053462982, 0.19087271392345428, 0.21328604221343994, 0.2356993556022644, 0.25811266899108887, 0.2805260121822357, 0.3029393255710602, 0.32535266876220703, 0.3477659821510315, 0.37017932534217834, 0.3925926387310028, 0.41500595211982727, 0.4374192953109741, 0.4598326086997986, 0.48224592208862305, 0.5046592354774475, 0.527072548866272, 0.5494858622550964, 0.5718991756439209, 0.5943125486373901, 0.6167258620262146, 0.6391391754150391, 0.6615524888038635, 0.683965802192688, 0.7063791155815125, 0.7287924289703369, 0.7512058019638062, 0.7736191153526306, 0.7960324287414551, 0.8184457421302795, 0.840859055519104, 0.8632724285125732, 0.8856857419013977, 0.9080990552902222, 0.9305124282836914, 0.9529257416725159, 0.9753390550613403, 0.9977523684501648, 1.0201656818389893, 1.042578935623169, 1.0649923086166382, 1.0874055624008179, 1.109818935394287, 1.1322321891784668, 1.154645562171936, 1.1770589351654053, 1.199472188949585, 1.2218855619430542]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 2.0, 3.0, 10.0, 8.0, 12.0, 16.0, 23.0, 23.0, 39.0, 48.0, 47.0, 57.0, 72.0, 60.0, 71.0, 72.0, 73.0, 61.0, 54.0, 52.0, 40.0, 43.0, 26.0, 17.0, 20.0, 21.0, 8.0, 7.0, 8.0, 4.0, 2.0, 5.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8293816447257996, -0.8047731518745422, -0.7801646590232849, -0.7555562257766724, -0.730947732925415, -0.7063392400741577, -0.6817307472229004, -0.6571222543716431, -0.6325137615203857, -0.6079052686691284, -0.5832967758178711, -0.5586882829666138, -0.5340798497200012, -0.5094713568687439, -0.4848628640174866, -0.46025437116622925, -0.4356459379196167, -0.4110374450683594, -0.38642898201942444, -0.3618204891681671, -0.3372120261192322, -0.31260353326797485, -0.28799504041671753, -0.2633865475654602, -0.23877808451652527, -0.21416960656642914, -0.189561128616333, -0.16495263576507568, -0.14034415781497955, -0.11573567986488342, -0.0911271870136261, -0.06651870906352997, -0.04191017150878906, -0.017301689833402634, 0.007306791841983795, 0.03191527724266052, 0.05652375519275665, 0.08113223314285278, 0.10574072599411011, 0.13034920394420624, 0.15495768189430237, 0.1795661598443985, 0.20417463779449463, 0.22878313064575195, 0.2533916234970093, 0.2780000865459442, 0.30260857939720154, 0.3272170424461365, 0.3518255352973938, 0.3764340281486511, 0.40104249119758606, 0.4256509840488434, 0.4502594470977783, 0.47486793994903564, 0.49947643280029297, 0.5240849256515503, 0.5486934185028076, 0.5733019113540649, 0.5979104042053223, 0.6225188970565796, 0.6471273303031921, 0.6717358231544495, 0.6963443160057068, 0.7209528088569641, 0.7455612421035767]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 3.0, 1.0, 3.0, 7.0, 11.0, 11.0, 4.0, 21.0, 21.0, 42.0, 52.0, 56.0, 87.0, 153.0, 290.0, 557.0, 1746.0, 9990.0, 785290.0, 3381647.0, 12367.0, 1447.0, 295.0, 99.0, 43.0, 29.0, 9.0, 2.0, 3.0, 2.0, 1.0], "bins": [-0.5849609375, -0.5737209320068359, -0.5624809265136719, -0.5512409210205078, -0.5400009155273438, -0.5287609100341797, -0.5175209045410156, -0.5062808990478516, -0.4950408935546875, -0.48380088806152344, -0.4725608825683594, -0.4613208770751953, -0.45008087158203125, -0.4388408660888672, -0.4276008605957031, -0.41636085510253906, -0.405120849609375, -0.39388084411621094, -0.3826408386230469, -0.3714008331298828, -0.36016082763671875, -0.3489208221435547, -0.3376808166503906, -0.32644081115722656, -0.3152008056640625, -0.30396080017089844, -0.2927207946777344, -0.2814807891845703, -0.27024078369140625, -0.2590007781982422, -0.24776077270507812, -0.23652076721191406, -0.22528076171875, -0.21404075622558594, -0.20280075073242188, -0.1915607452392578, -0.18032073974609375, -0.1690807342529297, -0.15784072875976562, -0.14660072326660156, -0.1353607177734375, -0.12412071228027344, -0.11288070678710938, -0.10164070129394531, -0.09040069580078125, -0.07916069030761719, -0.06792068481445312, -0.05668067932128906, -0.045440673828125, -0.03420066833496094, -0.022960662841796875, -0.011720657348632812, -0.00048065185546875, 0.010759353637695312, 0.021999359130859375, 0.03323936462402344, 0.0444793701171875, 0.05571937561035156, 0.06695938110351562, 0.07819938659667969, 0.08943939208984375, 0.10067939758300781, 0.11191940307617188, 0.12315940856933594, 0.1343994140625]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 8.0, 9.0, 22.0, 59.0, 83.0, 129.0, 180.0, 179.0, 124.0, 86.0, 70.0, 34.0, 11.0, 9.0, 2.0, 1.0, 1.0, 3.0], "bins": [-0.10028076171875, -0.0983879566192627, -0.09649515151977539, -0.09460234642028809, -0.09270954132080078, -0.09081673622131348, -0.08892393112182617, -0.08703112602233887, -0.08513832092285156, -0.08324551582336426, -0.08135271072387695, -0.07945990562438965, -0.07756710052490234, -0.07567429542541504, -0.07378149032592773, -0.07188868522644043, -0.06999588012695312, -0.06810307502746582, -0.06621026992797852, -0.06431746482849121, -0.062424659729003906, -0.0605318546295166, -0.0586390495300293, -0.05674624443054199, -0.05485343933105469, -0.05296063423156738, -0.05106782913208008, -0.04917502403259277, -0.04728221893310547, -0.045389413833618164, -0.04349660873413086, -0.041603803634643555, -0.03971099853515625, -0.037818193435668945, -0.03592538833618164, -0.034032583236694336, -0.03213977813720703, -0.030246973037719727, -0.028354167938232422, -0.026461362838745117, -0.024568557739257812, -0.022675752639770508, -0.020782947540283203, -0.0188901424407959, -0.016997337341308594, -0.015104532241821289, -0.013211727142333984, -0.01131892204284668, -0.009426116943359375, -0.00753331184387207, -0.005640506744384766, -0.003747701644897461, -0.0018548965454101562, 3.790855407714844e-05, 0.0019307136535644531, 0.003823518753051758, 0.0057163238525390625, 0.007609128952026367, 0.009501934051513672, 0.011394739151000977, 0.013287544250488281, 0.015180349349975586, 0.01707315444946289, 0.018965959548950195, 0.0208587646484375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 8.0, 14.0, 73.0, 210.0, 1393.0, 4190742.0, 1645.0, 140.0, 41.0, 10.0, 8.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.802734375, -2.7438430786132812, -2.6849517822265625, -2.6260604858398438, -2.567169189453125, -2.5082778930664062, -2.4493865966796875, -2.3904953002929688, -2.33160400390625, -2.2727127075195312, -2.2138214111328125, -2.1549301147460938, -2.096038818359375, -2.0371475219726562, -1.9782562255859375, -1.9193649291992188, -1.8604736328125, -1.8015823364257812, -1.7426910400390625, -1.6837997436523438, -1.624908447265625, -1.5660171508789062, -1.5071258544921875, -1.4482345581054688, -1.38934326171875, -1.3304519653320312, -1.2715606689453125, -1.2126693725585938, -1.153778076171875, -1.0948867797851562, -1.0359954833984375, -0.9771041870117188, -0.918212890625, -0.8593215942382812, -0.8004302978515625, -0.7415390014648438, -0.682647705078125, -0.6237564086914062, -0.5648651123046875, -0.5059738159179688, -0.44708251953125, -0.38819122314453125, -0.3292999267578125, -0.27040863037109375, -0.211517333984375, -0.15262603759765625, -0.0937347412109375, -0.03484344482421875, 0.0240478515625, 0.08293914794921875, 0.1418304443359375, 0.20072174072265625, 0.259613037109375, 0.31850433349609375, 0.3773956298828125, 0.43628692626953125, 0.49517822265625, 0.5540695190429688, 0.6129608154296875, 0.6718521118164062, 0.730743408203125, 0.7896347045898438, 0.8485260009765625, 0.9074172973632812, 0.96630859375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 7.0, 17.0, 39.0, 157.0, 3182.0, 542.0, 70.0, 39.0, 15.0, 7.0, 3.0, 0.0, 1.0, 4.0], "bins": [-0.283447265625, -0.2782754898071289, -0.2731037139892578, -0.2679319381713867, -0.2627601623535156, -0.25758838653564453, -0.25241661071777344, -0.24724483489990234, -0.24207305908203125, -0.23690128326416016, -0.23172950744628906, -0.22655773162841797, -0.22138595581054688, -0.21621417999267578, -0.2110424041748047, -0.2058706283569336, -0.2006988525390625, -0.1955270767211914, -0.1903553009033203, -0.18518352508544922, -0.18001174926757812, -0.17483997344970703, -0.16966819763183594, -0.16449642181396484, -0.15932464599609375, -0.15415287017822266, -0.14898109436035156, -0.14380931854248047, -0.13863754272460938, -0.13346576690673828, -0.1282939910888672, -0.1231222152709961, -0.117950439453125, -0.1127786636352539, -0.10760688781738281, -0.10243511199951172, -0.09726333618164062, -0.09209156036376953, -0.08691978454589844, -0.08174800872802734, -0.07657623291015625, -0.07140445709228516, -0.06623268127441406, -0.06106090545654297, -0.055889129638671875, -0.05071735382080078, -0.04554557800292969, -0.040373802185058594, -0.0352020263671875, -0.030030250549316406, -0.024858474731445312, -0.01968669891357422, -0.014514923095703125, -0.009343147277832031, -0.0041713714599609375, 0.0010004043579101562, 0.00617218017578125, 0.011343955993652344, 0.016515731811523438, 0.02168750762939453, 0.026859283447265625, 0.03203105926513672, 0.03720283508300781, 0.042374610900878906, 0.04754638671875]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 8.0, 21.0, 162.0, 803.0, 17.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.861103892326355, -0.8010647892951965, -0.7410256862640381, -0.6809866428375244, -0.620947539806366, -0.5609084367752075, -0.5008693933486938, -0.4408302903175354, -0.38079118728637695, -0.3207520842552185, -0.26071301102638245, -0.2006739228963852, -0.14063483476638794, -0.08059573173522949, -0.020556658506393433, 0.03948241472244263, 0.09952151775360107, 0.15956060588359833, 0.21959969401359558, 0.27963876724243164, 0.3396778702735901, 0.39971697330474854, 0.4597560465335846, 0.5197951197624207, 0.5798342227935791, 0.6398733258247375, 0.699912428855896, 0.7599514722824097, 0.8199905753135681, 0.8800296783447266, 0.9400687217712402, 1.000107765197754, 1.0601468086242676, 1.1201858520507812, 1.1802250146865845, 1.2402640581130981, 1.3003032207489014, 1.360342264175415, 1.4203813076019287, 1.4804203510284424, 1.5404595136642456, 1.6004985570907593, 1.6605377197265625, 1.7205767631530762, 1.7806158065795898, 1.840654969215393, 1.9006940126419067, 1.96073317527771, 2.0207722187042236, 2.0808112621307373, 2.140850305557251, 2.2008895874023438, 2.2609286308288574, 2.320967674255371, 2.3810067176818848, 2.4410457611083984, 2.501084804534912, 2.561123847961426, 2.6211628913879395, 2.6812021732330322, 2.741241216659546, 2.8012802600860596, 2.8613193035125732, 2.921358346939087, 2.9813976287841797]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 2.0, 3.0, 6.0, 8.0, 12.0, 21.0, 32.0, 44.0, 63.0, 83.0, 112.0, 91.0, 117.0, 98.0, 88.0, 76.0, 48.0, 44.0, 23.0, 14.0, 9.0, 9.0, 0.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6856005191802979, -0.6661354303359985, -0.6466703414916992, -0.6272052526473999, -0.6077401638031006, -0.5882750749588013, -0.568809986114502, -0.5493448972702026, -0.5298798084259033, -0.510414719581604, -0.4909496307373047, -0.47148454189300537, -0.45201945304870605, -0.43255436420440674, -0.41308924555778503, -0.3936241567134857, -0.374159038066864, -0.3546939492225647, -0.3352288603782654, -0.31576377153396606, -0.29629868268966675, -0.27683359384536743, -0.2573684751987457, -0.2379033863544464, -0.2184382975101471, -0.19897320866584778, -0.17950811982154846, -0.16004301607608795, -0.14057792723178864, -0.12111283838748932, -0.1016477420926094, -0.08218264579772949, -0.06271755695343018, -0.04325246438384056, -0.023787371814250946, -0.004322279244661331, 0.015142813324928284, 0.0346079021692276, 0.05407299846410751, 0.07353809475898743, 0.09300318360328674, 0.11246827244758606, 0.13193336129188538, 0.1513984650373459, 0.1708635538816452, 0.19032864272594452, 0.20979374647140503, 0.22925883531570435, 0.24872392416000366, 0.268189013004303, 0.2876541018486023, 0.3071191906929016, 0.3265842795372009, 0.34604936838150024, 0.36551448702812195, 0.38497957587242126, 0.4044446647167206, 0.4239097535610199, 0.4433748424053192, 0.46283993124961853, 0.48230504989624023, 0.5017701387405396, 0.5212352275848389, 0.5407003164291382, 0.5601654052734375]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 1.0, 1.0, 5.0, 3.0, 3.0, 6.0, 8.0, 8.0, 19.0, 23.0, 20.0, 34.0, 37.0, 41.0, 85.0, 109.0, 164.0, 262.0, 514.0, 1157.0, 3239.0, 13378.0, 80990.0, 746152.0, 171981.0, 22165.0, 4963.0, 1544.0, 674.0, 294.0, 202.0, 138.0, 96.0, 60.0, 43.0, 38.0, 19.0, 15.0, 14.0, 15.0, 8.0, 11.0, 7.0, 2.0, 4.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1563720703125, -0.15127182006835938, -0.14617156982421875, -0.14107131958007812, -0.1359710693359375, -0.13087081909179688, -0.12577056884765625, -0.12067031860351562, -0.115570068359375, -0.11046981811523438, -0.10536956787109375, -0.10026931762695312, -0.0951690673828125, -0.09006881713867188, -0.08496856689453125, -0.07986831665039062, -0.07476806640625, -0.06966781616210938, -0.06456756591796875, -0.059467315673828125, -0.0543670654296875, -0.049266815185546875, -0.04416656494140625, -0.039066314697265625, -0.033966064453125, -0.028865814208984375, -0.02376556396484375, -0.018665313720703125, -0.0135650634765625, -0.008464813232421875, -0.00336456298828125, 0.001735687255859375, 0.0068359375, 0.011936187744140625, 0.01703643798828125, 0.022136688232421875, 0.0272369384765625, 0.032337188720703125, 0.03743743896484375, 0.042537689208984375, 0.047637939453125, 0.052738189697265625, 0.05783843994140625, 0.06293869018554688, 0.0680389404296875, 0.07313919067382812, 0.07823944091796875, 0.08333969116210938, 0.08843994140625, 0.09354019165039062, 0.09864044189453125, 0.10374069213867188, 0.1088409423828125, 0.11394119262695312, 0.11904144287109375, 0.12414169311523438, 0.129241943359375, 0.13434219360351562, 0.13944244384765625, 0.14454269409179688, 0.1496429443359375, 0.15474319458007812, 0.15984344482421875, 0.16494369506835938, 0.1700439453125]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 12.0, 11.0, 24.0, 49.0, 58.0, 75.0, 120.0, 135.0, 132.0, 122.0, 84.0, 65.0, 49.0, 27.0, 18.0, 12.0, 6.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.09234619140625, -0.09038352966308594, -0.08842086791992188, -0.08645820617675781, -0.08449554443359375, -0.08253288269042969, -0.08057022094726562, -0.07860755920410156, -0.0766448974609375, -0.07468223571777344, -0.07271957397460938, -0.07075691223144531, -0.06879425048828125, -0.06683158874511719, -0.06486892700195312, -0.06290626525878906, -0.060943603515625, -0.05898094177246094, -0.057018280029296875, -0.05505561828613281, -0.05309295654296875, -0.05113029479980469, -0.049167633056640625, -0.04720497131347656, -0.0452423095703125, -0.04327964782714844, -0.041316986083984375, -0.03935432434082031, -0.03739166259765625, -0.03542900085449219, -0.033466339111328125, -0.03150367736816406, -0.029541015625, -0.027578353881835938, -0.025615692138671875, -0.023653030395507812, -0.02169036865234375, -0.019727706909179688, -0.017765045166015625, -0.015802383422851562, -0.0138397216796875, -0.011877059936523438, -0.009914398193359375, -0.007951736450195312, -0.00598907470703125, -0.0040264129638671875, -0.002063751220703125, -0.0001010894775390625, 0.001861572265625, 0.0038242340087890625, 0.005786895751953125, 0.0077495574951171875, 0.00971221923828125, 0.011674880981445312, 0.013637542724609375, 0.015600204467773438, 0.0175628662109375, 0.019525527954101562, 0.021488189697265625, 0.023450851440429688, 0.02541351318359375, 0.027376174926757812, 0.029338836669921875, 0.03130149841308594, 0.03326416015625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 5.0, 4.0, 9.0, 4.0, 11.0, 12.0, 21.0, 30.0, 32.0, 33.0, 66.0, 119.0, 227.0, 480.0, 1441.0, 9410.0, 238905.0, 773633.0, 20518.0, 2343.0, 613.0, 229.0, 124.0, 93.0, 37.0, 34.0, 37.0, 28.0, 12.0, 11.0, 13.0, 2.0, 3.0, 5.0, 4.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1671142578125, -0.16072463989257812, -0.15433502197265625, -0.14794540405273438, -0.1415557861328125, -0.13516616821289062, -0.12877655029296875, -0.12238693237304688, -0.115997314453125, -0.10960769653320312, -0.10321807861328125, -0.09682846069335938, -0.0904388427734375, -0.08404922485351562, -0.07765960693359375, -0.07126998901367188, -0.06488037109375, -0.058490753173828125, -0.05210113525390625, -0.045711517333984375, -0.0393218994140625, -0.032932281494140625, -0.02654266357421875, -0.020153045654296875, -0.013763427734375, -0.007373809814453125, -0.00098419189453125, 0.005405426025390625, 0.0117950439453125, 0.018184661865234375, 0.02457427978515625, 0.030963897705078125, 0.037353515625, 0.043743133544921875, 0.05013275146484375, 0.056522369384765625, 0.0629119873046875, 0.06930160522460938, 0.07569122314453125, 0.08208084106445312, 0.088470458984375, 0.09486007690429688, 0.10124969482421875, 0.10763931274414062, 0.1140289306640625, 0.12041854858398438, 0.12680816650390625, 0.13319778442382812, 0.13958740234375, 0.14597702026367188, 0.15236663818359375, 0.15875625610351562, 0.1651458740234375, 0.17153549194335938, 0.17792510986328125, 0.18431472778320312, 0.190704345703125, 0.19709396362304688, 0.20348358154296875, 0.20987319946289062, 0.2162628173828125, 0.22265243530273438, 0.22904205322265625, 0.23543167114257812, 0.2418212890625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 5.0, 7.0, 6.0, 13.0, 13.0, 24.0, 20.0, 24.0, 29.0, 37.0, 41.0, 41.0, 64.0, 49.0, 62.0, 50.0, 52.0, 59.0, 49.0, 59.0, 45.0, 46.0, 36.0, 24.0, 23.0, 31.0, 29.0, 9.0, 10.0, 11.0, 7.0, 6.0, 4.0, 2.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.101318359375, -0.09743309020996094, -0.09354782104492188, -0.08966255187988281, -0.08577728271484375, -0.08189201354980469, -0.07800674438476562, -0.07412147521972656, -0.0702362060546875, -0.06635093688964844, -0.062465667724609375, -0.05858039855957031, -0.05469512939453125, -0.05080986022949219, -0.046924591064453125, -0.04303932189941406, -0.039154052734375, -0.03526878356933594, -0.031383514404296875, -0.027498245239257812, -0.02361297607421875, -0.019727706909179688, -0.015842437744140625, -0.011957168579101562, -0.0080718994140625, -0.0041866302490234375, -0.000301361083984375, 0.0035839080810546875, 0.00746917724609375, 0.011354446411132812, 0.015239715576171875, 0.019124984741210938, 0.02301025390625, 0.026895523071289062, 0.030780792236328125, 0.03466606140136719, 0.03855133056640625, 0.04243659973144531, 0.046321868896484375, 0.05020713806152344, 0.0540924072265625, 0.05797767639160156, 0.061862945556640625, 0.06574821472167969, 0.06963348388671875, 0.07351875305175781, 0.07740402221679688, 0.08128929138183594, 0.085174560546875, 0.08905982971191406, 0.09294509887695312, 0.09683036804199219, 0.10071563720703125, 0.10460090637207031, 0.10848617553710938, 0.11237144470214844, 0.1162567138671875, 0.12014198303222656, 0.12402725219726562, 0.1279125213623047, 0.13179779052734375, 0.1356830596923828, 0.13956832885742188, 0.14345359802246094, 0.1473388671875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 8.0, 1.0, 5.0, 3.0, 4.0, 14.0, 12.0, 13.0, 17.0, 34.0, 64.0, 111.0, 213.0, 538.0, 1728.0, 7575.0, 93907.0, 858221.0, 76728.0, 6775.0, 1573.0, 532.0, 210.0, 108.0, 52.0, 31.0, 22.0, 13.0, 15.0, 10.0, 9.0, 3.0, 2.0, 2.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.05474853515625, -0.05316019058227539, -0.05157184600830078, -0.04998350143432617, -0.04839515686035156, -0.04680681228637695, -0.045218467712402344, -0.043630123138427734, -0.042041778564453125, -0.040453433990478516, -0.038865089416503906, -0.0372767448425293, -0.03568840026855469, -0.03410005569458008, -0.03251171112060547, -0.03092336654663086, -0.02933502197265625, -0.02774667739868164, -0.02615833282470703, -0.024569988250732422, -0.022981643676757812, -0.021393299102783203, -0.019804954528808594, -0.018216609954833984, -0.016628265380859375, -0.015039920806884766, -0.013451576232910156, -0.011863231658935547, -0.010274887084960938, -0.008686542510986328, -0.007098197937011719, -0.005509853363037109, -0.0039215087890625, -0.0023331642150878906, -0.0007448196411132812, 0.0008435249328613281, 0.0024318695068359375, 0.004020214080810547, 0.005608558654785156, 0.007196903228759766, 0.008785247802734375, 0.010373592376708984, 0.011961936950683594, 0.013550281524658203, 0.015138626098632812, 0.016726970672607422, 0.01831531524658203, 0.01990365982055664, 0.02149200439453125, 0.02308034896850586, 0.02466869354248047, 0.026257038116455078, 0.027845382690429688, 0.029433727264404297, 0.031022071838378906, 0.032610416412353516, 0.034198760986328125, 0.035787105560302734, 0.037375450134277344, 0.03896379470825195, 0.04055213928222656, 0.04214048385620117, 0.04372882843017578, 0.04531717300415039, 0.046905517578125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 8.0, 5.0, 9.0, 9.0, 13.0, 31.0, 17.0, 31.0, 34.0, 49.0, 47.0, 47.0, 79.0, 58.0, 56.0, 77.0, 53.0, 69.0, 42.0, 51.0, 44.0, 43.0, 18.0, 25.0, 19.0, 16.0, 18.0, 10.0, 6.0, 6.0, 7.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.52346420288086e-06, -8.305534720420837e-06, -8.087605237960815e-06, -7.869675755500793e-06, -7.651746273040771e-06, -7.4338167905807495e-06, -7.2158873081207275e-06, -6.9979578256607056e-06, -6.780028343200684e-06, -6.562098860740662e-06, -6.34416937828064e-06, -6.126239895820618e-06, -5.908310413360596e-06, -5.690380930900574e-06, -5.472451448440552e-06, -5.25452196598053e-06, -5.036592483520508e-06, -4.818663001060486e-06, -4.600733518600464e-06, -4.382804036140442e-06, -4.16487455368042e-06, -3.946945071220398e-06, -3.729015588760376e-06, -3.511086106300354e-06, -3.293156623840332e-06, -3.07522714138031e-06, -2.857297658920288e-06, -2.639368176460266e-06, -2.421438694000244e-06, -2.203509211540222e-06, -1.9855797290802e-06, -1.7676502466201782e-06, -1.5497207641601562e-06, -1.3317912817001343e-06, -1.1138617992401123e-06, -8.959323167800903e-07, -6.780028343200684e-07, -4.600733518600464e-07, -2.421438694000244e-07, -2.421438694000244e-08, 1.9371509552001953e-07, 4.116445779800415e-07, 6.295740604400635e-07, 8.475035429000854e-07, 1.0654330253601074e-06, 1.2833625078201294e-06, 1.5012919902801514e-06, 1.7192214727401733e-06, 1.9371509552001953e-06, 2.1550804376602173e-06, 2.3730099201202393e-06, 2.5909394025802612e-06, 2.808868885040283e-06, 3.026798367500305e-06, 3.244727849960327e-06, 3.462657332420349e-06, 3.680586814880371e-06, 3.898516297340393e-06, 4.116445779800415e-06, 4.334375262260437e-06, 4.552304744720459e-06, 4.770234227180481e-06, 4.988163709640503e-06, 5.206093192100525e-06, 5.424022674560547e-06]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 5.0, 3.0, 4.0, 4.0, 5.0, 11.0, 12.0, 22.0, 31.0, 37.0, 65.0, 113.0, 234.0, 477.0, 1202.0, 5043.0, 48652.0, 828236.0, 151788.0, 9455.0, 1844.0, 633.0, 301.0, 139.0, 80.0, 51.0, 32.0, 24.0, 20.0, 4.0, 9.0, 7.0, 4.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.055938720703125, -0.05422639846801758, -0.052514076232910156, -0.050801753997802734, -0.04908943176269531, -0.04737710952758789, -0.04566478729248047, -0.04395246505737305, -0.042240142822265625, -0.0405278205871582, -0.03881549835205078, -0.03710317611694336, -0.03539085388183594, -0.033678531646728516, -0.031966209411621094, -0.030253887176513672, -0.02854156494140625, -0.026829242706298828, -0.025116920471191406, -0.023404598236083984, -0.021692276000976562, -0.01997995376586914, -0.01826763153076172, -0.016555309295654297, -0.014842987060546875, -0.013130664825439453, -0.011418342590332031, -0.00970602035522461, -0.007993698120117188, -0.006281375885009766, -0.004569053649902344, -0.002856731414794922, -0.0011444091796875, 0.0005679130554199219, 0.0022802352905273438, 0.003992557525634766, 0.0057048797607421875, 0.007417201995849609, 0.009129524230957031, 0.010841846466064453, 0.012554168701171875, 0.014266490936279297, 0.01597881317138672, 0.01769113540649414, 0.019403457641601562, 0.021115779876708984, 0.022828102111816406, 0.024540424346923828, 0.02625274658203125, 0.027965068817138672, 0.029677391052246094, 0.031389713287353516, 0.03310203552246094, 0.03481435775756836, 0.03652667999267578, 0.0382390022277832, 0.039951324462890625, 0.04166364669799805, 0.04337596893310547, 0.04508829116821289, 0.04680061340332031, 0.048512935638427734, 0.050225257873535156, 0.05193758010864258, 0.05364990234375]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 0.0, 2.0, 2.0, 4.0, 4.0, 6.0, 9.0, 8.0, 9.0, 18.0, 28.0, 35.0, 48.0, 56.0, 80.0, 86.0, 108.0, 94.0, 78.0, 79.0, 60.0, 47.0, 37.0, 25.0, 20.0, 20.0, 12.0, 6.0, 11.0, 6.0, 4.0, 3.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.034210205078125, -0.03320884704589844, -0.032207489013671875, -0.031206130981445312, -0.03020477294921875, -0.029203414916992188, -0.028202056884765625, -0.027200698852539062, -0.0261993408203125, -0.025197982788085938, -0.024196624755859375, -0.023195266723632812, -0.02219390869140625, -0.021192550659179688, -0.020191192626953125, -0.019189834594726562, -0.0181884765625, -0.017187118530273438, -0.016185760498046875, -0.015184402465820312, -0.01418304443359375, -0.013181686401367188, -0.012180328369140625, -0.011178970336914062, -0.0101776123046875, -0.009176254272460938, -0.008174896240234375, -0.0071735382080078125, -0.00617218017578125, -0.0051708221435546875, -0.004169464111328125, -0.0031681060791015625, -0.002166748046875, -0.0011653900146484375, -0.000164031982421875, 0.0008373260498046875, 0.00183868408203125, 0.0028400421142578125, 0.003841400146484375, 0.0048427581787109375, 0.0058441162109375, 0.0068454742431640625, 0.007846832275390625, 0.008848190307617188, 0.00984954833984375, 0.010850906372070312, 0.011852264404296875, 0.012853622436523438, 0.01385498046875, 0.014856338500976562, 0.015857696533203125, 0.016859054565429688, 0.01786041259765625, 0.018861770629882812, 0.019863128662109375, 0.020864486694335938, 0.0218658447265625, 0.022867202758789062, 0.023868560791015625, 0.024869918823242188, 0.02587127685546875, 0.026872634887695312, 0.027873992919921875, 0.028875350952148438, 0.029876708984375]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 7.0, 62.0, 871.0, 66.0, 9.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.035308361053467, -2.9287521839141846, -2.8221962451934814, -2.715640068054199, -2.609083890914917, -2.5025277137756348, -2.3959717750549316, -2.2894155979156494, -2.182859420776367, -2.076303243637085, -1.9697471857070923, -1.8631911277770996, -1.7566349506378174, -1.6500788927078247, -1.543522834777832, -1.4369666576385498, -1.3304107189178467, -1.223854660987854, -1.1172984838485718, -1.010742425918579, -0.9041863083839417, -0.7976301908493042, -0.6910741329193115, -0.5845180153846741, -0.4779618978500366, -0.37140578031539917, -0.2648496925830841, -0.15829360485076904, -0.05173748731613159, 0.05481863021850586, 0.16137468814849854, 0.267930805683136, 0.37448692321777344, 0.4810430407524109, 0.5875991582870483, 0.694155216217041, 0.8007113337516785, 0.9072674512863159, 1.0138235092163086, 1.1203796863555908, 1.2269357442855835, 1.3334918022155762, 1.4400479793548584, 1.546604037284851, 1.6531600952148438, 1.759716272354126, 1.8662723302841187, 1.9728283882141113, 2.0793845653533936, 2.185940742492676, 2.292496681213379, 2.399052858352661, 2.5056090354919434, 2.6121649742126465, 2.7187211513519287, 2.825277328491211, 2.931833267211914, 3.0383894443511963, 3.1449453830718994, 3.2515015602111816, 3.358057737350464, 3.464613914489746, 3.571169853210449, 3.6777260303497314, 3.7842822074890137]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 8.0, 4.0, 16.0, 11.0, 21.0, 17.0, 21.0, 36.0, 28.0, 38.0, 37.0, 46.0, 59.0, 57.0, 76.0, 65.0, 70.0, 57.0, 63.0, 56.0, 42.0, 31.0, 26.0, 21.0, 22.0, 22.0, 17.0, 10.0, 10.0, 8.0, 2.0, 0.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6639466881752014, -0.6416165232658386, -0.6192863583564758, -0.596956193447113, -0.5746260285377502, -0.5522958636283875, -0.5299657583236694, -0.5076355934143066, -0.48530539870262146, -0.46297523379325867, -0.4406450688838959, -0.41831493377685547, -0.3959847688674927, -0.3736546039581299, -0.3513244390487671, -0.3289942741394043, -0.3066641092300415, -0.2843339443206787, -0.2620037794113159, -0.23967362940311432, -0.21734346449375153, -0.19501329958438873, -0.17268314957618713, -0.15035298466682434, -0.12802281975746155, -0.10569265484809875, -0.08336249738931656, -0.06103233993053436, -0.03870217502117157, -0.016372010111808777, 0.005958139896392822, 0.028288304805755615, 0.050618529319763184, 0.07294869422912598, 0.09527885168790817, 0.11760900914669037, 0.13993917405605316, 0.16226933896541595, 0.18459948897361755, 0.20692965388298035, 0.22925981879234314, 0.25158998370170593, 0.2739201486110687, 0.29625028371810913, 0.3185804486274719, 0.3409106135368347, 0.3632407784461975, 0.3855709433555603, 0.4079011082649231, 0.4302312731742859, 0.4525614380836487, 0.4748916029930115, 0.49722176790237427, 0.5195519328117371, 0.5418820381164551, 0.5642122030258179, 0.5865423679351807, 0.6088725328445435, 0.6312026977539062, 0.653532862663269, 0.6758630275726318, 0.6981931924819946, 0.7205233573913574, 0.7428535223007202, 0.765183687210083]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 5.0, 4.0, 2.0, 6.0, 10.0, 9.0, 7.0, 19.0, 28.0, 48.0, 62.0, 106.0, 194.0, 351.0, 655.0, 1790.0, 8108.0, 125745.0, 4011643.0, 39600.0, 4316.0, 952.0, 327.0, 141.0, 68.0, 36.0, 23.0, 8.0, 9.0, 5.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.35009765625, -0.34201812744140625, -0.3339385986328125, -0.32585906982421875, -0.317779541015625, -0.30970001220703125, -0.3016204833984375, -0.29354095458984375, -0.28546142578125, -0.27738189697265625, -0.2693023681640625, -0.26122283935546875, -0.253143310546875, -0.24506378173828125, -0.2369842529296875, -0.22890472412109375, -0.2208251953125, -0.21274566650390625, -0.2046661376953125, -0.19658660888671875, -0.188507080078125, -0.18042755126953125, -0.1723480224609375, -0.16426849365234375, -0.15618896484375, -0.14810943603515625, -0.1400299072265625, -0.13195037841796875, -0.123870849609375, -0.11579132080078125, -0.1077117919921875, -0.09963226318359375, -0.091552734375, -0.08347320556640625, -0.0753936767578125, -0.06731414794921875, -0.059234619140625, -0.05115509033203125, -0.0430755615234375, -0.03499603271484375, -0.02691650390625, -0.01883697509765625, -0.0107574462890625, -0.00267791748046875, 0.005401611328125, 0.01348114013671875, 0.0215606689453125, 0.02964019775390625, 0.0377197265625, 0.04579925537109375, 0.0538787841796875, 0.06195831298828125, 0.070037841796875, 0.07811737060546875, 0.0861968994140625, 0.09427642822265625, 0.10235595703125, 0.11043548583984375, 0.1185150146484375, 0.12659454345703125, 0.134674072265625, 0.14275360107421875, 0.1508331298828125, 0.15891265869140625, 0.1669921875]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 3.0, 10.0, 19.0, 37.0, 55.0, 76.0, 122.0, 137.0, 117.0, 124.0, 94.0, 72.0, 57.0, 29.0, 22.0, 12.0, 7.0, 4.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.09088134765625, -0.08891868591308594, -0.08695602416992188, -0.08499336242675781, -0.08303070068359375, -0.08106803894042969, -0.07910537719726562, -0.07714271545410156, -0.0751800537109375, -0.07321739196777344, -0.07125473022460938, -0.06929206848144531, -0.06732940673828125, -0.06536674499511719, -0.06340408325195312, -0.06144142150878906, -0.059478759765625, -0.05751609802246094, -0.055553436279296875, -0.05359077453613281, -0.05162811279296875, -0.04966545104980469, -0.047702789306640625, -0.04574012756347656, -0.0437774658203125, -0.04181480407714844, -0.039852142333984375, -0.03788948059082031, -0.03592681884765625, -0.03396415710449219, -0.032001495361328125, -0.030038833618164062, -0.028076171875, -0.026113510131835938, -0.024150848388671875, -0.022188186645507812, -0.02022552490234375, -0.018262863159179688, -0.016300201416015625, -0.014337539672851562, -0.0123748779296875, -0.010412216186523438, -0.008449554443359375, -0.0064868927001953125, -0.00452423095703125, -0.0025615692138671875, -0.000598907470703125, 0.0013637542724609375, 0.003326416015625, 0.0052890777587890625, 0.007251739501953125, 0.009214401245117188, 0.01117706298828125, 0.013139724731445312, 0.015102386474609375, 0.017065048217773438, 0.0190277099609375, 0.020990371704101562, 0.022953033447265625, 0.024915695190429688, 0.02687835693359375, 0.028841018676757812, 0.030803680419921875, 0.03276634216308594, 0.03472900390625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 7.0, 4.0, 28.0, 47.0, 153.0, 733.0, 4190489.0, 2329.0, 254.0, 112.0, 79.0, 30.0, 16.0, 8.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.76513671875, -0.7218093872070312, -0.6784820556640625, -0.6351547241210938, -0.591827392578125, -0.5485000610351562, -0.5051727294921875, -0.46184539794921875, -0.41851806640625, -0.37519073486328125, -0.3318634033203125, -0.28853607177734375, -0.245208740234375, -0.20188140869140625, -0.1585540771484375, -0.11522674560546875, -0.0718994140625, -0.02857208251953125, 0.0147552490234375, 0.05808258056640625, 0.101409912109375, 0.14473724365234375, 0.1880645751953125, 0.23139190673828125, 0.27471923828125, 0.31804656982421875, 0.3613739013671875, 0.40470123291015625, 0.448028564453125, 0.49135589599609375, 0.5346832275390625, 0.5780105590820312, 0.621337890625, 0.6646652221679688, 0.7079925537109375, 0.7513198852539062, 0.794647216796875, 0.8379745483398438, 0.8813018798828125, 0.9246292114257812, 0.96795654296875, 1.0112838745117188, 1.0546112060546875, 1.0979385375976562, 1.141265869140625, 1.1845932006835938, 1.2279205322265625, 1.2712478637695312, 1.3145751953125, 1.3579025268554688, 1.4012298583984375, 1.4445571899414062, 1.487884521484375, 1.5312118530273438, 1.5745391845703125, 1.6178665161132812, 1.66119384765625, 1.7045211791992188, 1.7478485107421875, 1.7911758422851562, 1.834503173828125, 1.8778305053710938, 1.9211578369140625, 1.9644851684570312, 2.0078125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 7.0, 32.0, 304.0, 3633.0, 92.0, 15.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1363525390625, -0.12891197204589844, -0.12147140502929688, -0.11403083801269531, -0.10659027099609375, -0.09914970397949219, -0.09170913696289062, -0.08426856994628906, -0.0768280029296875, -0.06938743591308594, -0.061946868896484375, -0.05450630187988281, -0.04706573486328125, -0.03962516784667969, -0.032184600830078125, -0.024744033813476562, -0.017303466796875, -0.009862899780273438, -0.002422332763671875, 0.0050182342529296875, 0.01245880126953125, 0.019899368286132812, 0.027339935302734375, 0.03478050231933594, 0.0422210693359375, 0.04966163635253906, 0.057102203369140625, 0.06454277038574219, 0.07198333740234375, 0.07942390441894531, 0.08686447143554688, 0.09430503845214844, 0.10174560546875, 0.10918617248535156, 0.11662673950195312, 0.12406730651855469, 0.13150787353515625, 0.1389484405517578, 0.14638900756835938, 0.15382957458496094, 0.1612701416015625, 0.16871070861816406, 0.17615127563476562, 0.1835918426513672, 0.19103240966796875, 0.1984729766845703, 0.20591354370117188, 0.21335411071777344, 0.220794677734375, 0.22823524475097656, 0.23567581176757812, 0.2431163787841797, 0.25055694580078125, 0.2579975128173828, 0.2654380798339844, 0.27287864685058594, 0.2803192138671875, 0.28775978088378906, 0.2952003479003906, 0.3026409149169922, 0.31008148193359375, 0.3175220489501953, 0.3249626159667969, 0.33240318298339844, 0.33984375]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 963.0, 52.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.079771041870117, -6.937816619873047, -6.795862674713135, -6.653908729553223, -6.511954307556152, -6.369999885559082, -6.22804594039917, -6.086091995239258, -5.9441375732421875, -5.802183151245117, -5.660229206085205, -5.518275260925293, -5.376320838928223, -5.234366416931152, -5.09241247177124, -4.950458526611328, -4.808504104614258, -4.6665496826171875, -4.524595737457275, -4.382641792297363, -4.240687370300293, -4.098732948303223, -3.9567790031433105, -3.8148248195648193, -3.672870635986328, -3.530916452407837, -3.3889622688293457, -3.2470080852508545, -3.1050539016723633, -2.963099718093872, -2.821145534515381, -2.6791913509368896, -2.5372371673583984, -2.3952829837799072, -2.253328800201416, -2.111374616622925, -1.9694204330444336, -1.8274662494659424, -1.6855120658874512, -1.54355788230896, -1.4016036987304688, -1.2596495151519775, -1.1176953315734863, -0.9757411479949951, -0.8337869644165039, -0.6918327808380127, -0.5498785972595215, -0.4079244136810303, -0.26597023010253906, -0.12401604652404785, 0.01793813705444336, 0.15989232063293457, 0.3018465042114258, 0.443800687789917, 0.5857548713684082, 0.7277090549468994, 0.8696632385253906, 1.0116174221038818, 1.153571605682373, 1.2955257892608643, 1.4374799728393555, 1.5794341564178467, 1.721388339996338, 1.863342523574829, 2.0052967071533203]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 5.0, 8.0, 24.0, 29.0, 72.0, 95.0, 113.0, 136.0, 130.0, 126.0, 109.0, 83.0, 36.0, 22.0, 14.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.5395345091819763, -0.5260591506958008, -0.5125837922096252, -0.4991084635257721, -0.48563313484191895, -0.4721577763557434, -0.45868241786956787, -0.4452070891857147, -0.4317317605018616, -0.41825640201568604, -0.4047810733318329, -0.39130571484565735, -0.3778303861618042, -0.36435502767562866, -0.3508796691894531, -0.3374043405056, -0.32392898201942444, -0.3104536235332489, -0.29697829484939575, -0.2835029363632202, -0.27002760767936707, -0.25655224919319153, -0.24307690560817719, -0.22960156202316284, -0.2161262184381485, -0.20265087485313416, -0.1891755312681198, -0.17570018768310547, -0.16222482919692993, -0.14874950051307678, -0.13527414202690125, -0.1217987984418869, -0.10832345485687256, -0.09484811127185822, -0.08137276768684387, -0.06789741665124893, -0.05442207306623459, -0.040946729481220245, -0.027471378445625305, -0.013996034860610962, -0.0005206912755966187, 0.012954654172062874, 0.026429999619722366, 0.03990534693002701, 0.05338069051504135, 0.0668560341000557, 0.08033138513565063, 0.09380672872066498, 0.10728207230567932, 0.12075741589069366, 0.134232759475708, 0.14770811796188354, 0.1611834466457367, 0.17465880513191223, 0.18813414871692657, 0.20160949230194092, 0.21508483588695526, 0.2285601794719696, 0.24203552305698395, 0.2555108666419983, 0.26898622512817383, 0.282461553812027, 0.2959369122982025, 0.30941224098205566, 0.3228875994682312]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 13.0, 10.0, 15.0, 18.0, 27.0, 32.0, 56.0, 79.0, 151.0, 254.0, 493.0, 1077.0, 3112.0, 13626.0, 114256.0, 792856.0, 104271.0, 13080.0, 2974.0, 1060.0, 472.0, 214.0, 143.0, 79.0, 64.0, 41.0, 25.0, 18.0, 9.0, 7.0, 10.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.1650390625, -0.16063594818115234, -0.1562328338623047, -0.15182971954345703, -0.14742660522460938, -0.14302349090576172, -0.13862037658691406, -0.1342172622680664, -0.12981414794921875, -0.1254110336303711, -0.12100791931152344, -0.11660480499267578, -0.11220169067382812, -0.10779857635498047, -0.10339546203613281, -0.09899234771728516, -0.0945892333984375, -0.09018611907958984, -0.08578300476074219, -0.08137989044189453, -0.07697677612304688, -0.07257366180419922, -0.06817054748535156, -0.0637674331665039, -0.05936431884765625, -0.054961204528808594, -0.05055809020996094, -0.04615497589111328, -0.041751861572265625, -0.03734874725341797, -0.03294563293457031, -0.028542518615722656, -0.024139404296875, -0.019736289978027344, -0.015333175659179688, -0.010930061340332031, -0.006526947021484375, -0.0021238327026367188, 0.0022792816162109375, 0.006682395935058594, 0.01108551025390625, 0.015488624572753906, 0.019891738891601562, 0.02429485321044922, 0.028697967529296875, 0.03310108184814453, 0.03750419616699219, 0.041907310485839844, 0.0463104248046875, 0.050713539123535156, 0.05511665344238281, 0.05951976776123047, 0.06392288208007812, 0.06832599639892578, 0.07272911071777344, 0.0771322250366211, 0.08153533935546875, 0.0859384536743164, 0.09034156799316406, 0.09474468231201172, 0.09914779663085938, 0.10355091094970703, 0.10795402526855469, 0.11235713958740234, 0.11676025390625]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 6.0, 2.0, 18.0, 11.0, 32.0, 53.0, 57.0, 80.0, 100.0, 118.0, 121.0, 92.0, 102.0, 72.0, 44.0, 32.0, 21.0, 22.0, 10.0, 8.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0], "bins": [-0.07476806640625, -0.07318234443664551, -0.07159662246704102, -0.07001090049743652, -0.06842517852783203, -0.06683945655822754, -0.06525373458862305, -0.06366801261901855, -0.06208229064941406, -0.06049656867980957, -0.05891084671020508, -0.057325124740600586, -0.055739402770996094, -0.0541536808013916, -0.05256795883178711, -0.05098223686218262, -0.049396514892578125, -0.04781079292297363, -0.04622507095336914, -0.04463934898376465, -0.043053627014160156, -0.041467905044555664, -0.03988218307495117, -0.03829646110534668, -0.03671073913574219, -0.035125017166137695, -0.0335392951965332, -0.03195357322692871, -0.03036785125732422, -0.028782129287719727, -0.027196407318115234, -0.025610685348510742, -0.02402496337890625, -0.022439241409301758, -0.020853519439697266, -0.019267797470092773, -0.01768207550048828, -0.01609635353088379, -0.014510631561279297, -0.012924909591674805, -0.011339187622070312, -0.00975346565246582, -0.008167743682861328, -0.006582021713256836, -0.004996299743652344, -0.0034105777740478516, -0.0018248558044433594, -0.0002391338348388672, 0.001346588134765625, 0.002932310104370117, 0.004518032073974609, 0.0061037540435791016, 0.007689476013183594, 0.009275197982788086, 0.010860919952392578, 0.01244664192199707, 0.014032363891601562, 0.015618085861206055, 0.017203807830810547, 0.01878952980041504, 0.02037525177001953, 0.021960973739624023, 0.023546695709228516, 0.025132417678833008, 0.0267181396484375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 5.0, 5.0, 7.0, 18.0, 15.0, 23.0, 18.0, 51.0, 78.0, 143.0, 276.0, 822.0, 3069.0, 28211.0, 886803.0, 120278.0, 6538.0, 1296.0, 445.0, 183.0, 78.0, 60.0, 41.0, 29.0, 24.0, 7.0, 10.0, 4.0, 1.0, 8.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0], "bins": [-0.25048828125, -0.2440166473388672, -0.23754501342773438, -0.23107337951660156, -0.22460174560546875, -0.21813011169433594, -0.21165847778320312, -0.2051868438720703, -0.1987152099609375, -0.1922435760498047, -0.18577194213867188, -0.17930030822753906, -0.17282867431640625, -0.16635704040527344, -0.15988540649414062, -0.1534137725830078, -0.146942138671875, -0.1404705047607422, -0.13399887084960938, -0.12752723693847656, -0.12105560302734375, -0.11458396911621094, -0.10811233520507812, -0.10164070129394531, -0.0951690673828125, -0.08869743347167969, -0.08222579956054688, -0.07575416564941406, -0.06928253173828125, -0.06281089782714844, -0.056339263916015625, -0.04986763000488281, -0.04339599609375, -0.03692436218261719, -0.030452728271484375, -0.023981094360351562, -0.01750946044921875, -0.011037826538085938, -0.004566192626953125, 0.0019054412841796875, 0.0083770751953125, 0.014848709106445312, 0.021320343017578125, 0.027791976928710938, 0.03426361083984375, 0.04073524475097656, 0.047206878662109375, 0.05367851257324219, 0.060150146484375, 0.06662178039550781, 0.07309341430664062, 0.07956504821777344, 0.08603668212890625, 0.09250831604003906, 0.09897994995117188, 0.10545158386230469, 0.1119232177734375, 0.11839485168457031, 0.12486648559570312, 0.13133811950683594, 0.13780975341796875, 0.14428138732910156, 0.15075302124023438, 0.1572246551513672, 0.1636962890625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 4.0, 7.0, 11.0, 10.0, 16.0, 19.0, 17.0, 30.0, 47.0, 50.0, 48.0, 78.0, 77.0, 90.0, 81.0, 86.0, 58.0, 67.0, 47.0, 40.0, 29.0, 23.0, 24.0, 10.0, 9.0, 8.0, 4.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0], "bins": [-0.198974609375, -0.19386863708496094, -0.18876266479492188, -0.1836566925048828, -0.17855072021484375, -0.1734447479248047, -0.16833877563476562, -0.16323280334472656, -0.1581268310546875, -0.15302085876464844, -0.14791488647460938, -0.1428089141845703, -0.13770294189453125, -0.1325969696044922, -0.12749099731445312, -0.12238502502441406, -0.117279052734375, -0.11217308044433594, -0.10706710815429688, -0.10196113586425781, -0.09685516357421875, -0.09174919128417969, -0.08664321899414062, -0.08153724670410156, -0.0764312744140625, -0.07132530212402344, -0.06621932983398438, -0.06111335754394531, -0.05600738525390625, -0.05090141296386719, -0.045795440673828125, -0.04068946838378906, -0.03558349609375, -0.030477523803710938, -0.025371551513671875, -0.020265579223632812, -0.01515960693359375, -0.010053634643554688, -0.004947662353515625, 0.0001583099365234375, 0.0052642822265625, 0.010370254516601562, 0.015476226806640625, 0.020582199096679688, 0.02568817138671875, 0.030794143676757812, 0.035900115966796875, 0.04100608825683594, 0.046112060546875, 0.05121803283691406, 0.056324005126953125, 0.06142997741699219, 0.06653594970703125, 0.07164192199707031, 0.07674789428710938, 0.08185386657714844, 0.0869598388671875, 0.09206581115722656, 0.09717178344726562, 0.10227775573730469, 0.10738372802734375, 0.11248970031738281, 0.11759567260742188, 0.12270164489746094, 0.1278076171875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 3.0, 14.0, 12.0, 26.0, 29.0, 65.0, 100.0, 280.0, 700.0, 2657.0, 21964.0, 868791.0, 145656.0, 6325.0, 1179.0, 390.0, 151.0, 89.0, 38.0, 30.0, 14.0, 16.0, 13.0, 5.0, 2.0, 9.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.040191650390625, -0.038342952728271484, -0.03649425506591797, -0.03464555740356445, -0.03279685974121094, -0.030948162078857422, -0.029099464416503906, -0.02725076675415039, -0.025402069091796875, -0.02355337142944336, -0.021704673767089844, -0.019855976104736328, -0.018007278442382812, -0.016158580780029297, -0.014309883117675781, -0.012461185455322266, -0.01061248779296875, -0.008763790130615234, -0.006915092468261719, -0.005066394805908203, -0.0032176971435546875, -0.0013689994812011719, 0.00047969818115234375, 0.0023283958435058594, 0.004177093505859375, 0.006025791168212891, 0.007874488830566406, 0.009723186492919922, 0.011571884155273438, 0.013420581817626953, 0.015269279479980469, 0.017117977142333984, 0.0189666748046875, 0.020815372467041016, 0.02266407012939453, 0.024512767791748047, 0.026361465454101562, 0.028210163116455078, 0.030058860778808594, 0.03190755844116211, 0.033756256103515625, 0.03560495376586914, 0.037453651428222656, 0.03930234909057617, 0.04115104675292969, 0.0429997444152832, 0.04484844207763672, 0.046697139739990234, 0.04854583740234375, 0.050394535064697266, 0.05224323272705078, 0.0540919303894043, 0.05594062805175781, 0.05778932571411133, 0.059638023376464844, 0.06148672103881836, 0.06333541870117188, 0.06518411636352539, 0.0670328140258789, 0.06888151168823242, 0.07073020935058594, 0.07257890701293945, 0.07442760467529297, 0.07627630233764648, 0.078125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 4.0, 9.0, 10.0, 15.0, 30.0, 44.0, 52.0, 83.0, 75.0, 83.0, 107.0, 98.0, 67.0, 93.0, 82.0, 52.0, 26.0, 32.0, 9.0, 11.0, 7.0, 6.0, 5.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.344650268554688e-06, -8.063390851020813e-06, -7.782131433486938e-06, -7.500872015953064e-06, -7.2196125984191895e-06, -6.938353180885315e-06, -6.6570937633514404e-06, -6.375834345817566e-06, -6.094574928283691e-06, -5.813315510749817e-06, -5.532056093215942e-06, -5.250796675682068e-06, -4.969537258148193e-06, -4.688277840614319e-06, -4.407018423080444e-06, -4.12575900554657e-06, -3.844499588012695e-06, -3.563240170478821e-06, -3.2819807529449463e-06, -3.0007213354110718e-06, -2.7194619178771973e-06, -2.4382025003433228e-06, -2.1569430828094482e-06, -1.8756836652755737e-06, -1.5944242477416992e-06, -1.3131648302078247e-06, -1.0319054126739502e-06, -7.506459951400757e-07, -4.6938657760620117e-07, -1.8812716007232666e-07, 9.313225746154785e-08, 3.7439167499542236e-07, 6.556510925292969e-07, 9.369105100631714e-07, 1.218169927597046e-06, 1.4994293451309204e-06, 1.780688762664795e-06, 2.0619481801986694e-06, 2.343207597732544e-06, 2.6244670152664185e-06, 2.905726432800293e-06, 3.1869858503341675e-06, 3.468245267868042e-06, 3.7495046854019165e-06, 4.030764102935791e-06, 4.3120235204696655e-06, 4.59328293800354e-06, 4.8745423555374146e-06, 5.155801773071289e-06, 5.4370611906051636e-06, 5.718320608139038e-06, 5.999580025672913e-06, 6.280839443206787e-06, 6.562098860740662e-06, 6.843358278274536e-06, 7.124617695808411e-06, 7.405877113342285e-06, 7.68713653087616e-06, 7.968395948410034e-06, 8.249655365943909e-06, 8.530914783477783e-06, 8.812174201011658e-06, 9.093433618545532e-06, 9.374693036079407e-06, 9.655952453613281e-06]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 7.0, 3.0, 10.0, 10.0, 16.0, 23.0, 44.0, 69.0, 150.0, 384.0, 1130.0, 7111.0, 550662.0, 480634.0, 6544.0, 1033.0, 386.0, 142.0, 73.0, 42.0, 25.0, 19.0, 11.0, 7.0, 9.0, 1.0, 6.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.06982421875, -0.06757068634033203, -0.06531715393066406, -0.0630636215209961, -0.060810089111328125, -0.058556556701660156, -0.05630302429199219, -0.05404949188232422, -0.05179595947265625, -0.04954242706298828, -0.04728889465332031, -0.045035362243652344, -0.042781829833984375, -0.040528297424316406, -0.03827476501464844, -0.03602123260498047, -0.0337677001953125, -0.03151416778564453, -0.029260635375976562, -0.027007102966308594, -0.024753570556640625, -0.022500038146972656, -0.020246505737304688, -0.01799297332763672, -0.01573944091796875, -0.013485908508300781, -0.011232376098632812, -0.008978843688964844, -0.006725311279296875, -0.004471778869628906, -0.0022182464599609375, 3.528594970703125e-05, 0.002288818359375, 0.004542350769042969, 0.0067958831787109375, 0.009049415588378906, 0.011302947998046875, 0.013556480407714844, 0.015810012817382812, 0.01806354522705078, 0.02031707763671875, 0.02257061004638672, 0.024824142456054688, 0.027077674865722656, 0.029331207275390625, 0.031584739685058594, 0.03383827209472656, 0.03609180450439453, 0.0383453369140625, 0.04059886932373047, 0.04285240173339844, 0.045105934143066406, 0.047359466552734375, 0.049612998962402344, 0.05186653137207031, 0.05412006378173828, 0.05637359619140625, 0.05862712860107422, 0.06088066101074219, 0.06313419342041016, 0.06538772583007812, 0.0676412582397461, 0.06989479064941406, 0.07214832305908203, 0.07440185546875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 4.0, 6.0, 14.0, 24.0, 29.0, 51.0, 111.0, 162.0, 209.0, 166.0, 106.0, 40.0, 32.0, 20.0, 15.0, 5.0, 4.0, 4.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0491943359375, -0.04726123809814453, -0.04532814025878906, -0.043395042419433594, -0.041461944580078125, -0.039528846740722656, -0.03759574890136719, -0.03566265106201172, -0.03372955322265625, -0.03179645538330078, -0.029863357543945312, -0.027930259704589844, -0.025997161865234375, -0.024064064025878906, -0.022130966186523438, -0.02019786834716797, -0.0182647705078125, -0.01633167266845703, -0.014398574829101562, -0.012465476989746094, -0.010532379150390625, -0.008599281311035156, -0.0066661834716796875, -0.004733085632324219, -0.00279998779296875, -0.0008668899536132812, 0.0010662078857421875, 0.0029993057250976562, 0.004932403564453125, 0.006865501403808594, 0.008798599243164062, 0.010731697082519531, 0.012664794921875, 0.014597892761230469, 0.016530990600585938, 0.018464088439941406, 0.020397186279296875, 0.022330284118652344, 0.024263381958007812, 0.02619647979736328, 0.02812957763671875, 0.03006267547607422, 0.03199577331542969, 0.033928871154785156, 0.035861968994140625, 0.037795066833496094, 0.03972816467285156, 0.04166126251220703, 0.0435943603515625, 0.04552745819091797, 0.04746055603027344, 0.049393653869628906, 0.051326751708984375, 0.053259849548339844, 0.05519294738769531, 0.05712604522705078, 0.05905914306640625, 0.06099224090576172, 0.06292533874511719, 0.06485843658447266, 0.06679153442382812, 0.0687246322631836, 0.07065773010253906, 0.07259082794189453, 0.07452392578125]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 10.0, 57.0, 802.0, 134.0, 7.0, 3.0, 0.0, 1.0, 1.0], "bins": [-5.617735862731934, -5.520354270935059, -5.422972679138184, -5.325591087341309, -5.228209495544434, -5.130828380584717, -5.033446788787842, -4.936065196990967, -4.838683605194092, -4.741302013397217, -4.643920421600342, -4.546538829803467, -4.44915771484375, -4.351776123046875, -4.25439453125, -4.157012939453125, -4.05963134765625, -3.962249755859375, -3.8648681640625, -3.767486810684204, -3.670105218887329, -3.572723627090454, -3.475342273712158, -3.377960681915283, -3.280579090118408, -3.183197498321533, -3.085815906524658, -2.9884345531463623, -2.8910529613494873, -2.7936713695526123, -2.6962900161743164, -2.5989084243774414, -2.5015268325805664, -2.4041452407836914, -2.3067636489868164, -2.2093822956085205, -2.1120007038116455, -2.0146191120147705, -1.917237639427185, -1.8198561668395996, -1.7224745750427246, -1.6250929832458496, -1.5277115106582642, -1.4303300380706787, -1.3329484462738037, -1.2355668544769287, -1.1381853818893433, -1.0408039093017578, -0.9434223771095276, -0.8460408449172974, -0.7486593127250671, -0.6512777805328369, -0.5538962483406067, -0.45651471614837646, -0.35913318395614624, -0.261751651763916, -0.1643701195716858, -0.06698858737945557, 0.030392944812774658, 0.12777447700500488, 0.2251560091972351, 0.32253754138946533, 0.41991907358169556, 0.5173006057739258, 0.614682137966156]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 4.0, 6.0, 4.0, 10.0, 10.0, 13.0, 11.0, 15.0, 24.0, 12.0, 22.0, 31.0, 39.0, 42.0, 43.0, 53.0, 43.0, 48.0, 60.0, 46.0, 56.0, 48.0, 42.0, 49.0, 38.0, 38.0, 30.0, 26.0, 24.0, 25.0, 21.0, 9.0, 14.0, 9.0, 8.0, 8.0, 4.0, 8.0, 4.0, 4.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.6214073896408081, -0.602865993976593, -0.5843246579170227, -0.5657832622528076, -0.5472419261932373, -0.5287005305290222, -0.5101591944694519, -0.4916177988052368, -0.4730764329433441, -0.4545350670814514, -0.4359937012195587, -0.417452335357666, -0.3989109396934509, -0.3803696036338806, -0.3618282079696655, -0.3432868421077728, -0.3247454762458801, -0.3062041103839874, -0.2876627445220947, -0.269121378660202, -0.2505800127983093, -0.23203863203525543, -0.21349725127220154, -0.19495588541030884, -0.17641451954841614, -0.15787315368652344, -0.13933178782463074, -0.12079040706157684, -0.10224904119968414, -0.08370767533779144, -0.06516630202531815, -0.04662492871284485, -0.02808356285095215, -0.00954219326376915, 0.008999176323413849, 0.027540545910596848, 0.046081915497779846, 0.06462328135967255, 0.08316465467214584, 0.10170602798461914, 0.12024739384651184, 0.13878875970840454, 0.15733012557029724, 0.17587150633335114, 0.19441287219524384, 0.21295423805713654, 0.23149561882019043, 0.25003698468208313, 0.26857835054397583, 0.28711971640586853, 0.30566108226776123, 0.32420244812965393, 0.34274381399154663, 0.3612852096557617, 0.3798265755176544, 0.3983679413795471, 0.4169093072414398, 0.4354506731033325, 0.4539920389652252, 0.4725334048271179, 0.491074800491333, 0.5096161365509033, 0.5281575322151184, 0.5466989278793335, 0.5652402639389038]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 9.0, 7.0, 7.0, 9.0, 17.0, 25.0, 27.0, 52.0, 56.0, 104.0, 173.0, 260.0, 539.0, 1145.0, 2814.0, 9612.0, 65903.0, 3921633.0, 170905.0, 15050.0, 3604.0, 1310.0, 481.0, 242.0, 128.0, 57.0, 34.0, 31.0, 15.0, 8.0, 6.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2491455078125, -0.2431621551513672, -0.23717880249023438, -0.23119544982910156, -0.22521209716796875, -0.21922874450683594, -0.21324539184570312, -0.2072620391845703, -0.2012786865234375, -0.1952953338623047, -0.18931198120117188, -0.18332862854003906, -0.17734527587890625, -0.17136192321777344, -0.16537857055664062, -0.1593952178955078, -0.153411865234375, -0.1474285125732422, -0.14144515991210938, -0.13546180725097656, -0.12947845458984375, -0.12349510192871094, -0.11751174926757812, -0.11152839660644531, -0.1055450439453125, -0.09956169128417969, -0.09357833862304688, -0.08759498596191406, -0.08161163330078125, -0.07562828063964844, -0.06964492797851562, -0.06366157531738281, -0.05767822265625, -0.05169486999511719, -0.045711517333984375, -0.03972816467285156, -0.03374481201171875, -0.027761459350585938, -0.021778106689453125, -0.015794754028320312, -0.0098114013671875, -0.0038280487060546875, 0.002155303955078125, 0.008138656616210938, 0.01412200927734375, 0.020105361938476562, 0.026088714599609375, 0.03207206726074219, 0.038055419921875, 0.04403877258300781, 0.050022125244140625, 0.05600547790527344, 0.06198883056640625, 0.06797218322753906, 0.07395553588867188, 0.07993888854980469, 0.0859222412109375, 0.09190559387207031, 0.09788894653320312, 0.10387229919433594, 0.10985565185546875, 0.11583900451660156, 0.12182235717773438, 0.1278057098388672, 0.1337890625]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 11.0, 12.0, 32.0, 40.0, 47.0, 60.0, 87.0, 119.0, 124.0, 106.0, 91.0, 77.0, 79.0, 40.0, 32.0, 19.0, 15.0, 9.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0], "bins": [-0.0750732421875, -0.0735311508178711, -0.07198905944824219, -0.07044696807861328, -0.06890487670898438, -0.06736278533935547, -0.06582069396972656, -0.06427860260009766, -0.06273651123046875, -0.061194419860839844, -0.05965232849121094, -0.05811023712158203, -0.056568145751953125, -0.05502605438232422, -0.05348396301269531, -0.051941871643066406, -0.0503997802734375, -0.048857688903808594, -0.04731559753417969, -0.04577350616455078, -0.044231414794921875, -0.04268932342529297, -0.04114723205566406, -0.039605140686035156, -0.03806304931640625, -0.036520957946777344, -0.03497886657714844, -0.03343677520751953, -0.031894683837890625, -0.03035259246826172, -0.028810501098632812, -0.027268409729003906, -0.025726318359375, -0.024184226989746094, -0.022642135620117188, -0.02110004425048828, -0.019557952880859375, -0.01801586151123047, -0.016473770141601562, -0.014931678771972656, -0.01338958740234375, -0.011847496032714844, -0.010305404663085938, -0.008763313293457031, -0.007221221923828125, -0.005679130554199219, -0.0041370391845703125, -0.0025949478149414062, -0.0010528564453125, 0.0004892349243164062, 0.0020313262939453125, 0.0035734176635742188, 0.005115509033203125, 0.006657600402832031, 0.008199691772460938, 0.009741783142089844, 0.01128387451171875, 0.012825965881347656, 0.014368057250976562, 0.01591014862060547, 0.017452239990234375, 0.01899433135986328, 0.020536422729492188, 0.022078514099121094, 0.02362060546875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 3.0, 7.0, 9.0, 30.0, 34.0, 67.0, 87.0, 184.0, 485.0, 1849.0, 24486.0, 4149300.0, 15828.0, 1332.0, 315.0, 129.0, 59.0, 27.0, 23.0, 15.0, 7.0, 9.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4150390625, -0.40299224853515625, -0.3909454345703125, -0.37889862060546875, -0.366851806640625, -0.35480499267578125, -0.3427581787109375, -0.33071136474609375, -0.31866455078125, -0.30661773681640625, -0.2945709228515625, -0.28252410888671875, -0.270477294921875, -0.25843048095703125, -0.2463836669921875, -0.23433685302734375, -0.2222900390625, -0.21024322509765625, -0.1981964111328125, -0.18614959716796875, -0.174102783203125, -0.16205596923828125, -0.1500091552734375, -0.13796234130859375, -0.12591552734375, -0.11386871337890625, -0.1018218994140625, -0.08977508544921875, -0.077728271484375, -0.06568145751953125, -0.0536346435546875, -0.04158782958984375, -0.029541015625, -0.01749420166015625, -0.0054473876953125, 0.00659942626953125, 0.018646240234375, 0.03069305419921875, 0.0427398681640625, 0.05478668212890625, 0.06683349609375, 0.07888031005859375, 0.0909271240234375, 0.10297393798828125, 0.115020751953125, 0.12706756591796875, 0.1391143798828125, 0.15116119384765625, 0.1632080078125, 0.17525482177734375, 0.1873016357421875, 0.19934844970703125, 0.211395263671875, 0.22344207763671875, 0.2354888916015625, 0.24753570556640625, 0.25958251953125, 0.27162933349609375, 0.2836761474609375, 0.29572296142578125, 0.307769775390625, 0.31981658935546875, 0.3318634033203125, 0.34391021728515625, 0.35595703125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 2.0, 2.0, 4.0, 4.0, 7.0, 10.0, 15.0, 19.0, 48.0, 140.0, 904.0, 2490.0, 281.0, 74.0, 43.0, 14.0, 5.0, 2.0, 6.0, 2.0, 3.0, 1.0, 1.0, 5.0], "bins": [-0.20458984375, -0.20059585571289062, -0.19660186767578125, -0.19260787963867188, -0.1886138916015625, -0.18461990356445312, -0.18062591552734375, -0.17663192749023438, -0.172637939453125, -0.16864395141601562, -0.16464996337890625, -0.16065597534179688, -0.1566619873046875, -0.15266799926757812, -0.14867401123046875, -0.14468002319335938, -0.14068603515625, -0.13669204711914062, -0.13269805908203125, -0.12870407104492188, -0.1247100830078125, -0.12071609497070312, -0.11672210693359375, -0.11272811889648438, -0.108734130859375, -0.10474014282226562, -0.10074615478515625, -0.09675216674804688, -0.0927581787109375, -0.08876419067382812, -0.08477020263671875, -0.08077621459960938, -0.0767822265625, -0.07278823852539062, -0.06879425048828125, -0.06480026245117188, -0.0608062744140625, -0.056812286376953125, -0.05281829833984375, -0.048824310302734375, -0.044830322265625, -0.040836334228515625, -0.03684234619140625, -0.032848358154296875, -0.0288543701171875, -0.024860382080078125, -0.02086639404296875, -0.016872406005859375, -0.01287841796875, -0.008884429931640625, -0.00489044189453125, -0.000896453857421875, 0.0030975341796875, 0.007091522216796875, 0.01108551025390625, 0.015079498291015625, 0.019073486328125, 0.023067474365234375, 0.02706146240234375, 0.031055450439453125, 0.0350494384765625, 0.039043426513671875, 0.04303741455078125, 0.047031402587890625, 0.051025390625]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 24.0, 572.0, 393.0, 15.0, 5.0, 1.0, 4.0], "bins": [-2.8906402587890625, -2.8415651321411133, -2.792490005493164, -2.7434146404266357, -2.6943395137786865, -2.6452643871307373, -2.596189022064209, -2.5471138954162598, -2.4980387687683105, -2.4489636421203613, -2.399888515472412, -2.350813150405884, -2.3017380237579346, -2.2526628971099854, -2.203587532043457, -2.154512405395508, -2.1054372787475586, -2.0563621520996094, -2.00728702545166, -1.9582116603851318, -1.9091365337371826, -1.8600614070892334, -1.8109861612319946, -1.7619109153747559, -1.7128357887268066, -1.6637606620788574, -1.6146854162216187, -1.5656101703643799, -1.5165350437164307, -1.4674599170684814, -1.4183846712112427, -1.369309425354004, -1.3202342987060547, -1.2711591720581055, -1.2220839262008667, -1.173008680343628, -1.1239335536956787, -1.0748584270477295, -1.0257831811904907, -0.9767079949378967, -0.9276328682899475, -0.8785576820373535, -0.8294824957847595, -0.7804073095321655, -0.7313321232795715, -0.6822569370269775, -0.6331817507743835, -0.5841065645217896, -0.5350313782691956, -0.48595619201660156, -0.43688100576400757, -0.3878058195114136, -0.3387306332588196, -0.2896554470062256, -0.2405802607536316, -0.1915050745010376, -0.1424298882484436, -0.09335470199584961, -0.044279515743255615, 0.004795670509338379, 0.05387085676193237, 0.10294604301452637, 0.15202122926712036, 0.20109641551971436, 0.25017160177230835]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 6.0, 7.0, 15.0, 25.0, 26.0, 50.0, 67.0, 82.0, 104.0, 114.0, 120.0, 88.0, 107.0, 70.0, 56.0, 30.0, 13.0, 16.0, 7.0, 7.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4765163064002991, -0.4609263241291046, -0.44533634185791016, -0.4297463893890381, -0.41415640711784363, -0.39856642484664917, -0.3829764425754547, -0.36738646030426025, -0.3517965078353882, -0.3362065255641937, -0.32061654329299927, -0.3050265908241272, -0.28943660855293274, -0.2738466262817383, -0.2582566440105438, -0.24266666173934937, -0.2270766794681549, -0.21148669719696045, -0.19589672982692719, -0.18030674755573273, -0.16471678018569946, -0.149126797914505, -0.13353681564331055, -0.11794684082269669, -0.10235686600208282, -0.08676689118146896, -0.0711769163608551, -0.055586934089660645, -0.03999695926904678, -0.024406984448432922, -0.008817002177238464, 0.006772972643375397, 0.022362947463989258, 0.03795292228460312, 0.05354290083050728, 0.06913287937641144, 0.0847228541970253, 0.10031282901763916, 0.11590281128883362, 0.13149279356002808, 0.14708276093006134, 0.1626727432012558, 0.17826271057128906, 0.19385269284248352, 0.20944267511367798, 0.22503264248371124, 0.2406226247549057, 0.25621259212493896, 0.2718025743961334, 0.2873925566673279, 0.30298253893852234, 0.3185725212097168, 0.33416247367858887, 0.3497524559497833, 0.3653424382209778, 0.38093242049217224, 0.3965224027633667, 0.41211238503456116, 0.4277023673057556, 0.4432923197746277, 0.45888230204582214, 0.4744722843170166, 0.49006226658821106, 0.5056522488594055, 0.5212422013282776]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 0.0, 1.0, 1.0, 8.0, 8.0, 12.0, 23.0, 25.0, 31.0, 41.0, 66.0, 112.0, 152.0, 255.0, 534.0, 1081.0, 2894.0, 11898.0, 84208.0, 715814.0, 202119.0, 21780.0, 4532.0, 1417.0, 636.0, 309.0, 174.0, 134.0, 87.0, 52.0, 37.0, 20.0, 33.0, 14.0, 13.0, 18.0, 5.0, 4.0, 5.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.12939453125, -0.12555217742919922, -0.12170982360839844, -0.11786746978759766, -0.11402511596679688, -0.1101827621459961, -0.10634040832519531, -0.10249805450439453, -0.09865570068359375, -0.09481334686279297, -0.09097099304199219, -0.0871286392211914, -0.08328628540039062, -0.07944393157958984, -0.07560157775878906, -0.07175922393798828, -0.0679168701171875, -0.06407451629638672, -0.06023216247558594, -0.056389808654785156, -0.052547454833984375, -0.048705101013183594, -0.04486274719238281, -0.04102039337158203, -0.03717803955078125, -0.03333568572998047, -0.029493331909179688, -0.025650978088378906, -0.021808624267578125, -0.017966270446777344, -0.014123916625976562, -0.010281562805175781, -0.006439208984375, -0.0025968551635742188, 0.0012454986572265625, 0.005087852478027344, 0.008930206298828125, 0.012772560119628906, 0.016614913940429688, 0.02045726776123047, 0.02429962158203125, 0.02814197540283203, 0.03198432922363281, 0.035826683044433594, 0.039669036865234375, 0.043511390686035156, 0.04735374450683594, 0.05119609832763672, 0.0550384521484375, 0.05888080596923828, 0.06272315979003906, 0.06656551361083984, 0.07040786743164062, 0.0742502212524414, 0.07809257507324219, 0.08193492889404297, 0.08577728271484375, 0.08961963653564453, 0.09346199035644531, 0.0973043441772461, 0.10114669799804688, 0.10498905181884766, 0.10883140563964844, 0.11267375946044922, 0.11651611328125]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 0.0, 12.0, 19.0, 30.0, 39.0, 58.0, 69.0, 97.0, 106.0, 113.0, 106.0, 84.0, 85.0, 67.0, 42.0, 36.0, 10.0, 16.0, 6.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0], "bins": [-0.061370849609375, -0.059990882873535156, -0.05861091613769531, -0.05723094940185547, -0.055850982666015625, -0.05447101593017578, -0.05309104919433594, -0.051711082458496094, -0.05033111572265625, -0.048951148986816406, -0.04757118225097656, -0.04619121551513672, -0.044811248779296875, -0.04343128204345703, -0.04205131530761719, -0.040671348571777344, -0.0392913818359375, -0.037911415100097656, -0.03653144836425781, -0.03515148162841797, -0.033771514892578125, -0.03239154815673828, -0.031011581420898438, -0.029631614685058594, -0.02825164794921875, -0.026871681213378906, -0.025491714477539062, -0.02411174774169922, -0.022731781005859375, -0.02135181427001953, -0.019971847534179688, -0.018591880798339844, -0.0172119140625, -0.015831947326660156, -0.014451980590820312, -0.013072013854980469, -0.011692047119140625, -0.010312080383300781, -0.008932113647460938, -0.007552146911621094, -0.00617218017578125, -0.004792213439941406, -0.0034122467041015625, -0.0020322799682617188, -0.000652313232421875, 0.0007276535034179688, 0.0021076202392578125, 0.0034875869750976562, 0.0048675537109375, 0.006247520446777344, 0.0076274871826171875, 0.009007453918457031, 0.010387420654296875, 0.011767387390136719, 0.013147354125976562, 0.014527320861816406, 0.01590728759765625, 0.017287254333496094, 0.018667221069335938, 0.02004718780517578, 0.021427154541015625, 0.02280712127685547, 0.024187088012695312, 0.025567054748535156, 0.026947021484375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 9.0, 9.0, 15.0, 20.0, 38.0, 59.0, 89.0, 129.0, 207.0, 299.0, 559.0, 1106.0, 2405.0, 5978.0, 17021.0, 52773.0, 207313.0, 496022.0, 189882.0, 48567.0, 15794.0, 5531.0, 2288.0, 1033.0, 559.0, 314.0, 176.0, 114.0, 77.0, 62.0, 33.0, 24.0, 20.0, 12.0, 7.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04803466796875, -0.04645824432373047, -0.04488182067871094, -0.043305397033691406, -0.041728973388671875, -0.040152549743652344, -0.03857612609863281, -0.03699970245361328, -0.03542327880859375, -0.03384685516357422, -0.03227043151855469, -0.030694007873535156, -0.029117584228515625, -0.027541160583496094, -0.025964736938476562, -0.02438831329345703, -0.0228118896484375, -0.02123546600341797, -0.019659042358398438, -0.018082618713378906, -0.016506195068359375, -0.014929771423339844, -0.013353347778320312, -0.011776924133300781, -0.01020050048828125, -0.008624076843261719, -0.0070476531982421875, -0.005471229553222656, -0.003894805908203125, -0.0023183822631835938, -0.0007419586181640625, 0.0008344650268554688, 0.002410888671875, 0.003987312316894531, 0.0055637359619140625, 0.007140159606933594, 0.008716583251953125, 0.010293006896972656, 0.011869430541992188, 0.013445854187011719, 0.01502227783203125, 0.01659870147705078, 0.018175125122070312, 0.019751548767089844, 0.021327972412109375, 0.022904396057128906, 0.024480819702148438, 0.02605724334716797, 0.0276336669921875, 0.02921009063720703, 0.030786514282226562, 0.032362937927246094, 0.033939361572265625, 0.035515785217285156, 0.03709220886230469, 0.03866863250732422, 0.04024505615234375, 0.04182147979736328, 0.04339790344238281, 0.044974327087402344, 0.046550750732421875, 0.048127174377441406, 0.04970359802246094, 0.05128002166748047, 0.0528564453125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 5.0, 2.0, 7.0, 11.0, 23.0, 18.0, 15.0, 23.0, 33.0, 40.0, 34.0, 40.0, 50.0, 54.0, 60.0, 68.0, 49.0, 60.0, 45.0, 50.0, 52.0, 54.0, 43.0, 33.0, 20.0, 24.0, 31.0, 17.0, 10.0, 10.0, 9.0, 14.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10089111328125, -0.09786510467529297, -0.09483909606933594, -0.0918130874633789, -0.08878707885742188, -0.08576107025146484, -0.08273506164550781, -0.07970905303955078, -0.07668304443359375, -0.07365703582763672, -0.07063102722167969, -0.06760501861572266, -0.06457901000976562, -0.061553001403808594, -0.05852699279785156, -0.05550098419189453, -0.0524749755859375, -0.04944896697998047, -0.04642295837402344, -0.043396949768066406, -0.040370941162109375, -0.037344932556152344, -0.03431892395019531, -0.03129291534423828, -0.02826690673828125, -0.02524089813232422, -0.022214889526367188, -0.019188880920410156, -0.016162872314453125, -0.013136863708496094, -0.010110855102539062, -0.007084846496582031, -0.004058837890625, -0.0010328292846679688, 0.0019931793212890625, 0.005019187927246094, 0.008045196533203125, 0.011071205139160156, 0.014097213745117188, 0.01712322235107422, 0.02014923095703125, 0.02317523956298828, 0.026201248168945312, 0.029227256774902344, 0.032253265380859375, 0.035279273986816406, 0.03830528259277344, 0.04133129119873047, 0.0443572998046875, 0.04738330841064453, 0.05040931701660156, 0.053435325622558594, 0.056461334228515625, 0.059487342834472656, 0.06251335144042969, 0.06553936004638672, 0.06856536865234375, 0.07159137725830078, 0.07461738586425781, 0.07764339447021484, 0.08066940307617188, 0.0836954116821289, 0.08672142028808594, 0.08974742889404297, 0.0927734375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 6.0, 4.0, 6.0, 14.0, 23.0, 41.0, 74.0, 108.0, 203.0, 309.0, 633.0, 1448.0, 4747.0, 23493.0, 221114.0, 648173.0, 127022.0, 15378.0, 3365.0, 1147.0, 550.0, 286.0, 156.0, 104.0, 56.0, 42.0, 21.0, 15.0, 7.0, 4.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0252227783203125, -0.024489164352416992, -0.023755550384521484, -0.023021936416625977, -0.02228832244873047, -0.02155470848083496, -0.020821094512939453, -0.020087480545043945, -0.019353866577148438, -0.01862025260925293, -0.017886638641357422, -0.017153024673461914, -0.016419410705566406, -0.0156857967376709, -0.01495218276977539, -0.014218568801879883, -0.013484954833984375, -0.012751340866088867, -0.01201772689819336, -0.011284112930297852, -0.010550498962402344, -0.009816884994506836, -0.009083271026611328, -0.00834965705871582, -0.0076160430908203125, -0.006882429122924805, -0.006148815155029297, -0.005415201187133789, -0.004681587219238281, -0.0039479732513427734, -0.0032143592834472656, -0.002480745315551758, -0.00174713134765625, -0.0010135173797607422, -0.0002799034118652344, 0.00045371055603027344, 0.0011873245239257812, 0.001920938491821289, 0.002654552459716797, 0.0033881664276123047, 0.0041217803955078125, 0.00485539436340332, 0.005589008331298828, 0.006322622299194336, 0.007056236267089844, 0.0077898502349853516, 0.00852346420288086, 0.009257078170776367, 0.009990692138671875, 0.010724306106567383, 0.01145792007446289, 0.012191534042358398, 0.012925148010253906, 0.013658761978149414, 0.014392375946044922, 0.01512598991394043, 0.015859603881835938, 0.016593217849731445, 0.017326831817626953, 0.01806044578552246, 0.01879405975341797, 0.019527673721313477, 0.020261287689208984, 0.020994901657104492, 0.021728515625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 3.0, 6.0, 8.0, 6.0, 17.0, 17.0, 25.0, 24.0, 41.0, 50.0, 65.0, 49.0, 81.0, 89.0, 86.0, 79.0, 49.0, 50.0, 65.0, 47.0, 30.0, 36.0, 23.0, 18.0, 11.0, 15.0, 9.0, 4.0, 0.0, 1.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.212162017822266e-06, -6.987713277339935e-06, -6.763264536857605e-06, -6.538815796375275e-06, -6.314367055892944e-06, -6.089918315410614e-06, -5.865469574928284e-06, -5.641020834445953e-06, -5.416572093963623e-06, -5.192123353481293e-06, -4.967674612998962e-06, -4.743225872516632e-06, -4.518777132034302e-06, -4.2943283915519714e-06, -4.069879651069641e-06, -3.845430910587311e-06, -3.6209821701049805e-06, -3.39653342962265e-06, -3.17208468914032e-06, -2.9476359486579895e-06, -2.723187208175659e-06, -2.498738467693329e-06, -2.2742897272109985e-06, -2.0498409867286682e-06, -1.8253922462463379e-06, -1.6009435057640076e-06, -1.3764947652816772e-06, -1.152046024799347e-06, -9.275972843170166e-07, -7.031485438346863e-07, -4.78699803352356e-07, -2.5425106287002563e-07, -2.9802322387695312e-08, 1.94646418094635e-07, 4.1909515857696533e-07, 6.435438990592957e-07, 8.67992639541626e-07, 1.0924413800239563e-06, 1.3168901205062866e-06, 1.541338860988617e-06, 1.7657876014709473e-06, 1.9902363419532776e-06, 2.214685082435608e-06, 2.4391338229179382e-06, 2.6635825634002686e-06, 2.888031303882599e-06, 3.112480044364929e-06, 3.3369287848472595e-06, 3.56137752532959e-06, 3.78582626581192e-06, 4.0102750062942505e-06, 4.234723746776581e-06, 4.459172487258911e-06, 4.6836212277412415e-06, 4.908069968223572e-06, 5.132518708705902e-06, 5.356967449188232e-06, 5.581416189670563e-06, 5.805864930152893e-06, 6.030313670635223e-06, 6.254762411117554e-06, 6.479211151599884e-06, 6.703659892082214e-06, 6.928108632564545e-06, 7.152557373046875e-06]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 6.0, 5.0, 7.0, 5.0, 20.0, 17.0, 24.0, 42.0, 96.0, 125.0, 254.0, 537.0, 1204.0, 3319.0, 11240.0, 67108.0, 450738.0, 434500.0, 63223.0, 10698.0, 3112.0, 1175.0, 503.0, 234.0, 149.0, 65.0, 54.0, 28.0, 14.0, 12.0, 10.0, 5.0, 8.0, 6.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.020751953125, -0.02008223533630371, -0.019412517547607422, -0.018742799758911133, -0.018073081970214844, -0.017403364181518555, -0.016733646392822266, -0.016063928604125977, -0.015394210815429688, -0.014724493026733398, -0.01405477523803711, -0.01338505744934082, -0.012715339660644531, -0.012045621871948242, -0.011375904083251953, -0.010706186294555664, -0.010036468505859375, -0.009366750717163086, -0.008697032928466797, -0.008027315139770508, -0.007357597351074219, -0.00668787956237793, -0.006018161773681641, -0.0053484439849853516, -0.0046787261962890625, -0.0040090084075927734, -0.0033392906188964844, -0.0026695728302001953, -0.0019998550415039062, -0.0013301372528076172, -0.0006604194641113281, 9.298324584960938e-06, 0.00067901611328125, 0.001348733901977539, 0.002018451690673828, 0.002688169479370117, 0.0033578872680664062, 0.004027605056762695, 0.004697322845458984, 0.0053670406341552734, 0.0060367584228515625, 0.0067064762115478516, 0.007376194000244141, 0.00804591178894043, 0.008715629577636719, 0.009385347366333008, 0.010055065155029297, 0.010724782943725586, 0.011394500732421875, 0.012064218521118164, 0.012733936309814453, 0.013403654098510742, 0.014073371887207031, 0.01474308967590332, 0.01541280746459961, 0.0160825252532959, 0.016752243041992188, 0.017421960830688477, 0.018091678619384766, 0.018761396408081055, 0.019431114196777344, 0.020100831985473633, 0.020770549774169922, 0.02144026756286621, 0.0221099853515625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 7.0, 4.0, 5.0, 17.0, 15.0, 35.0, 34.0, 48.0, 60.0, 72.0, 110.0, 97.0, 111.0, 108.0, 67.0, 58.0, 57.0, 26.0, 25.0, 18.0, 12.0, 5.0, 5.0, 3.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0243682861328125, -0.02360367774963379, -0.022839069366455078, -0.022074460983276367, -0.021309852600097656, -0.020545244216918945, -0.019780635833740234, -0.019016027450561523, -0.018251419067382812, -0.0174868106842041, -0.01672220230102539, -0.01595759391784668, -0.015192985534667969, -0.014428377151489258, -0.013663768768310547, -0.012899160385131836, -0.012134552001953125, -0.011369943618774414, -0.010605335235595703, -0.009840726852416992, -0.009076118469238281, -0.00831151008605957, -0.007546901702880859, -0.0067822933197021484, -0.0060176849365234375, -0.0052530765533447266, -0.004488468170166016, -0.0037238597869873047, -0.0029592514038085938, -0.002194643020629883, -0.0014300346374511719, -0.0006654262542724609, 9.918212890625e-05, 0.0008637905120849609, 0.0016283988952636719, 0.002393007278442383, 0.0031576156616210938, 0.003922224044799805, 0.004686832427978516, 0.0054514408111572266, 0.0062160491943359375, 0.0069806575775146484, 0.007745265960693359, 0.00850987434387207, 0.009274482727050781, 0.010039091110229492, 0.010803699493408203, 0.011568307876586914, 0.012332916259765625, 0.013097524642944336, 0.013862133026123047, 0.014626741409301758, 0.015391349792480469, 0.01615595817565918, 0.01692056655883789, 0.0176851749420166, 0.018449783325195312, 0.019214391708374023, 0.019979000091552734, 0.020743608474731445, 0.021508216857910156, 0.022272825241088867, 0.023037433624267578, 0.02380204200744629, 0.024566650390625]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 1.0, 6.0, 3.0, 4.0, 4.0, 8.0, 16.0, 23.0, 41.0, 79.0, 139.0, 151.0, 168.0, 135.0, 82.0, 57.0, 32.0, 21.0, 14.0, 9.0, 3.0, 6.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1647200584411621, -0.15388451516628265, -0.143048956990242, -0.13221341371536255, -0.1213778704404831, -0.11054231971502304, -0.09970676898956299, -0.08887122571468353, -0.07803567498922348, -0.06720012426376343, -0.05636458098888397, -0.04552903026342392, -0.034693483263254166, -0.02385793626308441, -0.013022385537624359, -0.0021868422627449036, 0.008648708462715149, 0.019484255462884903, 0.030319804325699806, 0.04115535318851471, 0.051990900188684464, 0.06282644718885422, 0.07366199791431427, 0.08449754118919373, 0.09533309191465378, 0.10616864264011383, 0.11700418591499329, 0.12783974409103394, 0.1386752873659134, 0.14951083064079285, 0.1603463888168335, 0.17118191719055176, 0.1820174753665924, 0.19285301864147186, 0.2036885768175125, 0.21452412009239197, 0.22535966336727142, 0.23619520664215088, 0.24703076481819153, 0.2578663229942322, 0.26870185136795044, 0.2795374095439911, 0.29037293791770935, 0.30120849609375, 0.31204405426979065, 0.3228795826435089, 0.33371514081954956, 0.3445506691932678, 0.35538625717163086, 0.3662218153476715, 0.37705734372138977, 0.3878929018974304, 0.39872846007347107, 0.40956398844718933, 0.42039954662323, 0.43123507499694824, 0.4420706331729889, 0.45290619134902954, 0.4637417197227478, 0.47457727789878845, 0.4854128360748291, 0.49624836444854736, 0.5070838928222656, 0.5179194808006287, 0.5287550091743469]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 0.0, 6.0, 5.0, 18.0, 13.0, 17.0, 20.0, 21.0, 25.0, 42.0, 38.0, 43.0, 49.0, 52.0, 68.0, 53.0, 49.0, 58.0, 65.0, 53.0, 59.0, 46.0, 36.0, 32.0, 27.0, 29.0, 24.0, 13.0, 13.0, 10.0, 8.0, 5.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4435855746269226, -0.4261478781700134, -0.40871018171310425, -0.39127248525619507, -0.3738347887992859, -0.3563970923423767, -0.3389594256877899, -0.32152172923088074, -0.30408403277397156, -0.2866463363170624, -0.2692086398601532, -0.251770943403244, -0.23433326184749603, -0.21689556539058685, -0.19945788383483887, -0.1820201873779297, -0.1645824909210205, -0.14714479446411133, -0.12970709800720215, -0.11226941645145416, -0.09483171999454498, -0.0773940235376358, -0.05995633453130722, -0.04251864552497864, -0.025080949068069458, -0.007643256336450577, 0.009794436395168304, 0.027232129126787186, 0.04466982185840607, 0.06210751831531525, 0.07954520732164383, 0.09698289632797241, 0.11442053318023682, 0.131858229637146, 0.14929592609405518, 0.16673360764980316, 0.18417130410671234, 0.20160900056362152, 0.2190466821193695, 0.2364843785762787, 0.25392207503318787, 0.27135977149009705, 0.2887974679470062, 0.3062351644039154, 0.3236728310585022, 0.3411105275154114, 0.35854822397232056, 0.37598592042922974, 0.3934236168861389, 0.4108613133430481, 0.4282990097999573, 0.44573670625686646, 0.46317440271377563, 0.4806120991706848, 0.4980497658252716, 0.5154874324798584, 0.5329251289367676, 0.5503628253936768, 0.5678005218505859, 0.5852382183074951, 0.6026759147644043, 0.6201136112213135, 0.6375513076782227, 0.6549890041351318, 0.672426700592041]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 9.0, 11.0, 14.0, 12.0, 29.0, 40.0, 53.0, 101.0, 289.0, 734.0, 2815.0, 20437.0, 3619122.0, 536030.0, 11921.0, 1844.0, 497.0, 159.0, 84.0, 48.0, 25.0, 4.0, 4.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.186767578125, -0.18260669708251953, -0.17844581604003906, -0.1742849349975586, -0.17012405395507812, -0.16596317291259766, -0.1618022918701172, -0.15764141082763672, -0.15348052978515625, -0.14931964874267578, -0.1451587677001953, -0.14099788665771484, -0.13683700561523438, -0.1326761245727539, -0.12851524353027344, -0.12435436248779297, -0.1201934814453125, -0.11603260040283203, -0.11187171936035156, -0.1077108383178711, -0.10354995727539062, -0.09938907623291016, -0.09522819519042969, -0.09106731414794922, -0.08690643310546875, -0.08274555206298828, -0.07858467102050781, -0.07442378997802734, -0.07026290893554688, -0.0661020278930664, -0.06194114685058594, -0.05778026580810547, -0.053619384765625, -0.04945850372314453, -0.04529762268066406, -0.041136741638183594, -0.036975860595703125, -0.032814979553222656, -0.028654098510742188, -0.02449321746826172, -0.02033233642578125, -0.01617145538330078, -0.012010574340820312, -0.007849693298339844, -0.003688812255859375, 0.00047206878662109375, 0.0046329498291015625, 0.008793830871582031, 0.0129547119140625, 0.01711559295654297, 0.021276473999023438, 0.025437355041503906, 0.029598236083984375, 0.033759117126464844, 0.03791999816894531, 0.04208087921142578, 0.04624176025390625, 0.05040264129638672, 0.05456352233886719, 0.058724403381347656, 0.06288528442382812, 0.0670461654663086, 0.07120704650878906, 0.07536792755126953, 0.07952880859375]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 15.0, 13.0, 14.0, 24.0, 38.0, 51.0, 65.0, 93.0, 102.0, 98.0, 95.0, 105.0, 90.0, 56.0, 49.0, 39.0, 25.0, 11.0, 12.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.05865478515625, -0.0573124885559082, -0.055970191955566406, -0.05462789535522461, -0.05328559875488281, -0.051943302154541016, -0.05060100555419922, -0.04925870895385742, -0.047916412353515625, -0.04657411575317383, -0.04523181915283203, -0.043889522552490234, -0.04254722595214844, -0.04120492935180664, -0.039862632751464844, -0.03852033615112305, -0.03717803955078125, -0.03583574295043945, -0.034493446350097656, -0.03315114974975586, -0.03180885314941406, -0.030466556549072266, -0.02912425994873047, -0.027781963348388672, -0.026439666748046875, -0.025097370147705078, -0.02375507354736328, -0.022412776947021484, -0.021070480346679688, -0.01972818374633789, -0.018385887145996094, -0.017043590545654297, -0.0157012939453125, -0.014358997344970703, -0.013016700744628906, -0.01167440414428711, -0.010332107543945312, -0.008989810943603516, -0.007647514343261719, -0.006305217742919922, -0.004962921142578125, -0.003620624542236328, -0.0022783279418945312, -0.0009360313415527344, 0.0004062652587890625, 0.0017485618591308594, 0.0030908584594726562, 0.004433155059814453, 0.00577545166015625, 0.007117748260498047, 0.008460044860839844, 0.00980234146118164, 0.011144638061523438, 0.012486934661865234, 0.013829231262207031, 0.015171527862548828, 0.016513824462890625, 0.017856121063232422, 0.01919841766357422, 0.020540714263916016, 0.021883010864257812, 0.02322530746459961, 0.024567604064941406, 0.025909900665283203, 0.027252197265625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 6.0, 4.0, 9.0, 25.0, 25.0, 52.0, 67.0, 149.0, 553.0, 10915.0, 4173265.0, 8117.0, 560.0, 216.0, 136.0, 77.0, 44.0, 29.0, 7.0, 11.0, 5.0, 3.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.336669921875, -0.32791709899902344, -0.3191642761230469, -0.3104114532470703, -0.30165863037109375, -0.2929058074951172, -0.2841529846191406, -0.27540016174316406, -0.2666473388671875, -0.25789451599121094, -0.24914169311523438, -0.2403888702392578, -0.23163604736328125, -0.2228832244873047, -0.21413040161132812, -0.20537757873535156, -0.196624755859375, -0.18787193298339844, -0.17911911010742188, -0.1703662872314453, -0.16161346435546875, -0.1528606414794922, -0.14410781860351562, -0.13535499572753906, -0.1266021728515625, -0.11784934997558594, -0.10909652709960938, -0.10034370422363281, -0.09159088134765625, -0.08283805847167969, -0.07408523559570312, -0.06533241271972656, -0.05657958984375, -0.04782676696777344, -0.039073944091796875, -0.030321121215820312, -0.02156829833984375, -0.012815475463867188, -0.004062652587890625, 0.0046901702880859375, 0.0134429931640625, 0.022195816040039062, 0.030948638916015625, 0.03970146179199219, 0.04845428466796875, 0.05720710754394531, 0.06595993041992188, 0.07471275329589844, 0.083465576171875, 0.09221839904785156, 0.10097122192382812, 0.10972404479980469, 0.11847686767578125, 0.1272296905517578, 0.13598251342773438, 0.14473533630371094, 0.1534881591796875, 0.16224098205566406, 0.17099380493164062, 0.1797466278076172, 0.18849945068359375, 0.1972522735595703, 0.20600509643554688, 0.21475791931152344, 0.2235107421875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 18.0, 136.0, 2993.0, 813.0, 86.0, 18.0, 8.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.037841796875, -0.034336090087890625, -0.03083038330078125, -0.027324676513671875, -0.0238189697265625, -0.020313262939453125, -0.01680755615234375, -0.013301849365234375, -0.009796142578125, -0.006290435791015625, -0.00278472900390625, 0.000720977783203125, 0.0042266845703125, 0.007732391357421875, 0.01123809814453125, 0.014743804931640625, 0.01824951171875, 0.021755218505859375, 0.02526092529296875, 0.028766632080078125, 0.0322723388671875, 0.035778045654296875, 0.03928375244140625, 0.042789459228515625, 0.046295166015625, 0.049800872802734375, 0.05330657958984375, 0.056812286376953125, 0.0603179931640625, 0.06382369995117188, 0.06732940673828125, 0.07083511352539062, 0.0743408203125, 0.07784652709960938, 0.08135223388671875, 0.08485794067382812, 0.0883636474609375, 0.09186935424804688, 0.09537506103515625, 0.09888076782226562, 0.102386474609375, 0.10589218139648438, 0.10939788818359375, 0.11290359497070312, 0.1164093017578125, 0.11991500854492188, 0.12342071533203125, 0.12692642211914062, 0.13043212890625, 0.13393783569335938, 0.13744354248046875, 0.14094924926757812, 0.1444549560546875, 0.14796066284179688, 0.15146636962890625, 0.15497207641601562, 0.158477783203125, 0.16198348999023438, 0.16548919677734375, 0.16899490356445312, 0.1725006103515625, 0.17600631713867188, 0.17951202392578125, 0.18301773071289062, 0.1865234375]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 8.0, 750.0, 246.0, 8.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5908468961715698, -1.5464011430740356, -1.501955509185791, -1.4575097560882568, -1.4130640029907227, -1.3686182498931885, -1.3241724967956543, -1.2797268629074097, -1.2352811098098755, -1.1908353567123413, -1.1463897228240967, -1.1019439697265625, -1.0574982166290283, -1.0130524635314941, -0.9686067700386047, -0.9241610765457153, -0.8797153234481812, -0.835269570350647, -0.7908238768577576, -0.7463781833648682, -0.701932430267334, -0.6574866771697998, -0.6130409836769104, -0.568595290184021, -0.5241495370864868, -0.479703813791275, -0.43525809049606323, -0.39081236720085144, -0.34636664390563965, -0.30192092061042786, -0.25747519731521606, -0.21302947402000427, -0.16858363151550293, -0.12413790822029114, -0.07969218492507935, -0.035246461629867554, 0.009199261665344238, 0.05364498496055603, 0.09809070825576782, 0.14253643155097961, 0.1869821548461914, 0.2314278781414032, 0.275873601436615, 0.3203193247318268, 0.3647650480270386, 0.40921077132225037, 0.45365649461746216, 0.49810221791267395, 0.5425479412078857, 0.5869936943054199, 0.6314393877983093, 0.6758850812911987, 0.7203308343887329, 0.7647765874862671, 0.8092222809791565, 0.8536679744720459, 0.8981137275695801, 0.9425594806671143, 0.9870051741600037, 1.031450867652893, 1.0758966207504272, 1.1203423738479614, 1.164788007736206, 1.2092337608337402, 1.2536795139312744]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 5.0, 19.0, 49.0, 117.0, 168.0, 212.0, 195.0, 121.0, 68.0, 35.0, 14.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.47874999046325684, -0.4631764590740204, -0.44760289788246155, -0.4320293664932251, -0.41645583510398865, -0.4008822739124298, -0.38530874252319336, -0.3697351813316345, -0.35416164994239807, -0.3385881185531616, -0.3230145573616028, -0.30744102597236633, -0.2918674945831299, -0.27629393339157104, -0.2607204020023346, -0.24514685571193695, -0.2295733243227005, -0.21399977803230286, -0.1984262466430664, -0.18285270035266876, -0.16727915406227112, -0.15170562267303467, -0.13613207638263702, -0.12055853009223938, -0.10498499125242233, -0.08941145241260529, -0.07383790612220764, -0.058264367282390594, -0.04269082471728325, -0.027117282152175903, -0.011543743312358856, 0.004029802978038788, 0.019603341817855835, 0.03517688438296318, 0.050750426948070526, 0.06632396578788757, 0.08189751207828522, 0.09747105091810226, 0.11304458975791931, 0.12861813604831696, 0.1441916823387146, 0.15976522862911224, 0.1753387600183487, 0.19091230630874634, 0.20648585259914398, 0.22205939888954163, 0.23763293027877808, 0.2532064914703369, 0.268779993057251, 0.2843535244464874, 0.29992708563804626, 0.3155006170272827, 0.33107414841651917, 0.346647709608078, 0.36222124099731445, 0.3777948021888733, 0.39336833357810974, 0.4089418649673462, 0.42451542615890503, 0.4400889575481415, 0.45566248893737793, 0.47123605012893677, 0.4868095815181732, 0.5023831129074097, 0.5179566740989685]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 10.0, 9.0, 10.0, 20.0, 14.0, 27.0, 36.0, 43.0, 62.0, 81.0, 109.0, 137.0, 241.0, 425.0, 660.0, 1131.0, 2315.0, 5547.0, 16767.0, 59090.0, 269562.0, 500384.0, 139620.0, 34291.0, 10214.0, 3813.0, 1596.0, 838.0, 521.0, 330.0, 212.0, 112.0, 97.0, 62.0, 53.0, 28.0, 24.0, 20.0, 14.0, 7.0, 9.0, 6.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.066650390625, -0.06464815139770508, -0.06264591217041016, -0.060643672943115234, -0.05864143371582031, -0.05663919448852539, -0.05463695526123047, -0.05263471603393555, -0.050632476806640625, -0.0486302375793457, -0.04662799835205078, -0.04462575912475586, -0.04262351989746094, -0.040621280670166016, -0.038619041442871094, -0.03661680221557617, -0.03461456298828125, -0.03261232376098633, -0.030610084533691406, -0.028607845306396484, -0.026605606079101562, -0.02460336685180664, -0.02260112762451172, -0.020598888397216797, -0.018596649169921875, -0.016594409942626953, -0.014592170715332031, -0.01258993148803711, -0.010587692260742188, -0.008585453033447266, -0.006583213806152344, -0.004580974578857422, -0.0025787353515625, -0.0005764961242675781, 0.0014257431030273438, 0.0034279823303222656, 0.0054302215576171875, 0.007432460784912109, 0.009434700012207031, 0.011436939239501953, 0.013439178466796875, 0.015441417694091797, 0.01744365692138672, 0.01944589614868164, 0.021448135375976562, 0.023450374603271484, 0.025452613830566406, 0.027454853057861328, 0.02945709228515625, 0.03145933151245117, 0.033461570739746094, 0.035463809967041016, 0.03746604919433594, 0.03946828842163086, 0.04147052764892578, 0.0434727668762207, 0.045475006103515625, 0.04747724533081055, 0.04947948455810547, 0.05148172378540039, 0.05348396301269531, 0.055486202239990234, 0.057488441467285156, 0.05949068069458008, 0.061492919921875]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 5.0, 5.0, 12.0, 8.0, 17.0, 25.0, 28.0, 33.0, 55.0, 66.0, 76.0, 84.0, 92.0, 73.0, 90.0, 84.0, 67.0, 54.0, 35.0, 37.0, 27.0, 14.0, 8.0, 1.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.045989990234375, -0.04488992691040039, -0.04378986358642578, -0.04268980026245117, -0.04158973693847656, -0.04048967361450195, -0.039389610290527344, -0.038289546966552734, -0.037189483642578125, -0.036089420318603516, -0.034989356994628906, -0.0338892936706543, -0.03278923034667969, -0.03168916702270508, -0.03058910369873047, -0.02948904037475586, -0.02838897705078125, -0.02728891372680664, -0.02618885040283203, -0.025088787078857422, -0.023988723754882812, -0.022888660430908203, -0.021788597106933594, -0.020688533782958984, -0.019588470458984375, -0.018488407135009766, -0.017388343811035156, -0.016288280487060547, -0.015188217163085938, -0.014088153839111328, -0.012988090515136719, -0.01188802719116211, -0.0107879638671875, -0.00968790054321289, -0.008587837219238281, -0.007487773895263672, -0.0063877105712890625, -0.005287647247314453, -0.004187583923339844, -0.0030875205993652344, -0.001987457275390625, -0.0008873939514160156, 0.00021266937255859375, 0.0013127326965332031, 0.0024127960205078125, 0.003512859344482422, 0.004612922668457031, 0.005712985992431641, 0.00681304931640625, 0.00791311264038086, 0.009013175964355469, 0.010113239288330078, 0.011213302612304688, 0.012313365936279297, 0.013413429260253906, 0.014513492584228516, 0.015613555908203125, 0.016713619232177734, 0.017813682556152344, 0.018913745880126953, 0.020013809204101562, 0.021113872528076172, 0.02221393585205078, 0.02331399917602539, 0.0244140625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 7.0, 9.0, 13.0, 16.0, 22.0, 31.0, 37.0, 52.0, 79.0, 100.0, 180.0, 238.0, 375.0, 598.0, 1124.0, 2413.0, 5364.0, 13684.0, 41449.0, 151259.0, 450786.0, 273304.0, 70683.0, 21629.0, 7865.0, 3372.0, 1594.0, 837.0, 438.0, 323.0, 200.0, 127.0, 88.0, 50.0, 67.0, 33.0, 36.0, 16.0, 22.0, 8.0, 8.0, 9.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03851318359375, -0.037217140197753906, -0.03592109680175781, -0.03462505340576172, -0.033329010009765625, -0.03203296661376953, -0.030736923217773438, -0.029440879821777344, -0.02814483642578125, -0.026848793029785156, -0.025552749633789062, -0.02425670623779297, -0.022960662841796875, -0.02166461944580078, -0.020368576049804688, -0.019072532653808594, -0.0177764892578125, -0.016480445861816406, -0.015184402465820312, -0.013888359069824219, -0.012592315673828125, -0.011296272277832031, -0.010000228881835938, -0.008704185485839844, -0.00740814208984375, -0.006112098693847656, -0.0048160552978515625, -0.0035200119018554688, -0.002223968505859375, -0.0009279251098632812, 0.0003681182861328125, 0.0016641616821289062, 0.002960205078125, 0.004256248474121094, 0.0055522918701171875, 0.006848335266113281, 0.008144378662109375, 0.009440422058105469, 0.010736465454101562, 0.012032508850097656, 0.01332855224609375, 0.014624595642089844, 0.015920639038085938, 0.01721668243408203, 0.018512725830078125, 0.01980876922607422, 0.021104812622070312, 0.022400856018066406, 0.0236968994140625, 0.024992942810058594, 0.026288986206054688, 0.02758502960205078, 0.028881072998046875, 0.03017711639404297, 0.03147315979003906, 0.032769203186035156, 0.03406524658203125, 0.035361289978027344, 0.03665733337402344, 0.03795337677001953, 0.039249420166015625, 0.04054546356201172, 0.04184150695800781, 0.043137550354003906, 0.04443359375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 4.0, 6.0, 4.0, 7.0, 6.0, 12.0, 10.0, 5.0, 11.0, 19.0, 25.0, 26.0, 30.0, 28.0, 33.0, 39.0, 39.0, 41.0, 44.0, 35.0, 42.0, 42.0, 53.0, 42.0, 34.0, 42.0, 45.0, 39.0, 39.0, 36.0, 22.0, 31.0, 18.0, 17.0, 15.0, 11.0, 10.0, 12.0, 8.0, 5.0, 4.0, 8.0, 3.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06793212890625, -0.06571006774902344, -0.06348800659179688, -0.06126594543457031, -0.05904388427734375, -0.05682182312011719, -0.054599761962890625, -0.05237770080566406, -0.0501556396484375, -0.04793357849121094, -0.045711517333984375, -0.04348945617675781, -0.04126739501953125, -0.03904533386230469, -0.036823272705078125, -0.03460121154785156, -0.032379150390625, -0.030157089233398438, -0.027935028076171875, -0.025712966918945312, -0.02349090576171875, -0.021268844604492188, -0.019046783447265625, -0.016824722290039062, -0.0146026611328125, -0.012380599975585938, -0.010158538818359375, -0.007936477661132812, -0.00571441650390625, -0.0034923553466796875, -0.001270294189453125, 0.0009517669677734375, 0.003173828125, 0.0053958892822265625, 0.007617950439453125, 0.009840011596679688, 0.01206207275390625, 0.014284133911132812, 0.016506195068359375, 0.018728256225585938, 0.0209503173828125, 0.023172378540039062, 0.025394439697265625, 0.027616500854492188, 0.02983856201171875, 0.03206062316894531, 0.034282684326171875, 0.03650474548339844, 0.038726806640625, 0.04094886779785156, 0.043170928955078125, 0.04539299011230469, 0.04761505126953125, 0.04983711242675781, 0.052059173583984375, 0.05428123474121094, 0.0565032958984375, 0.05872535705566406, 0.060947418212890625, 0.06316947937011719, 0.06539154052734375, 0.06761360168457031, 0.06983566284179688, 0.07205772399902344, 0.07427978515625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 4.0, 4.0, 8.0, 6.0, 3.0, 11.0, 15.0, 27.0, 34.0, 52.0, 73.0, 143.0, 248.0, 386.0, 717.0, 1272.0, 2684.0, 6668.0, 27240.0, 249532.0, 626532.0, 108682.0, 15175.0, 4585.0, 2065.0, 1008.0, 567.0, 300.0, 187.0, 120.0, 57.0, 53.0, 31.0, 18.0, 15.0, 14.0, 8.0, 7.0, 6.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.024993896484375, -0.024286270141601562, -0.023578643798828125, -0.022871017456054688, -0.02216339111328125, -0.021455764770507812, -0.020748138427734375, -0.020040512084960938, -0.0193328857421875, -0.018625259399414062, -0.017917633056640625, -0.017210006713867188, -0.01650238037109375, -0.015794754028320312, -0.015087127685546875, -0.014379501342773438, -0.013671875, -0.012964248657226562, -0.012256622314453125, -0.011548995971679688, -0.01084136962890625, -0.010133743286132812, -0.009426116943359375, -0.008718490600585938, -0.0080108642578125, -0.0073032379150390625, -0.006595611572265625, -0.0058879852294921875, -0.00518035888671875, -0.0044727325439453125, -0.003765106201171875, -0.0030574798583984375, -0.002349853515625, -0.0016422271728515625, -0.000934600830078125, -0.0002269744873046875, 0.00048065185546875, 0.0011882781982421875, 0.001895904541015625, 0.0026035308837890625, 0.0033111572265625, 0.0040187835693359375, 0.004726409912109375, 0.0054340362548828125, 0.00614166259765625, 0.0068492889404296875, 0.007556915283203125, 0.008264541625976562, 0.00897216796875, 0.009679794311523438, 0.010387420654296875, 0.011095046997070312, 0.01180267333984375, 0.012510299682617188, 0.013217926025390625, 0.013925552368164062, 0.0146331787109375, 0.015340805053710938, 0.016048431396484375, 0.016756057739257812, 0.01746368408203125, 0.018171310424804688, 0.018878936767578125, 0.019586563110351562, 0.020294189453125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 1.0, 5.0, 8.0, 11.0, 14.0, 13.0, 14.0, 26.0, 45.0, 32.0, 43.0, 43.0, 50.0, 48.0, 61.0, 49.0, 69.0, 83.0, 53.0, 64.0, 45.0, 33.0, 40.0, 28.0, 29.0, 18.0, 21.0, 17.0, 10.0, 7.0, 7.0, 4.0, 2.0, 0.0, 2.0, 6.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.496906280517578e-06, -6.311573088169098e-06, -6.126239895820618e-06, -5.9409067034721375e-06, -5.755573511123657e-06, -5.570240318775177e-06, -5.384907126426697e-06, -5.1995739340782166e-06, -5.014240741729736e-06, -4.828907549381256e-06, -4.643574357032776e-06, -4.458241164684296e-06, -4.2729079723358154e-06, -4.087574779987335e-06, -3.902241587638855e-06, -3.7169083952903748e-06, -3.5315752029418945e-06, -3.3462420105934143e-06, -3.160908818244934e-06, -2.975575625896454e-06, -2.7902424335479736e-06, -2.6049092411994934e-06, -2.419576048851013e-06, -2.234242856502533e-06, -2.0489096641540527e-06, -1.8635764718055725e-06, -1.6782432794570923e-06, -1.492910087108612e-06, -1.3075768947601318e-06, -1.1222437024116516e-06, -9.369105100631714e-07, -7.515773177146912e-07, -5.662441253662109e-07, -3.809109330177307e-07, -1.955777406692505e-07, -1.0244548320770264e-08, 1.7508864402770996e-07, 3.604218363761902e-07, 5.457550287246704e-07, 7.310882210731506e-07, 9.164214134216309e-07, 1.101754605770111e-06, 1.2870877981185913e-06, 1.4724209904670715e-06, 1.6577541828155518e-06, 1.843087375164032e-06, 2.028420567512512e-06, 2.2137537598609924e-06, 2.3990869522094727e-06, 2.584420144557953e-06, 2.769753336906433e-06, 2.9550865292549133e-06, 3.1404197216033936e-06, 3.3257529139518738e-06, 3.511086106300354e-06, 3.6964192986488342e-06, 3.8817524909973145e-06, 4.067085683345795e-06, 4.252418875694275e-06, 4.437752068042755e-06, 4.623085260391235e-06, 4.8084184527397156e-06, 4.993751645088196e-06, 5.179084837436676e-06, 5.364418029785156e-06]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 8.0, 3.0, 9.0, 14.0, 23.0, 36.0, 49.0, 167.0, 694.0, 6819.0, 555744.0, 478106.0, 5945.0, 665.0, 133.0, 72.0, 19.0, 27.0, 16.0, 9.0, 4.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.061553955078125, -0.05968761444091797, -0.05782127380371094, -0.055954933166503906, -0.054088592529296875, -0.052222251892089844, -0.05035591125488281, -0.04848957061767578, -0.04662322998046875, -0.04475688934326172, -0.04289054870605469, -0.041024208068847656, -0.039157867431640625, -0.037291526794433594, -0.03542518615722656, -0.03355884552001953, -0.0316925048828125, -0.02982616424560547, -0.027959823608398438, -0.026093482971191406, -0.024227142333984375, -0.022360801696777344, -0.020494461059570312, -0.01862812042236328, -0.01676177978515625, -0.014895439147949219, -0.013029098510742188, -0.011162757873535156, -0.009296417236328125, -0.007430076599121094, -0.0055637359619140625, -0.0036973953247070312, -0.0018310546875, 3.528594970703125e-05, 0.0019016265869140625, 0.0037679672241210938, 0.005634307861328125, 0.007500648498535156, 0.009366989135742188, 0.011233329772949219, 0.01309967041015625, 0.014966011047363281, 0.016832351684570312, 0.018698692321777344, 0.020565032958984375, 0.022431373596191406, 0.024297714233398438, 0.02616405487060547, 0.0280303955078125, 0.02989673614501953, 0.03176307678222656, 0.033629417419433594, 0.035495758056640625, 0.037362098693847656, 0.03922843933105469, 0.04109477996826172, 0.04296112060546875, 0.04482746124267578, 0.04669380187988281, 0.048560142517089844, 0.050426483154296875, 0.052292823791503906, 0.05415916442871094, 0.05602550506591797, 0.057891845703125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 3.0, 4.0, 1.0, 5.0, 4.0, 3.0, 7.0, 9.0, 15.0, 24.0, 21.0, 39.0, 53.0, 68.0, 103.0, 106.0, 129.0, 100.0, 99.0, 71.0, 49.0, 28.0, 24.0, 14.0, 9.0, 5.0, 3.0, 4.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0186309814453125, -0.017795324325561523, -0.016959667205810547, -0.01612401008605957, -0.015288352966308594, -0.014452695846557617, -0.01361703872680664, -0.012781381607055664, -0.011945724487304688, -0.011110067367553711, -0.010274410247802734, -0.009438753128051758, -0.008603096008300781, -0.007767438888549805, -0.006931781768798828, -0.0060961246490478516, -0.005260467529296875, -0.0044248104095458984, -0.003589153289794922, -0.0027534961700439453, -0.0019178390502929688, -0.0010821819305419922, -0.0002465248107910156, 0.0005891323089599609, 0.0014247894287109375, 0.002260446548461914, 0.0030961036682128906, 0.003931760787963867, 0.004767417907714844, 0.00560307502746582, 0.006438732147216797, 0.0072743892669677734, 0.00811004638671875, 0.008945703506469727, 0.009781360626220703, 0.01061701774597168, 0.011452674865722656, 0.012288331985473633, 0.01312398910522461, 0.013959646224975586, 0.014795303344726562, 0.01563096046447754, 0.016466617584228516, 0.017302274703979492, 0.01813793182373047, 0.018973588943481445, 0.019809246063232422, 0.0206449031829834, 0.021480560302734375, 0.02231621742248535, 0.023151874542236328, 0.023987531661987305, 0.02482318878173828, 0.025658845901489258, 0.026494503021240234, 0.02733016014099121, 0.028165817260742188, 0.029001474380493164, 0.02983713150024414, 0.030672788619995117, 0.031508445739746094, 0.03234410285949707, 0.03317975997924805, 0.03401541709899902, 0.03485107421875]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 9.0, 30.0, 82.0, 224.0, 321.0, 202.0, 81.0, 28.0, 18.0, 4.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.7022692561149597, -0.6824743151664734, -0.6626793742179871, -0.6428844332695007, -0.6230895519256592, -0.6032946109771729, -0.5834996700286865, -0.5637047290802002, -0.5439097881317139, -0.5241148471832275, -0.5043199062347412, -0.48452499508857727, -0.46473005414009094, -0.4449351131916046, -0.4251402020454407, -0.40534526109695435, -0.385550320148468, -0.3657553791999817, -0.34596043825149536, -0.3261655271053314, -0.3063705861568451, -0.28657564520835876, -0.2667807340621948, -0.2469857931137085, -0.22719085216522217, -0.20739591121673584, -0.1876009851694107, -0.16780605912208557, -0.14801111817359924, -0.12821617722511292, -0.10842125117778778, -0.08862632513046265, -0.06883132457733154, -0.04903639107942581, -0.02924145758152008, -0.00944652408361435, 0.010348409414291382, 0.030143342912197113, 0.049938276410102844, 0.06973320245742798, 0.0895281434059143, 0.10932307690382004, 0.12911801040172577, 0.1489129364490509, 0.16870787739753723, 0.18850281834602356, 0.2082977443933487, 0.22809267044067383, 0.24788761138916016, 0.2676825523376465, 0.2874774932861328, 0.30727240443229675, 0.3270673453807831, 0.3468622863292694, 0.36665719747543335, 0.3864521384239197, 0.406247079372406, 0.42604202032089233, 0.44583696126937866, 0.4656318724155426, 0.48542681336402893, 0.5052217245101929, 0.5250166654586792, 0.5448116064071655, 0.5646065473556519]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 9.0, 3.0, 7.0, 12.0, 16.0, 13.0, 20.0, 26.0, 26.0, 21.0, 34.0, 38.0, 49.0, 56.0, 42.0, 57.0, 52.0, 47.0, 50.0, 54.0, 48.0, 40.0, 47.0, 38.0, 28.0, 35.0, 26.0, 24.0, 21.0, 14.0, 11.0, 6.0, 9.0, 7.0, 8.0, 5.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3448348641395569, -0.3308033347129822, -0.31677180528640747, -0.30274027585983276, -0.28870871663093567, -0.27467718720436096, -0.26064565777778625, -0.24661412835121155, -0.23258259892463684, -0.21855106949806213, -0.20451952517032623, -0.19048799574375153, -0.17645646631717682, -0.16242492198944092, -0.1483933925628662, -0.1343618631362915, -0.1203303188085556, -0.1062987819314003, -0.09226725250482559, -0.07823571562767029, -0.06420418620109558, -0.05017264932394028, -0.03614111244678497, -0.022109583020210266, -0.008078046143054962, 0.005953487940132618, 0.019985022023320198, 0.03401655703783035, 0.04804809018969536, 0.062079623341560364, 0.07611116021871567, 0.09014268964529037, 0.10417422652244568, 0.11820576339960098, 0.1322373002767563, 0.146268829703331, 0.1603003591299057, 0.1743319034576416, 0.1883634328842163, 0.20239496231079102, 0.21642649173736572, 0.23045802116394043, 0.24448956549167633, 0.25852108001708984, 0.27255263924598694, 0.28658416867256165, 0.30061569809913635, 0.31464722752571106, 0.32867878675460815, 0.34271031618118286, 0.35674184560775757, 0.3707733750343323, 0.38480493426322937, 0.3988364636898041, 0.4128679931163788, 0.4268995225429535, 0.4409310519695282, 0.4549625813961029, 0.4689941108226776, 0.4830256700515747, 0.4970571994781494, 0.5110887289047241, 0.5251202583312988, 0.5391517877578735, 0.5531833171844482]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 2.0, 19.0, 30.0, 79.0, 174.0, 1916.0, 4188842.0, 2890.0, 182.0, 77.0, 38.0, 17.0, 10.0, 3.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.81396484375, -0.7956886291503906, -0.7774124145507812, -0.7591361999511719, -0.7408599853515625, -0.7225837707519531, -0.7043075561523438, -0.6860313415527344, -0.667755126953125, -0.6494789123535156, -0.6312026977539062, -0.6129264831542969, -0.5946502685546875, -0.5763740539550781, -0.5580978393554688, -0.5398216247558594, -0.52154541015625, -0.5032691955566406, -0.48499298095703125, -0.4667167663574219, -0.4484405517578125, -0.4301643371582031, -0.41188812255859375, -0.3936119079589844, -0.375335693359375, -0.3570594787597656, -0.33878326416015625, -0.3205070495605469, -0.3022308349609375, -0.2839546203613281, -0.26567840576171875, -0.24740219116210938, -0.2291259765625, -0.21084976196289062, -0.19257354736328125, -0.17429733276367188, -0.1560211181640625, -0.13774490356445312, -0.11946868896484375, -0.10119247436523438, -0.082916259765625, -0.06464004516601562, -0.04636383056640625, -0.028087615966796875, -0.0098114013671875, 0.008464813232421875, 0.02674102783203125, 0.045017242431640625, 0.06329345703125, 0.08156967163085938, 0.09984588623046875, 0.11812210083007812, 0.1363983154296875, 0.15467453002929688, 0.17295074462890625, 0.19122695922851562, 0.209503173828125, 0.22777938842773438, 0.24605560302734375, 0.2643318176269531, 0.2826080322265625, 0.3008842468261719, 0.31916046142578125, 0.3374366760253906, 0.355712890625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 9.0, 12.0, 13.0, 19.0, 24.0, 30.0, 32.0, 40.0, 52.0, 51.0, 65.0, 65.0, 81.0, 82.0, 88.0, 69.0, 64.0, 50.0, 43.0, 32.0, 27.0, 20.0, 10.0, 7.0, 9.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.04150390625, -0.0404815673828125, -0.039459228515625, -0.0384368896484375, -0.03741455078125, -0.0363922119140625, -0.035369873046875, -0.0343475341796875, -0.0333251953125, -0.0323028564453125, -0.031280517578125, -0.0302581787109375, -0.02923583984375, -0.0282135009765625, -0.027191162109375, -0.0261688232421875, -0.025146484375, -0.0241241455078125, -0.023101806640625, -0.0220794677734375, -0.02105712890625, -0.0200347900390625, -0.019012451171875, -0.0179901123046875, -0.0169677734375, -0.0159454345703125, -0.014923095703125, -0.0139007568359375, -0.01287841796875, -0.0118560791015625, -0.010833740234375, -0.0098114013671875, -0.0087890625, -0.0077667236328125, -0.006744384765625, -0.0057220458984375, -0.00469970703125, -0.0036773681640625, -0.002655029296875, -0.0016326904296875, -0.0006103515625, 0.0004119873046875, 0.001434326171875, 0.0024566650390625, 0.00347900390625, 0.0045013427734375, 0.005523681640625, 0.0065460205078125, 0.007568359375, 0.0085906982421875, 0.009613037109375, 0.0106353759765625, 0.01165771484375, 0.0126800537109375, 0.013702392578125, 0.0147247314453125, 0.0157470703125, 0.0167694091796875, 0.017791748046875, 0.0188140869140625, 0.01983642578125, 0.0208587646484375, 0.021881103515625, 0.0229034423828125, 0.02392578125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 8.0, 7.0, 14.0, 23.0, 78.0, 183.0, 787.0, 7173.0, 2932048.0, 1246585.0, 6115.0, 920.0, 220.0, 65.0, 30.0, 12.0, 9.0, 2.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16552734375, -0.16079330444335938, -0.15605926513671875, -0.15132522583007812, -0.1465911865234375, -0.14185714721679688, -0.13712310791015625, -0.13238906860351562, -0.127655029296875, -0.12292098999023438, -0.11818695068359375, -0.11345291137695312, -0.1087188720703125, -0.10398483276367188, -0.09925079345703125, -0.09451675415039062, -0.08978271484375, -0.08504867553710938, -0.08031463623046875, -0.07558059692382812, -0.0708465576171875, -0.06611251831054688, -0.06137847900390625, -0.056644439697265625, -0.051910400390625, -0.047176361083984375, -0.04244232177734375, -0.037708282470703125, -0.0329742431640625, -0.028240203857421875, -0.02350616455078125, -0.018772125244140625, -0.0140380859375, -0.009304046630859375, -0.00457000732421875, 0.000164031982421875, 0.0048980712890625, 0.009632110595703125, 0.01436614990234375, 0.019100189208984375, 0.023834228515625, 0.028568267822265625, 0.03330230712890625, 0.038036346435546875, 0.0427703857421875, 0.047504425048828125, 0.05223846435546875, 0.056972503662109375, 0.06170654296875, 0.06644058227539062, 0.07117462158203125, 0.07590866088867188, 0.0806427001953125, 0.08537673950195312, 0.09011077880859375, 0.09484481811523438, 0.099578857421875, 0.10431289672851562, 0.10904693603515625, 0.11378097534179688, 0.1185150146484375, 0.12324905395507812, 0.12798309326171875, 0.13271713256835938, 0.137451171875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 11.0, 11.0, 17.0, 23.0, 36.0, 100.0, 248.0, 799.0, 1963.0, 527.0, 161.0, 75.0, 41.0, 23.0, 13.0, 6.0, 5.0, 5.0, 3.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0249481201171875, -0.02365708351135254, -0.022366046905517578, -0.021075010299682617, -0.019783973693847656, -0.018492937088012695, -0.017201900482177734, -0.015910863876342773, -0.014619827270507812, -0.013328790664672852, -0.01203775405883789, -0.01074671745300293, -0.009455680847167969, -0.008164644241333008, -0.006873607635498047, -0.005582571029663086, -0.004291534423828125, -0.003000497817993164, -0.0017094612121582031, -0.0004184246063232422, 0.0008726119995117188, 0.0021636486053466797, 0.0034546852111816406, 0.0047457218170166016, 0.0060367584228515625, 0.0073277950286865234, 0.008618831634521484, 0.009909868240356445, 0.011200904846191406, 0.012491941452026367, 0.013782978057861328, 0.015074014663696289, 0.01636505126953125, 0.01765608787536621, 0.018947124481201172, 0.020238161087036133, 0.021529197692871094, 0.022820234298706055, 0.024111270904541016, 0.025402307510375977, 0.026693344116210938, 0.0279843807220459, 0.02927541732788086, 0.03056645393371582, 0.03185749053955078, 0.03314852714538574, 0.0344395637512207, 0.035730600357055664, 0.037021636962890625, 0.038312673568725586, 0.03960371017456055, 0.04089474678039551, 0.04218578338623047, 0.04347681999206543, 0.04476785659790039, 0.04605889320373535, 0.04734992980957031, 0.04864096641540527, 0.049932003021240234, 0.051223039627075195, 0.052514076232910156, 0.05380511283874512, 0.05509614944458008, 0.05638718605041504, 0.05767822265625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 20.0, 902.0, 82.0, 7.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18834048509597778, -0.14718113839626312, -0.10602179914712906, -0.064862459897995, -0.023703113198280334, 0.017456233501434326, 0.05861556529998779, 0.09977492690086365, 0.14093425869941711, 0.18209360539913177, 0.22325295209884644, 0.2644122838973999, 0.30557161569595337, 0.3467309772968292, 0.3878903090953827, 0.42904967069625854, 0.470209002494812, 0.5113683342933655, 0.552527666091919, 0.5936870574951172, 0.6348463892936707, 0.6760057210922241, 0.7171650528907776, 0.758324384689331, 0.7994837760925293, 0.8406431078910828, 0.8818024396896362, 0.9229618310928345, 0.9641211628913879, 1.0052804946899414, 1.0464398860931396, 1.0875991582870483, 1.1287585496902466, 1.1699179410934448, 1.2110772132873535, 1.2522366046905518, 1.2933958768844604, 1.3345552682876587, 1.3757145404815674, 1.4168739318847656, 1.4580333232879639, 1.499192714691162, 1.5403519868850708, 1.581511378288269, 1.6226706504821777, 1.663830041885376, 1.7049894332885742, 1.746148705482483, 1.7873079776763916, 1.8284673690795898, 1.8696266412734985, 1.9107860326766968, 1.9519453048706055, 1.9931046962738037, 2.034264087677002, 2.0754234790802, 2.1165828704833984, 2.1577422618865967, 2.198901653289795, 2.240060806274414, 2.2812201976776123, 2.3223795890808105, 2.363538980484009, 2.404698371887207, 2.445857524871826]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 2.0, 4.0, 1.0, 6.0, 8.0, 13.0, 19.0, 21.0, 13.0, 31.0, 33.0, 39.0, 43.0, 52.0, 61.0, 57.0, 78.0, 73.0, 68.0, 69.0, 52.0, 48.0, 53.0, 48.0, 24.0, 31.0, 15.0, 16.0, 15.0, 5.0, 5.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07955443859100342, -0.07560592144727707, -0.07165740430355072, -0.06770889461040497, -0.06376037746667862, -0.05981186032295227, -0.05586334690451622, -0.05191483348608017, -0.04796631634235382, -0.04401779919862747, -0.04006928578019142, -0.03612077236175537, -0.03217225521802902, -0.028223739936947823, -0.024275224655866623, -0.020326709374785423, -0.016378194093704224, -0.012429678812623024, -0.008481163531541824, -0.004532648250460625, -0.000584132969379425, 0.0033643823117017746, 0.007312897592782974, 0.011261412873864174, 0.015209928154945374, 0.019158443436026573, 0.023106958717107773, 0.027055473998188972, 0.031003989279270172, 0.03495250642299652, 0.03890101984143257, 0.04284953325986862, 0.04679805040359497, 0.05074656754732132, 0.05469508096575737, 0.05864359438419342, 0.06259211152791977, 0.06654062867164612, 0.07048913836479187, 0.07443765550851822, 0.07838617265224457, 0.08233468979597092, 0.08628320693969727, 0.09023171663284302, 0.09418023377656937, 0.09812875092029572, 0.10207726061344147, 0.10602577775716782, 0.10997429490089417, 0.11392281204462051, 0.11787132918834686, 0.12181983888149261, 0.12576836347579956, 0.1297168731689453, 0.13366538286209106, 0.137613907456398, 0.14156241714954376, 0.14551092684268951, 0.14945945143699646, 0.1534079611301422, 0.15735647082328796, 0.1613049954175949, 0.16525350511074066, 0.1692020297050476, 0.17315053939819336]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 12.0, 4.0, 7.0, 6.0, 13.0, 27.0, 33.0, 70.0, 150.0, 243.0, 479.0, 1146.0, 3104.0, 10879.0, 71022.0, 666336.0, 259871.0, 26368.0, 5593.0, 1756.0, 725.0, 345.0, 144.0, 88.0, 52.0, 26.0, 22.0, 12.0, 7.0, 4.0, 6.0, 1.0, 5.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10211181640625, -0.09879207611083984, -0.09547233581542969, -0.09215259552001953, -0.08883285522460938, -0.08551311492919922, -0.08219337463378906, -0.0788736343383789, -0.07555389404296875, -0.0722341537475586, -0.06891441345214844, -0.06559467315673828, -0.062274932861328125, -0.05895519256591797, -0.05563545227050781, -0.052315711975097656, -0.0489959716796875, -0.045676231384277344, -0.04235649108886719, -0.03903675079345703, -0.035717010498046875, -0.03239727020263672, -0.029077529907226562, -0.025757789611816406, -0.02243804931640625, -0.019118309020996094, -0.015798568725585938, -0.012478828430175781, -0.009159088134765625, -0.005839347839355469, -0.0025196075439453125, 0.0008001327514648438, 0.004119873046875, 0.007439613342285156, 0.010759353637695312, 0.014079093933105469, 0.017398834228515625, 0.02071857452392578, 0.024038314819335938, 0.027358055114746094, 0.03067779541015625, 0.033997535705566406, 0.03731727600097656, 0.04063701629638672, 0.043956756591796875, 0.04727649688720703, 0.05059623718261719, 0.053915977478027344, 0.0572357177734375, 0.060555458068847656, 0.06387519836425781, 0.06719493865966797, 0.07051467895507812, 0.07383441925048828, 0.07715415954589844, 0.0804738998413086, 0.08379364013671875, 0.0871133804321289, 0.09043312072753906, 0.09375286102294922, 0.09707260131835938, 0.10039234161376953, 0.10371208190917969, 0.10703182220458984, 0.1103515625]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 4.0, 14.0, 8.0, 13.0, 19.0, 22.0, 19.0, 32.0, 48.0, 43.0, 47.0, 55.0, 58.0, 81.0, 80.0, 72.0, 65.0, 69.0, 55.0, 40.0, 39.0, 27.0, 32.0, 21.0, 11.0, 12.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.0360107421875, -0.03508877754211426, -0.034166812896728516, -0.03324484825134277, -0.03232288360595703, -0.03140091896057129, -0.030478954315185547, -0.029556989669799805, -0.028635025024414062, -0.02771306037902832, -0.026791095733642578, -0.025869131088256836, -0.024947166442871094, -0.02402520179748535, -0.02310323715209961, -0.022181272506713867, -0.021259307861328125, -0.020337343215942383, -0.01941537857055664, -0.0184934139251709, -0.017571449279785156, -0.016649484634399414, -0.015727519989013672, -0.01480555534362793, -0.013883590698242188, -0.012961626052856445, -0.012039661407470703, -0.011117696762084961, -0.010195732116699219, -0.009273767471313477, -0.008351802825927734, -0.007429838180541992, -0.00650787353515625, -0.005585908889770508, -0.004663944244384766, -0.0037419795989990234, -0.0028200149536132812, -0.001898050308227539, -0.0009760856628417969, -5.412101745605469e-05, 0.0008678436279296875, 0.0017898082733154297, 0.002711772918701172, 0.003633737564086914, 0.004555702209472656, 0.0054776668548583984, 0.006399631500244141, 0.007321596145629883, 0.008243560791015625, 0.009165525436401367, 0.01008749008178711, 0.011009454727172852, 0.011931419372558594, 0.012853384017944336, 0.013775348663330078, 0.01469731330871582, 0.015619277954101562, 0.016541242599487305, 0.017463207244873047, 0.01838517189025879, 0.01930713653564453, 0.020229101181030273, 0.021151065826416016, 0.022073030471801758, 0.0229949951171875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 4.0, 2.0, 7.0, 8.0, 11.0, 10.0, 13.0, 32.0, 30.0, 61.0, 96.0, 127.0, 208.0, 310.0, 614.0, 1333.0, 3211.0, 9954.0, 39689.0, 246651.0, 586287.0, 125107.0, 23582.0, 6537.0, 2338.0, 995.0, 488.0, 302.0, 163.0, 108.0, 80.0, 61.0, 33.0, 22.0, 19.0, 18.0, 12.0, 9.0, 6.0, 6.0, 5.0, 4.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.054412841796875, -0.05261850357055664, -0.05082416534423828, -0.04902982711791992, -0.04723548889160156, -0.0454411506652832, -0.043646812438964844, -0.041852474212646484, -0.040058135986328125, -0.038263797760009766, -0.036469459533691406, -0.03467512130737305, -0.03288078308105469, -0.031086444854736328, -0.02929210662841797, -0.02749776840209961, -0.02570343017578125, -0.02390909194946289, -0.02211475372314453, -0.020320415496826172, -0.018526077270507812, -0.016731739044189453, -0.014937400817871094, -0.013143062591552734, -0.011348724365234375, -0.009554386138916016, -0.007760047912597656, -0.005965709686279297, -0.0041713714599609375, -0.002377033233642578, -0.0005826950073242188, 0.0012116432189941406, 0.0030059814453125, 0.004800319671630859, 0.006594657897949219, 0.008388996124267578, 0.010183334350585938, 0.011977672576904297, 0.013772010803222656, 0.015566349029541016, 0.017360687255859375, 0.019155025482177734, 0.020949363708496094, 0.022743701934814453, 0.024538040161132812, 0.026332378387451172, 0.02812671661376953, 0.02992105484008789, 0.03171539306640625, 0.03350973129272461, 0.03530406951904297, 0.03709840774536133, 0.03889274597167969, 0.04068708419799805, 0.042481422424316406, 0.044275760650634766, 0.046070098876953125, 0.047864437103271484, 0.049658775329589844, 0.0514531135559082, 0.05324745178222656, 0.05504179000854492, 0.05683612823486328, 0.05863046646118164, 0.0604248046875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 1.0, 9.0, 7.0, 6.0, 9.0, 9.0, 10.0, 12.0, 17.0, 22.0, 38.0, 31.0, 35.0, 44.0, 37.0, 37.0, 46.0, 58.0, 64.0, 57.0, 61.0, 49.0, 38.0, 48.0, 44.0, 42.0, 20.0, 26.0, 20.0, 16.0, 23.0, 17.0, 9.0, 9.0, 5.0, 10.0, 4.0, 5.0, 6.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.077880859375, -0.07527542114257812, -0.07266998291015625, -0.07006454467773438, -0.0674591064453125, -0.06485366821289062, -0.06224822998046875, -0.059642791748046875, -0.057037353515625, -0.054431915283203125, -0.05182647705078125, -0.049221038818359375, -0.0466156005859375, -0.044010162353515625, -0.04140472412109375, -0.038799285888671875, -0.03619384765625, -0.033588409423828125, -0.03098297119140625, -0.028377532958984375, -0.0257720947265625, -0.023166656494140625, -0.02056121826171875, -0.017955780029296875, -0.015350341796875, -0.012744903564453125, -0.01013946533203125, -0.007534027099609375, -0.0049285888671875, -0.002323150634765625, 0.00028228759765625, 0.002887725830078125, 0.0054931640625, 0.008098602294921875, 0.01070404052734375, 0.013309478759765625, 0.0159149169921875, 0.018520355224609375, 0.02112579345703125, 0.023731231689453125, 0.026336669921875, 0.028942108154296875, 0.03154754638671875, 0.034152984619140625, 0.0367584228515625, 0.039363861083984375, 0.04196929931640625, 0.044574737548828125, 0.04718017578125, 0.049785614013671875, 0.05239105224609375, 0.054996490478515625, 0.0576019287109375, 0.060207366943359375, 0.06281280517578125, 0.06541824340820312, 0.068023681640625, 0.07062911987304688, 0.07323455810546875, 0.07583999633789062, 0.0784454345703125, 0.08105087280273438, 0.08365631103515625, 0.08626174926757812, 0.0888671875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 5.0, 2.0, 3.0, 6.0, 19.0, 24.0, 31.0, 56.0, 110.0, 197.0, 303.0, 598.0, 1244.0, 3851.0, 21307.0, 215129.0, 657853.0, 128830.0, 13757.0, 2948.0, 1132.0, 517.0, 247.0, 144.0, 95.0, 42.0, 35.0, 23.0, 17.0, 10.0, 4.0, 6.0, 8.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.021392822265625, -0.020770788192749023, -0.020148754119873047, -0.01952672004699707, -0.018904685974121094, -0.018282651901245117, -0.01766061782836914, -0.017038583755493164, -0.016416549682617188, -0.01579451560974121, -0.015172481536865234, -0.014550447463989258, -0.013928413391113281, -0.013306379318237305, -0.012684345245361328, -0.012062311172485352, -0.011440277099609375, -0.010818243026733398, -0.010196208953857422, -0.009574174880981445, -0.008952140808105469, -0.008330106735229492, -0.007708072662353516, -0.007086038589477539, -0.0064640045166015625, -0.005841970443725586, -0.005219936370849609, -0.004597902297973633, -0.003975868225097656, -0.0033538341522216797, -0.002731800079345703, -0.0021097660064697266, -0.00148773193359375, -0.0008656978607177734, -0.00024366378784179688, 0.0003783702850341797, 0.0010004043579101562, 0.0016224384307861328, 0.0022444725036621094, 0.002866506576538086, 0.0034885406494140625, 0.004110574722290039, 0.004732608795166016, 0.005354642868041992, 0.005976676940917969, 0.006598711013793945, 0.007220745086669922, 0.007842779159545898, 0.008464813232421875, 0.009086847305297852, 0.009708881378173828, 0.010330915451049805, 0.010952949523925781, 0.011574983596801758, 0.012197017669677734, 0.012819051742553711, 0.013441085815429688, 0.014063119888305664, 0.01468515396118164, 0.015307188034057617, 0.015929222106933594, 0.01655125617980957, 0.017173290252685547, 0.017795324325561523, 0.0184173583984375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 4.0, 13.0, 23.0, 25.0, 44.0, 55.0, 46.0, 53.0, 88.0, 85.0, 91.0, 113.0, 85.0, 75.0, 50.0, 46.0, 39.0, 24.0, 16.0, 13.0, 9.0, 5.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.404254913330078e-06, -8.14627856016159e-06, -7.888302206993103e-06, -7.630325853824615e-06, -7.372349500656128e-06, -7.11437314748764e-06, -6.856396794319153e-06, -6.598420441150665e-06, -6.340444087982178e-06, -6.08246773481369e-06, -5.824491381645203e-06, -5.566515028476715e-06, -5.3085386753082275e-06, -5.05056232213974e-06, -4.7925859689712524e-06, -4.534609615802765e-06, -4.276633262634277e-06, -4.01865690946579e-06, -3.7606805562973022e-06, -3.5027042031288147e-06, -3.244727849960327e-06, -2.9867514967918396e-06, -2.728775143623352e-06, -2.4707987904548645e-06, -2.212822437286377e-06, -1.9548460841178894e-06, -1.6968697309494019e-06, -1.4388933777809143e-06, -1.1809170246124268e-06, -9.229406714439392e-07, -6.649643182754517e-07, -4.069879651069641e-07, -1.4901161193847656e-07, 1.0896474123001099e-07, 3.6694109439849854e-07, 6.249174475669861e-07, 8.828938007354736e-07, 1.1408701539039612e-06, 1.3988465070724487e-06, 1.6568228602409363e-06, 1.914799213409424e-06, 2.1727755665779114e-06, 2.430751919746399e-06, 2.6887282729148865e-06, 2.946704626083374e-06, 3.2046809792518616e-06, 3.462657332420349e-06, 3.7206336855888367e-06, 3.978610038757324e-06, 4.236586391925812e-06, 4.494562745094299e-06, 4.752539098262787e-06, 5.010515451431274e-06, 5.268491804599762e-06, 5.5264681577682495e-06, 5.784444510936737e-06, 6.042420864105225e-06, 6.300397217273712e-06, 6.5583735704422e-06, 6.816349923610687e-06, 7.074326276779175e-06, 7.332302629947662e-06, 7.59027898311615e-06, 7.848255336284637e-06, 8.106231689453125e-06]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 5.0, 2.0, 0.0, 3.0, 6.0, 10.0, 8.0, 15.0, 11.0, 14.0, 36.0, 41.0, 74.0, 102.0, 138.0, 245.0, 404.0, 992.0, 2776.0, 11884.0, 92047.0, 610995.0, 288980.0, 31153.0, 5425.0, 1672.0, 684.0, 303.0, 172.0, 114.0, 93.0, 37.0, 35.0, 29.0, 19.0, 12.0, 8.0, 6.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.01776123046875, -0.01714348793029785, -0.016525745391845703, -0.015908002853393555, -0.015290260314941406, -0.014672517776489258, -0.01405477523803711, -0.013437032699584961, -0.012819290161132812, -0.012201547622680664, -0.011583805084228516, -0.010966062545776367, -0.010348320007324219, -0.00973057746887207, -0.009112834930419922, -0.008495092391967773, -0.007877349853515625, -0.0072596073150634766, -0.006641864776611328, -0.00602412223815918, -0.005406379699707031, -0.004788637161254883, -0.004170894622802734, -0.003553152084350586, -0.0029354095458984375, -0.002317667007446289, -0.0016999244689941406, -0.0010821819305419922, -0.00046443939208984375, 0.0001533031463623047, 0.0007710456848144531, 0.0013887882232666016, 0.00200653076171875, 0.0026242733001708984, 0.003242015838623047, 0.0038597583770751953, 0.004477500915527344, 0.005095243453979492, 0.005712985992431641, 0.006330728530883789, 0.0069484710693359375, 0.007566213607788086, 0.008183956146240234, 0.008801698684692383, 0.009419441223144531, 0.01003718376159668, 0.010654926300048828, 0.011272668838500977, 0.011890411376953125, 0.012508153915405273, 0.013125896453857422, 0.01374363899230957, 0.014361381530761719, 0.014979124069213867, 0.015596866607666016, 0.016214609146118164, 0.016832351684570312, 0.01745009422302246, 0.01806783676147461, 0.018685579299926758, 0.019303321838378906, 0.019921064376831055, 0.020538806915283203, 0.02115654945373535, 0.0217742919921875]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 6.0, 9.0, 5.0, 18.0, 25.0, 29.0, 33.0, 55.0, 69.0, 96.0, 126.0, 124.0, 98.0, 81.0, 77.0, 47.0, 28.0, 25.0, 15.0, 11.0, 5.0, 6.0, 8.0, 6.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.02886962890625, -0.028093814849853516, -0.02731800079345703, -0.026542186737060547, -0.025766372680664062, -0.024990558624267578, -0.024214744567871094, -0.02343893051147461, -0.022663116455078125, -0.02188730239868164, -0.021111488342285156, -0.020335674285888672, -0.019559860229492188, -0.018784046173095703, -0.01800823211669922, -0.017232418060302734, -0.01645660400390625, -0.015680789947509766, -0.014904975891113281, -0.014129161834716797, -0.013353347778320312, -0.012577533721923828, -0.011801719665527344, -0.01102590560913086, -0.010250091552734375, -0.00947427749633789, -0.008698463439941406, -0.007922649383544922, -0.0071468353271484375, -0.006371021270751953, -0.005595207214355469, -0.004819393157958984, -0.0040435791015625, -0.0032677650451660156, -0.0024919509887695312, -0.0017161369323730469, -0.0009403228759765625, -0.00016450881958007812, 0.0006113052368164062, 0.0013871192932128906, 0.002162933349609375, 0.0029387474060058594, 0.0037145614624023438, 0.004490375518798828, 0.0052661895751953125, 0.006042003631591797, 0.006817817687988281, 0.007593631744384766, 0.00836944580078125, 0.009145259857177734, 0.009921073913574219, 0.010696887969970703, 0.011472702026367188, 0.012248516082763672, 0.013024330139160156, 0.01380014419555664, 0.014575958251953125, 0.01535177230834961, 0.016127586364746094, 0.016903400421142578, 0.017679214477539062, 0.018455028533935547, 0.01923084259033203, 0.020006656646728516, 0.020782470703125]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 6.0, 15.0, 37.0, 92.0, 234.0, 289.0, 202.0, 73.0, 29.0, 13.0, 8.0, 1.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4369722008705139, -0.41969966888427734, -0.40242716670036316, -0.3851546347141266, -0.3678821325302124, -0.35060960054397583, -0.33333706855773926, -0.3160645365715027, -0.2987920343875885, -0.28151950240135193, -0.26424700021743774, -0.24697446823120117, -0.2297019511461258, -0.21242943406105042, -0.19515690207481384, -0.17788438498973846, -0.16061186790466309, -0.1433393508195877, -0.12606683373451233, -0.10879430174827576, -0.09152178466320038, -0.074249267578125, -0.056976743042469025, -0.03970421850681305, -0.02243170142173767, -0.005159180611371994, 0.012113340198993683, 0.02938586100935936, 0.04665838181972504, 0.06393089890480042, 0.08120342344045639, 0.09847594797611237, 0.11574852466583252, 0.1330210417509079, 0.15029355883598328, 0.16756609082221985, 0.18483860790729523, 0.2021111249923706, 0.21938365697860718, 0.23665617406368256, 0.25392869114875793, 0.2712012231349945, 0.2884737253189087, 0.30574625730514526, 0.32301878929138184, 0.340291291475296, 0.3575638234615326, 0.3748363256454468, 0.39210885763168335, 0.4093813896179199, 0.4266538918018341, 0.4439264237880707, 0.46119892597198486, 0.47847145795822144, 0.495743989944458, 0.5130165219306946, 0.5302890539169312, 0.5475615859031677, 0.5648341178894043, 0.5821065902709961, 0.5993791222572327, 0.6166516542434692, 0.6339241862297058, 0.6511967182159424, 0.6684691905975342]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 6.0, 2.0, 8.0, 5.0, 9.0, 8.0, 10.0, 13.0, 11.0, 13.0, 16.0, 24.0, 22.0, 37.0, 41.0, 30.0, 35.0, 32.0, 50.0, 37.0, 32.0, 41.0, 38.0, 45.0, 36.0, 38.0, 49.0, 31.0, 21.0, 39.0, 34.0, 34.0, 24.0, 22.0, 11.0, 12.0, 17.0, 12.0, 4.0, 7.0, 14.0, 12.0, 10.0, 5.0, 2.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.3165345788002014, -0.30662062764167786, -0.2967066764831543, -0.28679272532463074, -0.2768787741661072, -0.26696479320526123, -0.25705087184906006, -0.2471368908882141, -0.23722293972969055, -0.227308988571167, -0.21739503741264343, -0.20748108625411987, -0.19756712019443512, -0.18765316903591156, -0.177739217877388, -0.16782525181770325, -0.15791131556034088, -0.14799736440181732, -0.13808341324329376, -0.128169447183609, -0.11825549602508545, -0.10834154486656189, -0.09842759370803833, -0.08851363509893417, -0.07859968394041061, -0.06868573278188705, -0.0587717741727829, -0.04885782301425934, -0.03894386813044548, -0.029029913246631622, -0.019115962088108063, -0.009202003479003906, 0.0007119476795196533, 0.010625901632010937, 0.02053985558450222, 0.03045380860567093, 0.04036776348948479, 0.050281718373298645, 0.060195669531822205, 0.07010962814092636, 0.08002357929944992, 0.08993753045797348, 0.09985148906707764, 0.1097654402256012, 0.11967939138412476, 0.12959334254264832, 0.13950729370117188, 0.14942125976085663, 0.1593352109193802, 0.16924916207790375, 0.1791631132364273, 0.18907707929611206, 0.19899103045463562, 0.20890498161315918, 0.21881893277168274, 0.2287328839302063, 0.23864683508872986, 0.24856078624725342, 0.258474737405777, 0.26838868856430054, 0.2783026397228241, 0.28821659088134766, 0.2981305718421936, 0.30804452300071716, 0.3179584741592407]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 7.0, 12.0, 12.0, 10.0, 11.0, 25.0, 23.0, 42.0, 61.0, 100.0, 129.0, 215.0, 317.0, 544.0, 977.0, 1727.0, 3421.0, 8211.0, 26452.0, 179388.0, 3647017.0, 273334.0, 33800.0, 9715.0, 4029.0, 1957.0, 1061.0, 595.0, 397.0, 233.0, 162.0, 93.0, 68.0, 32.0, 23.0, 21.0, 23.0, 6.0, 10.0, 7.0, 2.0, 9.0, 2.0, 3.0, 2.0, 3.0, 1.0, 2.0, 4.0, 1.0], "bins": [-0.0474853515625, -0.046112060546875, -0.04473876953125, -0.043365478515625, -0.0419921875, -0.040618896484375, -0.03924560546875, -0.037872314453125, -0.0364990234375, -0.035125732421875, -0.03375244140625, -0.032379150390625, -0.031005859375, -0.029632568359375, -0.02825927734375, -0.026885986328125, -0.0255126953125, -0.024139404296875, -0.02276611328125, -0.021392822265625, -0.02001953125, -0.018646240234375, -0.01727294921875, -0.015899658203125, -0.0145263671875, -0.013153076171875, -0.01177978515625, -0.010406494140625, -0.009033203125, -0.007659912109375, -0.00628662109375, -0.004913330078125, -0.0035400390625, -0.002166748046875, -0.00079345703125, 0.000579833984375, 0.001953125, 0.003326416015625, 0.00469970703125, 0.006072998046875, 0.0074462890625, 0.008819580078125, 0.01019287109375, 0.011566162109375, 0.012939453125, 0.014312744140625, 0.01568603515625, 0.017059326171875, 0.0184326171875, 0.019805908203125, 0.02117919921875, 0.022552490234375, 0.02392578125, 0.025299072265625, 0.02667236328125, 0.028045654296875, 0.0294189453125, 0.030792236328125, 0.03216552734375, 0.033538818359375, 0.034912109375, 0.036285400390625, 0.03765869140625, 0.039031982421875, 0.0404052734375]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 6.0, 4.0, 4.0, 14.0, 15.0, 25.0, 20.0, 28.0, 32.0, 42.0, 52.0, 57.0, 55.0, 85.0, 83.0, 78.0, 80.0, 73.0, 63.0, 49.0, 39.0, 30.0, 22.0, 20.0, 17.0, 6.0, 3.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.0413818359375, -0.0403599739074707, -0.039338111877441406, -0.03831624984741211, -0.03729438781738281, -0.036272525787353516, -0.03525066375732422, -0.03422880172729492, -0.033206939697265625, -0.03218507766723633, -0.03116321563720703, -0.030141353607177734, -0.029119491577148438, -0.02809762954711914, -0.027075767517089844, -0.026053905487060547, -0.02503204345703125, -0.024010181427001953, -0.022988319396972656, -0.02196645736694336, -0.020944595336914062, -0.019922733306884766, -0.01890087127685547, -0.017879009246826172, -0.016857147216796875, -0.015835285186767578, -0.014813423156738281, -0.013791561126708984, -0.012769699096679688, -0.01174783706665039, -0.010725975036621094, -0.009704113006591797, -0.0086822509765625, -0.007660388946533203, -0.006638526916503906, -0.005616664886474609, -0.0045948028564453125, -0.0035729408264160156, -0.0025510787963867188, -0.0015292167663574219, -0.000507354736328125, 0.0005145072937011719, 0.0015363693237304688, 0.0025582313537597656, 0.0035800933837890625, 0.004601955413818359, 0.005623817443847656, 0.006645679473876953, 0.00766754150390625, 0.008689403533935547, 0.009711265563964844, 0.01073312759399414, 0.011754989624023438, 0.012776851654052734, 0.013798713684082031, 0.014820575714111328, 0.015842437744140625, 0.016864299774169922, 0.01788616180419922, 0.018908023834228516, 0.019929885864257812, 0.02095174789428711, 0.021973609924316406, 0.022995471954345703, 0.024017333984375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 9.0, 6.0, 10.0, 19.0, 38.0, 62.0, 97.0, 204.0, 401.0, 967.0, 3117.0, 23058.0, 2597241.0, 1542096.0, 21649.0, 3268.0, 993.0, 433.0, 267.0, 137.0, 101.0, 49.0, 28.0, 12.0, 10.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.094970703125, -0.0922555923461914, -0.08954048156738281, -0.08682537078857422, -0.08411026000976562, -0.08139514923095703, -0.07868003845214844, -0.07596492767333984, -0.07324981689453125, -0.07053470611572266, -0.06781959533691406, -0.06510448455810547, -0.062389373779296875, -0.05967426300048828, -0.05695915222167969, -0.054244041442871094, -0.0515289306640625, -0.048813819885253906, -0.04609870910644531, -0.04338359832763672, -0.040668487548828125, -0.03795337677001953, -0.03523826599121094, -0.032523155212402344, -0.02980804443359375, -0.027092933654785156, -0.024377822875976562, -0.02166271209716797, -0.018947601318359375, -0.01623249053955078, -0.013517379760742188, -0.010802268981933594, -0.008087158203125, -0.005372047424316406, -0.0026569366455078125, 5.817413330078125e-05, 0.002773284912109375, 0.005488395690917969, 0.008203506469726562, 0.010918617248535156, 0.01363372802734375, 0.016348838806152344, 0.019063949584960938, 0.02177906036376953, 0.024494171142578125, 0.02720928192138672, 0.029924392700195312, 0.032639503479003906, 0.0353546142578125, 0.038069725036621094, 0.04078483581542969, 0.04349994659423828, 0.046215057373046875, 0.04893016815185547, 0.05164527893066406, 0.054360389709472656, 0.05707550048828125, 0.059790611267089844, 0.06250572204589844, 0.06522083282470703, 0.06793594360351562, 0.07065105438232422, 0.07336616516113281, 0.0760812759399414, 0.07879638671875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 10.0, 17.0, 45.0, 108.0, 456.0, 2503.0, 633.0, 172.0, 72.0, 25.0, 13.0, 9.0, 6.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.037017822265625, -0.035678863525390625, -0.03433990478515625, -0.033000946044921875, -0.0316619873046875, -0.030323028564453125, -0.02898406982421875, -0.027645111083984375, -0.02630615234375, -0.024967193603515625, -0.02362823486328125, -0.022289276123046875, -0.0209503173828125, -0.019611358642578125, -0.01827239990234375, -0.016933441162109375, -0.015594482421875, -0.014255523681640625, -0.01291656494140625, -0.011577606201171875, -0.0102386474609375, -0.008899688720703125, -0.00756072998046875, -0.006221771240234375, -0.0048828125, -0.003543853759765625, -0.00220489501953125, -0.000865936279296875, 0.0004730224609375, 0.001811981201171875, 0.00315093994140625, 0.004489898681640625, 0.005828857421875, 0.007167816162109375, 0.00850677490234375, 0.009845733642578125, 0.0111846923828125, 0.012523651123046875, 0.01386260986328125, 0.015201568603515625, 0.01654052734375, 0.017879486083984375, 0.01921844482421875, 0.020557403564453125, 0.0218963623046875, 0.023235321044921875, 0.02457427978515625, 0.025913238525390625, 0.027252197265625, 0.028591156005859375, 0.02993011474609375, 0.031269073486328125, 0.0326080322265625, 0.033946990966796875, 0.03528594970703125, 0.036624908447265625, 0.0379638671875, 0.039302825927734375, 0.04064178466796875, 0.041980743408203125, 0.0433197021484375, 0.044658660888671875, 0.04599761962890625, 0.047336578369140625, 0.048675537109375]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [4.0, 4.0, 41.0, 461.0, 429.0, 44.0, 18.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06264618784189224, -0.04683995991945267, -0.031033731997013092, -0.015227504074573517, 0.0005787238478660583, 0.016384951770305634, 0.03219117969274521, 0.047997407615184784, 0.06380363553762436, 0.07960986346006393, 0.09541609138250351, 0.11122231930494308, 0.12702855467796326, 0.14283478260040283, 0.1586410105228424, 0.17444723844528198, 0.19025346636772156, 0.20605969429016113, 0.2218659222126007, 0.23767215013504028, 0.25347837805747986, 0.26928460597991943, 0.285090833902359, 0.3008970618247986, 0.31670328974723816, 0.33250951766967773, 0.3483157455921173, 0.3641219735145569, 0.37992820143699646, 0.39573442935943604, 0.4115406572818756, 0.4273468852043152, 0.4431530833244324, 0.45895931124687195, 0.4747655391693115, 0.4905717670917511, 0.5063779950141907, 0.5221842527389526, 0.5379904508590698, 0.553796648979187, 0.569602906703949, 0.5854091644287109, 0.6012153625488281, 0.6170215606689453, 0.6328278183937073, 0.6486340761184692, 0.6644402742385864, 0.6802464723587036, 0.6960527300834656, 0.7118589878082275, 0.7276651859283447, 0.7434713840484619, 0.7592776417732239, 0.7750838994979858, 0.790890097618103, 0.8066962957382202, 0.8225025534629822, 0.8383088111877441, 0.8541150093078613, 0.8699212074279785, 0.8857274651527405, 0.9015337228775024, 0.9173399209976196, 0.9331461191177368, 0.9489523768424988]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 10.0, 13.0, 23.0, 40.0, 54.0, 76.0, 117.0, 117.0, 124.0, 130.0, 102.0, 58.0, 61.0, 31.0, 23.0, 10.0, 9.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1265823245048523, -0.12119630724191666, -0.11581028997898102, -0.11042426526546478, -0.10503824800252914, -0.0996522307395935, -0.09426620602607727, -0.08888018876314163, -0.083494171500206, -0.07810815423727036, -0.07272213697433472, -0.06733611226081848, -0.06195009499788284, -0.056564077734947205, -0.05117805674672127, -0.04579203575849533, -0.04040601849555969, -0.035020001232624054, -0.029633980244398117, -0.02424796111881733, -0.018861941993236542, -0.013475922867655754, -0.008089903742074966, -0.0027038827538490295, 0.002682134509086609, 0.008068153634667397, 0.013454172760248184, 0.018840191885828972, 0.02422621101140976, 0.029612230136990547, 0.034998249262571335, 0.04038427025079727, 0.04577028751373291, 0.05115630477666855, 0.056542325764894485, 0.06192834675312042, 0.06731436401605606, 0.0727003812789917, 0.07808640599250793, 0.08347242325544357, 0.08885844051837921, 0.09424445778131485, 0.09963047504425049, 0.10501649975776672, 0.11040251702070236, 0.115788534283638, 0.12117455899715424, 0.12656056880950928, 0.1319465935230255, 0.13733261823654175, 0.1427186280488968, 0.14810465276241302, 0.15349066257476807, 0.1588766872882843, 0.16426271200180054, 0.16964873671531677, 0.17503474652767181, 0.18042077124118805, 0.1858067810535431, 0.19119280576705933, 0.19657883048057556, 0.2019648402929306, 0.20735086500644684, 0.21273687481880188, 0.21812289953231812]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 4.0, 3.0, 12.0, 11.0, 14.0, 21.0, 41.0, 90.0, 134.0, 305.0, 563.0, 1290.0, 3685.0, 14865.0, 97800.0, 639264.0, 250368.0, 30334.0, 6273.0, 1920.0, 773.0, 355.0, 188.0, 93.0, 66.0, 38.0, 17.0, 15.0, 4.0, 3.0, 4.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0943603515625, -0.09171772003173828, -0.08907508850097656, -0.08643245697021484, -0.08378982543945312, -0.0811471939086914, -0.07850456237792969, -0.07586193084716797, -0.07321929931640625, -0.07057666778564453, -0.06793403625488281, -0.0652914047241211, -0.06264877319335938, -0.060006141662597656, -0.05736351013183594, -0.05472087860107422, -0.0520782470703125, -0.04943561553955078, -0.04679298400878906, -0.044150352478027344, -0.041507720947265625, -0.038865089416503906, -0.03622245788574219, -0.03357982635498047, -0.03093719482421875, -0.02829456329345703, -0.025651931762695312, -0.023009300231933594, -0.020366668701171875, -0.017724037170410156, -0.015081405639648438, -0.012438774108886719, -0.009796142578125, -0.007153511047363281, -0.0045108795166015625, -0.0018682479858398438, 0.000774383544921875, 0.0034170150756835938, 0.0060596466064453125, 0.008702278137207031, 0.01134490966796875, 0.013987541198730469, 0.016630172729492188, 0.019272804260253906, 0.021915435791015625, 0.024558067321777344, 0.027200698852539062, 0.02984333038330078, 0.0324859619140625, 0.03512859344482422, 0.03777122497558594, 0.040413856506347656, 0.043056488037109375, 0.045699119567871094, 0.04834175109863281, 0.05098438262939453, 0.05362701416015625, 0.05626964569091797, 0.05891227722167969, 0.061554908752441406, 0.06419754028320312, 0.06684017181396484, 0.06948280334472656, 0.07212543487548828, 0.07476806640625]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 8.0, 11.0, 14.0, 10.0, 18.0, 35.0, 27.0, 34.0, 30.0, 53.0, 63.0, 53.0, 55.0, 73.0, 72.0, 70.0, 69.0, 58.0, 53.0, 39.0, 38.0, 30.0, 26.0, 18.0, 17.0, 8.0, 5.0, 4.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0321044921875, -0.031208038330078125, -0.03031158447265625, -0.029415130615234375, -0.0285186767578125, -0.027622222900390625, -0.02672576904296875, -0.025829315185546875, -0.024932861328125, -0.024036407470703125, -0.02313995361328125, -0.022243499755859375, -0.0213470458984375, -0.020450592041015625, -0.01955413818359375, -0.018657684326171875, -0.01776123046875, -0.016864776611328125, -0.01596832275390625, -0.015071868896484375, -0.0141754150390625, -0.013278961181640625, -0.01238250732421875, -0.011486053466796875, -0.010589599609375, -0.009693145751953125, -0.00879669189453125, -0.007900238037109375, -0.0070037841796875, -0.006107330322265625, -0.00521087646484375, -0.004314422607421875, -0.00341796875, -0.002521514892578125, -0.00162506103515625, -0.000728607177734375, 0.0001678466796875, 0.001064300537109375, 0.00196075439453125, 0.002857208251953125, 0.003753662109375, 0.004650115966796875, 0.00554656982421875, 0.006443023681640625, 0.0073394775390625, 0.008235931396484375, 0.00913238525390625, 0.010028839111328125, 0.01092529296875, 0.011821746826171875, 0.01271820068359375, 0.013614654541015625, 0.0145111083984375, 0.015407562255859375, 0.01630401611328125, 0.017200469970703125, 0.018096923828125, 0.018993377685546875, 0.01988983154296875, 0.020786285400390625, 0.0216827392578125, 0.022579193115234375, 0.02347564697265625, 0.024372100830078125, 0.0252685546875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 2.0, 5.0, 6.0, 2.0, 8.0, 14.0, 16.0, 7.0, 17.0, 20.0, 36.0, 27.0, 73.0, 93.0, 132.0, 249.0, 402.0, 869.0, 1901.0, 4577.0, 12770.0, 42052.0, 172781.0, 498144.0, 233090.0, 55057.0, 16070.0, 5581.0, 2236.0, 998.0, 501.0, 266.0, 181.0, 103.0, 56.0, 40.0, 49.0, 24.0, 24.0, 10.0, 16.0, 10.0, 15.0, 13.0, 9.0, 6.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0435791015625, -0.04220008850097656, -0.040821075439453125, -0.03944206237792969, -0.03806304931640625, -0.03668403625488281, -0.035305023193359375, -0.03392601013183594, -0.0325469970703125, -0.031167984008789062, -0.029788970947265625, -0.028409957885742188, -0.02703094482421875, -0.025651931762695312, -0.024272918701171875, -0.022893905639648438, -0.021514892578125, -0.020135879516601562, -0.018756866455078125, -0.017377853393554688, -0.01599884033203125, -0.014619827270507812, -0.013240814208984375, -0.011861801147460938, -0.0104827880859375, -0.009103775024414062, -0.007724761962890625, -0.0063457489013671875, -0.00496673583984375, -0.0035877227783203125, -0.002208709716796875, -0.0008296966552734375, 0.00054931640625, 0.0019283294677734375, 0.003307342529296875, 0.0046863555908203125, 0.00606536865234375, 0.0074443817138671875, 0.008823394775390625, 0.010202407836914062, 0.0115814208984375, 0.012960433959960938, 0.014339447021484375, 0.015718460083007812, 0.01709747314453125, 0.018476486206054688, 0.019855499267578125, 0.021234512329101562, 0.022613525390625, 0.023992538452148438, 0.025371551513671875, 0.026750564575195312, 0.02812957763671875, 0.029508590698242188, 0.030887603759765625, 0.03226661682128906, 0.0336456298828125, 0.03502464294433594, 0.036403656005859375, 0.03778266906738281, 0.03916168212890625, 0.04054069519042969, 0.041919708251953125, 0.04329872131347656, 0.044677734375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 5.0, 1.0, 5.0, 6.0, 4.0, 7.0, 7.0, 10.0, 14.0, 16.0, 16.0, 30.0, 25.0, 35.0, 35.0, 25.0, 35.0, 31.0, 45.0, 43.0, 50.0, 43.0, 48.0, 46.0, 48.0, 34.0, 34.0, 31.0, 33.0, 39.0, 23.0, 25.0, 29.0, 21.0, 11.0, 16.0, 14.0, 14.0, 8.0, 15.0, 10.0, 5.0, 2.0, 5.0, 5.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.07421875, -0.07204246520996094, -0.06986618041992188, -0.06768989562988281, -0.06551361083984375, -0.06333732604980469, -0.061161041259765625, -0.05898475646972656, -0.0568084716796875, -0.05463218688964844, -0.052455902099609375, -0.05027961730957031, -0.04810333251953125, -0.04592704772949219, -0.043750762939453125, -0.04157447814941406, -0.039398193359375, -0.03722190856933594, -0.035045623779296875, -0.03286933898925781, -0.03069305419921875, -0.028516769409179688, -0.026340484619140625, -0.024164199829101562, -0.0219879150390625, -0.019811630249023438, -0.017635345458984375, -0.015459060668945312, -0.01328277587890625, -0.011106491088867188, -0.008930206298828125, -0.0067539215087890625, -0.00457763671875, -0.0024013519287109375, -0.000225067138671875, 0.0019512176513671875, 0.00412750244140625, 0.0063037872314453125, 0.008480072021484375, 0.010656356811523438, 0.0128326416015625, 0.015008926391601562, 0.017185211181640625, 0.019361495971679688, 0.02153778076171875, 0.023714065551757812, 0.025890350341796875, 0.028066635131835938, 0.030242919921875, 0.03241920471191406, 0.034595489501953125, 0.03677177429199219, 0.03894805908203125, 0.04112434387207031, 0.043300628662109375, 0.04547691345214844, 0.0476531982421875, 0.04982948303222656, 0.052005767822265625, 0.05418205261230469, 0.05635833740234375, 0.05853462219238281, 0.060710906982421875, 0.06288719177246094, 0.0650634765625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 8.0, 8.0, 8.0, 19.0, 16.0, 40.0, 46.0, 71.0, 111.0, 198.0, 313.0, 528.0, 1090.0, 2708.0, 9040.0, 47239.0, 290663.0, 531507.0, 134577.0, 21774.0, 5006.0, 1658.0, 805.0, 446.0, 238.0, 157.0, 96.0, 55.0, 40.0, 40.0, 13.0, 16.0, 9.0, 6.0, 3.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.015838623046875, -0.015315532684326172, -0.014792442321777344, -0.014269351959228516, -0.013746261596679688, -0.01322317123413086, -0.012700080871582031, -0.012176990509033203, -0.011653900146484375, -0.011130809783935547, -0.010607719421386719, -0.01008462905883789, -0.009561538696289062, -0.009038448333740234, -0.008515357971191406, -0.007992267608642578, -0.00746917724609375, -0.006946086883544922, -0.006422996520996094, -0.005899906158447266, -0.0053768157958984375, -0.004853725433349609, -0.004330635070800781, -0.003807544708251953, -0.003284454345703125, -0.002761363983154297, -0.0022382736206054688, -0.0017151832580566406, -0.0011920928955078125, -0.0006690025329589844, -0.00014591217041015625, 0.0003771781921386719, 0.0009002685546875, 0.0014233589172363281, 0.0019464492797851562, 0.0024695396423339844, 0.0029926300048828125, 0.0035157203674316406, 0.004038810729980469, 0.004561901092529297, 0.005084991455078125, 0.005608081817626953, 0.006131172180175781, 0.006654262542724609, 0.0071773529052734375, 0.007700443267822266, 0.008223533630371094, 0.008746623992919922, 0.00926971435546875, 0.009792804718017578, 0.010315895080566406, 0.010838985443115234, 0.011362075805664062, 0.01188516616821289, 0.012408256530761719, 0.012931346893310547, 0.013454437255859375, 0.013977527618408203, 0.014500617980957031, 0.01502370834350586, 0.015546798706054688, 0.016069889068603516, 0.016592979431152344, 0.017116069793701172, 0.01763916015625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 4.0, 1.0, 5.0, 6.0, 3.0, 17.0, 8.0, 8.0, 14.0, 17.0, 11.0, 36.0, 45.0, 32.0, 39.0, 35.0, 49.0, 58.0, 35.0, 71.0, 45.0, 65.0, 41.0, 46.0, 62.0, 37.0, 47.0, 17.0, 29.0, 13.0, 32.0, 19.0, 12.0, 17.0, 3.0, 4.0, 5.0, 8.0, 3.0, 1.0, 4.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.351139068603516e-06, -4.197470843791962e-06, -4.043802618980408e-06, -3.890134394168854e-06, -3.7364661693573e-06, -3.582797944545746e-06, -3.429129719734192e-06, -3.275461494922638e-06, -3.121793270111084e-06, -2.96812504529953e-06, -2.814456820487976e-06, -2.660788595676422e-06, -2.507120370864868e-06, -2.353452146053314e-06, -2.1997839212417603e-06, -2.0461156964302063e-06, -1.8924474716186523e-06, -1.7387792468070984e-06, -1.5851110219955444e-06, -1.4314427971839905e-06, -1.2777745723724365e-06, -1.1241063475608826e-06, -9.704381227493286e-07, -8.167698979377747e-07, -6.631016731262207e-07, -5.094334483146667e-07, -3.557652235031128e-07, -2.0209699869155884e-07, -4.842877388000488e-08, 1.0523945093154907e-07, 2.5890767574310303e-07, 4.12575900554657e-07, 5.662441253662109e-07, 7.199123501777649e-07, 8.735805749893188e-07, 1.0272487998008728e-06, 1.1809170246124268e-06, 1.3345852494239807e-06, 1.4882534742355347e-06, 1.6419216990470886e-06, 1.7955899238586426e-06, 1.9492581486701965e-06, 2.1029263734817505e-06, 2.2565945982933044e-06, 2.4102628231048584e-06, 2.5639310479164124e-06, 2.7175992727279663e-06, 2.8712674975395203e-06, 3.0249357223510742e-06, 3.178603947162628e-06, 3.332272171974182e-06, 3.485940396785736e-06, 3.63960862159729e-06, 3.793276846408844e-06, 3.946945071220398e-06, 4.100613296031952e-06, 4.254281520843506e-06, 4.40794974565506e-06, 4.561617970466614e-06, 4.715286195278168e-06, 4.868954420089722e-06, 5.022622644901276e-06, 5.17629086971283e-06, 5.3299590945243835e-06, 5.4836273193359375e-06]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 6.0, 5.0, 7.0, 7.0, 22.0, 38.0, 60.0, 93.0, 219.0, 390.0, 856.0, 2103.0, 8503.0, 68218.0, 556448.0, 367046.0, 35960.0, 5485.0, 1598.0, 693.0, 389.0, 179.0, 97.0, 46.0, 28.0, 21.0, 13.0, 8.0, 4.0, 3.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0207366943359375, -0.020064830780029297, -0.019392967224121094, -0.01872110366821289, -0.018049240112304688, -0.017377376556396484, -0.01670551300048828, -0.016033649444580078, -0.015361785888671875, -0.014689922332763672, -0.014018058776855469, -0.013346195220947266, -0.012674331665039062, -0.01200246810913086, -0.011330604553222656, -0.010658740997314453, -0.00998687744140625, -0.009315013885498047, -0.008643150329589844, -0.00797128677368164, -0.0072994232177734375, -0.006627559661865234, -0.005955696105957031, -0.005283832550048828, -0.004611968994140625, -0.003940105438232422, -0.0032682418823242188, -0.0025963783264160156, -0.0019245147705078125, -0.0012526512145996094, -0.0005807876586914062, 9.107589721679688e-05, 0.000762939453125, 0.0014348030090332031, 0.0021066665649414062, 0.0027785301208496094, 0.0034503936767578125, 0.004122257232666016, 0.004794120788574219, 0.005465984344482422, 0.006137847900390625, 0.006809711456298828, 0.007481575012207031, 0.008153438568115234, 0.008825302124023438, 0.00949716567993164, 0.010169029235839844, 0.010840892791748047, 0.01151275634765625, 0.012184619903564453, 0.012856483459472656, 0.01352834701538086, 0.014200210571289062, 0.014872074127197266, 0.015543937683105469, 0.016215801239013672, 0.016887664794921875, 0.017559528350830078, 0.01823139190673828, 0.018903255462646484, 0.019575119018554688, 0.02024698257446289, 0.020918846130371094, 0.021590709686279297, 0.0222625732421875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 7.0, 9.0, 5.0, 19.0, 26.0, 38.0, 46.0, 72.0, 68.0, 105.0, 128.0, 102.0, 101.0, 81.0, 57.0, 46.0, 30.0, 18.0, 16.0, 11.0, 6.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0184783935546875, -0.017759084701538086, -0.017039775848388672, -0.016320466995239258, -0.015601158142089844, -0.01488184928894043, -0.014162540435791016, -0.013443231582641602, -0.012723922729492188, -0.012004613876342773, -0.01128530502319336, -0.010565996170043945, -0.009846687316894531, -0.009127378463745117, -0.008408069610595703, -0.007688760757446289, -0.006969451904296875, -0.006250143051147461, -0.005530834197998047, -0.004811525344848633, -0.004092216491699219, -0.0033729076385498047, -0.0026535987854003906, -0.0019342899322509766, -0.0012149810791015625, -0.0004956722259521484, 0.00022363662719726562, 0.0009429454803466797, 0.0016622543334960938, 0.002381563186645508, 0.003100872039794922, 0.003820180892944336, 0.00453948974609375, 0.005258798599243164, 0.005978107452392578, 0.006697416305541992, 0.007416725158691406, 0.00813603401184082, 0.008855342864990234, 0.009574651718139648, 0.010293960571289062, 0.011013269424438477, 0.01173257827758789, 0.012451887130737305, 0.013171195983886719, 0.013890504837036133, 0.014609813690185547, 0.015329122543334961, 0.016048431396484375, 0.01676774024963379, 0.017487049102783203, 0.018206357955932617, 0.01892566680908203, 0.019644975662231445, 0.02036428451538086, 0.021083593368530273, 0.021802902221679688, 0.0225222110748291, 0.023241519927978516, 0.02396082878112793, 0.024680137634277344, 0.025399446487426758, 0.026118755340576172, 0.026838064193725586, 0.027557373046875]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 33.0, 344.0, 559.0, 63.0, 10.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7394766807556152, -0.6938133835792542, -0.6481500864028931, -0.602486789226532, -0.5568234920501709, -0.5111601948738098, -0.4654969274997711, -0.41983363032341003, -0.37417033314704895, -0.32850703597068787, -0.2828437387943268, -0.2371804565191269, -0.1915171593427658, -0.14585386216640472, -0.10019057989120483, -0.05452728271484375, -0.008863985538482666, 0.03679930791258812, 0.0824626013636589, 0.1281258910894394, 0.17378918826580048, 0.21945248544216156, 0.26511576771736145, 0.31077906489372253, 0.3564423620700836, 0.4021056592464447, 0.4477689564228058, 0.4934322237968445, 0.5390955209732056, 0.5847588181495667, 0.6304221153259277, 0.6760854125022888, 0.7217487096786499, 0.767412006855011, 0.8130753040313721, 0.8587386012077332, 0.9044018983840942, 0.9500651955604553, 0.9957284927368164, 1.0413917303085327, 1.0870550870895386, 1.1327183246612549, 1.1783816814422607, 1.224044919013977, 1.269708275794983, 1.3153715133666992, 1.361034870147705, 1.4066981077194214, 1.4523613452911377, 1.498024582862854, 1.5436879396438599, 1.5893511772155762, 1.635014533996582, 1.6806777715682983, 1.7263411283493042, 1.7720043659210205, 1.8176677227020264, 1.8633309602737427, 1.9089943170547485, 1.9546575546264648, 2.0003209114074707, 2.0459842681884766, 2.0916473865509033, 2.137310743331909, 2.182974100112915]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 6.0, 6.0, 12.0, 2.0, 6.0, 6.0, 3.0, 17.0, 15.0, 15.0, 16.0, 22.0, 23.0, 20.0, 32.0, 26.0, 36.0, 37.0, 46.0, 40.0, 49.0, 38.0, 38.0, 47.0, 36.0, 44.0, 35.0, 31.0, 33.0, 29.0, 33.0, 37.0, 19.0, 31.0, 10.0, 16.0, 23.0, 11.0, 14.0, 13.0, 6.0, 9.0, 3.0, 5.0, 3.0, 7.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.30336302518844604, -0.2935250997543335, -0.28368720412254333, -0.2738492786884308, -0.2640113830566406, -0.2541734576225281, -0.24433556199073792, -0.23449763655662537, -0.2246597409248352, -0.21482183039188385, -0.2049839198589325, -0.19514600932598114, -0.18530809879302979, -0.17547018826007843, -0.16563227772712708, -0.15579435229301453, -0.14595644176006317, -0.13611853122711182, -0.12628062069416046, -0.1164427101612091, -0.10660479962825775, -0.0967668890953064, -0.08692897111177444, -0.07709106057882309, -0.06725315004587173, -0.05741523951292038, -0.047577328979969025, -0.03773941472172737, -0.027901504188776016, -0.01806359365582466, -0.008225679397583008, 0.0016122311353683472, 0.011450141668319702, 0.021288052201271057, 0.03112596459686756, 0.040963876992464066, 0.05080178752541542, 0.060639698058366776, 0.07047761231660843, 0.08031552284955978, 0.09015343338251114, 0.0999913439154625, 0.10982925444841385, 0.1196671724319458, 0.12950508296489716, 0.1393429934978485, 0.14918090403079987, 0.15901881456375122, 0.16885672509670258, 0.17869463562965393, 0.18853254616260529, 0.19837045669555664, 0.208208367228508, 0.21804627776145935, 0.2278842031955719, 0.23772209882736206, 0.2475600242614746, 0.25739794969558716, 0.2672358453273773, 0.27707377076148987, 0.28691166639328003, 0.2967495918273926, 0.30658748745918274, 0.3164254128932953, 0.32626330852508545]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 6.0, 8.0, 10.0, 19.0, 27.0, 42.0, 85.0, 174.0, 342.0, 716.0, 1950.0, 6463.0, 31811.0, 3375929.0, 742746.0, 25204.0, 5469.0, 1783.0, 747.0, 336.0, 168.0, 104.0, 56.0, 29.0, 25.0, 16.0, 10.0, 7.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10137939453125, -0.09870719909667969, -0.09603500366210938, -0.09336280822753906, -0.09069061279296875, -0.08801841735839844, -0.08534622192382812, -0.08267402648925781, -0.0800018310546875, -0.07732963562011719, -0.07465744018554688, -0.07198524475097656, -0.06931304931640625, -0.06664085388183594, -0.06396865844726562, -0.06129646301269531, -0.058624267578125, -0.05595207214355469, -0.053279876708984375, -0.05060768127441406, -0.04793548583984375, -0.04526329040527344, -0.042591094970703125, -0.03991889953613281, -0.0372467041015625, -0.03457450866699219, -0.031902313232421875, -0.029230117797851562, -0.02655792236328125, -0.023885726928710938, -0.021213531494140625, -0.018541336059570312, -0.015869140625, -0.013196945190429688, -0.010524749755859375, -0.007852554321289062, -0.00518035888671875, -0.0025081634521484375, 0.000164031982421875, 0.0028362274169921875, 0.0055084228515625, 0.008180618286132812, 0.010852813720703125, 0.013525009155273438, 0.01619720458984375, 0.018869400024414062, 0.021541595458984375, 0.024213790893554688, 0.026885986328125, 0.029558181762695312, 0.032230377197265625, 0.03490257263183594, 0.03757476806640625, 0.04024696350097656, 0.042919158935546875, 0.04559135437011719, 0.0482635498046875, 0.05093574523925781, 0.053607940673828125, 0.05628013610839844, 0.05895233154296875, 0.06162452697753906, 0.06429672241210938, 0.06696891784667969, 0.06964111328125]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 6.0, 9.0, 10.0, 15.0, 9.0, 16.0, 30.0, 43.0, 40.0, 37.0, 48.0, 60.0, 46.0, 71.0, 65.0, 68.0, 66.0, 55.0, 58.0, 45.0, 41.0, 43.0, 23.0, 20.0, 18.0, 14.0, 11.0, 9.0, 4.0, 10.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.02850341796875, -0.027657747268676758, -0.026812076568603516, -0.025966405868530273, -0.02512073516845703, -0.02427506446838379, -0.023429393768310547, -0.022583723068237305, -0.021738052368164062, -0.02089238166809082, -0.020046710968017578, -0.019201040267944336, -0.018355369567871094, -0.01750969886779785, -0.01666402816772461, -0.015818357467651367, -0.014972686767578125, -0.014127016067504883, -0.01328134536743164, -0.012435674667358398, -0.011590003967285156, -0.010744333267211914, -0.009898662567138672, -0.00905299186706543, -0.008207321166992188, -0.007361650466918945, -0.006515979766845703, -0.005670309066772461, -0.004824638366699219, -0.0039789676666259766, -0.0031332969665527344, -0.002287626266479492, -0.00144195556640625, -0.0005962848663330078, 0.0002493858337402344, 0.0010950565338134766, 0.0019407272338867188, 0.002786397933959961, 0.003632068634033203, 0.004477739334106445, 0.0053234100341796875, 0.00616908073425293, 0.007014751434326172, 0.007860422134399414, 0.008706092834472656, 0.009551763534545898, 0.01039743423461914, 0.011243104934692383, 0.012088775634765625, 0.012934446334838867, 0.01378011703491211, 0.014625787734985352, 0.015471458435058594, 0.016317129135131836, 0.017162799835205078, 0.01800847053527832, 0.018854141235351562, 0.019699811935424805, 0.020545482635498047, 0.02139115333557129, 0.02223682403564453, 0.023082494735717773, 0.023928165435791016, 0.024773836135864258, 0.0256195068359375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 6.0, 5.0, 16.0, 20.0, 43.0, 38.0, 90.0, 177.0, 399.0, 916.0, 2276.0, 6582.0, 24623.0, 235620.0, 3799735.0, 99496.0, 15934.0, 4880.0, 1850.0, 811.0, 366.0, 166.0, 88.0, 50.0, 34.0, 18.0, 15.0, 8.0, 9.0, 2.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05792236328125, -0.05594921112060547, -0.05397605895996094, -0.052002906799316406, -0.050029754638671875, -0.048056602478027344, -0.04608345031738281, -0.04411029815673828, -0.04213714599609375, -0.04016399383544922, -0.03819084167480469, -0.036217689514160156, -0.034244537353515625, -0.032271385192871094, -0.030298233032226562, -0.02832508087158203, -0.0263519287109375, -0.02437877655029297, -0.022405624389648438, -0.020432472229003906, -0.018459320068359375, -0.016486167907714844, -0.014513015747070312, -0.012539863586425781, -0.01056671142578125, -0.008593559265136719, -0.0066204071044921875, -0.004647254943847656, -0.002674102783203125, -0.0007009506225585938, 0.0012722015380859375, 0.0032453536987304688, 0.005218505859375, 0.007191658020019531, 0.009164810180664062, 0.011137962341308594, 0.013111114501953125, 0.015084266662597656, 0.017057418823242188, 0.01903057098388672, 0.02100372314453125, 0.02297687530517578, 0.024950027465820312, 0.026923179626464844, 0.028896331787109375, 0.030869483947753906, 0.03284263610839844, 0.03481578826904297, 0.0367889404296875, 0.03876209259033203, 0.04073524475097656, 0.042708396911621094, 0.044681549072265625, 0.046654701232910156, 0.04862785339355469, 0.05060100555419922, 0.05257415771484375, 0.05454730987548828, 0.05652046203613281, 0.058493614196777344, 0.060466766357421875, 0.062439918518066406, 0.06441307067871094, 0.06638622283935547, 0.068359375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 8.0, 6.0, 7.0, 11.0, 9.0, 20.0, 57.0, 93.0, 311.0, 2374.0, 823.0, 190.0, 72.0, 33.0, 14.0, 9.0, 15.0, 8.0, 6.0, 4.0, 1.0, 2.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0202484130859375, -0.019223928451538086, -0.018199443817138672, -0.017174959182739258, -0.016150474548339844, -0.01512598991394043, -0.014101505279541016, -0.013077020645141602, -0.012052536010742188, -0.011028051376342773, -0.01000356674194336, -0.008979082107543945, -0.007954597473144531, -0.006930112838745117, -0.005905628204345703, -0.004881143569946289, -0.003856658935546875, -0.002832174301147461, -0.0018076896667480469, -0.0007832050323486328, 0.00024127960205078125, 0.0012657642364501953, 0.0022902488708496094, 0.0033147335052490234, 0.0043392181396484375, 0.0053637027740478516, 0.006388187408447266, 0.00741267204284668, 0.008437156677246094, 0.009461641311645508, 0.010486125946044922, 0.011510610580444336, 0.01253509521484375, 0.013559579849243164, 0.014584064483642578, 0.015608549118041992, 0.016633033752441406, 0.01765751838684082, 0.018682003021240234, 0.01970648765563965, 0.020730972290039062, 0.021755456924438477, 0.02277994155883789, 0.023804426193237305, 0.02482891082763672, 0.025853395462036133, 0.026877880096435547, 0.02790236473083496, 0.028926849365234375, 0.02995133399963379, 0.030975818634033203, 0.03200030326843262, 0.03302478790283203, 0.034049272537231445, 0.03507375717163086, 0.03609824180603027, 0.03712272644042969, 0.0381472110748291, 0.039171695709228516, 0.04019618034362793, 0.041220664978027344, 0.04224514961242676, 0.04326963424682617, 0.044294118881225586, 0.045318603515625]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 8.0, 58.0, 305.0, 416.0, 170.0, 23.0, 8.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.39603090286254883, -0.3859335482120514, -0.37583622336387634, -0.3657388687133789, -0.35564151406288147, -0.3455441892147064, -0.335446834564209, -0.32534950971603394, -0.3152521550655365, -0.30515480041503906, -0.295057475566864, -0.2849601209163666, -0.27486276626586914, -0.2647654414176941, -0.25466808676719666, -0.2445707470178604, -0.23447339236736298, -0.22437605261802673, -0.2142786979675293, -0.20418135821819305, -0.1940840184688568, -0.18398666381835938, -0.17388932406902313, -0.1637919843196869, -0.15369462966918945, -0.1435972899198532, -0.13349993526935577, -0.12340259552001953, -0.11330525577068329, -0.10320790857076645, -0.09311056137084961, -0.08301322162151337, -0.07291588187217712, -0.06281853467226028, -0.05272119492292404, -0.0426238477230072, -0.03252650424838066, -0.02242916077375412, -0.01233181357383728, -0.0022344738245010376, 0.007862873375415802, 0.017960216850042343, 0.028057562187314034, 0.038154907524585724, 0.048252250999212265, 0.058349594473838806, 0.06844694167375565, 0.07854428142309189, 0.08864162862300873, 0.09873897582292557, 0.10883631557226181, 0.11893366277217865, 0.1290310025215149, 0.13912835717201233, 0.14922569692134857, 0.15932303667068481, 0.16942039132118225, 0.1795177310705185, 0.18961508572101593, 0.19971242547035217, 0.20980976521968842, 0.21990710496902466, 0.2300044596195221, 0.24010179936885834, 0.2501991391181946]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 8.0, 18.0, 21.0, 20.0, 30.0, 46.0, 58.0, 65.0, 63.0, 83.0, 78.0, 87.0, 66.0, 67.0, 73.0, 46.0, 42.0, 33.0, 28.0, 25.0, 11.0, 13.0, 6.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.09769409894943237, -0.09455743432044983, -0.09142076224088669, -0.08828409016132355, -0.085147425532341, -0.08201076090335846, -0.07887408882379532, -0.07573741674423218, -0.07260075211524963, -0.06946408748626709, -0.06632741540670395, -0.06319074332714081, -0.060054078698158264, -0.05691741034388542, -0.05378074198961258, -0.05064407363533974, -0.047507405281066895, -0.04437073692679405, -0.04123406857252121, -0.03809740021824837, -0.034960731863975525, -0.03182406350970268, -0.02868739515542984, -0.025550726801156998, -0.022414058446884155, -0.019277390092611313, -0.01614072173833847, -0.013004053384065628, -0.009867385029792786, -0.006730716675519943, -0.003594048321247101, -0.0004573799669742584, 0.002679288387298584, 0.005815956741571426, 0.008952625095844269, 0.012089293450117111, 0.015225961804389954, 0.018362630158662796, 0.02149929851293564, 0.02463596686720848, 0.027772635221481323, 0.030909303575754166, 0.03404597193002701, 0.03718264028429985, 0.04031930863857269, 0.043455976992845535, 0.04659264534711838, 0.04972931370139122, 0.05286598205566406, 0.056002650409936905, 0.05913931876420975, 0.06227598711848259, 0.06541265547275543, 0.06854932010173798, 0.07168599218130112, 0.07482266426086426, 0.0779593288898468, 0.08109599351882935, 0.08423266559839249, 0.08736933767795563, 0.09050600230693817, 0.09364266693592072, 0.09677933901548386, 0.099916011095047, 0.10305267572402954]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 4.0, 4.0, 2.0, 3.0, 5.0, 4.0, 9.0, 13.0, 18.0, 26.0, 29.0, 46.0, 46.0, 96.0, 117.0, 168.0, 228.0, 361.0, 607.0, 923.0, 1535.0, 2599.0, 4962.0, 10121.0, 22360.0, 56371.0, 154344.0, 344481.0, 272475.0, 104016.0, 39207.0, 16260.0, 7746.0, 3902.0, 2071.0, 1227.0, 708.0, 481.0, 299.0, 201.0, 137.0, 104.0, 63.0, 52.0, 30.0, 28.0, 24.0, 13.0, 5.0, 11.0, 9.0, 2.0, 6.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0], "bins": [-0.03662109375, -0.03543233871459961, -0.03424358367919922, -0.03305482864379883, -0.03186607360839844, -0.030677318572998047, -0.029488563537597656, -0.028299808502197266, -0.027111053466796875, -0.025922298431396484, -0.024733543395996094, -0.023544788360595703, -0.022356033325195312, -0.021167278289794922, -0.01997852325439453, -0.01878976821899414, -0.01760101318359375, -0.01641225814819336, -0.015223503112792969, -0.014034748077392578, -0.012845993041992188, -0.011657238006591797, -0.010468482971191406, -0.009279727935791016, -0.008090972900390625, -0.006902217864990234, -0.005713462829589844, -0.004524707794189453, -0.0033359527587890625, -0.002147197723388672, -0.0009584426879882812, 0.00023031234741210938, 0.0014190673828125, 0.0026078224182128906, 0.0037965774536132812, 0.004985332489013672, 0.0061740875244140625, 0.007362842559814453, 0.008551597595214844, 0.009740352630615234, 0.010929107666015625, 0.012117862701416016, 0.013306617736816406, 0.014495372772216797, 0.015684127807617188, 0.016872882843017578, 0.01806163787841797, 0.01925039291381836, 0.02043914794921875, 0.02162790298461914, 0.02281665802001953, 0.024005413055419922, 0.025194168090820312, 0.026382923126220703, 0.027571678161621094, 0.028760433197021484, 0.029949188232421875, 0.031137943267822266, 0.032326698303222656, 0.03351545333862305, 0.03470420837402344, 0.03589296340942383, 0.03708171844482422, 0.03827047348022461, 0.039459228515625]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 4.0, 5.0, 11.0, 9.0, 13.0, 13.0, 27.0, 20.0, 29.0, 44.0, 35.0, 55.0, 57.0, 43.0, 56.0, 71.0, 65.0, 64.0, 59.0, 55.0, 44.0, 45.0, 33.0, 31.0, 23.0, 22.0, 12.0, 10.0, 12.0, 13.0, 2.0, 7.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0264434814453125, -0.02563929557800293, -0.02483510971069336, -0.02403092384338379, -0.02322673797607422, -0.02242255210876465, -0.021618366241455078, -0.020814180374145508, -0.020009994506835938, -0.019205808639526367, -0.018401622772216797, -0.017597436904907227, -0.016793251037597656, -0.015989065170288086, -0.015184879302978516, -0.014380693435668945, -0.013576507568359375, -0.012772321701049805, -0.011968135833740234, -0.011163949966430664, -0.010359764099121094, -0.009555578231811523, -0.008751392364501953, -0.007947206497192383, -0.0071430206298828125, -0.006338834762573242, -0.005534648895263672, -0.0047304630279541016, -0.003926277160644531, -0.003122091293334961, -0.0023179054260253906, -0.0015137195587158203, -0.00070953369140625, 9.465217590332031e-05, 0.0008988380432128906, 0.001703023910522461, 0.0025072097778320312, 0.0033113956451416016, 0.004115581512451172, 0.004919767379760742, 0.0057239532470703125, 0.006528139114379883, 0.007332324981689453, 0.008136510848999023, 0.008940696716308594, 0.009744882583618164, 0.010549068450927734, 0.011353254318237305, 0.012157440185546875, 0.012961626052856445, 0.013765811920166016, 0.014569997787475586, 0.015374183654785156, 0.016178369522094727, 0.016982555389404297, 0.017786741256713867, 0.018590927124023438, 0.019395112991333008, 0.020199298858642578, 0.02100348472595215, 0.02180767059326172, 0.02261185646057129, 0.02341604232788086, 0.02422022819519043, 0.0250244140625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 5.0, 4.0, 6.0, 11.0, 9.0, 8.0, 14.0, 23.0, 26.0, 47.0, 55.0, 79.0, 78.0, 139.0, 217.0, 325.0, 589.0, 1109.0, 2596.0, 7215.0, 24932.0, 108784.0, 454501.0, 346439.0, 73361.0, 18143.0, 5428.0, 2068.0, 945.0, 497.0, 288.0, 180.0, 127.0, 91.0, 69.0, 36.0, 28.0, 19.0, 20.0, 10.0, 6.0, 9.0, 9.0, 1.0, 5.0, 3.0, 2.0, 2.0, 0.0, 3.0, 3.0, 0.0, 1.0], "bins": [-0.0501708984375, -0.048689842224121094, -0.04720878601074219, -0.04572772979736328, -0.044246673583984375, -0.04276561737060547, -0.04128456115722656, -0.039803504943847656, -0.03832244873046875, -0.036841392517089844, -0.03536033630371094, -0.03387928009033203, -0.032398223876953125, -0.03091716766357422, -0.029436111450195312, -0.027955055236816406, -0.0264739990234375, -0.024992942810058594, -0.023511886596679688, -0.02203083038330078, -0.020549774169921875, -0.01906871795654297, -0.017587661743164062, -0.016106605529785156, -0.01462554931640625, -0.013144493103027344, -0.011663436889648438, -0.010182380676269531, -0.008701324462890625, -0.007220268249511719, -0.0057392120361328125, -0.004258155822753906, -0.002777099609375, -0.0012960433959960938, 0.0001850128173828125, 0.0016660690307617188, 0.003147125244140625, 0.004628181457519531, 0.0061092376708984375, 0.007590293884277344, 0.00907135009765625, 0.010552406311035156, 0.012033462524414062, 0.013514518737792969, 0.014995574951171875, 0.01647663116455078, 0.017957687377929688, 0.019438743591308594, 0.0209197998046875, 0.022400856018066406, 0.023881912231445312, 0.02536296844482422, 0.026844024658203125, 0.02832508087158203, 0.029806137084960938, 0.031287193298339844, 0.03276824951171875, 0.034249305725097656, 0.03573036193847656, 0.03721141815185547, 0.038692474365234375, 0.04017353057861328, 0.04165458679199219, 0.043135643005371094, 0.04461669921875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 3.0, 6.0, 8.0, 6.0, 4.0, 10.0, 11.0, 14.0, 16.0, 20.0, 16.0, 30.0, 25.0, 30.0, 22.0, 36.0, 32.0, 38.0, 38.0, 36.0, 43.0, 31.0, 33.0, 37.0, 34.0, 51.0, 28.0, 31.0, 24.0, 33.0, 41.0, 17.0, 28.0, 27.0, 20.0, 13.0, 21.0, 12.0, 15.0, 11.0, 9.0, 7.0, 4.0, 6.0, 10.0, 6.0, 1.0, 0.0, 3.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.062225341796875, -0.06016397476196289, -0.05810260772705078, -0.05604124069213867, -0.05397987365722656, -0.05191850662231445, -0.049857139587402344, -0.047795772552490234, -0.045734405517578125, -0.043673038482666016, -0.041611671447753906, -0.0395503044128418, -0.03748893737792969, -0.03542757034301758, -0.03336620330810547, -0.03130483627319336, -0.02924346923828125, -0.02718210220336914, -0.02512073516845703, -0.023059368133544922, -0.020998001098632812, -0.018936634063720703, -0.016875267028808594, -0.014813899993896484, -0.012752532958984375, -0.010691165924072266, -0.008629798889160156, -0.006568431854248047, -0.0045070648193359375, -0.002445697784423828, -0.00038433074951171875, 0.0016770362854003906, 0.0037384033203125, 0.005799770355224609, 0.007861137390136719, 0.009922504425048828, 0.011983871459960938, 0.014045238494873047, 0.016106605529785156, 0.018167972564697266, 0.020229339599609375, 0.022290706634521484, 0.024352073669433594, 0.026413440704345703, 0.028474807739257812, 0.030536174774169922, 0.03259754180908203, 0.03465890884399414, 0.03672027587890625, 0.03878164291381836, 0.04084300994873047, 0.04290437698364258, 0.04496574401855469, 0.0470271110534668, 0.049088478088378906, 0.051149845123291016, 0.053211212158203125, 0.055272579193115234, 0.057333946228027344, 0.05939531326293945, 0.06145668029785156, 0.06351804733276367, 0.06557941436767578, 0.06764078140258789, 0.0697021484375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 9.0, 4.0, 3.0, 18.0, 25.0, 43.0, 63.0, 170.0, 402.0, 1057.0, 3031.0, 11441.0, 78957.0, 620057.0, 294456.0, 30033.0, 5813.0, 1773.0, 657.0, 270.0, 118.0, 63.0, 30.0, 19.0, 10.0, 9.0, 10.0, 3.0, 3.0, 3.0, 1.0, 0.0, 4.0, 3.0, 0.0, 1.0, 0.0, 3.0, 1.0], "bins": [-0.0291290283203125, -0.028377771377563477, -0.027626514434814453, -0.02687525749206543, -0.026124000549316406, -0.025372743606567383, -0.02462148666381836, -0.023870229721069336, -0.023118972778320312, -0.02236771583557129, -0.021616458892822266, -0.020865201950073242, -0.02011394500732422, -0.019362688064575195, -0.018611431121826172, -0.01786017417907715, -0.017108917236328125, -0.0163576602935791, -0.015606403350830078, -0.014855146408081055, -0.014103889465332031, -0.013352632522583008, -0.012601375579833984, -0.011850118637084961, -0.011098861694335938, -0.010347604751586914, -0.00959634780883789, -0.008845090866088867, -0.008093833923339844, -0.00734257698059082, -0.006591320037841797, -0.0058400630950927734, -0.00508880615234375, -0.0043375492095947266, -0.003586292266845703, -0.0028350353240966797, -0.0020837783813476562, -0.0013325214385986328, -0.0005812644958496094, 0.00016999244689941406, 0.0009212493896484375, 0.001672506332397461, 0.0024237632751464844, 0.003175020217895508, 0.003926277160644531, 0.004677534103393555, 0.005428791046142578, 0.0061800479888916016, 0.006931304931640625, 0.0076825618743896484, 0.008433818817138672, 0.009185075759887695, 0.009936332702636719, 0.010687589645385742, 0.011438846588134766, 0.012190103530883789, 0.012941360473632812, 0.013692617416381836, 0.01444387435913086, 0.015195131301879883, 0.015946388244628906, 0.01669764518737793, 0.017448902130126953, 0.018200159072875977, 0.018951416015625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 6.0, 4.0, 6.0, 7.0, 18.0, 17.0, 22.0, 23.0, 25.0, 27.0, 44.0, 51.0, 46.0, 74.0, 71.0, 96.0, 67.0, 86.0, 54.0, 68.0, 42.0, 37.0, 27.0, 24.0, 24.0, 10.0, 11.0, 6.0, 5.0, 4.0, 3.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.987022399902344e-06, -7.780268788337708e-06, -7.573515176773071e-06, -7.366761565208435e-06, -7.160007953643799e-06, -6.953254342079163e-06, -6.746500730514526e-06, -6.53974711894989e-06, -6.332993507385254e-06, -6.126239895820618e-06, -5.9194862842559814e-06, -5.712732672691345e-06, -5.505979061126709e-06, -5.299225449562073e-06, -5.0924718379974365e-06, -4.8857182264328e-06, -4.678964614868164e-06, -4.472211003303528e-06, -4.265457391738892e-06, -4.058703780174255e-06, -3.851950168609619e-06, -3.645196557044983e-06, -3.4384429454803467e-06, -3.2316893339157104e-06, -3.0249357223510742e-06, -2.818182110786438e-06, -2.6114284992218018e-06, -2.4046748876571655e-06, -2.1979212760925293e-06, -1.991167664527893e-06, -1.7844140529632568e-06, -1.5776604413986206e-06, -1.3709068298339844e-06, -1.1641532182693481e-06, -9.57399606704712e-07, -7.506459951400757e-07, -5.438923835754395e-07, -3.371387720108032e-07, -1.30385160446167e-07, 7.636845111846924e-08, 2.8312206268310547e-07, 4.898756742477417e-07, 6.966292858123779e-07, 9.033828973770142e-07, 1.1101365089416504e-06, 1.3168901205062866e-06, 1.5236437320709229e-06, 1.730397343635559e-06, 1.9371509552001953e-06, 2.1439045667648315e-06, 2.3506581783294678e-06, 2.557411789894104e-06, 2.7641654014587402e-06, 2.9709190130233765e-06, 3.1776726245880127e-06, 3.384426236152649e-06, 3.591179847717285e-06, 3.7979334592819214e-06, 4.004687070846558e-06, 4.211440682411194e-06, 4.41819429397583e-06, 4.624947905540466e-06, 4.8317015171051025e-06, 5.038455128669739e-06, 5.245208740234375e-06]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 12.0, 24.0, 25.0, 42.0, 76.0, 144.0, 425.0, 1231.0, 6620.0, 74499.0, 686944.0, 257038.0, 17893.0, 2496.0, 588.0, 235.0, 127.0, 51.0, 41.0, 16.0, 13.0, 9.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.036651611328125, -0.03572893142700195, -0.034806251525878906, -0.03388357162475586, -0.03296089172363281, -0.032038211822509766, -0.03111553192138672, -0.030192852020263672, -0.029270172119140625, -0.028347492218017578, -0.02742481231689453, -0.026502132415771484, -0.025579452514648438, -0.02465677261352539, -0.023734092712402344, -0.022811412811279297, -0.02188873291015625, -0.020966053009033203, -0.020043373107910156, -0.01912069320678711, -0.018198013305664062, -0.017275333404541016, -0.01635265350341797, -0.015429973602294922, -0.014507293701171875, -0.013584613800048828, -0.012661933898925781, -0.011739253997802734, -0.010816574096679688, -0.00989389419555664, -0.008971214294433594, -0.008048534393310547, -0.0071258544921875, -0.006203174591064453, -0.005280494689941406, -0.004357814788818359, -0.0034351348876953125, -0.0025124549865722656, -0.0015897750854492188, -0.0006670951843261719, 0.000255584716796875, 0.0011782646179199219, 0.0021009445190429688, 0.0030236244201660156, 0.0039463043212890625, 0.004868984222412109, 0.005791664123535156, 0.006714344024658203, 0.00763702392578125, 0.008559703826904297, 0.009482383728027344, 0.01040506362915039, 0.011327743530273438, 0.012250423431396484, 0.013173103332519531, 0.014095783233642578, 0.015018463134765625, 0.015941143035888672, 0.01686382293701172, 0.017786502838134766, 0.018709182739257812, 0.01963186264038086, 0.020554542541503906, 0.021477222442626953, 0.02239990234375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 4.0, 5.0, 4.0, 8.0, 6.0, 10.0, 13.0, 24.0, 14.0, 51.0, 36.0, 66.0, 85.0, 74.0, 80.0, 91.0, 73.0, 76.0, 52.0, 42.0, 39.0, 50.0, 23.0, 16.0, 14.0, 12.0, 14.0, 8.0, 3.0, 4.0, 3.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.019775390625, -0.01919865608215332, -0.01862192153930664, -0.01804518699645996, -0.01746845245361328, -0.0168917179107666, -0.016314983367919922, -0.015738248825073242, -0.015161514282226562, -0.014584779739379883, -0.014008045196533203, -0.013431310653686523, -0.012854576110839844, -0.012277841567993164, -0.011701107025146484, -0.011124372482299805, -0.010547637939453125, -0.009970903396606445, -0.009394168853759766, -0.008817434310913086, -0.008240699768066406, -0.0076639652252197266, -0.007087230682373047, -0.006510496139526367, -0.0059337615966796875, -0.005357027053833008, -0.004780292510986328, -0.0042035579681396484, -0.0036268234252929688, -0.003050088882446289, -0.0024733543395996094, -0.0018966197967529297, -0.00131988525390625, -0.0007431507110595703, -0.00016641616821289062, 0.00041031837463378906, 0.0009870529174804688, 0.0015637874603271484, 0.002140522003173828, 0.002717256546020508, 0.0032939910888671875, 0.003870725631713867, 0.004447460174560547, 0.0050241947174072266, 0.005600929260253906, 0.006177663803100586, 0.006754398345947266, 0.007331132888793945, 0.007907867431640625, 0.008484601974487305, 0.009061336517333984, 0.009638071060180664, 0.010214805603027344, 0.010791540145874023, 0.011368274688720703, 0.011945009231567383, 0.012521743774414062, 0.013098478317260742, 0.013675212860107422, 0.014251947402954102, 0.014828681945800781, 0.015405416488647461, 0.01598215103149414, 0.01655888557434082, 0.0171356201171875]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 10.0, 19.0, 42.0, 132.0, 272.0, 292.0, 142.0, 63.0, 17.0, 8.0, 10.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.28774282336235046, -0.2661486864089966, -0.2445545494556427, -0.22296041250228882, -0.20136627554893494, -0.17977213859558105, -0.15817798674106598, -0.1365838497877121, -0.11498971283435822, -0.09339557588100433, -0.07180143892765045, -0.05020729452371597, -0.02861315757036209, -0.007019020617008209, 0.01457512378692627, 0.03616926074028015, 0.05776339769363403, 0.07935753464698792, 0.1009516716003418, 0.12254581600427628, 0.14413994550704956, 0.16573408246040344, 0.18732823431491852, 0.2089223712682724, 0.23051650822162628, 0.25211066007614136, 0.27370479702949524, 0.2952989339828491, 0.316893070936203, 0.3384872078895569, 0.36008134484291077, 0.38167548179626465, 0.40326958894729614, 0.42486372590065, 0.4464578628540039, 0.4680519998073578, 0.48964613676071167, 0.5112403035163879, 0.5328344106674194, 0.5544285774230957, 0.5760226845741272, 0.5976168513298035, 0.619210958480835, 0.6408051252365112, 0.6623992323875427, 0.683993399143219, 0.7055875062942505, 0.7271816730499268, 0.748775839805603, 0.7703700065612793, 0.7919641137123108, 0.8135582804679871, 0.8351523876190186, 0.8567465543746948, 0.8783406615257263, 0.8999348282814026, 0.9215289354324341, 0.9431231021881104, 0.9647172093391418, 0.9863113760948181, 1.0079054832458496, 1.0294996500015259, 1.0510938167572021, 1.0726878643035889, 1.0942820310592651]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 5.0, 2.0, 0.0, 2.0, 3.0, 2.0, 5.0, 9.0, 4.0, 7.0, 15.0, 5.0, 11.0, 14.0, 13.0, 17.0, 27.0, 28.0, 23.0, 25.0, 31.0, 30.0, 39.0, 42.0, 36.0, 25.0, 35.0, 47.0, 48.0, 42.0, 27.0, 41.0, 47.0, 34.0, 29.0, 33.0, 29.0, 23.0, 18.0, 22.0, 18.0, 21.0, 15.0, 9.0, 16.0, 11.0, 10.0, 7.0, 1.0, 4.0, 1.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.3345339298248291, -0.3238120675086975, -0.31309017539024353, -0.30236831307411194, -0.29164645075798035, -0.28092455863952637, -0.2702026963233948, -0.2594808340072632, -0.2487589418888092, -0.23803706467151642, -0.22731520235538483, -0.21659332513809204, -0.20587144792079926, -0.19514957070350647, -0.18442770838737488, -0.1737058311700821, -0.1629839688539505, -0.15226209163665771, -0.14154022932052612, -0.13081835210323334, -0.12009647488594055, -0.10937460511922836, -0.09865273535251617, -0.08793085813522339, -0.0772089883685112, -0.06648711860179901, -0.055765241384506226, -0.04504337161779404, -0.03432149812579155, -0.023599624633789062, -0.012877754867076874, -0.002155877649784088, 0.0085659921169281, 0.019287865608930588, 0.030009737238287926, 0.040731608867645264, 0.05145348235964775, 0.06217535585165024, 0.07289722561836243, 0.08361910283565521, 0.0943409726023674, 0.10506284236907959, 0.11578471958637238, 0.12650659680366516, 0.13722845911979675, 0.14795033633708954, 0.15867221355438232, 0.16939407587051392, 0.1801159530878067, 0.1908378303050995, 0.20155969262123108, 0.21228156983852386, 0.22300344705581665, 0.23372530937194824, 0.24444718658924103, 0.2551690638065338, 0.2658909261226654, 0.276612788438797, 0.287334680557251, 0.29805654287338257, 0.30877840518951416, 0.31950029730796814, 0.33022215962409973, 0.3409440517425537, 0.3516659140586853]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 10.0, 12.0, 17.0, 28.0, 30.0, 69.0, 108.0, 148.0, 306.0, 547.0, 1108.0, 3121.0, 13680.0, 350522.0, 3793652.0, 23430.0, 4334.0, 1551.0, 694.0, 323.0, 213.0, 122.0, 87.0, 61.0, 31.0, 25.0, 7.0, 12.0, 5.0, 13.0, 5.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06964111328125, -0.06686973571777344, -0.06409835815429688, -0.06132698059082031, -0.05855560302734375, -0.05578422546386719, -0.053012847900390625, -0.05024147033691406, -0.0474700927734375, -0.04469871520996094, -0.041927337646484375, -0.03915596008300781, -0.03638458251953125, -0.03361320495605469, -0.030841827392578125, -0.028070449829101562, -0.025299072265625, -0.022527694702148438, -0.019756317138671875, -0.016984939575195312, -0.01421356201171875, -0.011442184448242188, -0.008670806884765625, -0.0058994293212890625, -0.0031280517578125, -0.0003566741943359375, 0.002414703369140625, 0.0051860809326171875, 0.00795745849609375, 0.010728836059570312, 0.013500213623046875, 0.016271591186523438, 0.01904296875, 0.021814346313476562, 0.024585723876953125, 0.027357101440429688, 0.03012847900390625, 0.03289985656738281, 0.035671234130859375, 0.03844261169433594, 0.0412139892578125, 0.04398536682128906, 0.046756744384765625, 0.04952812194824219, 0.05229949951171875, 0.05507087707519531, 0.057842254638671875, 0.06061363220214844, 0.063385009765625, 0.06615638732910156, 0.06892776489257812, 0.07169914245605469, 0.07447052001953125, 0.07724189758300781, 0.08001327514648438, 0.08278465270996094, 0.0855560302734375, 0.08832740783691406, 0.09109878540039062, 0.09387016296386719, 0.09664154052734375, 0.09941291809082031, 0.10218429565429688, 0.10495567321777344, 0.10772705078125]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 7.0, 9.0, 4.0, 20.0, 22.0, 15.0, 25.0, 35.0, 23.0, 45.0, 50.0, 46.0, 67.0, 73.0, 58.0, 62.0, 51.0, 70.0, 52.0, 51.0, 39.0, 44.0, 30.0, 30.0, 15.0, 10.0, 17.0, 8.0, 6.0, 7.0, 1.0, 4.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0274505615234375, -0.026618480682373047, -0.025786399841308594, -0.02495431900024414, -0.024122238159179688, -0.023290157318115234, -0.02245807647705078, -0.021625995635986328, -0.020793914794921875, -0.019961833953857422, -0.01912975311279297, -0.018297672271728516, -0.017465591430664062, -0.01663351058959961, -0.015801429748535156, -0.014969348907470703, -0.01413726806640625, -0.013305187225341797, -0.012473106384277344, -0.01164102554321289, -0.010808944702148438, -0.009976863861083984, -0.009144783020019531, -0.008312702178955078, -0.007480621337890625, -0.006648540496826172, -0.005816459655761719, -0.004984378814697266, -0.0041522979736328125, -0.0033202171325683594, -0.0024881362915039062, -0.0016560554504394531, -0.000823974609375, 8.106231689453125e-06, 0.0008401870727539062, 0.0016722679138183594, 0.0025043487548828125, 0.0033364295959472656, 0.004168510437011719, 0.005000591278076172, 0.005832672119140625, 0.006664752960205078, 0.007496833801269531, 0.008328914642333984, 0.009160995483398438, 0.00999307632446289, 0.010825157165527344, 0.011657238006591797, 0.01248931884765625, 0.013321399688720703, 0.014153480529785156, 0.01498556137084961, 0.015817642211914062, 0.016649723052978516, 0.01748180389404297, 0.018313884735107422, 0.019145965576171875, 0.019978046417236328, 0.02081012725830078, 0.021642208099365234, 0.022474288940429688, 0.02330636978149414, 0.024138450622558594, 0.024970531463623047, 0.0258026123046875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 8.0, 8.0, 10.0, 22.0, 34.0, 33.0, 72.0, 102.0, 120.0, 239.0, 354.0, 742.0, 1528.0, 4014.0, 14490.0, 91537.0, 3862428.0, 187701.0, 21613.0, 5328.0, 1949.0, 814.0, 424.0, 238.0, 151.0, 101.0, 78.0, 37.0, 31.0, 26.0, 12.0, 12.0, 5.0, 3.0, 8.0, 3.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.05914306640625, -0.057211875915527344, -0.05528068542480469, -0.05334949493408203, -0.051418304443359375, -0.04948711395263672, -0.04755592346191406, -0.045624732971191406, -0.04369354248046875, -0.041762351989746094, -0.03983116149902344, -0.03789997100830078, -0.035968780517578125, -0.03403759002685547, -0.03210639953613281, -0.030175209045410156, -0.0282440185546875, -0.026312828063964844, -0.024381637573242188, -0.02245044708251953, -0.020519256591796875, -0.01858806610107422, -0.016656875610351562, -0.014725685119628906, -0.01279449462890625, -0.010863304138183594, -0.008932113647460938, -0.007000923156738281, -0.005069732666015625, -0.0031385421752929688, -0.0012073516845703125, 0.0007238388061523438, 0.002655029296875, 0.004586219787597656, 0.0065174102783203125, 0.008448600769042969, 0.010379791259765625, 0.012310981750488281, 0.014242172241210938, 0.016173362731933594, 0.01810455322265625, 0.020035743713378906, 0.021966934204101562, 0.02389812469482422, 0.025829315185546875, 0.02776050567626953, 0.029691696166992188, 0.031622886657714844, 0.0335540771484375, 0.035485267639160156, 0.03741645812988281, 0.03934764862060547, 0.041278839111328125, 0.04321002960205078, 0.04514122009277344, 0.047072410583496094, 0.04900360107421875, 0.050934791564941406, 0.05286598205566406, 0.05479717254638672, 0.056728363037109375, 0.05865955352783203, 0.06059074401855469, 0.06252193450927734, 0.064453125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 4.0, 5.0, 6.0, 12.0, 23.0, 45.0, 75.0, 239.0, 2288.0, 1047.0, 163.0, 59.0, 33.0, 17.0, 19.0, 9.0, 7.0, 5.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.023651123046875, -0.022460460662841797, -0.021269798278808594, -0.02007913589477539, -0.018888473510742188, -0.017697811126708984, -0.01650714874267578, -0.015316486358642578, -0.014125823974609375, -0.012935161590576172, -0.011744499206542969, -0.010553836822509766, -0.009363174438476562, -0.00817251205444336, -0.006981849670410156, -0.005791187286376953, -0.00460052490234375, -0.003409862518310547, -0.0022192001342773438, -0.0010285377502441406, 0.0001621246337890625, 0.0013527870178222656, 0.0025434494018554688, 0.003734111785888672, 0.004924774169921875, 0.006115436553955078, 0.007306098937988281, 0.008496761322021484, 0.009687423706054688, 0.01087808609008789, 0.012068748474121094, 0.013259410858154297, 0.0144500732421875, 0.015640735626220703, 0.016831398010253906, 0.01802206039428711, 0.019212722778320312, 0.020403385162353516, 0.02159404754638672, 0.022784709930419922, 0.023975372314453125, 0.025166034698486328, 0.02635669708251953, 0.027547359466552734, 0.028738021850585938, 0.02992868423461914, 0.031119346618652344, 0.03231000900268555, 0.03350067138671875, 0.03469133377075195, 0.035881996154785156, 0.03707265853881836, 0.03826332092285156, 0.039453983306884766, 0.04064464569091797, 0.04183530807495117, 0.043025970458984375, 0.04421663284301758, 0.04540729522705078, 0.046597957611083984, 0.04778861999511719, 0.04897928237915039, 0.050169944763183594, 0.0513606071472168, 0.05255126953125]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 20.0, 144.0, 450.0, 298.0, 60.0, 14.0, 6.0, 6.0, 4.0, 5.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26207125186920166, -0.24944326281547546, -0.23681528866291046, -0.22418729960918427, -0.21155932545661926, -0.19893133640289307, -0.18630334734916687, -0.17367535829544067, -0.16104738414287567, -0.14841939508914948, -0.13579142093658447, -0.12316343188285828, -0.11053545027971268, -0.09790746867656708, -0.08527947962284088, -0.07265149801969528, -0.06002351641654968, -0.04739553481340408, -0.034767549484968185, -0.022139564156532288, -0.009511582553386688, 0.003116399049758911, 0.015744388103485107, 0.028372369706630707, 0.041000351309776306, 0.053628332912921906, 0.0662563145160675, 0.0788843035697937, 0.0915122851729393, 0.1041402667760849, 0.1167682558298111, 0.1293962299823761, 0.1420242190361023, 0.1546522080898285, 0.1672801822423935, 0.1799081712961197, 0.1925361454486847, 0.2051641345024109, 0.21779212355613708, 0.23042011260986328, 0.24304808676242828, 0.2556760609149933, 0.2683040499687195, 0.2809320390224457, 0.2935600280761719, 0.3061879873275757, 0.31881600618362427, 0.3314439654350281, 0.3440719544887543, 0.35669994354248047, 0.36932793259620667, 0.38195592164993286, 0.39458388090133667, 0.40721186995506287, 0.41983985900878906, 0.43246784806251526, 0.44509583711624146, 0.45772382616996765, 0.47035181522369385, 0.48297977447509766, 0.49560776352882385, 0.50823575258255, 0.5208637714385986, 0.5334917306900024, 0.5461196899414062]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 5.0, 4.0, 8.0, 9.0, 12.0, 20.0, 18.0, 39.0, 45.0, 52.0, 70.0, 58.0, 92.0, 88.0, 86.0, 66.0, 67.0, 70.0, 46.0, 48.0, 39.0, 28.0, 8.0, 5.0, 6.0, 10.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.13454782962799072, -0.13068975508213043, -0.12683166563510895, -0.12297359108924866, -0.11911550909280777, -0.11525742709636688, -0.11139935255050659, -0.1075412705540657, -0.10368318855762482, -0.09982510656118393, -0.09596702456474304, -0.09210895001888275, -0.08825086802244186, -0.08439278602600098, -0.08053471148014069, -0.0766766294836998, -0.07281854748725891, -0.06896046549081802, -0.06510238349437714, -0.061244308948516846, -0.05738622695207596, -0.05352814495563507, -0.04967006668448448, -0.04581198841333389, -0.041953906416893005, -0.03809582442045212, -0.03423774614930153, -0.03037966601550579, -0.026521585881710052, -0.022663505747914314, -0.018805425614118576, -0.014947345480322838, -0.0110892653465271, -0.007231185212731361, -0.003373105078935623, 0.00048497505486011505, 0.004343055188655853, 0.008201135322451591, 0.01205921545624733, 0.015917295590043068, 0.019775375723838806, 0.023633455857634544, 0.027491535991430283, 0.03134961426258087, 0.03520769625902176, 0.039065778255462646, 0.042923856526613235, 0.046781934797763824, 0.05064001679420471, 0.0544980987906456, 0.05835617706179619, 0.06221425533294678, 0.06607233732938766, 0.06993041932582855, 0.07378849387168884, 0.07764657586812973, 0.08150465786457062, 0.0853627398610115, 0.08922082185745239, 0.09307889640331268, 0.09693697839975357, 0.10079506039619446, 0.10465313494205475, 0.10851121693849564, 0.11236929893493652]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 5.0, 1.0, 3.0, 6.0, 16.0, 11.0, 16.0, 23.0, 48.0, 91.0, 127.0, 201.0, 345.0, 639.0, 1245.0, 2924.0, 7850.0, 29015.0, 147735.0, 578610.0, 221797.0, 40926.0, 10189.0, 3522.0, 1490.0, 755.0, 398.0, 225.0, 122.0, 64.0, 55.0, 23.0, 29.0, 19.0, 13.0, 5.0, 7.0, 2.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.06231689453125, -0.06034564971923828, -0.05837440490722656, -0.056403160095214844, -0.054431915283203125, -0.052460670471191406, -0.05048942565917969, -0.04851818084716797, -0.04654693603515625, -0.04457569122314453, -0.04260444641113281, -0.040633201599121094, -0.038661956787109375, -0.036690711975097656, -0.03471946716308594, -0.03274822235107422, -0.0307769775390625, -0.02880573272705078, -0.026834487915039062, -0.024863243103027344, -0.022891998291015625, -0.020920753479003906, -0.018949508666992188, -0.01697826385498047, -0.01500701904296875, -0.013035774230957031, -0.011064529418945312, -0.009093284606933594, -0.007122039794921875, -0.005150794982910156, -0.0031795501708984375, -0.0012083053588867188, 0.000762939453125, 0.0027341842651367188, 0.0047054290771484375, 0.006676673889160156, 0.008647918701171875, 0.010619163513183594, 0.012590408325195312, 0.014561653137207031, 0.01653289794921875, 0.01850414276123047, 0.020475387573242188, 0.022446632385253906, 0.024417877197265625, 0.026389122009277344, 0.028360366821289062, 0.03033161163330078, 0.0323028564453125, 0.03427410125732422, 0.03624534606933594, 0.038216590881347656, 0.040187835693359375, 0.042159080505371094, 0.04413032531738281, 0.04610157012939453, 0.04807281494140625, 0.05004405975341797, 0.05201530456542969, 0.053986549377441406, 0.055957794189453125, 0.057929039001464844, 0.05990028381347656, 0.06187152862548828, 0.0638427734375]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 6.0, 9.0, 10.0, 7.0, 19.0, 19.0, 24.0, 28.0, 29.0, 39.0, 48.0, 50.0, 62.0, 66.0, 61.0, 77.0, 64.0, 73.0, 44.0, 46.0, 43.0, 41.0, 40.0, 19.0, 19.0, 15.0, 13.0, 7.0, 9.0, 4.0, 1.0, 2.0, 4.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.02972412109375, -0.028853893280029297, -0.027983665466308594, -0.02711343765258789, -0.026243209838867188, -0.025372982025146484, -0.02450275421142578, -0.023632526397705078, -0.022762298583984375, -0.021892070770263672, -0.02102184295654297, -0.020151615142822266, -0.019281387329101562, -0.01841115951538086, -0.017540931701660156, -0.016670703887939453, -0.01580047607421875, -0.014930248260498047, -0.014060020446777344, -0.01318979263305664, -0.012319564819335938, -0.011449337005615234, -0.010579109191894531, -0.009708881378173828, -0.008838653564453125, -0.007968425750732422, -0.007098197937011719, -0.006227970123291016, -0.0053577423095703125, -0.004487514495849609, -0.0036172866821289062, -0.002747058868408203, -0.0018768310546875, -0.0010066032409667969, -0.00013637542724609375, 0.0007338523864746094, 0.0016040802001953125, 0.0024743080139160156, 0.0033445358276367188, 0.004214763641357422, 0.005084991455078125, 0.005955219268798828, 0.006825447082519531, 0.007695674896240234, 0.008565902709960938, 0.00943613052368164, 0.010306358337402344, 0.011176586151123047, 0.01204681396484375, 0.012917041778564453, 0.013787269592285156, 0.01465749740600586, 0.015527725219726562, 0.016397953033447266, 0.01726818084716797, 0.018138408660888672, 0.019008636474609375, 0.019878864288330078, 0.02074909210205078, 0.021619319915771484, 0.022489547729492188, 0.02335977554321289, 0.024230003356933594, 0.025100231170654297, 0.025970458984375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 2.0, 2.0, 7.0, 14.0, 8.0, 12.0, 16.0, 14.0, 25.0, 42.0, 52.0, 57.0, 126.0, 121.0, 201.0, 346.0, 639.0, 1357.0, 3687.0, 13434.0, 68146.0, 465816.0, 415873.0, 60254.0, 12024.0, 3370.0, 1283.0, 572.0, 347.0, 193.0, 157.0, 97.0, 65.0, 49.0, 46.0, 21.0, 21.0, 13.0, 8.0, 12.0, 10.0, 7.0, 2.0, 2.0, 4.0, 2.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05548095703125, -0.053745269775390625, -0.05200958251953125, -0.050273895263671875, -0.0485382080078125, -0.046802520751953125, -0.04506683349609375, -0.043331146240234375, -0.041595458984375, -0.039859771728515625, -0.03812408447265625, -0.036388397216796875, -0.0346527099609375, -0.032917022705078125, -0.03118133544921875, -0.029445648193359375, -0.0277099609375, -0.025974273681640625, -0.02423858642578125, -0.022502899169921875, -0.0207672119140625, -0.019031524658203125, -0.01729583740234375, -0.015560150146484375, -0.013824462890625, -0.012088775634765625, -0.01035308837890625, -0.008617401123046875, -0.0068817138671875, -0.005146026611328125, -0.00341033935546875, -0.001674652099609375, 6.103515625e-05, 0.001796722412109375, 0.00353240966796875, 0.005268096923828125, 0.0070037841796875, 0.008739471435546875, 0.01047515869140625, 0.012210845947265625, 0.013946533203125, 0.015682220458984375, 0.01741790771484375, 0.019153594970703125, 0.0208892822265625, 0.022624969482421875, 0.02436065673828125, 0.026096343994140625, 0.02783203125, 0.029567718505859375, 0.03130340576171875, 0.033039093017578125, 0.0347747802734375, 0.036510467529296875, 0.03824615478515625, 0.039981842041015625, 0.041717529296875, 0.043453216552734375, 0.04518890380859375, 0.046924591064453125, 0.0486602783203125, 0.050395965576171875, 0.05213165283203125, 0.053867340087890625, 0.05560302734375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 7.0, 5.0, 8.0, 4.0, 3.0, 9.0, 9.0, 16.0, 9.0, 14.0, 15.0, 20.0, 30.0, 27.0, 26.0, 28.0, 39.0, 49.0, 43.0, 34.0, 39.0, 37.0, 45.0, 44.0, 41.0, 38.0, 40.0, 41.0, 45.0, 24.0, 28.0, 27.0, 16.0, 23.0, 29.0, 13.0, 17.0, 15.0, 10.0, 9.0, 7.0, 6.0, 7.0, 5.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.06768798828125, -0.06540966033935547, -0.06313133239746094, -0.060853004455566406, -0.058574676513671875, -0.056296348571777344, -0.05401802062988281, -0.05173969268798828, -0.04946136474609375, -0.04718303680419922, -0.04490470886230469, -0.042626380920410156, -0.040348052978515625, -0.038069725036621094, -0.03579139709472656, -0.03351306915283203, -0.0312347412109375, -0.02895641326904297, -0.026678085327148438, -0.024399757385253906, -0.022121429443359375, -0.019843101501464844, -0.017564773559570312, -0.015286445617675781, -0.01300811767578125, -0.010729789733886719, -0.008451461791992188, -0.006173133850097656, -0.003894805908203125, -0.0016164779663085938, 0.0006618499755859375, 0.0029401779174804688, 0.005218505859375, 0.007496833801269531, 0.009775161743164062, 0.012053489685058594, 0.014331817626953125, 0.016610145568847656, 0.018888473510742188, 0.02116680145263672, 0.02344512939453125, 0.02572345733642578, 0.028001785278320312, 0.030280113220214844, 0.032558441162109375, 0.034836769104003906, 0.03711509704589844, 0.03939342498779297, 0.0416717529296875, 0.04395008087158203, 0.04622840881347656, 0.048506736755371094, 0.050785064697265625, 0.053063392639160156, 0.05534172058105469, 0.05762004852294922, 0.05989837646484375, 0.06217670440673828, 0.06445503234863281, 0.06673336029052734, 0.06901168823242188, 0.0712900161743164, 0.07356834411621094, 0.07584667205810547, 0.078125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 4.0, 2.0, 9.0, 16.0, 20.0, 24.0, 43.0, 84.0, 94.0, 178.0, 354.0, 744.0, 1986.0, 6817.0, 42397.0, 834653.0, 143448.0, 12478.0, 3088.0, 1039.0, 445.0, 247.0, 140.0, 93.0, 59.0, 34.0, 22.0, 9.0, 11.0, 6.0, 5.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.041290283203125, -0.04016518592834473, -0.03904008865356445, -0.03791499137878418, -0.036789894104003906, -0.03566479682922363, -0.03453969955444336, -0.033414602279663086, -0.03228950500488281, -0.03116440773010254, -0.030039310455322266, -0.028914213180541992, -0.02778911590576172, -0.026664018630981445, -0.025538921356201172, -0.0244138240814209, -0.023288726806640625, -0.02216362953186035, -0.021038532257080078, -0.019913434982299805, -0.01878833770751953, -0.017663240432739258, -0.016538143157958984, -0.015413045883178711, -0.014287948608398438, -0.013162851333618164, -0.01203775405883789, -0.010912656784057617, -0.009787559509277344, -0.00866246223449707, -0.007537364959716797, -0.0064122676849365234, -0.00528717041015625, -0.0041620731353759766, -0.003036975860595703, -0.0019118785858154297, -0.0007867813110351562, 0.0003383159637451172, 0.0014634132385253906, 0.002588510513305664, 0.0037136077880859375, 0.004838705062866211, 0.005963802337646484, 0.007088899612426758, 0.008213996887207031, 0.009339094161987305, 0.010464191436767578, 0.011589288711547852, 0.012714385986328125, 0.013839483261108398, 0.014964580535888672, 0.016089677810668945, 0.01721477508544922, 0.018339872360229492, 0.019464969635009766, 0.02059006690979004, 0.021715164184570312, 0.022840261459350586, 0.02396535873413086, 0.025090456008911133, 0.026215553283691406, 0.02734065055847168, 0.028465747833251953, 0.029590845108032227, 0.0307159423828125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 7.0, 6.0, 6.0, 11.0, 18.0, 8.0, 23.0, 34.0, 28.0, 39.0, 41.0, 47.0, 47.0, 47.0, 63.0, 79.0, 84.0, 51.0, 65.0, 64.0, 46.0, 34.0, 32.0, 37.0, 22.0, 19.0, 11.0, 12.0, 8.0, 4.0, 5.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0067901611328125e-06, -4.821456968784332e-06, -4.636123776435852e-06, -4.450790584087372e-06, -4.265457391738892e-06, -4.080124199390411e-06, -3.894791007041931e-06, -3.709457814693451e-06, -3.5241246223449707e-06, -3.3387914299964905e-06, -3.1534582376480103e-06, -2.96812504529953e-06, -2.78279185295105e-06, -2.5974586606025696e-06, -2.4121254682540894e-06, -2.226792275905609e-06, -2.041459083557129e-06, -1.8561258912086487e-06, -1.6707926988601685e-06, -1.4854595065116882e-06, -1.300126314163208e-06, -1.1147931218147278e-06, -9.294599294662476e-07, -7.441267371177673e-07, -5.587935447692871e-07, -3.734603524208069e-07, -1.8812716007232666e-07, -2.7939677238464355e-09, 1.825392246246338e-07, 3.67872416973114e-07, 5.532056093215942e-07, 7.385388016700745e-07, 9.238719940185547e-07, 1.109205186367035e-06, 1.2945383787155151e-06, 1.4798715710639954e-06, 1.6652047634124756e-06, 1.8505379557609558e-06, 2.035871148109436e-06, 2.2212043404579163e-06, 2.4065375328063965e-06, 2.5918707251548767e-06, 2.777203917503357e-06, 2.962537109851837e-06, 3.1478703022003174e-06, 3.3332034945487976e-06, 3.518536686897278e-06, 3.703869879245758e-06, 3.889203071594238e-06, 4.0745362639427185e-06, 4.259869456291199e-06, 4.445202648639679e-06, 4.630535840988159e-06, 4.815869033336639e-06, 5.00120222568512e-06, 5.1865354180336e-06, 5.37186861038208e-06, 5.55720180273056e-06, 5.7425349950790405e-06, 5.927868187427521e-06, 6.113201379776001e-06, 6.298534572124481e-06, 6.4838677644729614e-06, 6.669200956821442e-06, 6.854534149169922e-06]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 7.0, 13.0, 14.0, 23.0, 34.0, 67.0, 171.0, 343.0, 755.0, 2018.0, 8886.0, 91243.0, 864300.0, 69783.0, 7771.0, 1903.0, 649.0, 262.0, 127.0, 77.0, 46.0, 23.0, 15.0, 9.0, 4.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0460205078125, -0.044883012771606445, -0.04374551773071289, -0.042608022689819336, -0.04147052764892578, -0.04033303260803223, -0.03919553756713867, -0.03805804252624512, -0.03692054748535156, -0.03578305244445801, -0.03464555740356445, -0.0335080623626709, -0.032370567321777344, -0.03123307228088379, -0.030095577239990234, -0.02895808219909668, -0.027820587158203125, -0.02668309211730957, -0.025545597076416016, -0.02440810203552246, -0.023270606994628906, -0.02213311195373535, -0.020995616912841797, -0.019858121871948242, -0.018720626831054688, -0.017583131790161133, -0.016445636749267578, -0.015308141708374023, -0.014170646667480469, -0.013033151626586914, -0.01189565658569336, -0.010758161544799805, -0.00962066650390625, -0.008483171463012695, -0.007345676422119141, -0.006208181381225586, -0.005070686340332031, -0.0039331912994384766, -0.002795696258544922, -0.0016582012176513672, -0.0005207061767578125, 0.0006167888641357422, 0.0017542839050292969, 0.0028917789459228516, 0.004029273986816406, 0.005166769027709961, 0.006304264068603516, 0.00744175910949707, 0.008579254150390625, 0.00971674919128418, 0.010854244232177734, 0.011991739273071289, 0.013129234313964844, 0.014266729354858398, 0.015404224395751953, 0.016541719436645508, 0.017679214477539062, 0.018816709518432617, 0.019954204559326172, 0.021091699600219727, 0.02222919464111328, 0.023366689682006836, 0.02450418472290039, 0.025641679763793945, 0.0267791748046875]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 6.0, 5.0, 1.0, 7.0, 14.0, 19.0, 62.0, 117.0, 179.0, 251.0, 174.0, 89.0, 28.0, 18.0, 10.0, 9.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06011962890625, -0.05862712860107422, -0.05713462829589844, -0.055642127990722656, -0.054149627685546875, -0.052657127380371094, -0.05116462707519531, -0.04967212677001953, -0.04817962646484375, -0.04668712615966797, -0.04519462585449219, -0.043702125549316406, -0.042209625244140625, -0.040717124938964844, -0.03922462463378906, -0.03773212432861328, -0.0362396240234375, -0.03474712371826172, -0.03325462341308594, -0.031762123107910156, -0.030269622802734375, -0.028777122497558594, -0.027284622192382812, -0.02579212188720703, -0.02429962158203125, -0.02280712127685547, -0.021314620971679688, -0.019822120666503906, -0.018329620361328125, -0.016837120056152344, -0.015344619750976562, -0.013852119445800781, -0.012359619140625, -0.010867118835449219, -0.009374618530273438, -0.007882118225097656, -0.006389617919921875, -0.004897117614746094, -0.0034046173095703125, -0.0019121170043945312, -0.00041961669921875, 0.0010728836059570312, 0.0025653839111328125, 0.004057884216308594, 0.005550384521484375, 0.007042884826660156, 0.008535385131835938, 0.010027885437011719, 0.0115203857421875, 0.013012886047363281, 0.014505386352539062, 0.015997886657714844, 0.017490386962890625, 0.018982887268066406, 0.020475387573242188, 0.02196788787841797, 0.02346038818359375, 0.02495288848876953, 0.026445388793945312, 0.027937889099121094, 0.029430389404296875, 0.030922889709472656, 0.03241539001464844, 0.03390789031982422, 0.035400390625]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 12.0, 15.0, 20.0, 42.0, 92.0, 214.0, 247.0, 182.0, 89.0, 55.0, 22.0, 9.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.28669309616088867, -0.2693149149417877, -0.25193676352500916, -0.2345585823059082, -0.21718040108680725, -0.1998022347688675, -0.18242406845092773, -0.16504588723182678, -0.14766772091388702, -0.13028955459594727, -0.11291137337684631, -0.09553320705890656, -0.0781550332903862, -0.060776859521865845, -0.043398693203926086, -0.02602051943540573, -0.008642345666885376, 0.00873582623898983, 0.026113998144865036, 0.04349216818809509, 0.06087034195661545, 0.0782485157251358, 0.09562668204307556, 0.11300485581159592, 0.13038302958011627, 0.14776119589805603, 0.16513937711715698, 0.18251754343509674, 0.1998957097530365, 0.21727389097213745, 0.2346520572900772, 0.25203022360801697, 0.2694084048271179, 0.28678658604621887, 0.30416473746299744, 0.3215429186820984, 0.33892109990119934, 0.3562992811203003, 0.37367743253707886, 0.3910556137561798, 0.40843379497528076, 0.4258119761943817, 0.4431901276111603, 0.46056830883026123, 0.4779464900493622, 0.49532467126846313, 0.5127028226852417, 0.5300809741020203, 0.5474591255187988, 0.5648372769355774, 0.5822154879570007, 0.5995936393737793, 0.6169717907905579, 0.6343500018119812, 0.6517281532287598, 0.6691063046455383, 0.6864845156669617, 0.7038626670837402, 0.7212408781051636, 0.7386190295219421, 0.7559971809387207, 0.773375391960144, 0.7907535433769226, 0.8081316947937012, 0.8255099058151245]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 7.0, 4.0, 8.0, 8.0, 13.0, 10.0, 14.0, 12.0, 17.0, 18.0, 24.0, 25.0, 32.0, 31.0, 29.0, 36.0, 46.0, 42.0, 38.0, 37.0, 41.0, 52.0, 59.0, 46.0, 37.0, 33.0, 32.0, 36.0, 27.0, 28.0, 31.0, 16.0, 20.0, 16.0, 13.0, 12.0, 11.0, 14.0, 7.0, 4.0, 7.0, 3.0, 1.0, 3.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.33788788318634033, -0.32666054368019104, -0.31543317437171936, -0.30420583486557007, -0.2929784953594208, -0.2817511558532715, -0.2705237865447998, -0.2592964470386505, -0.24806909263134003, -0.23684173822402954, -0.22561439871788025, -0.21438704431056976, -0.20315968990325928, -0.19193235039710999, -0.1807049959897995, -0.169477641582489, -0.15825030207633972, -0.14702294766902924, -0.13579560816287994, -0.12456825375556946, -0.11334090679883957, -0.10211355984210968, -0.0908862054347992, -0.0796588584780693, -0.06843151152133942, -0.05720416456460953, -0.04597681388258934, -0.03474946320056915, -0.023522116243839264, -0.012294769287109375, -0.0010674148797988892, 0.010159932076931, 0.02138727903366089, 0.03261462599039078, 0.043841976672410965, 0.05506932735443115, 0.06629667431116104, 0.07752402126789093, 0.08875137567520142, 0.0999787226319313, 0.1112060695886612, 0.12243341654539108, 0.13366076350212097, 0.14488811790943146, 0.15611547231674194, 0.16734281182289124, 0.17857016623020172, 0.1897975206375122, 0.2010248601436615, 0.21225221455097198, 0.22347955405712128, 0.23470690846443176, 0.24593424797058105, 0.25716161727905273, 0.268388956785202, 0.2796162962913513, 0.290843665599823, 0.3020710051059723, 0.31329837441444397, 0.32452571392059326, 0.33575305342674255, 0.34698039293289185, 0.3582077622413635, 0.3694351017475128, 0.3806624412536621]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 5.0, 7.0, 13.0, 15.0, 12.0, 33.0, 53.0, 50.0, 85.0, 106.0, 193.0, 384.0, 891.0, 2594.0, 15698.0, 4143698.0, 25089.0, 3251.0, 1043.0, 432.0, 220.0, 112.0, 87.0, 63.0, 33.0, 30.0, 19.0, 27.0, 13.0, 2.0, 11.0, 2.0, 3.0, 1.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0765380859375, -0.07365798950195312, -0.07077789306640625, -0.06789779663085938, -0.0650177001953125, -0.062137603759765625, -0.05925750732421875, -0.056377410888671875, -0.053497314453125, -0.050617218017578125, -0.04773712158203125, -0.044857025146484375, -0.0419769287109375, -0.039096832275390625, -0.03621673583984375, -0.033336639404296875, -0.03045654296875, -0.027576446533203125, -0.02469635009765625, -0.021816253662109375, -0.0189361572265625, -0.016056060791015625, -0.01317596435546875, -0.010295867919921875, -0.007415771484375, -0.004535675048828125, -0.00165557861328125, 0.001224517822265625, 0.0041046142578125, 0.006984710693359375, 0.00986480712890625, 0.012744903564453125, 0.015625, 0.018505096435546875, 0.02138519287109375, 0.024265289306640625, 0.0271453857421875, 0.030025482177734375, 0.03290557861328125, 0.035785675048828125, 0.038665771484375, 0.041545867919921875, 0.04442596435546875, 0.047306060791015625, 0.0501861572265625, 0.053066253662109375, 0.05594635009765625, 0.058826446533203125, 0.06170654296875, 0.06458663940429688, 0.06746673583984375, 0.07034683227539062, 0.0732269287109375, 0.07610702514648438, 0.07898712158203125, 0.08186721801757812, 0.084747314453125, 0.08762741088867188, 0.09050750732421875, 0.09338760375976562, 0.0962677001953125, 0.09914779663085938, 0.10202789306640625, 0.10490798950195312, 0.1077880859375]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 7.0, 13.0, 11.0, 13.0, 23.0, 20.0, 24.0, 31.0, 40.0, 38.0, 46.0, 58.0, 63.0, 59.0, 83.0, 61.0, 61.0, 57.0, 57.0, 42.0, 34.0, 36.0, 29.0, 21.0, 15.0, 15.0, 14.0, 7.0, 5.0, 4.0, 4.0, 4.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0307159423828125, -0.029825687408447266, -0.02893543243408203, -0.028045177459716797, -0.027154922485351562, -0.026264667510986328, -0.025374412536621094, -0.02448415756225586, -0.023593902587890625, -0.02270364761352539, -0.021813392639160156, -0.020923137664794922, -0.020032882690429688, -0.019142627716064453, -0.01825237274169922, -0.017362117767333984, -0.01647186279296875, -0.015581607818603516, -0.014691352844238281, -0.013801097869873047, -0.012910842895507812, -0.012020587921142578, -0.011130332946777344, -0.01024007797241211, -0.009349822998046875, -0.00845956802368164, -0.007569313049316406, -0.006679058074951172, -0.0057888031005859375, -0.004898548126220703, -0.004008293151855469, -0.0031180381774902344, -0.002227783203125, -0.0013375282287597656, -0.00044727325439453125, 0.0004429817199707031, 0.0013332366943359375, 0.002223491668701172, 0.0031137466430664062, 0.004004001617431641, 0.004894256591796875, 0.005784511566162109, 0.006674766540527344, 0.007565021514892578, 0.008455276489257812, 0.009345531463623047, 0.010235786437988281, 0.011126041412353516, 0.01201629638671875, 0.012906551361083984, 0.013796806335449219, 0.014687061309814453, 0.015577316284179688, 0.016467571258544922, 0.017357826232910156, 0.01824808120727539, 0.019138336181640625, 0.02002859115600586, 0.020918846130371094, 0.021809101104736328, 0.022699356079101562, 0.023589611053466797, 0.02447986602783203, 0.025370121002197266, 0.0262603759765625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 7.0, 8.0, 7.0, 8.0, 12.0, 13.0, 22.0, 25.0, 33.0, 41.0, 60.0, 82.0, 99.0, 135.0, 210.0, 325.0, 529.0, 925.0, 1825.0, 4233.0, 12561.0, 87541.0, 4025023.0, 44161.0, 9301.0, 3435.0, 1482.0, 811.0, 432.0, 280.0, 180.0, 139.0, 92.0, 66.0, 57.0, 30.0, 27.0, 18.0, 16.0, 9.0, 7.0, 5.0, 7.0, 3.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.04443359375, -0.0430607795715332, -0.041687965393066406, -0.04031515121459961, -0.03894233703613281, -0.037569522857666016, -0.03619670867919922, -0.03482389450073242, -0.033451080322265625, -0.03207826614379883, -0.03070545196533203, -0.029332637786865234, -0.027959823608398438, -0.02658700942993164, -0.025214195251464844, -0.023841381072998047, -0.02246856689453125, -0.021095752716064453, -0.019722938537597656, -0.01835012435913086, -0.016977310180664062, -0.015604496002197266, -0.014231681823730469, -0.012858867645263672, -0.011486053466796875, -0.010113239288330078, -0.008740425109863281, -0.007367610931396484, -0.0059947967529296875, -0.004621982574462891, -0.0032491683959960938, -0.0018763542175292969, -0.0005035400390625, 0.0008692741394042969, 0.0022420883178710938, 0.0036149024963378906, 0.0049877166748046875, 0.006360530853271484, 0.007733345031738281, 0.009106159210205078, 0.010478973388671875, 0.011851787567138672, 0.013224601745605469, 0.014597415924072266, 0.015970230102539062, 0.01734304428100586, 0.018715858459472656, 0.020088672637939453, 0.02146148681640625, 0.022834300994873047, 0.024207115173339844, 0.02557992935180664, 0.026952743530273438, 0.028325557708740234, 0.02969837188720703, 0.031071186065673828, 0.032444000244140625, 0.03381681442260742, 0.03518962860107422, 0.036562442779541016, 0.03793525695800781, 0.03930807113647461, 0.040680885314941406, 0.0420536994934082, 0.043426513671875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 6.0, 17.0, 31.0, 68.0, 258.0, 3457.0, 106.0, 42.0, 35.0, 14.0, 9.0, 1.0, 10.0, 4.0, 3.0, 3.0, 0.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0092620849609375, -0.008955836296081543, -0.008649587631225586, -0.008343338966369629, -0.008037090301513672, -0.007730841636657715, -0.007424592971801758, -0.007118344306945801, -0.006812095642089844, -0.006505846977233887, -0.00619959831237793, -0.005893349647521973, -0.005587100982666016, -0.005280852317810059, -0.0049746036529541016, -0.0046683549880981445, -0.0043621063232421875, -0.0040558576583862305, -0.0037496089935302734, -0.0034433603286743164, -0.0031371116638183594, -0.0028308629989624023, -0.0025246143341064453, -0.0022183656692504883, -0.0019121170043945312, -0.0016058683395385742, -0.0012996196746826172, -0.0009933710098266602, -0.0006871223449707031, -0.0003808736801147461, -7.462501525878906e-05, 0.00023162364959716797, 0.000537872314453125, 0.000844120979309082, 0.001150369644165039, 0.001456618309020996, 0.0017628669738769531, 0.00206911563873291, 0.002375364303588867, 0.0026816129684448242, 0.0029878616333007812, 0.0032941102981567383, 0.0036003589630126953, 0.003906607627868652, 0.004212856292724609, 0.004519104957580566, 0.0048253536224365234, 0.0051316022872924805, 0.0054378509521484375, 0.0057440996170043945, 0.0060503482818603516, 0.006356596946716309, 0.006662845611572266, 0.006969094276428223, 0.00727534294128418, 0.007581591606140137, 0.007887840270996094, 0.00819408893585205, 0.008500337600708008, 0.008806586265563965, 0.009112834930419922, 0.009419083595275879, 0.009725332260131836, 0.010031580924987793, 0.01033782958984375]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 7.0, 15.0, 77.0, 211.0, 371.0, 209.0, 83.0, 20.0, 13.0, 8.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02930133044719696, -0.026735611259937286, -0.024169892072677612, -0.021604172885417938, -0.019038453698158264, -0.01647273451089859, -0.013907015323638916, -0.011341296136379242, -0.008775576949119568, -0.006209857761859894, -0.0036441385746002197, -0.0010784193873405457, 0.0014872997999191284, 0.0040530189871788025, 0.0066187381744384766, 0.00918445736169815, 0.011750176548957825, 0.014315895736217499, 0.016881614923477173, 0.019447334110736847, 0.02201305329799652, 0.024578772485256195, 0.02714449167251587, 0.029710210859775543, 0.03227593004703522, 0.03484164923429489, 0.037407368421554565, 0.03997308760881424, 0.042538806796073914, 0.04510452598333359, 0.04767024517059326, 0.050235964357852936, 0.05280168354511261, 0.055367402732372284, 0.05793312191963196, 0.06049884110689163, 0.0630645602941513, 0.06563027948141098, 0.06819599866867065, 0.07076171785593033, 0.07332743704319, 0.07589315623044968, 0.07845887541770935, 0.08102459460496902, 0.0835903137922287, 0.08615603297948837, 0.08872175216674805, 0.09128747135400772, 0.0938531905412674, 0.09641890972852707, 0.09898462891578674, 0.10155034810304642, 0.10411606729030609, 0.10668178647756577, 0.10924750566482544, 0.11181322485208511, 0.11437894403934479, 0.11694466322660446, 0.11951038241386414, 0.12207610160112381, 0.12464182078838348, 0.12720754742622375, 0.12977325916290283, 0.1323389708995819, 0.13490469753742218]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 7.0, 5.0, 5.0, 8.0, 9.0, 8.0, 18.0, 17.0, 19.0, 26.0, 31.0, 31.0, 39.0, 35.0, 47.0, 49.0, 43.0, 41.0, 41.0, 52.0, 52.0, 44.0, 55.0, 54.0, 34.0, 36.0, 43.0, 28.0, 29.0, 21.0, 20.0, 18.0, 12.0, 9.0, 8.0, 11.0, 3.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.013973116874694824, -0.013431194238364697, -0.012889271602034569, -0.012347348965704441, -0.011805426329374313, -0.011263503693044186, -0.010721581056714058, -0.01017965842038393, -0.009637735784053802, -0.009095813147723675, -0.008553890511393547, -0.00801196787506342, -0.007470045238733292, -0.006928122602403164, -0.006386199966073036, -0.0058442773297429085, -0.005302354693412781, -0.004760432057082653, -0.004218509420752525, -0.0036765867844223976, -0.00313466414809227, -0.002592741511762142, -0.0020508188754320145, -0.0015088962391018867, -0.000966973602771759, -0.0004250509664416313, 0.0001168716698884964, 0.0006587943062186241, 0.0012007169425487518, 0.0017426395788788795, 0.0022845622152090073, 0.002826484851539135, 0.0033684074878692627, 0.00391033012419939, 0.004452252760529518, 0.004994175396859646, 0.0055360980331897736, 0.006078020669519901, 0.006619943305850029, 0.007161865942180157, 0.007703788578510284, 0.008245711214840412, 0.00878763385117054, 0.009329556487500668, 0.009871479123830795, 0.010413401760160923, 0.01095532439649105, 0.011497247032821178, 0.012039169669151306, 0.012581092305481434, 0.013123014941811562, 0.01366493757814169, 0.014206860214471817, 0.014748782850801945, 0.015290705487132072, 0.015832629054784775, 0.016374550759792328, 0.01691647246479988, 0.017458396032452583, 0.018000319600105286, 0.01854224130511284, 0.019084163010120392, 0.019626086577773094, 0.020168010145425797, 0.02070993185043335]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 3.0, 4.0, 5.0, 8.0, 15.0, 8.0, 29.0, 37.0, 70.0, 77.0, 128.0, 213.0, 340.0, 573.0, 1134.0, 2255.0, 4992.0, 12288.0, 36473.0, 123311.0, 388191.0, 332303.0, 97511.0, 29642.0, 10366.0, 4234.0, 1971.0, 971.0, 536.0, 319.0, 178.0, 119.0, 96.0, 60.0, 27.0, 23.0, 14.0, 15.0, 4.0, 8.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.039703369140625, -0.0383758544921875, -0.03704833984375, -0.0357208251953125, -0.034393310546875, -0.0330657958984375, -0.03173828125, -0.0304107666015625, -0.029083251953125, -0.0277557373046875, -0.02642822265625, -0.0251007080078125, -0.023773193359375, -0.0224456787109375, -0.0211181640625, -0.0197906494140625, -0.018463134765625, -0.0171356201171875, -0.01580810546875, -0.0144805908203125, -0.013153076171875, -0.0118255615234375, -0.010498046875, -0.0091705322265625, -0.007843017578125, -0.0065155029296875, -0.00518798828125, -0.0038604736328125, -0.002532958984375, -0.0012054443359375, 0.0001220703125, 0.0014495849609375, 0.002777099609375, 0.0041046142578125, 0.00543212890625, 0.0067596435546875, 0.008087158203125, 0.0094146728515625, 0.0107421875, 0.0120697021484375, 0.013397216796875, 0.0147247314453125, 0.01605224609375, 0.0173797607421875, 0.018707275390625, 0.0200347900390625, 0.0213623046875, 0.0226898193359375, 0.024017333984375, 0.0253448486328125, 0.02667236328125, 0.0279998779296875, 0.029327392578125, 0.0306549072265625, 0.031982421875, 0.0333099365234375, 0.034637451171875, 0.0359649658203125, 0.03729248046875, 0.0386199951171875, 0.039947509765625, 0.0412750244140625, 0.0426025390625, 0.0439300537109375, 0.045257568359375]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 5.0, 6.0, 8.0, 11.0, 16.0, 25.0, 24.0, 22.0, 27.0, 36.0, 42.0, 48.0, 50.0, 70.0, 64.0, 74.0, 57.0, 56.0, 56.0, 53.0, 50.0, 39.0, 41.0, 25.0, 16.0, 11.0, 24.0, 13.0, 7.0, 5.0, 5.0, 5.0, 5.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0307464599609375, -0.029855728149414062, -0.028964996337890625, -0.028074264526367188, -0.02718353271484375, -0.026292800903320312, -0.025402069091796875, -0.024511337280273438, -0.02362060546875, -0.022729873657226562, -0.021839141845703125, -0.020948410034179688, -0.02005767822265625, -0.019166946411132812, -0.018276214599609375, -0.017385482788085938, -0.0164947509765625, -0.015604019165039062, -0.014713287353515625, -0.013822555541992188, -0.01293182373046875, -0.012041091918945312, -0.011150360107421875, -0.010259628295898438, -0.009368896484375, -0.008478164672851562, -0.007587432861328125, -0.0066967010498046875, -0.00580596923828125, -0.0049152374267578125, -0.004024505615234375, -0.0031337738037109375, -0.0022430419921875, -0.0013523101806640625, -0.000461578369140625, 0.0004291534423828125, 0.00131988525390625, 0.0022106170654296875, 0.003101348876953125, 0.0039920806884765625, 0.0048828125, 0.0057735443115234375, 0.006664276123046875, 0.0075550079345703125, 0.00844573974609375, 0.009336471557617188, 0.010227203369140625, 0.011117935180664062, 0.0120086669921875, 0.012899398803710938, 0.013790130615234375, 0.014680862426757812, 0.01557159423828125, 0.016462326049804688, 0.017353057861328125, 0.018243789672851562, 0.019134521484375, 0.020025253295898438, 0.020915985107421875, 0.021806716918945312, 0.02269744873046875, 0.023588180541992188, 0.024478912353515625, 0.025369644165039062, 0.0262603759765625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 4.0, 1.0, 1.0, 7.0, 6.0, 6.0, 9.0, 10.0, 8.0, 22.0, 24.0, 29.0, 32.0, 43.0, 40.0, 78.0, 111.0, 145.0, 240.0, 431.0, 967.0, 2391.0, 8933.0, 45758.0, 337251.0, 554086.0, 77953.0, 14026.0, 3454.0, 1143.0, 515.0, 274.0, 163.0, 99.0, 80.0, 51.0, 42.0, 32.0, 28.0, 16.0, 13.0, 11.0, 4.0, 9.0, 3.0, 2.0, 4.0, 1.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.056640625, -0.05498170852661133, -0.053322792053222656, -0.051663875579833984, -0.05000495910644531, -0.04834604263305664, -0.04668712615966797, -0.0450282096862793, -0.043369293212890625, -0.04171037673950195, -0.04005146026611328, -0.03839254379272461, -0.03673362731933594, -0.035074710845947266, -0.033415794372558594, -0.03175687789916992, -0.03009796142578125, -0.028439044952392578, -0.026780128479003906, -0.025121212005615234, -0.023462295532226562, -0.02180337905883789, -0.02014446258544922, -0.018485546112060547, -0.016826629638671875, -0.015167713165283203, -0.013508796691894531, -0.01184988021850586, -0.010190963745117188, -0.008532047271728516, -0.006873130798339844, -0.005214214324951172, -0.0035552978515625, -0.0018963813781738281, -0.00023746490478515625, 0.0014214515686035156, 0.0030803680419921875, 0.004739284515380859, 0.006398200988769531, 0.008057117462158203, 0.009716033935546875, 0.011374950408935547, 0.013033866882324219, 0.01469278335571289, 0.016351699829101562, 0.018010616302490234, 0.019669532775878906, 0.021328449249267578, 0.02298736572265625, 0.024646282196044922, 0.026305198669433594, 0.027964115142822266, 0.029623031616210938, 0.03128194808959961, 0.03294086456298828, 0.03459978103637695, 0.036258697509765625, 0.0379176139831543, 0.03957653045654297, 0.04123544692993164, 0.04289436340332031, 0.044553279876708984, 0.046212196350097656, 0.04787111282348633, 0.049530029296875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 5.0, 5.0, 5.0, 10.0, 13.0, 15.0, 19.0, 26.0, 20.0, 25.0, 33.0, 27.0, 30.0, 49.0, 36.0, 40.0, 51.0, 42.0, 47.0, 51.0, 51.0, 55.0, 43.0, 26.0, 38.0, 32.0, 33.0, 28.0, 25.0, 20.0, 16.0, 15.0, 14.0, 15.0, 11.0, 7.0, 7.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.079345703125, -0.07697677612304688, -0.07460784912109375, -0.07223892211914062, -0.0698699951171875, -0.06750106811523438, -0.06513214111328125, -0.06276321411132812, -0.060394287109375, -0.058025360107421875, -0.05565643310546875, -0.053287506103515625, -0.0509185791015625, -0.048549652099609375, -0.04618072509765625, -0.043811798095703125, -0.04144287109375, -0.039073944091796875, -0.03670501708984375, -0.034336090087890625, -0.0319671630859375, -0.029598236083984375, -0.02722930908203125, -0.024860382080078125, -0.022491455078125, -0.020122528076171875, -0.01775360107421875, -0.015384674072265625, -0.0130157470703125, -0.010646820068359375, -0.00827789306640625, -0.005908966064453125, -0.0035400390625, -0.001171112060546875, 0.00119781494140625, 0.003566741943359375, 0.0059356689453125, 0.008304595947265625, 0.01067352294921875, 0.013042449951171875, 0.015411376953125, 0.017780303955078125, 0.02014923095703125, 0.022518157958984375, 0.0248870849609375, 0.027256011962890625, 0.02962493896484375, 0.031993865966796875, 0.03436279296875, 0.036731719970703125, 0.03910064697265625, 0.041469573974609375, 0.0438385009765625, 0.046207427978515625, 0.04857635498046875, 0.050945281982421875, 0.053314208984375, 0.055683135986328125, 0.05805206298828125, 0.060420989990234375, 0.0627899169921875, 0.06515884399414062, 0.06752777099609375, 0.06989669799804688, 0.072265625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 2.0, 3.0, 7.0, 8.0, 12.0, 14.0, 24.0, 47.0, 65.0, 114.0, 200.0, 328.0, 670.0, 1436.0, 3426.0, 9268.0, 30875.0, 125275.0, 528779.0, 266424.0, 55977.0, 15988.0, 5405.0, 2127.0, 975.0, 432.0, 269.0, 153.0, 92.0, 65.0, 28.0, 28.0, 14.0, 13.0, 6.0, 3.0, 5.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01142120361328125, -0.0110093355178833, -0.010597467422485352, -0.010185599327087402, -0.009773731231689453, -0.009361863136291504, -0.008949995040893555, -0.008538126945495605, -0.008126258850097656, -0.007714390754699707, -0.007302522659301758, -0.006890654563903809, -0.006478786468505859, -0.00606691837310791, -0.005655050277709961, -0.005243182182312012, -0.0048313140869140625, -0.004419445991516113, -0.004007577896118164, -0.003595709800720215, -0.0031838417053222656, -0.0027719736099243164, -0.002360105514526367, -0.001948237419128418, -0.0015363693237304688, -0.0011245012283325195, -0.0007126331329345703, -0.0003007650375366211, 0.00011110305786132812, 0.0005229711532592773, 0.0009348392486572266, 0.0013467073440551758, 0.001758575439453125, 0.0021704435348510742, 0.0025823116302490234, 0.0029941797256469727, 0.003406047821044922, 0.003817915916442871, 0.00422978401184082, 0.0046416521072387695, 0.005053520202636719, 0.005465388298034668, 0.005877256393432617, 0.006289124488830566, 0.006700992584228516, 0.007112860679626465, 0.007524728775024414, 0.007936596870422363, 0.008348464965820312, 0.008760333061218262, 0.009172201156616211, 0.00958406925201416, 0.00999593734741211, 0.010407805442810059, 0.010819673538208008, 0.011231541633605957, 0.011643409729003906, 0.012055277824401855, 0.012467145919799805, 0.012879014015197754, 0.013290882110595703, 0.013702750205993652, 0.014114618301391602, 0.01452648639678955, 0.0149383544921875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 6.0, 9.0, 9.0, 15.0, 21.0, 16.0, 25.0, 26.0, 18.0, 42.0, 53.0, 42.0, 44.0, 73.0, 49.0, 75.0, 71.0, 44.0, 66.0, 50.0, 29.0, 55.0, 34.0, 21.0, 22.0, 27.0, 18.0, 14.0, 7.0, 4.0, 8.0, 4.0, 4.0, 5.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.112720489501953e-06, -3.953464329242706e-06, -3.7942081689834595e-06, -3.6349520087242126e-06, -3.475695848464966e-06, -3.316439688205719e-06, -3.157183527946472e-06, -2.9979273676872253e-06, -2.8386712074279785e-06, -2.6794150471687317e-06, -2.520158886909485e-06, -2.360902726650238e-06, -2.201646566390991e-06, -2.0423904061317444e-06, -1.8831342458724976e-06, -1.7238780856132507e-06, -1.564621925354004e-06, -1.405365765094757e-06, -1.2461096048355103e-06, -1.0868534445762634e-06, -9.275972843170166e-07, -7.683411240577698e-07, -6.09084963798523e-07, -4.498288035392761e-07, -2.905726432800293e-07, -1.3131648302078247e-07, 2.7939677238464355e-08, 1.8719583749771118e-07, 3.46451997756958e-07, 5.057081580162048e-07, 6.649643182754517e-07, 8.242204785346985e-07, 9.834766387939453e-07, 1.1427327990531921e-06, 1.301988959312439e-06, 1.4612451195716858e-06, 1.6205012798309326e-06, 1.7797574400901794e-06, 1.9390136003494263e-06, 2.098269760608673e-06, 2.25752592086792e-06, 2.4167820811271667e-06, 2.5760382413864136e-06, 2.7352944016456604e-06, 2.8945505619049072e-06, 3.053806722164154e-06, 3.213062882423401e-06, 3.3723190426826477e-06, 3.5315752029418945e-06, 3.6908313632011414e-06, 3.850087523460388e-06, 4.009343683719635e-06, 4.168599843978882e-06, 4.327856004238129e-06, 4.4871121644973755e-06, 4.646368324756622e-06, 4.805624485015869e-06, 4.964880645275116e-06, 5.124136805534363e-06, 5.28339296579361e-06, 5.4426491260528564e-06, 5.601905286312103e-06, 5.76116144657135e-06, 5.920417606830597e-06, 6.079673767089844e-06]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 6.0, 3.0, 11.0, 14.0, 19.0, 25.0, 47.0, 59.0, 136.0, 249.0, 472.0, 1090.0, 2739.0, 7644.0, 25661.0, 105608.0, 442949.0, 351995.0, 79339.0, 20119.0, 6226.0, 2264.0, 953.0, 415.0, 236.0, 98.0, 60.0, 24.0, 19.0, 19.0, 16.0, 11.0, 3.0, 7.0, 5.0, 6.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.015899658203125, -0.015468835830688477, -0.015038013458251953, -0.01460719108581543, -0.014176368713378906, -0.013745546340942383, -0.01331472396850586, -0.012883901596069336, -0.012453079223632812, -0.012022256851196289, -0.011591434478759766, -0.011160612106323242, -0.010729789733886719, -0.010298967361450195, -0.009868144989013672, -0.009437322616577148, -0.009006500244140625, -0.008575677871704102, -0.008144855499267578, -0.007714033126831055, -0.007283210754394531, -0.006852388381958008, -0.006421566009521484, -0.005990743637084961, -0.0055599212646484375, -0.005129098892211914, -0.004698276519775391, -0.004267454147338867, -0.0038366317749023438, -0.0034058094024658203, -0.002974987030029297, -0.0025441646575927734, -0.00211334228515625, -0.0016825199127197266, -0.0012516975402832031, -0.0008208751678466797, -0.00039005279541015625, 4.076957702636719e-05, 0.0004715919494628906, 0.0009024143218994141, 0.0013332366943359375, 0.001764059066772461, 0.0021948814392089844, 0.002625703811645508, 0.0030565261840820312, 0.0034873485565185547, 0.003918170928955078, 0.0043489933013916016, 0.004779815673828125, 0.0052106380462646484, 0.005641460418701172, 0.006072282791137695, 0.006503105163574219, 0.006933927536010742, 0.007364749908447266, 0.007795572280883789, 0.008226394653320312, 0.008657217025756836, 0.00908803939819336, 0.009518861770629883, 0.009949684143066406, 0.01038050651550293, 0.010811328887939453, 0.011242151260375977, 0.0116729736328125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 4.0, 4.0, 2.0, 7.0, 11.0, 16.0, 18.0, 22.0, 29.0, 37.0, 57.0, 58.0, 57.0, 69.0, 65.0, 86.0, 78.0, 62.0, 57.0, 52.0, 37.0, 41.0, 26.0, 25.0, 19.0, 16.0, 8.0, 3.0, 5.0, 8.0, 7.0, 3.0, 5.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0156402587890625, -0.01517331600189209, -0.01470637321472168, -0.01423943042755127, -0.01377248764038086, -0.01330554485321045, -0.012838602066040039, -0.012371659278869629, -0.011904716491699219, -0.011437773704528809, -0.010970830917358398, -0.010503888130187988, -0.010036945343017578, -0.009570002555847168, -0.009103059768676758, -0.008636116981506348, -0.008169174194335938, -0.007702231407165527, -0.007235288619995117, -0.006768345832824707, -0.006301403045654297, -0.005834460258483887, -0.0053675174713134766, -0.004900574684143066, -0.004433631896972656, -0.003966689109802246, -0.003499746322631836, -0.0030328035354614258, -0.0025658607482910156, -0.0020989179611206055, -0.0016319751739501953, -0.0011650323867797852, -0.000698089599609375, -0.00023114681243896484, 0.0002357959747314453, 0.0007027387619018555, 0.0011696815490722656, 0.0016366243362426758, 0.002103567123413086, 0.002570509910583496, 0.0030374526977539062, 0.0035043954849243164, 0.0039713382720947266, 0.004438281059265137, 0.004905223846435547, 0.005372166633605957, 0.005839109420776367, 0.006306052207946777, 0.0067729949951171875, 0.007239937782287598, 0.007706880569458008, 0.008173823356628418, 0.008640766143798828, 0.009107708930969238, 0.009574651718139648, 0.010041594505310059, 0.010508537292480469, 0.010975480079650879, 0.011442422866821289, 0.0119093656539917, 0.01237630844116211, 0.01284325122833252, 0.01331019401550293, 0.01377713680267334, 0.01424407958984375]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 5.0, 19.0, 46.0, 130.0, 301.0, 305.0, 131.0, 44.0, 22.0, 6.0, 2.0, 0.0, 2.0], "bins": [-1.3754898309707642, -1.3509693145751953, -1.326448917388916, -1.3019284009933472, -1.2774080038070679, -1.252887487411499, -1.2283670902252197, -1.2038465738296509, -1.1793261766433716, -1.1548056602478027, -1.1302852630615234, -1.1057647466659546, -1.0812443494796753, -1.0567238330841064, -1.0322034358978271, -1.0076829195022583, -0.983162522315979, -0.9586420655250549, -0.9341216087341309, -0.9096011519432068, -0.8850806951522827, -0.8605602383613586, -0.8360397815704346, -0.8115193247795105, -0.7869988083839417, -0.7624783515930176, -0.7379578948020935, -0.7134374380111694, -0.6889169812202454, -0.6643965244293213, -0.6398760676383972, -0.6153556108474731, -0.5908351540565491, -0.566314697265625, -0.5417942404747009, -0.5172737836837769, -0.4927533268928528, -0.4682328701019287, -0.44371241331100464, -0.41919195652008057, -0.3946714699268341, -0.37015101313591003, -0.34563055634498596, -0.3211100995540619, -0.2965896427631378, -0.27206918597221375, -0.24754871428012848, -0.2230282574892044, -0.19850780069828033, -0.17398734390735626, -0.1494668871164322, -0.12494642287492752, -0.10042596608400345, -0.07590550929307938, -0.05138504505157471, -0.026864588260650635, -0.0023441314697265625, 0.02217632718384266, 0.04669678583741188, 0.07121724635362625, 0.09573770314455032, 0.1202581599354744, 0.14477862417697906, 0.16929908096790314, 0.1938195377588272]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 5.0, 4.0, 2.0, 1.0, 6.0, 7.0, 6.0, 9.0, 16.0, 9.0, 19.0, 14.0, 22.0, 17.0, 29.0, 27.0, 23.0, 20.0, 29.0, 42.0, 34.0, 39.0, 55.0, 47.0, 43.0, 48.0, 43.0, 35.0, 37.0, 35.0, 40.0, 36.0, 14.0, 21.0, 25.0, 22.0, 23.0, 9.0, 16.0, 16.0, 15.0, 17.0, 9.0, 5.0, 5.0, 3.0, 6.0, 7.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.31455808877944946, -0.30430909991264343, -0.2940601110458374, -0.283811092376709, -0.27356210350990295, -0.2633131146430969, -0.2530641257762909, -0.24281513690948486, -0.23256613314151764, -0.2223171442747116, -0.21206814050674438, -0.20181915163993835, -0.19157016277313232, -0.1813211590051651, -0.17107217013835907, -0.16082316637039185, -0.15057417750358582, -0.14032518863677979, -0.13007618486881256, -0.11982719600200653, -0.1095781996846199, -0.09932920336723328, -0.08908021450042725, -0.07883121818304062, -0.06858222186565399, -0.058333225548267365, -0.048084232956171036, -0.03783524036407471, -0.02758624404668808, -0.017337247729301453, -0.007088255137205124, 0.003160737454891205, 0.013409733772277832, 0.02365872822701931, 0.03390772268176079, 0.04415671527385712, 0.054405711591243744, 0.06465470790863037, 0.0749036967754364, 0.08515269309282303, 0.09540168941020966, 0.10565068572759628, 0.11589968204498291, 0.12614867091178894, 0.13639765977859497, 0.1466466635465622, 0.15689565241336823, 0.16714465618133545, 0.17739364504814148, 0.1876426339149475, 0.19789163768291473, 0.20814062654972076, 0.218389630317688, 0.22863861918449402, 0.23888760805130005, 0.24913659691810608, 0.2593855857849121, 0.26963457465171814, 0.27988356351852417, 0.2901325821876526, 0.3003815710544586, 0.31063055992126465, 0.3208795487880707, 0.3311285376548767, 0.3413775563240051]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 2.0, 3.0, 6.0, 4.0, 7.0, 15.0, 23.0, 26.0, 28.0, 62.0, 69.0, 109.0, 147.0, 225.0, 382.0, 639.0, 1173.0, 2410.0, 7451.0, 57127.0, 4076616.0, 36770.0, 6031.0, 2210.0, 1094.0, 622.0, 366.0, 237.0, 123.0, 110.0, 61.0, 39.0, 30.0, 20.0, 15.0, 11.0, 12.0, 5.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.043914794921875, -0.04251718521118164, -0.04111957550048828, -0.03972196578979492, -0.03832435607910156, -0.0369267463684082, -0.035529136657714844, -0.034131526947021484, -0.032733917236328125, -0.031336307525634766, -0.029938697814941406, -0.028541088104248047, -0.027143478393554688, -0.025745868682861328, -0.02434825897216797, -0.02295064926147461, -0.02155303955078125, -0.02015542984008789, -0.01875782012939453, -0.017360210418701172, -0.015962600708007812, -0.014564990997314453, -0.013167381286621094, -0.011769771575927734, -0.010372161865234375, -0.008974552154541016, -0.007576942443847656, -0.006179332733154297, -0.0047817230224609375, -0.003384113311767578, -0.0019865036010742188, -0.0005888938903808594, 0.0008087158203125, 0.0022063255310058594, 0.0036039352416992188, 0.005001544952392578, 0.0063991546630859375, 0.007796764373779297, 0.009194374084472656, 0.010591983795166016, 0.011989593505859375, 0.013387203216552734, 0.014784812927246094, 0.016182422637939453, 0.017580032348632812, 0.018977642059326172, 0.02037525177001953, 0.02177286148071289, 0.02317047119140625, 0.02456808090209961, 0.02596569061279297, 0.027363300323486328, 0.028760910034179688, 0.030158519744873047, 0.031556129455566406, 0.032953739166259766, 0.034351348876953125, 0.035748958587646484, 0.037146568298339844, 0.0385441780090332, 0.03994178771972656, 0.04133939743041992, 0.04273700714111328, 0.04413461685180664, 0.0455322265625]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 7.0, 3.0, 5.0, 7.0, 8.0, 11.0, 22.0, 23.0, 26.0, 30.0, 35.0, 33.0, 50.0, 56.0, 60.0, 65.0, 72.0, 64.0, 56.0, 57.0, 50.0, 60.0, 43.0, 42.0, 27.0, 23.0, 20.0, 16.0, 8.0, 11.0, 5.0, 2.0, 4.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.031341552734375, -0.0304412841796875, -0.029541015625, -0.0286407470703125, -0.027740478515625, -0.0268402099609375, -0.02593994140625, -0.0250396728515625, -0.024139404296875, -0.0232391357421875, -0.0223388671875, -0.0214385986328125, -0.020538330078125, -0.0196380615234375, -0.01873779296875, -0.0178375244140625, -0.016937255859375, -0.0160369873046875, -0.01513671875, -0.0142364501953125, -0.013336181640625, -0.0124359130859375, -0.01153564453125, -0.0106353759765625, -0.009735107421875, -0.0088348388671875, -0.0079345703125, -0.0070343017578125, -0.006134033203125, -0.0052337646484375, -0.00433349609375, -0.0034332275390625, -0.002532958984375, -0.0016326904296875, -0.000732421875, 0.0001678466796875, 0.001068115234375, 0.0019683837890625, 0.00286865234375, 0.0037689208984375, 0.004669189453125, 0.0055694580078125, 0.0064697265625, 0.0073699951171875, 0.008270263671875, 0.0091705322265625, 0.01007080078125, 0.0109710693359375, 0.011871337890625, 0.0127716064453125, 0.013671875, 0.0145721435546875, 0.015472412109375, 0.0163726806640625, 0.01727294921875, 0.0181732177734375, 0.019073486328125, 0.0199737548828125, 0.0208740234375, 0.0217742919921875, 0.022674560546875, 0.0235748291015625, 0.02447509765625, 0.0253753662109375, 0.026275634765625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 5.0, 9.0, 14.0, 16.0, 17.0, 32.0, 65.0, 76.0, 105.0, 133.0, 213.0, 310.0, 497.0, 733.0, 1030.0, 1745.0, 2841.0, 5529.0, 12985.0, 47811.0, 3806906.0, 261896.0, 30201.0, 9799.0, 4506.0, 2405.0, 1493.0, 952.0, 633.0, 442.0, 282.0, 188.0, 133.0, 83.0, 64.0, 36.0, 31.0, 25.0, 15.0, 8.0, 7.0, 5.0, 7.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0225067138671875, -0.021726608276367188, -0.020946502685546875, -0.020166397094726562, -0.01938629150390625, -0.018606185913085938, -0.017826080322265625, -0.017045974731445312, -0.016265869140625, -0.015485763549804688, -0.014705657958984375, -0.013925552368164062, -0.01314544677734375, -0.012365341186523438, -0.011585235595703125, -0.010805130004882812, -0.0100250244140625, -0.009244918823242188, -0.008464813232421875, -0.0076847076416015625, -0.00690460205078125, -0.0061244964599609375, -0.005344390869140625, -0.0045642852783203125, -0.0037841796875, -0.0030040740966796875, -0.002223968505859375, -0.0014438629150390625, -0.00066375732421875, 0.0001163482666015625, 0.000896453857421875, 0.0016765594482421875, 0.0024566650390625, 0.0032367706298828125, 0.004016876220703125, 0.0047969818115234375, 0.00557708740234375, 0.0063571929931640625, 0.007137298583984375, 0.007917404174804688, 0.008697509765625, 0.009477615356445312, 0.010257720947265625, 0.011037826538085938, 0.01181793212890625, 0.012598037719726562, 0.013378143310546875, 0.014158248901367188, 0.0149383544921875, 0.015718460083007812, 0.016498565673828125, 0.017278671264648438, 0.01805877685546875, 0.018838882446289062, 0.019618988037109375, 0.020399093627929688, 0.02117919921875, 0.021959304809570312, 0.022739410400390625, 0.023519515991210938, 0.02429962158203125, 0.025079727172851562, 0.025859832763671875, 0.026639938354492188, 0.0274200439453125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 6.0, 1.0, 3.0, 4.0, 12.0, 8.0, 6.0, 21.0, 25.0, 50.0, 104.0, 336.0, 3248.0, 121.0, 43.0, 33.0, 16.0, 13.0, 5.0, 6.0, 3.0, 3.0, 0.0, 2.0, 5.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00786590576171875, -0.007635653018951416, -0.007405400276184082, -0.007175147533416748, -0.006944894790649414, -0.00671464204788208, -0.006484389305114746, -0.006254136562347412, -0.006023883819580078, -0.005793631076812744, -0.00556337833404541, -0.005333125591278076, -0.005102872848510742, -0.004872620105743408, -0.004642367362976074, -0.00441211462020874, -0.004181861877441406, -0.003951609134674072, -0.0037213563919067383, -0.0034911036491394043, -0.0032608509063720703, -0.0030305981636047363, -0.0028003454208374023, -0.0025700926780700684, -0.0023398399353027344, -0.0021095871925354004, -0.0018793344497680664, -0.0016490817070007324, -0.0014188289642333984, -0.0011885762214660645, -0.0009583234786987305, -0.0007280707359313965, -0.0004978179931640625, -0.0002675652503967285, -3.731250762939453e-05, 0.00019294023513793945, 0.00042319297790527344, 0.0006534457206726074, 0.0008836984634399414, 0.0011139512062072754, 0.0013442039489746094, 0.0015744566917419434, 0.0018047094345092773, 0.0020349621772766113, 0.0022652149200439453, 0.0024954676628112793, 0.0027257204055786133, 0.0029559731483459473, 0.0031862258911132812, 0.0034164786338806152, 0.0036467313766479492, 0.003876984119415283, 0.004107236862182617, 0.004337489604949951, 0.004567742347717285, 0.004797995090484619, 0.005028247833251953, 0.005258500576019287, 0.005488753318786621, 0.005719006061553955, 0.005949258804321289, 0.006179511547088623, 0.006409764289855957, 0.006640017032623291, 0.006870269775390625]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 5.0, 4.0, 8.0, 31.0, 31.0, 60.0, 117.0, 155.0, 185.0, 142.0, 115.0, 68.0, 44.0, 21.0, 13.0, 10.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02102694846689701, -0.01969367079436779, -0.01836039498448372, -0.0170271173119545, -0.015693841502070427, -0.014360563829541206, -0.01302728708833456, -0.011694010347127914, -0.010360733605921268, -0.009027456864714622, -0.0076941801235079765, -0.006360902916640043, -0.005027626175433397, -0.0036943494342267513, -0.002361072227358818, -0.001027795486152172, 0.0003054812550544739, 0.0016387581126764417, 0.0029720349702984095, 0.004305311944335699, 0.005638588685542345, 0.006971865426748991, 0.008305142633616924, 0.00963841937482357, 0.010971696116030216, 0.012304972857236862, 0.013638249598443508, 0.014971526339650154, 0.016304804012179375, 0.017638079822063446, 0.018971357494592667, 0.020304635167121887, 0.021637912839651108, 0.02297119051218033, 0.0243044663220644, 0.02563774399459362, 0.02697101980447769, 0.028304297477006912, 0.029637575149536133, 0.030970850959420204, 0.032304126769304276, 0.033637404441833496, 0.03497068211436272, 0.03630395606160164, 0.03763723373413086, 0.03897051140666008, 0.0403037890791893, 0.04163706302642822, 0.04297034442424774, 0.04430362209677696, 0.04563689976930618, 0.046970173716545105, 0.048303451389074326, 0.049636729061603546, 0.05097000673413277, 0.05230328440666199, 0.05363655835390091, 0.05496983602643013, 0.05630311369895935, 0.05763638764619827, 0.05896966531872749, 0.060302942991256714, 0.061636220663785934, 0.06296949833631516, 0.06430277228355408]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 6.0, 4.0, 2.0, 11.0, 12.0, 5.0, 18.0, 21.0, 24.0, 24.0, 20.0, 23.0, 27.0, 27.0, 31.0, 36.0, 34.0, 27.0, 42.0, 47.0, 29.0, 31.0, 40.0, 33.0, 35.0, 40.0, 35.0, 36.0, 31.0, 27.0, 30.0, 18.0, 19.0, 26.0, 18.0, 18.0, 20.0, 15.0, 11.0, 11.0, 10.0, 4.0, 8.0, 3.0, 8.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.011730551719665527, -0.011368915438652039, -0.01100727915763855, -0.010645642876625061, -0.010284006595611572, -0.009922370314598083, -0.009560734033584595, -0.009199097752571106, -0.008837461471557617, -0.008475825190544128, -0.00811418890953064, -0.007752552628517151, -0.007390916347503662, -0.007029280066490173, -0.006667643785476685, -0.006306007504463196, -0.005944371223449707, -0.005582734942436218, -0.0052210986614227295, -0.004859462380409241, -0.004497826099395752, -0.004136189818382263, -0.0037745535373687744, -0.0034129172563552856, -0.003051280975341797, -0.002689644694328308, -0.0023280084133148193, -0.0019663721323013306, -0.0016047358512878418, -0.001243099570274353, -0.0008814632892608643, -0.0005198270082473755, -0.00015819072723388672, 0.00020344555377960205, 0.0005650818347930908, 0.0009267181158065796, 0.0012883543968200684, 0.0016499906778335571, 0.002011626958847046, 0.0023732632398605347, 0.0027348995208740234, 0.003096535801887512, 0.003458172082901001, 0.0038198083639144897, 0.0041814446449279785, 0.004543080925941467, 0.004904717206954956, 0.005266353487968445, 0.005627989768981934, 0.005989626049995422, 0.006351262331008911, 0.0067128986120224, 0.007074534893035889, 0.0074361711740493774, 0.007797807455062866, 0.008159443736076355, 0.008521080017089844, 0.008882716298103333, 0.009244352579116821, 0.00960598886013031, 0.009967625141143799, 0.010329261422157288, 0.010690897703170776, 0.011052533984184265, 0.011414170265197754]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 3.0, 4.0, 10.0, 16.0, 16.0, 32.0, 53.0, 59.0, 81.0, 144.0, 235.0, 338.0, 615.0, 1060.0, 2020.0, 4272.0, 10123.0, 27709.0, 89260.0, 318730.0, 406941.0, 125483.0, 37443.0, 12990.0, 5324.0, 2509.0, 1227.0, 719.0, 420.0, 239.0, 161.0, 90.0, 61.0, 54.0, 34.0, 21.0, 12.0, 13.0, 7.0, 4.0, 6.0, 4.0, 1.0, 3.0, 4.0, 3.0], "bins": [-0.048187255859375, -0.04692363739013672, -0.04566001892089844, -0.044396400451660156, -0.043132781982421875, -0.041869163513183594, -0.04060554504394531, -0.03934192657470703, -0.03807830810546875, -0.03681468963623047, -0.03555107116699219, -0.034287452697753906, -0.033023834228515625, -0.031760215759277344, -0.030496597290039062, -0.02923297882080078, -0.0279693603515625, -0.02670574188232422, -0.025442123413085938, -0.024178504943847656, -0.022914886474609375, -0.021651268005371094, -0.020387649536132812, -0.01912403106689453, -0.01786041259765625, -0.01659679412841797, -0.015333175659179688, -0.014069557189941406, -0.012805938720703125, -0.011542320251464844, -0.010278701782226562, -0.009015083312988281, -0.00775146484375, -0.006487846374511719, -0.0052242279052734375, -0.003960609436035156, -0.002696990966796875, -0.0014333724975585938, -0.0001697540283203125, 0.0010938644409179688, 0.00235748291015625, 0.0036211013793945312, 0.0048847198486328125, 0.006148338317871094, 0.007411956787109375, 0.008675575256347656, 0.009939193725585938, 0.011202812194824219, 0.0124664306640625, 0.013730049133300781, 0.014993667602539062, 0.016257286071777344, 0.017520904541015625, 0.018784523010253906, 0.020048141479492188, 0.02131175994873047, 0.02257537841796875, 0.02383899688720703, 0.025102615356445312, 0.026366233825683594, 0.027629852294921875, 0.028893470764160156, 0.030157089233398438, 0.03142070770263672, 0.032684326171875]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 7.0, 2.0, 5.0, 14.0, 18.0, 18.0, 29.0, 25.0, 28.0, 32.0, 45.0, 49.0, 52.0, 56.0, 70.0, 63.0, 58.0, 61.0, 62.0, 58.0, 52.0, 40.0, 34.0, 32.0, 19.0, 23.0, 12.0, 13.0, 9.0, 3.0, 1.0, 4.0, 2.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0310211181640625, -0.030125141143798828, -0.029229164123535156, -0.028333187103271484, -0.027437210083007812, -0.02654123306274414, -0.02564525604248047, -0.024749279022216797, -0.023853302001953125, -0.022957324981689453, -0.02206134796142578, -0.02116537094116211, -0.020269393920898438, -0.019373416900634766, -0.018477439880371094, -0.017581462860107422, -0.01668548583984375, -0.015789508819580078, -0.014893531799316406, -0.013997554779052734, -0.013101577758789062, -0.01220560073852539, -0.011309623718261719, -0.010413646697998047, -0.009517669677734375, -0.008621692657470703, -0.007725715637207031, -0.006829738616943359, -0.0059337615966796875, -0.005037784576416016, -0.004141807556152344, -0.003245830535888672, -0.002349853515625, -0.0014538764953613281, -0.0005578994750976562, 0.0003380775451660156, 0.0012340545654296875, 0.0021300315856933594, 0.0030260086059570312, 0.003921985626220703, 0.004817962646484375, 0.005713939666748047, 0.006609916687011719, 0.007505893707275391, 0.008401870727539062, 0.009297847747802734, 0.010193824768066406, 0.011089801788330078, 0.01198577880859375, 0.012881755828857422, 0.013777732849121094, 0.014673709869384766, 0.015569686889648438, 0.01646566390991211, 0.01736164093017578, 0.018257617950439453, 0.019153594970703125, 0.020049571990966797, 0.02094554901123047, 0.02184152603149414, 0.022737503051757812, 0.023633480072021484, 0.024529457092285156, 0.025425434112548828, 0.0263214111328125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 2.0, 6.0, 3.0, 4.0, 9.0, 11.0, 7.0, 18.0, 18.0, 22.0, 35.0, 40.0, 32.0, 57.0, 86.0, 88.0, 166.0, 265.0, 500.0, 981.0, 2528.0, 8422.0, 37315.0, 294462.0, 604372.0, 77646.0, 14269.0, 4018.0, 1537.0, 646.0, 350.0, 181.0, 124.0, 85.0, 50.0, 47.0, 33.0, 17.0, 13.0, 28.0, 17.0, 10.0, 6.0, 6.0, 6.0, 6.0, 4.0, 5.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.050323486328125, -0.04871034622192383, -0.047097206115722656, -0.045484066009521484, -0.04387092590332031, -0.04225778579711914, -0.04064464569091797, -0.0390315055847168, -0.037418365478515625, -0.03580522537231445, -0.03419208526611328, -0.03257894515991211, -0.030965805053710938, -0.029352664947509766, -0.027739524841308594, -0.026126384735107422, -0.02451324462890625, -0.022900104522705078, -0.021286964416503906, -0.019673824310302734, -0.018060684204101562, -0.01644754409790039, -0.014834403991699219, -0.013221263885498047, -0.011608123779296875, -0.009994983673095703, -0.008381843566894531, -0.006768703460693359, -0.0051555633544921875, -0.0035424232482910156, -0.0019292831420898438, -0.0003161430358886719, 0.0012969970703125, 0.002910137176513672, 0.004523277282714844, 0.006136417388916016, 0.0077495574951171875, 0.00936269760131836, 0.010975837707519531, 0.012588977813720703, 0.014202117919921875, 0.015815258026123047, 0.01742839813232422, 0.01904153823852539, 0.020654678344726562, 0.022267818450927734, 0.023880958557128906, 0.025494098663330078, 0.02710723876953125, 0.028720378875732422, 0.030333518981933594, 0.031946659088134766, 0.03355979919433594, 0.03517293930053711, 0.03678607940673828, 0.03839921951293945, 0.040012359619140625, 0.0416254997253418, 0.04323863983154297, 0.04485177993774414, 0.04646492004394531, 0.048078060150146484, 0.049691200256347656, 0.05130434036254883, 0.05291748046875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 5.0, 2.0, 4.0, 8.0, 6.0, 3.0, 6.0, 14.0, 19.0, 12.0, 10.0, 14.0, 19.0, 21.0, 28.0, 36.0, 36.0, 34.0, 35.0, 42.0, 40.0, 37.0, 33.0, 53.0, 34.0, 45.0, 33.0, 46.0, 32.0, 38.0, 36.0, 27.0, 30.0, 24.0, 20.0, 21.0, 17.0, 16.0, 14.0, 12.0, 9.0, 3.0, 6.0, 5.0, 6.0, 3.0, 2.0, 7.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0631103515625, -0.06099414825439453, -0.05887794494628906, -0.056761741638183594, -0.054645538330078125, -0.052529335021972656, -0.05041313171386719, -0.04829692840576172, -0.04618072509765625, -0.04406452178955078, -0.04194831848144531, -0.039832115173339844, -0.037715911865234375, -0.035599708557128906, -0.03348350524902344, -0.03136730194091797, -0.0292510986328125, -0.02713489532470703, -0.025018692016601562, -0.022902488708496094, -0.020786285400390625, -0.018670082092285156, -0.016553878784179688, -0.014437675476074219, -0.01232147216796875, -0.010205268859863281, -0.008089065551757812, -0.005972862243652344, -0.003856658935546875, -0.0017404556274414062, 0.0003757476806640625, 0.0024919509887695312, 0.004608154296875, 0.006724357604980469, 0.008840560913085938, 0.010956764221191406, 0.013072967529296875, 0.015189170837402344, 0.017305374145507812, 0.01942157745361328, 0.02153778076171875, 0.02365398406982422, 0.025770187377929688, 0.027886390686035156, 0.030002593994140625, 0.032118797302246094, 0.03423500061035156, 0.03635120391845703, 0.0384674072265625, 0.04058361053466797, 0.04269981384277344, 0.044816017150878906, 0.046932220458984375, 0.049048423767089844, 0.05116462707519531, 0.05328083038330078, 0.05539703369140625, 0.05751323699951172, 0.05962944030761719, 0.061745643615722656, 0.06386184692382812, 0.0659780502319336, 0.06809425354003906, 0.07021045684814453, 0.07232666015625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 5.0, 7.0, 2.0, 7.0, 9.0, 6.0, 14.0, 15.0, 26.0, 33.0, 57.0, 72.0, 124.0, 194.0, 301.0, 603.0, 1224.0, 3045.0, 10320.0, 58582.0, 616208.0, 314831.0, 31727.0, 6791.0, 2192.0, 944.0, 471.0, 260.0, 135.0, 111.0, 66.0, 40.0, 33.0, 31.0, 16.0, 11.0, 10.0, 7.0, 10.0, 3.0, 3.0, 3.0, 6.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0172119140625, -0.016687870025634766, -0.01616382598876953, -0.015639781951904297, -0.015115737915039062, -0.014591693878173828, -0.014067649841308594, -0.01354360580444336, -0.013019561767578125, -0.01249551773071289, -0.011971473693847656, -0.011447429656982422, -0.010923385620117188, -0.010399341583251953, -0.009875297546386719, -0.009351253509521484, -0.00882720947265625, -0.008303165435791016, -0.007779121398925781, -0.007255077362060547, -0.0067310333251953125, -0.006206989288330078, -0.005682945251464844, -0.005158901214599609, -0.004634857177734375, -0.004110813140869141, -0.0035867691040039062, -0.003062725067138672, -0.0025386810302734375, -0.002014636993408203, -0.0014905929565429688, -0.0009665489196777344, -0.0004425048828125, 8.153915405273438e-05, 0.0006055831909179688, 0.0011296272277832031, 0.0016536712646484375, 0.002177715301513672, 0.0027017593383789062, 0.0032258033752441406, 0.003749847412109375, 0.004273891448974609, 0.004797935485839844, 0.005321979522705078, 0.0058460235595703125, 0.006370067596435547, 0.006894111633300781, 0.007418155670166016, 0.00794219970703125, 0.008466243743896484, 0.008990287780761719, 0.009514331817626953, 0.010038375854492188, 0.010562419891357422, 0.011086463928222656, 0.01161050796508789, 0.012134552001953125, 0.01265859603881836, 0.013182640075683594, 0.013706684112548828, 0.014230728149414062, 0.014754772186279297, 0.015278816223144531, 0.015802860260009766, 0.016326904296875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 8.0, 6.0, 13.0, 17.0, 13.0, 21.0, 29.0, 20.0, 17.0, 40.0, 58.0, 55.0, 74.0, 79.0, 66.0, 67.0, 75.0, 44.0, 54.0, 58.0, 41.0, 34.0, 29.0, 21.0, 12.0, 11.0, 10.0, 5.0, 6.0, 4.0, 6.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.781650543212891e-06, -5.609355866909027e-06, -5.4370611906051636e-06, -5.2647665143013e-06, -5.0924718379974365e-06, -4.920177161693573e-06, -4.7478824853897095e-06, -4.575587809085846e-06, -4.403293132781982e-06, -4.230998456478119e-06, -4.058703780174255e-06, -3.886409103870392e-06, -3.7141144275665283e-06, -3.541819751262665e-06, -3.3695250749588013e-06, -3.1972303986549377e-06, -3.0249357223510742e-06, -2.8526410460472107e-06, -2.680346369743347e-06, -2.5080516934394836e-06, -2.33575701713562e-06, -2.1634623408317566e-06, -1.991167664527893e-06, -1.8188729882240295e-06, -1.646578311920166e-06, -1.4742836356163025e-06, -1.301988959312439e-06, -1.1296942830085754e-06, -9.57399606704712e-07, -7.851049304008484e-07, -6.128102540969849e-07, -4.4051557779312134e-07, -2.682209014892578e-07, -9.592622518539429e-08, 7.636845111846924e-08, 2.4866312742233276e-07, 4.209578037261963e-07, 5.932524800300598e-07, 7.655471563339233e-07, 9.378418326377869e-07, 1.1101365089416504e-06, 1.282431185245514e-06, 1.4547258615493774e-06, 1.627020537853241e-06, 1.7993152141571045e-06, 1.971609890460968e-06, 2.1439045667648315e-06, 2.316199243068695e-06, 2.4884939193725586e-06, 2.660788595676422e-06, 2.8330832719802856e-06, 3.005377948284149e-06, 3.1776726245880127e-06, 3.3499673008918762e-06, 3.5222619771957397e-06, 3.6945566534996033e-06, 3.866851329803467e-06, 4.03914600610733e-06, 4.211440682411194e-06, 4.383735358715057e-06, 4.556030035018921e-06, 4.7283247113227844e-06, 4.900619387626648e-06, 5.0729140639305115e-06, 5.245208740234375e-06]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 3.0, 21.0, 32.0, 52.0, 96.0, 243.0, 557.0, 1821.0, 10734.0, 341802.0, 672520.0, 17079.0, 2424.0, 673.0, 257.0, 119.0, 62.0, 27.0, 17.0, 6.0, 3.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0369873046875, -0.035962581634521484, -0.03493785858154297, -0.03391313552856445, -0.03288841247558594, -0.03186368942260742, -0.030838966369628906, -0.02981424331665039, -0.028789520263671875, -0.02776479721069336, -0.026740074157714844, -0.025715351104736328, -0.024690628051757812, -0.023665904998779297, -0.02264118194580078, -0.021616458892822266, -0.02059173583984375, -0.019567012786865234, -0.01854228973388672, -0.017517566680908203, -0.016492843627929688, -0.015468120574951172, -0.014443397521972656, -0.01341867446899414, -0.012393951416015625, -0.01136922836303711, -0.010344505310058594, -0.009319782257080078, -0.008295059204101562, -0.007270336151123047, -0.006245613098144531, -0.005220890045166016, -0.0041961669921875, -0.0031714439392089844, -0.0021467208862304688, -0.0011219978332519531, -9.72747802734375e-05, 0.0009274482727050781, 0.0019521713256835938, 0.0029768943786621094, 0.004001617431640625, 0.005026340484619141, 0.006051063537597656, 0.007075786590576172, 0.008100509643554688, 0.009125232696533203, 0.010149955749511719, 0.011174678802490234, 0.01219940185546875, 0.013224124908447266, 0.014248847961425781, 0.015273571014404297, 0.016298294067382812, 0.017323017120361328, 0.018347740173339844, 0.01937246322631836, 0.020397186279296875, 0.02142190933227539, 0.022446632385253906, 0.023471355438232422, 0.024496078491210938, 0.025520801544189453, 0.02654552459716797, 0.027570247650146484, 0.028594970703125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 7.0, 13.0, 6.0, 16.0, 26.0, 52.0, 68.0, 118.0, 142.0, 142.0, 120.0, 97.0, 71.0, 39.0, 27.0, 20.0, 10.0, 9.0, 9.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0265350341796875, -0.02574014663696289, -0.02494525909423828, -0.024150371551513672, -0.023355484008789062, -0.022560596466064453, -0.021765708923339844, -0.020970821380615234, -0.020175933837890625, -0.019381046295166016, -0.018586158752441406, -0.017791271209716797, -0.016996383666992188, -0.016201496124267578, -0.015406608581542969, -0.01461172103881836, -0.01381683349609375, -0.01302194595336914, -0.012227058410644531, -0.011432170867919922, -0.010637283325195312, -0.009842395782470703, -0.009047508239746094, -0.008252620697021484, -0.007457733154296875, -0.006662845611572266, -0.005867958068847656, -0.005073070526123047, -0.0042781829833984375, -0.003483295440673828, -0.0026884078979492188, -0.0018935203552246094, -0.0010986328125, -0.0003037452697753906, 0.0004911422729492188, 0.0012860298156738281, 0.0020809173583984375, 0.002875804901123047, 0.0036706924438476562, 0.004465579986572266, 0.005260467529296875, 0.006055355072021484, 0.006850242614746094, 0.007645130157470703, 0.008440017700195312, 0.009234905242919922, 0.010029792785644531, 0.01082468032836914, 0.01161956787109375, 0.01241445541381836, 0.013209342956542969, 0.014004230499267578, 0.014799118041992188, 0.015594005584716797, 0.016388893127441406, 0.017183780670166016, 0.017978668212890625, 0.018773555755615234, 0.019568443298339844, 0.020363330841064453, 0.021158218383789062, 0.021953105926513672, 0.02274799346923828, 0.02354288101196289, 0.0243377685546875]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 36.0, 228.0, 593.0, 138.0, 18.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0807645320892334, -2.033801555633545, -1.986838459968567, -1.9398753643035889, -1.8929122686386108, -1.8459492921829224, -1.7989861965179443, -1.7520232200622559, -1.7050601243972778, -1.6580970287322998, -1.6111340522766113, -1.5641709566116333, -1.5172078609466553, -1.4702448844909668, -1.4232817888259888, -1.3763186931610107, -1.3293557167053223, -1.2823926210403442, -1.2354296445846558, -1.1884665489196777, -1.1415034532546997, -1.0945404767990112, -1.0475773811340332, -1.0006144046783447, -0.9536511898040771, -0.9066881537437439, -0.8597250580787659, -0.8127620220184326, -0.7657989859580994, -0.7188359498977661, -0.6718728542327881, -0.6249098181724548, -0.5779467821121216, -0.5309837460517883, -0.4840206801891327, -0.43705761432647705, -0.3900945782661438, -0.34313151240348816, -0.2961684465408325, -0.24920541048049927, -0.20224234461784363, -0.15527929365634918, -0.10831623524427414, -0.0613531768321991, -0.014390125870704651, 0.032572925090789795, 0.07953599095344543, 0.1264990270137787, 0.17346209287643433, 0.22042514383792877, 0.2673881947994232, 0.31435126066207886, 0.3613142967224121, 0.40827736258506775, 0.4552404284477234, 0.5022034645080566, 0.5491665601730347, 0.5961295962333679, 0.643092691898346, 0.6900557279586792, 0.7370187640190125, 0.7839818000793457, 0.8309448957443237, 0.877907931804657, 0.9248709678649902]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 6.0, 2.0, 7.0, 7.0, 6.0, 6.0, 14.0, 25.0, 14.0, 32.0, 28.0, 23.0, 33.0, 41.0, 55.0, 50.0, 74.0, 56.0, 54.0, 57.0, 50.0, 54.0, 46.0, 31.0, 35.0, 36.0, 25.0, 29.0, 25.0, 16.0, 22.0, 10.0, 6.0, 3.0, 6.0, 7.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.38024890422821045, -0.3677985966205597, -0.35534828901290894, -0.3428979814052582, -0.3304476737976074, -0.31799736618995667, -0.3055470585823059, -0.29309675097465515, -0.2806464433670044, -0.26819613575935364, -0.2557458281517029, -0.24329552054405212, -0.23084521293640137, -0.2183949053287506, -0.20594459772109985, -0.1934942901134491, -0.18104399740695953, -0.16859368979930878, -0.15614338219165802, -0.14369307458400726, -0.1312427669763565, -0.11879245936870575, -0.10634215921163559, -0.09389185160398483, -0.08144154399633408, -0.06899123638868332, -0.05654092878103256, -0.044090624898672104, -0.03164031729102135, -0.01919000968337059, -0.006739705801010132, 0.005710601806640625, 0.018160909414291382, 0.03061121702194214, 0.043061524629592896, 0.055511828511953354, 0.06796213984489441, 0.08041244745254517, 0.09286274760961533, 0.10531305521726608, 0.11776336282491684, 0.130213662981987, 0.14266397058963776, 0.1551142781972885, 0.16756458580493927, 0.18001489341259003, 0.19246520102024078, 0.20491550862789154, 0.2173658162355423, 0.22981612384319305, 0.2422664314508438, 0.2547167241573334, 0.26716703176498413, 0.2796173393726349, 0.29206764698028564, 0.3045179545879364, 0.31696826219558716, 0.3294185698032379, 0.34186887741088867, 0.35431918501853943, 0.3667694926261902, 0.37921980023384094, 0.3916701078414917, 0.40412041544914246, 0.4165707230567932]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 1.0, 3.0, 5.0, 7.0, 11.0, 12.0, 15.0, 16.0, 16.0, 21.0, 32.0, 31.0, 37.0, 35.0, 61.0, 67.0, 168.0, 412.0, 2288.0, 4152579.0, 36645.0, 1077.0, 262.0, 123.0, 80.0, 51.0, 52.0, 41.0, 22.0, 22.0, 16.0, 18.0, 10.0, 15.0, 9.0, 8.0, 4.0, 5.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1412353515625, -0.1367969512939453, -0.13235855102539062, -0.12792015075683594, -0.12348175048828125, -0.11904335021972656, -0.11460494995117188, -0.11016654968261719, -0.1057281494140625, -0.10128974914550781, -0.09685134887695312, -0.09241294860839844, -0.08797454833984375, -0.08353614807128906, -0.07909774780273438, -0.07465934753417969, -0.070220947265625, -0.06578254699707031, -0.061344146728515625, -0.05690574645996094, -0.05246734619140625, -0.04802894592285156, -0.043590545654296875, -0.03915214538574219, -0.0347137451171875, -0.030275344848632812, -0.025836944580078125, -0.021398544311523438, -0.01696014404296875, -0.012521743774414062, -0.008083343505859375, -0.0036449432373046875, 0.00079345703125, 0.0052318572998046875, 0.009670257568359375, 0.014108657836914062, 0.01854705810546875, 0.022985458374023438, 0.027423858642578125, 0.03186225891113281, 0.0363006591796875, 0.04073905944824219, 0.045177459716796875, 0.04961585998535156, 0.05405426025390625, 0.05849266052246094, 0.06293106079101562, 0.06736946105957031, 0.071807861328125, 0.07624626159667969, 0.08068466186523438, 0.08512306213378906, 0.08956146240234375, 0.09399986267089844, 0.09843826293945312, 0.10287666320800781, 0.1073150634765625, 0.11175346374511719, 0.11619186401367188, 0.12063026428222656, 0.12506866455078125, 0.12950706481933594, 0.13394546508789062, 0.1383838653564453, 0.142822265625]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 9.0, 4.0, 8.0, 6.0, 12.0, 13.0, 25.0, 30.0, 32.0, 21.0, 35.0, 43.0, 43.0, 45.0, 60.0, 59.0, 61.0, 74.0, 65.0, 64.0, 61.0, 44.0, 46.0, 28.0, 33.0, 24.0, 13.0, 17.0, 9.0, 6.0, 0.0, 3.0, 4.0, 4.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0306396484375, -0.029749631881713867, -0.028859615325927734, -0.0279695987701416, -0.02707958221435547, -0.026189565658569336, -0.025299549102783203, -0.02440953254699707, -0.023519515991210938, -0.022629499435424805, -0.021739482879638672, -0.02084946632385254, -0.019959449768066406, -0.019069433212280273, -0.01817941665649414, -0.017289400100708008, -0.016399383544921875, -0.015509366989135742, -0.01461935043334961, -0.013729333877563477, -0.012839317321777344, -0.011949300765991211, -0.011059284210205078, -0.010169267654418945, -0.009279251098632812, -0.00838923454284668, -0.007499217987060547, -0.006609201431274414, -0.005719184875488281, -0.0048291683197021484, -0.003939151763916016, -0.003049135208129883, -0.00215911865234375, -0.0012691020965576172, -0.0003790855407714844, 0.0005109310150146484, 0.0014009475708007812, 0.002290964126586914, 0.003180980682373047, 0.00407099723815918, 0.0049610137939453125, 0.005851030349731445, 0.006741046905517578, 0.007631063461303711, 0.008521080017089844, 0.009411096572875977, 0.01030111312866211, 0.011191129684448242, 0.012081146240234375, 0.012971162796020508, 0.01386117935180664, 0.014751195907592773, 0.015641212463378906, 0.01653122901916504, 0.017421245574951172, 0.018311262130737305, 0.019201278686523438, 0.02009129524230957, 0.020981311798095703, 0.021871328353881836, 0.02276134490966797, 0.0236513614654541, 0.024541378021240234, 0.025431394577026367, 0.0263214111328125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 7.0, 11.0, 8.0, 15.0, 12.0, 22.0, 28.0, 39.0, 52.0, 59.0, 81.0, 100.0, 161.0, 218.0, 323.0, 578.0, 990.0, 2017.0, 4652.0, 16195.0, 138938.0, 3987156.0, 29786.0, 6895.0, 2730.0, 1211.0, 721.0, 362.0, 284.0, 156.0, 134.0, 85.0, 67.0, 36.0, 33.0, 34.0, 16.0, 13.0, 20.0, 12.0, 8.0, 9.0, 7.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.031646728515625, -0.030663490295410156, -0.029680252075195312, -0.02869701385498047, -0.027713775634765625, -0.02673053741455078, -0.025747299194335938, -0.024764060974121094, -0.02378082275390625, -0.022797584533691406, -0.021814346313476562, -0.02083110809326172, -0.019847869873046875, -0.01886463165283203, -0.017881393432617188, -0.016898155212402344, -0.0159149169921875, -0.014931678771972656, -0.013948440551757812, -0.012965202331542969, -0.011981964111328125, -0.010998725891113281, -0.010015487670898438, -0.009032249450683594, -0.00804901123046875, -0.007065773010253906, -0.0060825347900390625, -0.005099296569824219, -0.004116058349609375, -0.0031328201293945312, -0.0021495819091796875, -0.0011663436889648438, -0.00018310546875, 0.0008001327514648438, 0.0017833709716796875, 0.0027666091918945312, 0.003749847412109375, 0.004733085632324219, 0.0057163238525390625, 0.006699562072753906, 0.00768280029296875, 0.008666038513183594, 0.009649276733398438, 0.010632514953613281, 0.011615753173828125, 0.012598991394042969, 0.013582229614257812, 0.014565467834472656, 0.0155487060546875, 0.016531944274902344, 0.017515182495117188, 0.01849842071533203, 0.019481658935546875, 0.02046489715576172, 0.021448135375976562, 0.022431373596191406, 0.02341461181640625, 0.024397850036621094, 0.025381088256835938, 0.02636432647705078, 0.027347564697265625, 0.02833080291748047, 0.029314041137695312, 0.030297279357910156, 0.031280517578125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 1.0, 5.0, 7.0, 13.0, 17.0, 51.0, 165.0, 3686.0, 76.0, 29.0, 14.0, 6.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00817108154296875, -0.007787346839904785, -0.00740361213684082, -0.0070198774337768555, -0.006636142730712891, -0.006252408027648926, -0.005868673324584961, -0.005484938621520996, -0.005101203918457031, -0.004717469215393066, -0.0043337345123291016, -0.003949999809265137, -0.003566265106201172, -0.003182530403137207, -0.002798795700073242, -0.0024150609970092773, -0.0020313262939453125, -0.0016475915908813477, -0.0012638568878173828, -0.000880122184753418, -0.0004963874816894531, -0.00011265277862548828, 0.00027108192443847656, 0.0006548166275024414, 0.0010385513305664062, 0.001422286033630371, 0.001806020736694336, 0.0021897554397583008, 0.0025734901428222656, 0.0029572248458862305, 0.0033409595489501953, 0.00372469425201416, 0.004108428955078125, 0.00449216365814209, 0.004875898361206055, 0.0052596330642700195, 0.005643367767333984, 0.006027102470397949, 0.006410837173461914, 0.006794571876525879, 0.007178306579589844, 0.007562041282653809, 0.007945775985717773, 0.008329510688781738, 0.008713245391845703, 0.009096980094909668, 0.009480714797973633, 0.009864449501037598, 0.010248184204101562, 0.010631918907165527, 0.011015653610229492, 0.011399388313293457, 0.011783123016357422, 0.012166857719421387, 0.012550592422485352, 0.012934327125549316, 0.013318061828613281, 0.013701796531677246, 0.014085531234741211, 0.014469265937805176, 0.01485300064086914, 0.015236735343933105, 0.01562047004699707, 0.016004204750061035, 0.016387939453125]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 3.0, 7.0, 6.0, 28.0, 38.0, 97.0, 149.0, 230.0, 219.0, 139.0, 57.0, 21.0, 13.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01756390370428562, -0.01601211167871952, -0.014460320584475994, -0.012908529490232468, -0.011356737464666367, -0.00980494637042284, -0.008253155276179314, -0.006701363250613213, -0.005149572156369686, -0.0035977805964648724, -0.0020459892693907022, -0.0004941979423165321, 0.0010575936175882816, 0.0026093851774930954, 0.004161176271736622, 0.005712968297302723, 0.007264759391546249, 0.008816550485789776, 0.010368342511355877, 0.011920133605599403, 0.013471925631165504, 0.015023716725409031, 0.016575507819652557, 0.01812729984521866, 0.01967909187078476, 0.02123088389635086, 0.022782674059271812, 0.024334466084837914, 0.025886258110404015, 0.027438048273324966, 0.028989840298891068, 0.03054163232445717, 0.03209342435002327, 0.03364521637558937, 0.03519700840115547, 0.036748796701431274, 0.038300588726997375, 0.03985238075256348, 0.04140417277812958, 0.04295596480369568, 0.04450775682926178, 0.04605954885482788, 0.04761134088039398, 0.04916313290596008, 0.050714921206235886, 0.05226671323180199, 0.05381850525736809, 0.05537029728293419, 0.05692208558320999, 0.05847387760877609, 0.060025669634342194, 0.061577461659908295, 0.0631292536854744, 0.0646810457110405, 0.066232830286026, 0.0677846223115921, 0.0693364217877388, 0.0708882138133049, 0.072440005838871, 0.0739917978644371, 0.0755435898900032, 0.0770953819155693, 0.07864716649055481, 0.08019895851612091, 0.08175075054168701]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 0.0, 5.0, 8.0, 8.0, 11.0, 13.0, 8.0, 9.0, 15.0, 19.0, 17.0, 29.0, 24.0, 32.0, 38.0, 35.0, 38.0, 30.0, 45.0, 42.0, 31.0, 39.0, 44.0, 40.0, 47.0, 35.0, 53.0, 37.0, 46.0, 21.0, 29.0, 24.0, 24.0, 25.0, 26.0, 16.0, 18.0, 10.0, 4.0, 6.0, 1.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.012302577495574951, -0.011802403256297112, -0.011302229017019272, -0.010802054777741432, -0.010301880538463593, -0.009801706299185753, -0.009301532059907913, -0.008801357820630074, -0.008301183581352234, -0.007801009342074394, -0.0073008351027965546, -0.006800660863518715, -0.006300486624240875, -0.005800312384963036, -0.005300138145685196, -0.004799963906407356, -0.004299789667129517, -0.003799615427851677, -0.0032994411885738373, -0.0027992669492959976, -0.002299092710018158, -0.0017989184707403183, -0.0012987442314624786, -0.000798569992184639, -0.0002983957529067993, 0.00020177848637104034, 0.00070195272564888, 0.0012021269649267197, 0.0017023012042045593, 0.002202475443482399, 0.0027026496827602386, 0.0032028239220380783, 0.003702998161315918, 0.004203172400593758, 0.004703346639871597, 0.005203520879149437, 0.005703695118427277, 0.006203869357705116, 0.006704043596982956, 0.007204217836260796, 0.007704392075538635, 0.008204566314816475, 0.008704740554094315, 0.009204914793372154, 0.009705089032649994, 0.010205263271927834, 0.010705437511205673, 0.011205611750483513, 0.011705785989761353, 0.012205960229039192, 0.012706134468317032, 0.013206308707594872, 0.013706482946872711, 0.01420665718615055, 0.01470683142542839, 0.01520700566470623, 0.01570717990398407, 0.01620735414326191, 0.01670752838253975, 0.01720770262181759, 0.01770787686109543, 0.018208051100373268, 0.018708225339651108, 0.019208399578928947, 0.019708573818206787]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 5.0, 3.0, 2.0, 2.0, 5.0, 1.0, 5.0, 11.0, 9.0, 27.0, 32.0, 41.0, 54.0, 76.0, 106.0, 146.0, 266.0, 404.0, 644.0, 1024.0, 1903.0, 3691.0, 10989.0, 114132.0, 792291.0, 103875.0, 10597.0, 3561.0, 1801.0, 1062.0, 610.0, 346.0, 266.0, 174.0, 143.0, 76.0, 40.0, 35.0, 22.0, 21.0, 15.0, 12.0, 9.0, 9.0, 5.0, 3.0, 2.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.07244873046875, -0.07007217407226562, -0.06769561767578125, -0.06531906127929688, -0.0629425048828125, -0.060565948486328125, -0.05818939208984375, -0.055812835693359375, -0.053436279296875, -0.051059722900390625, -0.04868316650390625, -0.046306610107421875, -0.0439300537109375, -0.041553497314453125, -0.03917694091796875, -0.036800384521484375, -0.034423828125, -0.032047271728515625, -0.02967071533203125, -0.027294158935546875, -0.0249176025390625, -0.022541046142578125, -0.02016448974609375, -0.017787933349609375, -0.015411376953125, -0.013034820556640625, -0.01065826416015625, -0.008281707763671875, -0.0059051513671875, -0.003528594970703125, -0.00115203857421875, 0.001224517822265625, 0.00360107421875, 0.005977630615234375, 0.00835418701171875, 0.010730743408203125, 0.0131072998046875, 0.015483856201171875, 0.01786041259765625, 0.020236968994140625, 0.022613525390625, 0.024990081787109375, 0.02736663818359375, 0.029743194580078125, 0.0321197509765625, 0.034496307373046875, 0.03687286376953125, 0.039249420166015625, 0.0416259765625, 0.044002532958984375, 0.04637908935546875, 0.048755645751953125, 0.0511322021484375, 0.053508758544921875, 0.05588531494140625, 0.058261871337890625, 0.060638427734375, 0.06301498413085938, 0.06539154052734375, 0.06776809692382812, 0.0701446533203125, 0.07252120971679688, 0.07489776611328125, 0.07727432250976562, 0.07965087890625]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 6.0, 9.0, 6.0, 8.0, 7.0, 11.0, 25.0, 30.0, 32.0, 29.0, 33.0, 38.0, 47.0, 49.0, 53.0, 54.0, 60.0, 61.0, 65.0, 61.0, 68.0, 65.0, 36.0, 32.0, 28.0, 29.0, 17.0, 11.0, 8.0, 11.0, 4.0, 1.0, 3.0, 3.0, 3.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.03094482421875, -0.030050277709960938, -0.029155731201171875, -0.028261184692382812, -0.02736663818359375, -0.026472091674804688, -0.025577545166015625, -0.024682998657226562, -0.0237884521484375, -0.022893905639648438, -0.021999359130859375, -0.021104812622070312, -0.02021026611328125, -0.019315719604492188, -0.018421173095703125, -0.017526626586914062, -0.016632080078125, -0.015737533569335938, -0.014842987060546875, -0.013948440551757812, -0.01305389404296875, -0.012159347534179688, -0.011264801025390625, -0.010370254516601562, -0.0094757080078125, -0.008581161499023438, -0.007686614990234375, -0.0067920684814453125, -0.00589752197265625, -0.0050029754638671875, -0.004108428955078125, -0.0032138824462890625, -0.0023193359375, -0.0014247894287109375, -0.000530242919921875, 0.0003643035888671875, 0.00125885009765625, 0.0021533966064453125, 0.003047943115234375, 0.0039424896240234375, 0.0048370361328125, 0.0057315826416015625, 0.006626129150390625, 0.0075206756591796875, 0.00841522216796875, 0.009309768676757812, 0.010204315185546875, 0.011098861694335938, 0.011993408203125, 0.012887954711914062, 0.013782501220703125, 0.014677047729492188, 0.01557159423828125, 0.016466140747070312, 0.017360687255859375, 0.018255233764648438, 0.0191497802734375, 0.020044326782226562, 0.020938873291015625, 0.021833419799804688, 0.02272796630859375, 0.023622512817382812, 0.024517059326171875, 0.025411605834960938, 0.02630615234375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 4.0, 6.0, 6.0, 7.0, 11.0, 31.0, 35.0, 58.0, 72.0, 126.0, 224.0, 357.0, 629.0, 1187.0, 2684.0, 10575.0, 230444.0, 769965.0, 24798.0, 3991.0, 1506.0, 740.0, 394.0, 245.0, 176.0, 89.0, 66.0, 38.0, 34.0, 22.0, 12.0, 6.0, 8.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.0865478515625, -0.08415603637695312, -0.08176422119140625, -0.07937240600585938, -0.0769805908203125, -0.07458877563476562, -0.07219696044921875, -0.06980514526367188, -0.067413330078125, -0.06502151489257812, -0.06262969970703125, -0.060237884521484375, -0.0578460693359375, -0.055454254150390625, -0.05306243896484375, -0.050670623779296875, -0.04827880859375, -0.045886993408203125, -0.04349517822265625, -0.041103363037109375, -0.0387115478515625, -0.036319732666015625, -0.03392791748046875, -0.031536102294921875, -0.029144287109375, -0.026752471923828125, -0.02436065673828125, -0.021968841552734375, -0.0195770263671875, -0.017185211181640625, -0.01479339599609375, -0.012401580810546875, -0.010009765625, -0.007617950439453125, -0.00522613525390625, -0.002834320068359375, -0.0004425048828125, 0.001949310302734375, 0.00434112548828125, 0.006732940673828125, 0.009124755859375, 0.011516571044921875, 0.01390838623046875, 0.016300201416015625, 0.0186920166015625, 0.021083831787109375, 0.02347564697265625, 0.025867462158203125, 0.02825927734375, 0.030651092529296875, 0.03304290771484375, 0.035434722900390625, 0.0378265380859375, 0.040218353271484375, 0.04261016845703125, 0.045001983642578125, 0.047393798828125, 0.049785614013671875, 0.05217742919921875, 0.054569244384765625, 0.0569610595703125, 0.059352874755859375, 0.06174468994140625, 0.06413650512695312, 0.0665283203125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 7.0, 1.0, 5.0, 8.0, 4.0, 11.0, 8.0, 13.0, 21.0, 22.0, 18.0, 29.0, 32.0, 32.0, 33.0, 43.0, 41.0, 48.0, 33.0, 42.0, 46.0, 41.0, 45.0, 50.0, 50.0, 49.0, 43.0, 35.0, 29.0, 33.0, 20.0, 15.0, 21.0, 9.0, 13.0, 12.0, 15.0, 8.0, 7.0, 5.0, 3.0, 4.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.087646484375, -0.08510208129882812, -0.08255767822265625, -0.08001327514648438, -0.0774688720703125, -0.07492446899414062, -0.07238006591796875, -0.06983566284179688, -0.067291259765625, -0.06474685668945312, -0.06220245361328125, -0.059658050537109375, -0.0571136474609375, -0.054569244384765625, -0.05202484130859375, -0.049480438232421875, -0.04693603515625, -0.044391632080078125, -0.04184722900390625, -0.039302825927734375, -0.0367584228515625, -0.034214019775390625, -0.03166961669921875, -0.029125213623046875, -0.026580810546875, -0.024036407470703125, -0.02149200439453125, -0.018947601318359375, -0.0164031982421875, -0.013858795166015625, -0.01131439208984375, -0.008769989013671875, -0.0062255859375, -0.003681182861328125, -0.00113677978515625, 0.001407623291015625, 0.0039520263671875, 0.006496429443359375, 0.00904083251953125, 0.011585235595703125, 0.014129638671875, 0.016674041748046875, 0.01921844482421875, 0.021762847900390625, 0.0243072509765625, 0.026851654052734375, 0.02939605712890625, 0.031940460205078125, 0.03448486328125, 0.037029266357421875, 0.03957366943359375, 0.042118072509765625, 0.0446624755859375, 0.047206878662109375, 0.04975128173828125, 0.052295684814453125, 0.054840087890625, 0.057384490966796875, 0.05992889404296875, 0.062473297119140625, 0.0650177001953125, 0.06756210327148438, 0.07010650634765625, 0.07265090942382812, 0.0751953125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 11.0, 14.0, 20.0, 33.0, 58.0, 132.0, 309.0, 923.0, 3739.0, 40650.0, 923616.0, 72260.0, 5009.0, 1135.0, 356.0, 146.0, 54.0, 25.0, 17.0, 14.0, 5.0, 4.0, 7.0, 4.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0231475830078125, -0.022276639938354492, -0.021405696868896484, -0.020534753799438477, -0.01966381072998047, -0.01879286766052246, -0.017921924591064453, -0.017050981521606445, -0.016180038452148438, -0.01530909538269043, -0.014438152313232422, -0.013567209243774414, -0.012696266174316406, -0.011825323104858398, -0.01095438003540039, -0.010083436965942383, -0.009212493896484375, -0.008341550827026367, -0.007470607757568359, -0.0065996646881103516, -0.005728721618652344, -0.004857778549194336, -0.003986835479736328, -0.0031158924102783203, -0.0022449493408203125, -0.0013740062713623047, -0.0005030632019042969, 0.00036787986755371094, 0.0012388229370117188, 0.0021097660064697266, 0.0029807090759277344, 0.003851652145385742, 0.00472259521484375, 0.005593538284301758, 0.006464481353759766, 0.0073354244232177734, 0.008206367492675781, 0.009077310562133789, 0.009948253631591797, 0.010819196701049805, 0.011690139770507812, 0.01256108283996582, 0.013432025909423828, 0.014302968978881836, 0.015173912048339844, 0.01604485511779785, 0.01691579818725586, 0.017786741256713867, 0.018657684326171875, 0.019528627395629883, 0.02039957046508789, 0.0212705135345459, 0.022141456604003906, 0.023012399673461914, 0.023883342742919922, 0.02475428581237793, 0.025625228881835938, 0.026496171951293945, 0.027367115020751953, 0.02823805809020996, 0.02910900115966797, 0.029979944229125977, 0.030850887298583984, 0.03172183036804199, 0.0325927734375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 2.0, 6.0, 14.0, 7.0, 14.0, 10.0, 17.0, 31.0, 26.0, 40.0, 35.0, 57.0, 42.0, 37.0, 51.0, 43.0, 82.0, 57.0, 52.0, 68.0, 39.0, 53.0, 25.0, 28.0, 39.0, 22.0, 25.0, 12.0, 12.0, 9.0, 13.0, 11.0, 7.0, 7.0, 8.0, 2.0, 2.0, 1.0, 2.0], "bins": [-6.020069122314453e-06, -5.8766454458236694e-06, -5.733221769332886e-06, -5.589798092842102e-06, -5.446374416351318e-06, -5.302950739860535e-06, -5.159527063369751e-06, -5.016103386878967e-06, -4.872679710388184e-06, -4.7292560338974e-06, -4.585832357406616e-06, -4.4424086809158325e-06, -4.298985004425049e-06, -4.155561327934265e-06, -4.0121376514434814e-06, -3.868713974952698e-06, -3.725290298461914e-06, -3.5818666219711304e-06, -3.4384429454803467e-06, -3.295019268989563e-06, -3.1515955924987793e-06, -3.0081719160079956e-06, -2.864748239517212e-06, -2.7213245630264282e-06, -2.5779008865356445e-06, -2.434477210044861e-06, -2.291053533554077e-06, -2.1476298570632935e-06, -2.0042061805725098e-06, -1.860782504081726e-06, -1.7173588275909424e-06, -1.5739351511001587e-06, -1.430511474609375e-06, -1.2870877981185913e-06, -1.1436641216278076e-06, -1.000240445137024e-06, -8.568167686462402e-07, -7.133930921554565e-07, -5.699694156646729e-07, -4.2654573917388916e-07, -2.8312206268310547e-07, -1.3969838619232178e-07, 3.725290298461914e-09, 1.471489667892456e-07, 2.905726432800293e-07, 4.33996319770813e-07, 5.774199962615967e-07, 7.208436727523804e-07, 8.642673492431641e-07, 1.0076910257339478e-06, 1.1511147022247314e-06, 1.2945383787155151e-06, 1.4379620552062988e-06, 1.5813857316970825e-06, 1.7248094081878662e-06, 1.86823308467865e-06, 2.0116567611694336e-06, 2.1550804376602173e-06, 2.298504114151001e-06, 2.4419277906417847e-06, 2.5853514671325684e-06, 2.728775143623352e-06, 2.8721988201141357e-06, 3.0156224966049194e-06, 3.159046173095703e-06]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 6.0, 2.0, 3.0, 2.0, 1.0, 3.0, 2.0, 3.0, 3.0, 4.0, 5.0, 4.0, 5.0, 12.0, 13.0, 26.0, 56.0, 163.0, 707.0, 5996.0, 1005928.0, 33496.0, 1629.0, 317.0, 73.0, 38.0, 21.0, 11.0, 5.0, 4.0, 6.0, 4.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.091552734375, -0.08924722671508789, -0.08694171905517578, -0.08463621139526367, -0.08233070373535156, -0.08002519607543945, -0.07771968841552734, -0.07541418075561523, -0.07310867309570312, -0.07080316543579102, -0.0684976577758789, -0.0661921501159668, -0.06388664245605469, -0.06158113479614258, -0.05927562713623047, -0.05697011947631836, -0.05466461181640625, -0.05235910415649414, -0.05005359649658203, -0.04774808883666992, -0.04544258117675781, -0.0431370735168457, -0.040831565856933594, -0.038526058197021484, -0.036220550537109375, -0.033915042877197266, -0.031609535217285156, -0.029304027557373047, -0.026998519897460938, -0.024693012237548828, -0.02238750457763672, -0.02008199691772461, -0.0177764892578125, -0.01547098159790039, -0.013165473937988281, -0.010859966278076172, -0.008554458618164062, -0.006248950958251953, -0.003943443298339844, -0.0016379356384277344, 0.000667572021484375, 0.0029730796813964844, 0.005278587341308594, 0.007584095001220703, 0.009889602661132812, 0.012195110321044922, 0.014500617980957031, 0.01680612564086914, 0.01911163330078125, 0.02141714096069336, 0.02372264862060547, 0.026028156280517578, 0.028333663940429688, 0.030639171600341797, 0.032944679260253906, 0.035250186920166016, 0.037555694580078125, 0.039861202239990234, 0.042166709899902344, 0.04447221755981445, 0.04677772521972656, 0.04908323287963867, 0.05138874053955078, 0.05369424819946289, 0.055999755859375]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 8.0, 3.0, 14.0, 34.0, 91.0, 264.0, 340.0, 152.0, 40.0, 14.0, 11.0, 8.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.09149169921875, -0.0891571044921875, -0.086822509765625, -0.0844879150390625, -0.0821533203125, -0.0798187255859375, -0.077484130859375, -0.0751495361328125, -0.07281494140625, -0.0704803466796875, -0.068145751953125, -0.0658111572265625, -0.0634765625, -0.0611419677734375, -0.058807373046875, -0.0564727783203125, -0.05413818359375, -0.0518035888671875, -0.049468994140625, -0.0471343994140625, -0.0447998046875, -0.0424652099609375, -0.040130615234375, -0.0377960205078125, -0.03546142578125, -0.0331268310546875, -0.030792236328125, -0.0284576416015625, -0.026123046875, -0.0237884521484375, -0.021453857421875, -0.0191192626953125, -0.01678466796875, -0.0144500732421875, -0.012115478515625, -0.0097808837890625, -0.0074462890625, -0.0051116943359375, -0.002777099609375, -0.0004425048828125, 0.00189208984375, 0.0042266845703125, 0.006561279296875, 0.0088958740234375, 0.01123046875, 0.0135650634765625, 0.015899658203125, 0.0182342529296875, 0.02056884765625, 0.0229034423828125, 0.025238037109375, 0.0275726318359375, 0.0299072265625, 0.0322418212890625, 0.034576416015625, 0.0369110107421875, 0.03924560546875, 0.0415802001953125, 0.043914794921875, 0.0462493896484375, 0.048583984375, 0.0509185791015625, 0.053253173828125, 0.0555877685546875, 0.05792236328125]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 11.0, 18.0, 62.0, 203.0, 374.0, 242.0, 79.0, 12.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.2711992263793945, -1.2451297044754028, -1.2190600633621216, -1.1929905414581299, -1.1669209003448486, -1.140851378440857, -1.1147817373275757, -1.088712215423584, -1.0626425743103027, -1.036573052406311, -1.0105034112930298, -0.9844338297843933, -0.9583642482757568, -0.9322946667671204, -0.9062250852584839, -0.8801555633544922, -0.8540859818458557, -0.8280164003372192, -0.8019468188285828, -0.7758772373199463, -0.7498076558113098, -0.7237380743026733, -0.6976685523986816, -0.6715989112854004, -0.6455293893814087, -0.6194598078727722, -0.5933902263641357, -0.5673206448554993, -0.5412510633468628, -0.5151814818382263, -0.48911193013191223, -0.46304234862327576, -0.43697279691696167, -0.4109032154083252, -0.3848336338996887, -0.35876405239105225, -0.33269447088241577, -0.3066248893737793, -0.2805553376674652, -0.25448575615882874, -0.22841617465019226, -0.2023465931415558, -0.1762770116329193, -0.15020744502544403, -0.12413786351680756, -0.09806828200817108, -0.0719987154006958, -0.045929133892059326, -0.01985955238342285, 0.006210025399923325, 0.0322796031832695, 0.05834917724132538, 0.08441875874996185, 0.11048834025859833, 0.1365579068660736, 0.16262748837471008, 0.18869706988334656, 0.21476665139198303, 0.2408362329006195, 0.2669057846069336, 0.29297536611557007, 0.31904494762420654, 0.345114529132843, 0.3711841106414795, 0.39725369215011597]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 7.0, 7.0, 4.0, 7.0, 11.0, 11.0, 13.0, 10.0, 16.0, 16.0, 21.0, 28.0, 37.0, 47.0, 36.0, 46.0, 45.0, 43.0, 53.0, 46.0, 42.0, 42.0, 49.0, 47.0, 39.0, 34.0, 31.0, 24.0, 32.0, 19.0, 19.0, 24.0, 19.0, 17.0, 10.0, 8.0, 18.0, 7.0, 3.0, 7.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.34837424755096436, -0.3365650773048401, -0.3247559070587158, -0.31294673681259155, -0.3011375963687897, -0.2893284261226654, -0.27751925587654114, -0.26571008563041687, -0.253900945186615, -0.24209177494049072, -0.23028261959552765, -0.21847344934940338, -0.2066642940044403, -0.19485512375831604, -0.18304595351219177, -0.1712367832660675, -0.15942761301994324, -0.14761844277381897, -0.1358092874288559, -0.12400011718273163, -0.11219095438718796, -0.10038179159164429, -0.08857262134552002, -0.07676345854997635, -0.06495429575443268, -0.05314513295888901, -0.04133596643805504, -0.02952679991722107, -0.0177176371216774, -0.005908474326133728, 0.0059006959199905396, 0.01770985871553421, 0.02951902151107788, 0.04132818430662155, 0.05313735082745552, 0.06494651734828949, 0.07675568014383316, 0.08856484293937683, 0.1003740131855011, 0.11218317598104477, 0.12399233877658844, 0.1358015090227127, 0.14761066436767578, 0.15941983461380005, 0.17122900485992432, 0.1830381602048874, 0.19484733045101166, 0.20665648579597473, 0.218465656042099, 0.23027482628822327, 0.24208398163318634, 0.2538931369781494, 0.2657023072242737, 0.27751147747039795, 0.2893206477165222, 0.3011298179626465, 0.31293898820877075, 0.324748158454895, 0.3365573287010193, 0.34836649894714355, 0.36017563939094543, 0.3719848096370697, 0.38379397988319397, 0.39560315012931824, 0.4074122905731201]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 2.0, 7.0, 6.0, 11.0, 8.0, 12.0, 20.0, 20.0, 18.0, 28.0, 37.0, 40.0, 44.0, 82.0, 178.0, 479.0, 1905.0, 14829.0, 4153153.0, 20160.0, 2226.0, 494.0, 182.0, 94.0, 39.0, 27.0, 37.0, 30.0, 24.0, 21.0, 20.0, 8.0, 7.0, 7.0, 7.0, 3.0, 3.0, 5.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.09405517578125, -0.09097576141357422, -0.08789634704589844, -0.08481693267822266, -0.08173751831054688, -0.0786581039428711, -0.07557868957519531, -0.07249927520751953, -0.06941986083984375, -0.06634044647216797, -0.06326103210449219, -0.060181617736816406, -0.057102203369140625, -0.054022789001464844, -0.05094337463378906, -0.04786396026611328, -0.0447845458984375, -0.04170513153076172, -0.03862571716308594, -0.035546302795410156, -0.032466888427734375, -0.029387474060058594, -0.026308059692382812, -0.02322864532470703, -0.02014923095703125, -0.01706981658935547, -0.013990402221679688, -0.010910987854003906, -0.007831573486328125, -0.004752159118652344, -0.0016727447509765625, 0.0014066696166992188, 0.004486083984375, 0.007565498352050781, 0.010644912719726562, 0.013724327087402344, 0.016803741455078125, 0.019883155822753906, 0.022962570190429688, 0.02604198455810547, 0.02912139892578125, 0.03220081329345703, 0.03528022766113281, 0.038359642028808594, 0.041439056396484375, 0.044518470764160156, 0.04759788513183594, 0.05067729949951172, 0.0537567138671875, 0.05683612823486328, 0.05991554260253906, 0.06299495697021484, 0.06607437133789062, 0.0691537857055664, 0.07223320007324219, 0.07531261444091797, 0.07839202880859375, 0.08147144317626953, 0.08455085754394531, 0.0876302719116211, 0.09070968627929688, 0.09378910064697266, 0.09686851501464844, 0.09994792938232422, 0.10302734375]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 5.0, 5.0, 10.0, 18.0, 10.0, 19.0, 27.0, 38.0, 35.0, 50.0, 42.0, 52.0, 46.0, 59.0, 56.0, 65.0, 75.0, 53.0, 47.0, 71.0, 41.0, 42.0, 33.0, 20.0, 24.0, 10.0, 11.0, 11.0, 4.0, 1.0, 3.0, 4.0, 5.0, 2.0, 0.0, 2.0, 1.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.02813720703125, -0.027286052703857422, -0.026434898376464844, -0.025583744049072266, -0.024732589721679688, -0.02388143539428711, -0.02303028106689453, -0.022179126739501953, -0.021327972412109375, -0.020476818084716797, -0.01962566375732422, -0.01877450942993164, -0.017923355102539062, -0.017072200775146484, -0.016221046447753906, -0.015369892120361328, -0.01451873779296875, -0.013667583465576172, -0.012816429138183594, -0.011965274810791016, -0.011114120483398438, -0.01026296615600586, -0.009411811828613281, -0.008560657501220703, -0.007709503173828125, -0.006858348846435547, -0.006007194519042969, -0.005156040191650391, -0.0043048858642578125, -0.0034537315368652344, -0.0026025772094726562, -0.0017514228820800781, -0.0009002685546875, -4.9114227294921875e-05, 0.0008020401000976562, 0.0016531944274902344, 0.0025043487548828125, 0.0033555030822753906, 0.004206657409667969, 0.005057811737060547, 0.005908966064453125, 0.006760120391845703, 0.007611274719238281, 0.00846242904663086, 0.009313583374023438, 0.010164737701416016, 0.011015892028808594, 0.011867046356201172, 0.01271820068359375, 0.013569355010986328, 0.014420509338378906, 0.015271663665771484, 0.016122817993164062, 0.01697397232055664, 0.01782512664794922, 0.018676280975341797, 0.019527435302734375, 0.020378589630126953, 0.02122974395751953, 0.02208089828491211, 0.022932052612304688, 0.023783206939697266, 0.024634361267089844, 0.025485515594482422, 0.026336669921875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 0.0, 6.0, 5.0, 7.0, 11.0, 23.0, 25.0, 29.0, 33.0, 64.0, 88.0, 145.0, 253.0, 525.0, 1435.0, 4412.0, 28767.0, 4099849.0, 49820.0, 5714.0, 1659.0, 650.0, 286.0, 161.0, 92.0, 63.0, 37.0, 41.0, 28.0, 24.0, 7.0, 7.0, 4.0, 4.0, 3.0, 6.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.06915283203125, -0.06720972061157227, -0.06526660919189453, -0.0633234977722168, -0.06138038635253906, -0.05943727493286133, -0.057494163513183594, -0.05555105209350586, -0.053607940673828125, -0.05166482925415039, -0.049721717834472656, -0.04777860641479492, -0.04583549499511719, -0.04389238357543945, -0.04194927215576172, -0.040006160736083984, -0.03806304931640625, -0.036119937896728516, -0.03417682647705078, -0.03223371505737305, -0.030290603637695312, -0.028347492218017578, -0.026404380798339844, -0.02446126937866211, -0.022518157958984375, -0.02057504653930664, -0.018631935119628906, -0.016688823699951172, -0.014745712280273438, -0.012802600860595703, -0.010859489440917969, -0.008916378021240234, -0.0069732666015625, -0.005030155181884766, -0.0030870437622070312, -0.0011439323425292969, 0.0007991790771484375, 0.002742290496826172, 0.004685401916503906, 0.006628513336181641, 0.008571624755859375, 0.01051473617553711, 0.012457847595214844, 0.014400959014892578, 0.016344070434570312, 0.018287181854248047, 0.02023029327392578, 0.022173404693603516, 0.02411651611328125, 0.026059627532958984, 0.02800273895263672, 0.029945850372314453, 0.03188896179199219, 0.03383207321166992, 0.035775184631347656, 0.03771829605102539, 0.039661407470703125, 0.04160451889038086, 0.043547630310058594, 0.04549074172973633, 0.04743385314941406, 0.0493769645690918, 0.05132007598876953, 0.053263187408447266, 0.055206298828125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 8.0, 19.0, 46.0, 366.0, 3489.0, 94.0, 28.0, 12.0, 10.0, 5.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.043487548828125, -0.04240536689758301, -0.041323184967041016, -0.04024100303649902, -0.03915882110595703, -0.03807663917541504, -0.03699445724487305, -0.035912275314331055, -0.03483009338378906, -0.03374791145324707, -0.03266572952270508, -0.031583547592163086, -0.030501365661621094, -0.0294191837310791, -0.02833700180053711, -0.027254819869995117, -0.026172637939453125, -0.025090456008911133, -0.02400827407836914, -0.02292609214782715, -0.021843910217285156, -0.020761728286743164, -0.019679546356201172, -0.01859736442565918, -0.017515182495117188, -0.016433000564575195, -0.015350818634033203, -0.014268636703491211, -0.013186454772949219, -0.012104272842407227, -0.011022090911865234, -0.009939908981323242, -0.00885772705078125, -0.007775545120239258, -0.006693363189697266, -0.0056111812591552734, -0.004528999328613281, -0.003446817398071289, -0.002364635467529297, -0.0012824535369873047, -0.0002002716064453125, 0.0008819103240966797, 0.001964092254638672, 0.003046274185180664, 0.004128456115722656, 0.0052106380462646484, 0.006292819976806641, 0.007375001907348633, 0.008457183837890625, 0.009539365768432617, 0.01062154769897461, 0.011703729629516602, 0.012785911560058594, 0.013868093490600586, 0.014950275421142578, 0.01603245735168457, 0.017114639282226562, 0.018196821212768555, 0.019279003143310547, 0.02036118507385254, 0.02144336700439453, 0.022525548934936523, 0.023607730865478516, 0.024689912796020508, 0.0257720947265625]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 11.0, 8.0, 16.0, 26.0, 20.0, 54.0, 61.0, 104.0, 123.0, 127.0, 115.0, 122.0, 79.0, 47.0, 38.0, 18.0, 14.0, 7.0, 4.0, 1.0, 7.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03876728564500809, -0.0367964506149292, -0.03482561931014061, -0.03285478800535202, -0.030883952975273132, -0.028913119807839394, -0.026942286640405655, -0.024971453472971916, -0.023000620305538177, -0.02102978713810444, -0.0190589539706707, -0.01708812080323696, -0.015117287635803223, -0.013146454468369484, -0.011175621300935745, -0.009204788133502007, -0.007233954966068268, -0.005263121798634529, -0.0032922886312007904, -0.0013214554637670517, 0.000649377703666687, 0.0026202108711004257, 0.004591044038534164, 0.006561877205967903, 0.008532710373401642, 0.01050354354083538, 0.01247437670826912, 0.014445209875702858, 0.016416043043136597, 0.018386876210570335, 0.020357709378004074, 0.022328542545437813, 0.024299368262290955, 0.026270201429724693, 0.028241034597158432, 0.03021186776459217, 0.03218270093202591, 0.0341535359621048, 0.03612436726689339, 0.038095198571681976, 0.040066033601760864, 0.04203686863183975, 0.04400769993662834, 0.04597853124141693, 0.04794936627149582, 0.04992020130157471, 0.051891032606363297, 0.053861863911151886, 0.055832698941230774, 0.05780353397130966, 0.05977436527609825, 0.06174519658088684, 0.06371603161096573, 0.06568686664104462, 0.06765769422054291, 0.0696285292506218, 0.07159936428070068, 0.07357019931077957, 0.07554103434085846, 0.07751186192035675, 0.07948269695043564, 0.08145353198051453, 0.08342435956001282, 0.0853951945900917, 0.0873660296201706]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 9.0, 7.0, 8.0, 15.0, 11.0, 8.0, 13.0, 21.0, 18.0, 22.0, 20.0, 32.0, 38.0, 39.0, 30.0, 47.0, 44.0, 34.0, 35.0, 42.0, 58.0, 41.0, 40.0, 32.0, 32.0, 35.0, 33.0, 28.0, 38.0, 27.0, 23.0, 24.0, 20.0, 7.0, 18.0, 12.0, 12.0, 9.0, 9.0, 6.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0], "bins": [-0.0391085147857666, -0.03795212507247925, -0.036795735359191895, -0.03563934564590454, -0.03448295593261719, -0.033326566219329834, -0.03217017650604248, -0.031013786792755127, -0.029857397079467773, -0.02870100736618042, -0.027544617652893066, -0.026388227939605713, -0.02523183822631836, -0.024075448513031006, -0.022919058799743652, -0.0217626690864563, -0.020606279373168945, -0.019449889659881592, -0.01829349994659424, -0.017137110233306885, -0.01598072052001953, -0.014824330806732178, -0.013667941093444824, -0.01251155138015747, -0.011355161666870117, -0.010198771953582764, -0.00904238224029541, -0.007885992527008057, -0.006729602813720703, -0.00557321310043335, -0.004416823387145996, -0.0032604336738586426, -0.002104043960571289, -0.0009476542472839355, 0.00020873546600341797, 0.0013651251792907715, 0.002521514892578125, 0.0036779046058654785, 0.004834294319152832, 0.0059906840324401855, 0.007147073745727539, 0.008303463459014893, 0.009459853172302246, 0.0106162428855896, 0.011772632598876953, 0.012929022312164307, 0.01408541202545166, 0.015241801738739014, 0.016398191452026367, 0.01755458116531372, 0.018710970878601074, 0.019867360591888428, 0.02102375030517578, 0.022180140018463135, 0.02333652973175049, 0.024492919445037842, 0.025649309158325195, 0.02680569887161255, 0.027962088584899902, 0.029118478298187256, 0.03027486801147461, 0.03143125772476196, 0.032587647438049316, 0.03374403715133667, 0.03490042686462402]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 4.0, 3.0, 4.0, 4.0, 3.0, 4.0, 5.0, 15.0, 8.0, 16.0, 25.0, 41.0, 46.0, 71.0, 112.0, 155.0, 274.0, 514.0, 947.0, 1942.0, 4314.0, 11617.0, 35559.0, 132782.0, 433049.0, 310430.0, 79060.0, 22866.0, 8171.0, 3331.0, 1430.0, 674.0, 390.0, 230.0, 136.0, 92.0, 65.0, 56.0, 36.0, 24.0, 12.0, 12.0, 11.0, 7.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.03411865234375, -0.03310966491699219, -0.032100677490234375, -0.031091690063476562, -0.03008270263671875, -0.029073715209960938, -0.028064727783203125, -0.027055740356445312, -0.0260467529296875, -0.025037765502929688, -0.024028778076171875, -0.023019790649414062, -0.02201080322265625, -0.021001815795898438, -0.019992828369140625, -0.018983840942382812, -0.017974853515625, -0.016965866088867188, -0.015956878662109375, -0.014947891235351562, -0.01393890380859375, -0.012929916381835938, -0.011920928955078125, -0.010911941528320312, -0.0099029541015625, -0.008893966674804688, -0.007884979248046875, -0.0068759918212890625, -0.00586700439453125, -0.0048580169677734375, -0.003849029541015625, -0.0028400421142578125, -0.0018310546875, -0.0008220672607421875, 0.000186920166015625, 0.0011959075927734375, 0.00220489501953125, 0.0032138824462890625, 0.004222869873046875, 0.0052318572998046875, 0.0062408447265625, 0.0072498321533203125, 0.008258819580078125, 0.009267807006835938, 0.01027679443359375, 0.011285781860351562, 0.012294769287109375, 0.013303756713867188, 0.014312744140625, 0.015321731567382812, 0.016330718994140625, 0.017339706420898438, 0.01834869384765625, 0.019357681274414062, 0.020366668701171875, 0.021375656127929688, 0.0223846435546875, 0.023393630981445312, 0.024402618408203125, 0.025411605834960938, 0.02642059326171875, 0.027429580688476562, 0.028438568115234375, 0.029447555541992188, 0.03045654296875]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 6.0, 7.0, 8.0, 18.0, 14.0, 18.0, 24.0, 41.0, 34.0, 49.0, 43.0, 48.0, 55.0, 55.0, 57.0, 57.0, 65.0, 47.0, 63.0, 56.0, 50.0, 35.0, 45.0, 19.0, 21.0, 20.0, 7.0, 8.0, 5.0, 2.0, 4.0, 3.0, 3.0, 4.0, 1.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0281982421875, -0.027346134185791016, -0.02649402618408203, -0.025641918182373047, -0.024789810180664062, -0.023937702178955078, -0.023085594177246094, -0.02223348617553711, -0.021381378173828125, -0.02052927017211914, -0.019677162170410156, -0.018825054168701172, -0.017972946166992188, -0.017120838165283203, -0.01626873016357422, -0.015416622161865234, -0.01456451416015625, -0.013712406158447266, -0.012860298156738281, -0.012008190155029297, -0.011156082153320312, -0.010303974151611328, -0.009451866149902344, -0.00859975814819336, -0.007747650146484375, -0.006895542144775391, -0.006043434143066406, -0.005191326141357422, -0.0043392181396484375, -0.003487110137939453, -0.0026350021362304688, -0.0017828941345214844, -0.0009307861328125, -7.867813110351562e-05, 0.0007734298706054688, 0.0016255378723144531, 0.0024776458740234375, 0.003329753875732422, 0.004181861877441406, 0.005033969879150391, 0.005886077880859375, 0.006738185882568359, 0.007590293884277344, 0.008442401885986328, 0.009294509887695312, 0.010146617889404297, 0.010998725891113281, 0.011850833892822266, 0.01270294189453125, 0.013555049896240234, 0.014407157897949219, 0.015259265899658203, 0.016111373901367188, 0.016963481903076172, 0.017815589904785156, 0.01866769790649414, 0.019519805908203125, 0.02037191390991211, 0.021224021911621094, 0.022076129913330078, 0.022928237915039062, 0.023780345916748047, 0.02463245391845703, 0.025484561920166016, 0.026336669921875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 5.0, 3.0, 9.0, 17.0, 12.0, 18.0, 16.0, 40.0, 56.0, 71.0, 115.0, 168.0, 278.0, 531.0, 1169.0, 3159.0, 13167.0, 116263.0, 768382.0, 125352.0, 13858.0, 3309.0, 1173.0, 563.0, 308.0, 164.0, 97.0, 90.0, 44.0, 34.0, 21.0, 20.0, 7.0, 12.0, 7.0, 5.0, 5.0, 2.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.051025390625, -0.04950284957885742, -0.047980308532714844, -0.046457767486572266, -0.04493522644042969, -0.04341268539428711, -0.04189014434814453, -0.04036760330200195, -0.038845062255859375, -0.0373225212097168, -0.03579998016357422, -0.03427743911743164, -0.03275489807128906, -0.031232357025146484, -0.029709815979003906, -0.028187274932861328, -0.02666473388671875, -0.025142192840576172, -0.023619651794433594, -0.022097110748291016, -0.020574569702148438, -0.01905202865600586, -0.01752948760986328, -0.016006946563720703, -0.014484405517578125, -0.012961864471435547, -0.011439323425292969, -0.00991678237915039, -0.008394241333007812, -0.006871700286865234, -0.005349159240722656, -0.003826618194580078, -0.0023040771484375, -0.0007815361022949219, 0.0007410049438476562, 0.0022635459899902344, 0.0037860870361328125, 0.005308628082275391, 0.006831169128417969, 0.008353710174560547, 0.009876251220703125, 0.011398792266845703, 0.012921333312988281, 0.01444387435913086, 0.015966415405273438, 0.017488956451416016, 0.019011497497558594, 0.020534038543701172, 0.02205657958984375, 0.023579120635986328, 0.025101661682128906, 0.026624202728271484, 0.028146743774414062, 0.02966928482055664, 0.03119182586669922, 0.0327143669128418, 0.034236907958984375, 0.03575944900512695, 0.03728199005126953, 0.03880453109741211, 0.04032707214355469, 0.041849613189697266, 0.043372154235839844, 0.04489469528198242, 0.046417236328125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 8.0, 1.0, 3.0, 5.0, 7.0, 13.0, 10.0, 15.0, 19.0, 25.0, 25.0, 23.0, 22.0, 27.0, 36.0, 29.0, 27.0, 37.0, 47.0, 42.0, 53.0, 32.0, 44.0, 38.0, 58.0, 27.0, 42.0, 32.0, 39.0, 22.0, 29.0, 28.0, 23.0, 25.0, 14.0, 14.0, 18.0, 8.0, 10.0, 9.0, 6.0, 4.0, 2.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.07049560546875, -0.06835365295410156, -0.06621170043945312, -0.06406974792480469, -0.06192779541015625, -0.05978584289550781, -0.057643890380859375, -0.05550193786621094, -0.0533599853515625, -0.05121803283691406, -0.049076080322265625, -0.04693412780761719, -0.04479217529296875, -0.04265022277832031, -0.040508270263671875, -0.03836631774902344, -0.036224365234375, -0.03408241271972656, -0.031940460205078125, -0.029798507690429688, -0.02765655517578125, -0.025514602661132812, -0.023372650146484375, -0.021230697631835938, -0.0190887451171875, -0.016946792602539062, -0.014804840087890625, -0.012662887573242188, -0.01052093505859375, -0.008378982543945312, -0.006237030029296875, -0.0040950775146484375, -0.001953125, 0.0001888275146484375, 0.002330780029296875, 0.0044727325439453125, 0.00661468505859375, 0.008756637573242188, 0.010898590087890625, 0.013040542602539062, 0.0151824951171875, 0.017324447631835938, 0.019466400146484375, 0.021608352661132812, 0.02375030517578125, 0.025892257690429688, 0.028034210205078125, 0.030176162719726562, 0.032318115234375, 0.03446006774902344, 0.036602020263671875, 0.03874397277832031, 0.04088592529296875, 0.04302787780761719, 0.045169830322265625, 0.04731178283691406, 0.0494537353515625, 0.05159568786621094, 0.053737640380859375, 0.05587959289550781, 0.05802154541015625, 0.06016349792480469, 0.062305450439453125, 0.06444740295410156, 0.06658935546875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 5.0, 1.0, 1.0, 8.0, 5.0, 10.0, 22.0, 22.0, 35.0, 52.0, 83.0, 135.0, 275.0, 512.0, 1175.0, 3347.0, 14014.0, 97241.0, 724565.0, 178475.0, 21048.0, 4739.0, 1434.0, 650.0, 278.0, 151.0, 85.0, 51.0, 37.0, 24.0, 17.0, 12.0, 11.0, 5.0, 7.0, 6.0, 6.0, 3.0, 6.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01035308837890625, -0.010015010833740234, -0.009676933288574219, -0.009338855743408203, -0.009000778198242188, -0.008662700653076172, -0.008324623107910156, -0.00798654556274414, -0.007648468017578125, -0.007310390472412109, -0.006972312927246094, -0.006634235382080078, -0.0062961578369140625, -0.005958080291748047, -0.005620002746582031, -0.005281925201416016, -0.00494384765625, -0.004605770111083984, -0.004267692565917969, -0.003929615020751953, -0.0035915374755859375, -0.003253459930419922, -0.0029153823852539062, -0.0025773048400878906, -0.002239227294921875, -0.0019011497497558594, -0.0015630722045898438, -0.0012249946594238281, -0.0008869171142578125, -0.0005488395690917969, -0.00021076202392578125, 0.00012731552124023438, 0.00046539306640625, 0.0008034706115722656, 0.0011415481567382812, 0.0014796257019042969, 0.0018177032470703125, 0.002155780792236328, 0.0024938583374023438, 0.0028319358825683594, 0.003170013427734375, 0.0035080909729003906, 0.0038461685180664062, 0.004184246063232422, 0.0045223236083984375, 0.004860401153564453, 0.005198478698730469, 0.005536556243896484, 0.0058746337890625, 0.006212711334228516, 0.006550788879394531, 0.006888866424560547, 0.0072269439697265625, 0.007565021514892578, 0.007903099060058594, 0.00824117660522461, 0.008579254150390625, 0.00891733169555664, 0.009255409240722656, 0.009593486785888672, 0.009931564331054688, 0.010269641876220703, 0.010607719421386719, 0.010945796966552734, 0.01128387451171875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 6.0, 3.0, 16.0, 7.0, 9.0, 11.0, 22.0, 24.0, 27.0, 31.0, 39.0, 44.0, 34.0, 59.0, 43.0, 53.0, 48.0, 53.0, 55.0, 44.0, 35.0, 62.0, 38.0, 45.0, 40.0, 27.0, 29.0, 14.0, 25.0, 7.0, 15.0, 8.0, 9.0, 6.0, 9.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-4.589557647705078e-06, -4.464760422706604e-06, -4.33996319770813e-06, -4.215165972709656e-06, -4.090368747711182e-06, -3.9655715227127075e-06, -3.840774297714233e-06, -3.7159770727157593e-06, -3.591179847717285e-06, -3.466382622718811e-06, -3.341585397720337e-06, -3.216788172721863e-06, -3.0919909477233887e-06, -2.9671937227249146e-06, -2.8423964977264404e-06, -2.7175992727279663e-06, -2.592802047729492e-06, -2.468004822731018e-06, -2.343207597732544e-06, -2.21841037273407e-06, -2.0936131477355957e-06, -1.9688159227371216e-06, -1.8440186977386475e-06, -1.7192214727401733e-06, -1.5944242477416992e-06, -1.469627022743225e-06, -1.344829797744751e-06, -1.2200325727462769e-06, -1.0952353477478027e-06, -9.704381227493286e-07, -8.456408977508545e-07, -7.208436727523804e-07, -5.960464477539062e-07, -4.7124922275543213e-07, -3.46451997756958e-07, -2.2165477275848389e-07, -9.685754776000977e-08, 2.7939677238464355e-08, 1.5273690223693848e-07, 2.775341272354126e-07, 4.023313522338867e-07, 5.271285772323608e-07, 6.51925802230835e-07, 7.767230272293091e-07, 9.015202522277832e-07, 1.0263174772262573e-06, 1.1511147022247314e-06, 1.2759119272232056e-06, 1.4007091522216797e-06, 1.5255063772201538e-06, 1.650303602218628e-06, 1.775100827217102e-06, 1.8998980522155762e-06, 2.0246952772140503e-06, 2.1494925022125244e-06, 2.2742897272109985e-06, 2.3990869522094727e-06, 2.5238841772079468e-06, 2.648681402206421e-06, 2.773478627204895e-06, 2.898275852203369e-06, 3.0230730772018433e-06, 3.1478703022003174e-06, 3.2726675271987915e-06, 3.3974647521972656e-06]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0, 4.0, 5.0, 3.0, 8.0, 11.0, 18.0, 23.0, 46.0, 73.0, 124.0, 251.0, 558.0, 1638.0, 7322.0, 75286.0, 826243.0, 123587.0, 10000.0, 2082.0, 663.0, 253.0, 142.0, 90.0, 52.0, 24.0, 19.0, 14.0, 6.0, 7.0, 8.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.02142333984375, -0.020908117294311523, -0.020392894744873047, -0.01987767219543457, -0.019362449645996094, -0.018847227096557617, -0.01833200454711914, -0.017816781997680664, -0.017301559448242188, -0.01678633689880371, -0.016271114349365234, -0.015755891799926758, -0.015240669250488281, -0.014725446701049805, -0.014210224151611328, -0.013695001602172852, -0.013179779052734375, -0.012664556503295898, -0.012149333953857422, -0.011634111404418945, -0.011118888854980469, -0.010603666305541992, -0.010088443756103516, -0.009573221206665039, -0.009057998657226562, -0.008542776107788086, -0.00802755355834961, -0.007512331008911133, -0.006997108459472656, -0.00648188591003418, -0.005966663360595703, -0.0054514408111572266, -0.00493621826171875, -0.0044209957122802734, -0.003905773162841797, -0.0033905506134033203, -0.0028753280639648438, -0.002360105514526367, -0.0018448829650878906, -0.001329660415649414, -0.0008144378662109375, -0.00029921531677246094, 0.00021600723266601562, 0.0007312297821044922, 0.0012464523315429688, 0.0017616748809814453, 0.002276897430419922, 0.0027921199798583984, 0.003307342529296875, 0.0038225650787353516, 0.004337787628173828, 0.004853010177612305, 0.005368232727050781, 0.005883455276489258, 0.006398677825927734, 0.006913900375366211, 0.0074291229248046875, 0.007944345474243164, 0.00845956802368164, 0.008974790573120117, 0.009490013122558594, 0.01000523567199707, 0.010520458221435547, 0.011035680770874023, 0.0115509033203125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 5.0, 5.0, 3.0, 9.0, 10.0, 6.0, 18.0, 22.0, 22.0, 39.0, 53.0, 80.0, 81.0, 88.0, 91.0, 91.0, 79.0, 67.0, 57.0, 56.0, 25.0, 23.0, 19.0, 19.0, 15.0, 4.0, 5.0, 7.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0130462646484375, -0.012617707252502441, -0.012189149856567383, -0.011760592460632324, -0.011332035064697266, -0.010903477668762207, -0.010474920272827148, -0.01004636287689209, -0.009617805480957031, -0.009189248085021973, -0.008760690689086914, -0.008332133293151855, -0.007903575897216797, -0.007475018501281738, -0.00704646110534668, -0.006617903709411621, -0.0061893463134765625, -0.005760788917541504, -0.005332231521606445, -0.004903674125671387, -0.004475116729736328, -0.0040465593338012695, -0.003618001937866211, -0.0031894445419311523, -0.0027608871459960938, -0.002332329750061035, -0.0019037723541259766, -0.001475214958190918, -0.0010466575622558594, -0.0006181001663208008, -0.0001895427703857422, 0.0002390146255493164, 0.000667572021484375, 0.0010961294174194336, 0.0015246868133544922, 0.0019532442092895508, 0.0023818016052246094, 0.002810359001159668, 0.0032389163970947266, 0.003667473793029785, 0.004096031188964844, 0.004524588584899902, 0.004953145980834961, 0.0053817033767700195, 0.005810260772705078, 0.006238818168640137, 0.006667375564575195, 0.007095932960510254, 0.0075244903564453125, 0.007953047752380371, 0.00838160514831543, 0.008810162544250488, 0.009238719940185547, 0.009667277336120605, 0.010095834732055664, 0.010524392127990723, 0.010952949523925781, 0.01138150691986084, 0.011810064315795898, 0.012238621711730957, 0.012667179107666016, 0.013095736503601074, 0.013524293899536133, 0.013952851295471191, 0.01438140869140625]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 8.0, 15.0, 49.0, 93.0, 197.0, 302.0, 195.0, 92.0, 34.0, 11.0, 5.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6209662556648254, -0.6053115129470825, -0.5896567702293396, -0.5740020275115967, -0.5583473443984985, -0.5426926016807556, -0.5270378589630127, -0.5113831162452698, -0.49572837352752686, -0.48007363080978394, -0.464418888092041, -0.4487641751766205, -0.43310943245887756, -0.41745468974113464, -0.4017999768257141, -0.3861452341079712, -0.37049049139022827, -0.35483574867248535, -0.33918100595474243, -0.3235262930393219, -0.307871550321579, -0.29221680760383606, -0.2765620946884155, -0.2609073519706726, -0.2452526092529297, -0.22959786653518677, -0.21394313871860504, -0.19828841090202332, -0.1826336681842804, -0.16697892546653748, -0.15132419764995575, -0.13566946983337402, -0.12001475691795349, -0.10436002165079117, -0.08870528638362885, -0.07305055111646652, -0.0573958158493042, -0.041741080582141876, -0.026086345314979553, -0.01043161004781723, 0.005223125219345093, 0.020877860486507416, 0.03653259575366974, 0.05218733102083206, 0.06784206628799438, 0.08349680155515671, 0.09915153682231903, 0.11480627208948135, 0.13046100735664368, 0.1461157500743866, 0.16177047789096832, 0.17742520570755005, 0.19307994842529297, 0.2087346911430359, 0.22438941895961761, 0.24004414677619934, 0.25569888949394226, 0.2713536322116852, 0.2870083451271057, 0.30266308784484863, 0.31831783056259155, 0.3339725732803345, 0.3496273159980774, 0.3652820289134979, 0.38093677163124084]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 6.0, 3.0, 2.0, 2.0, 7.0, 12.0, 9.0, 13.0, 12.0, 21.0, 16.0, 23.0, 18.0, 29.0, 35.0, 28.0, 33.0, 30.0, 37.0, 43.0, 52.0, 39.0, 53.0, 43.0, 44.0, 49.0, 39.0, 38.0, 46.0, 40.0, 31.0, 26.0, 19.0, 21.0, 19.0, 11.0, 7.0, 13.0, 9.0, 3.0, 7.0, 5.0, 7.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2847708463668823, -0.27509087324142456, -0.2654108703136444, -0.25573089718818665, -0.2460509091615677, -0.23637092113494873, -0.22669094800949097, -0.217010959982872, -0.20733097195625305, -0.1976509839296341, -0.18797099590301514, -0.17829102277755737, -0.16861103475093842, -0.15893104672431946, -0.1492510735988617, -0.13957108557224274, -0.12989109754562378, -0.12021110951900482, -0.11053112894296646, -0.1008511483669281, -0.09117116034030914, -0.08149117231369019, -0.07181119173765182, -0.062131211161613464, -0.05245122313499451, -0.04277123883366585, -0.03309125453233719, -0.02341127023100853, -0.01373128592967987, -0.0040513016283512115, 0.0056286826729774475, 0.015308663249015808, 0.024988651275634766, 0.034668635576963425, 0.044348619878292084, 0.05402860417962074, 0.0637085884809494, 0.07338857650756836, 0.08306855708360672, 0.09274853765964508, 0.10242852568626404, 0.112108513712883, 0.12178849428892136, 0.13146847486495972, 0.14114846289157867, 0.15082845091819763, 0.1605084240436554, 0.17018841207027435, 0.1798684000968933, 0.18954838812351227, 0.19922837615013123, 0.208908349275589, 0.21858833730220795, 0.2282683253288269, 0.23794829845428467, 0.24762828648090363, 0.2573082745075226, 0.26698824763298035, 0.2766682505607605, 0.28634822368621826, 0.296028196811676, 0.3057081997394562, 0.31538817286491394, 0.3250681757926941, 0.33474814891815186]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 6.0, 6.0, 12.0, 24.0, 68.0, 207.0, 928.0, 11557.0, 4034856.0, 142296.0, 3501.0, 536.0, 158.0, 73.0, 30.0, 13.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1728515625, -0.16890335083007812, -0.16495513916015625, -0.16100692749023438, -0.1570587158203125, -0.15311050415039062, -0.14916229248046875, -0.14521408081054688, -0.141265869140625, -0.13731765747070312, -0.13336944580078125, -0.12942123413085938, -0.1254730224609375, -0.12152481079101562, -0.11757659912109375, -0.11362838745117188, -0.10968017578125, -0.10573196411132812, -0.10178375244140625, -0.09783554077148438, -0.0938873291015625, -0.08993911743164062, -0.08599090576171875, -0.08204269409179688, -0.078094482421875, -0.07414627075195312, -0.07019805908203125, -0.06624984741210938, -0.0623016357421875, -0.058353424072265625, -0.05440521240234375, -0.050457000732421875, -0.0465087890625, -0.042560577392578125, -0.03861236572265625, -0.034664154052734375, -0.0307159423828125, -0.026767730712890625, -0.02281951904296875, -0.018871307373046875, -0.014923095703125, -0.010974884033203125, -0.00702667236328125, -0.003078460693359375, 0.0008697509765625, 0.004817962646484375, 0.00876617431640625, 0.012714385986328125, 0.01666259765625, 0.020610809326171875, 0.02455902099609375, 0.028507232666015625, 0.0324554443359375, 0.036403656005859375, 0.04035186767578125, 0.044300079345703125, 0.048248291015625, 0.052196502685546875, 0.05614471435546875, 0.060092926025390625, 0.0640411376953125, 0.06798934936523438, 0.07193756103515625, 0.07588577270507812, 0.079833984375]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 8.0, 7.0, 10.0, 14.0, 17.0, 33.0, 23.0, 40.0, 47.0, 46.0, 60.0, 52.0, 47.0, 54.0, 67.0, 60.0, 55.0, 68.0, 65.0, 51.0, 31.0, 31.0, 26.0, 22.0, 12.0, 9.0, 11.0, 8.0, 3.0, 2.0, 3.0, 5.0, 1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.02685546875, -0.026024818420410156, -0.025194168090820312, -0.02436351776123047, -0.023532867431640625, -0.02270221710205078, -0.021871566772460938, -0.021040916442871094, -0.02021026611328125, -0.019379615783691406, -0.018548965454101562, -0.01771831512451172, -0.016887664794921875, -0.01605701446533203, -0.015226364135742188, -0.014395713806152344, -0.0135650634765625, -0.012734413146972656, -0.011903762817382812, -0.011073112487792969, -0.010242462158203125, -0.009411811828613281, -0.008581161499023438, -0.007750511169433594, -0.00691986083984375, -0.006089210510253906, -0.0052585601806640625, -0.004427909851074219, -0.003597259521484375, -0.0027666091918945312, -0.0019359588623046875, -0.0011053085327148438, -0.000274658203125, 0.0005559921264648438, 0.0013866424560546875, 0.0022172927856445312, 0.003047943115234375, 0.0038785934448242188, 0.0047092437744140625, 0.005539894104003906, 0.00637054443359375, 0.007201194763183594, 0.008031845092773438, 0.008862495422363281, 0.009693145751953125, 0.010523796081542969, 0.011354446411132812, 0.012185096740722656, 0.0130157470703125, 0.013846397399902344, 0.014677047729492188, 0.015507698059082031, 0.016338348388671875, 0.01716899871826172, 0.017999649047851562, 0.018830299377441406, 0.01966094970703125, 0.020491600036621094, 0.021322250366210938, 0.02215290069580078, 0.022983551025390625, 0.02381420135498047, 0.024644851684570312, 0.025475502014160156, 0.02630615234375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 5.0, 1.0, 2.0, 2.0, 5.0, 6.0, 12.0, 17.0, 8.0, 32.0, 36.0, 65.0, 105.0, 240.0, 887.0, 7617.0, 164874.0, 3988027.0, 29106.0, 2442.0, 405.0, 131.0, 78.0, 57.0, 33.0, 24.0, 17.0, 14.0, 7.0, 4.0, 8.0, 4.0, 4.0, 5.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0947265625, -0.09203910827636719, -0.08935165405273438, -0.08666419982910156, -0.08397674560546875, -0.08128929138183594, -0.07860183715820312, -0.07591438293457031, -0.0732269287109375, -0.07053947448730469, -0.06785202026367188, -0.06516456604003906, -0.06247711181640625, -0.05978965759277344, -0.057102203369140625, -0.05441474914550781, -0.051727294921875, -0.04903984069824219, -0.046352386474609375, -0.04366493225097656, -0.04097747802734375, -0.03829002380371094, -0.035602569580078125, -0.03291511535644531, -0.0302276611328125, -0.027540206909179688, -0.024852752685546875, -0.022165298461914062, -0.01947784423828125, -0.016790390014648438, -0.014102935791015625, -0.011415481567382812, -0.00872802734375, -0.0060405731201171875, -0.003353118896484375, -0.0006656646728515625, 0.00202178955078125, 0.0047092437744140625, 0.007396697998046875, 0.010084152221679688, 0.0127716064453125, 0.015459060668945312, 0.018146514892578125, 0.020833969116210938, 0.02352142333984375, 0.026208877563476562, 0.028896331787109375, 0.03158378601074219, 0.034271240234375, 0.03695869445800781, 0.039646148681640625, 0.04233360290527344, 0.04502105712890625, 0.04770851135253906, 0.050395965576171875, 0.05308341979980469, 0.0557708740234375, 0.05845832824707031, 0.061145782470703125, 0.06383323669433594, 0.06652069091796875, 0.06920814514160156, 0.07189559936523438, 0.07458305358886719, 0.0772705078125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 1.0, 3.0, 8.0, 1.0, 4.0, 11.0, 11.0, 18.0, 18.0, 12.0, 32.0, 40.0, 65.0, 244.0, 1039.0, 1781.0, 469.0, 129.0, 54.0, 29.0, 32.0, 20.0, 15.0, 8.0, 11.0, 8.0, 1.0, 2.0, 1.0, 2.0, 0.0, 6.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.048309326171875, -0.04659318923950195, -0.044877052307128906, -0.04316091537475586, -0.04144477844238281, -0.039728641510009766, -0.03801250457763672, -0.03629636764526367, -0.034580230712890625, -0.03286409378051758, -0.03114795684814453, -0.029431819915771484, -0.027715682983398438, -0.02599954605102539, -0.024283409118652344, -0.022567272186279297, -0.02085113525390625, -0.019134998321533203, -0.017418861389160156, -0.01570272445678711, -0.013986587524414062, -0.012270450592041016, -0.010554313659667969, -0.008838176727294922, -0.007122039794921875, -0.005405902862548828, -0.0036897659301757812, -0.0019736289978027344, -0.0002574920654296875, 0.0014586448669433594, 0.0031747817993164062, 0.004890918731689453, 0.0066070556640625, 0.008323192596435547, 0.010039329528808594, 0.01175546646118164, 0.013471603393554688, 0.015187740325927734, 0.01690387725830078, 0.018620014190673828, 0.020336151123046875, 0.022052288055419922, 0.02376842498779297, 0.025484561920166016, 0.027200698852539062, 0.02891683578491211, 0.030632972717285156, 0.0323491096496582, 0.03406524658203125, 0.0357813835144043, 0.037497520446777344, 0.03921365737915039, 0.04092979431152344, 0.042645931243896484, 0.04436206817626953, 0.04607820510864258, 0.047794342041015625, 0.04951047897338867, 0.05122661590576172, 0.052942752838134766, 0.05465888977050781, 0.05637502670288086, 0.058091163635253906, 0.05980730056762695, 0.0615234375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 6.0, 33.0, 260.0, 478.0, 178.0, 29.0, 9.0, 6.0, 5.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.40531718730926514, -0.3804280757904053, -0.3555389642715454, -0.33064985275268555, -0.30576077103614807, -0.2808716595172882, -0.25598254799842834, -0.23109345138072968, -0.2062043398618698, -0.18131522834300995, -0.15642613172531128, -0.13153702020645142, -0.10664791613817215, -0.08175881206989288, -0.05686970055103302, -0.03198060393333435, -0.007091492414474487, 0.01779761351644993, 0.042686719447374344, 0.06757582724094391, 0.09246493130922318, 0.11735403537750244, 0.1422431468963623, 0.16713224351406097, 0.19202135503292084, 0.2169104665517807, 0.24179956316947937, 0.26668867468833923, 0.2915777862071991, 0.3164668679237366, 0.34135597944259644, 0.3662450909614563, 0.39113420248031616, 0.416023313999176, 0.4409124255180359, 0.46580153703689575, 0.4906906187534332, 0.5155797004699707, 0.5404688119888306, 0.5653579235076904, 0.5902470350265503, 0.6151361465454102, 0.64002525806427, 0.6649143695831299, 0.6898034811019897, 0.7146925926208496, 0.7395817041397095, 0.7644707560539246, 0.7893599271774292, 0.8142490386962891, 0.8391381502151489, 0.8640272617340088, 0.8889163732528687, 0.9138054847717285, 0.9386945962905884, 0.9635836482048035, 0.9884727597236633, 1.0133618116378784, 1.0382509231567383, 1.0631400346755981, 1.088029146194458, 1.1129182577133179, 1.1378073692321777, 1.1626964807510376, 1.1875855922698975]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 10.0, 9.0, 7.0, 8.0, 14.0, 10.0, 10.0, 18.0, 32.0, 19.0, 34.0, 30.0, 36.0, 26.0, 40.0, 47.0, 58.0, 53.0, 43.0, 48.0, 38.0, 51.0, 42.0, 37.0, 38.0, 35.0, 33.0, 19.0, 21.0, 30.0, 19.0, 13.0, 9.0, 23.0, 6.0, 10.0, 9.0, 9.0, 4.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16657251119613647, -0.16070255637168884, -0.1548326164484024, -0.14896266162395477, -0.14309272170066833, -0.1372227668762207, -0.13135281205177307, -0.12548287212848663, -0.1196129247546196, -0.11374297738075256, -0.10787303000688553, -0.1020030826330185, -0.09613312780857086, -0.09026318788528442, -0.08439323306083679, -0.07852328568696976, -0.07265333831310272, -0.06678339093923569, -0.06091344356536865, -0.05504349246621132, -0.049173545092344284, -0.04330359771847725, -0.037433646619319916, -0.03156369924545288, -0.025693751871585846, -0.01982380449771881, -0.013953855261206627, -0.008083906024694443, -0.002213958650827408, 0.003655988723039627, 0.00952593982219696, 0.015395887196063995, 0.02126583456993103, 0.027135781943798065, 0.0330057293176651, 0.038875680416822433, 0.04474562779068947, 0.0506155751645565, 0.05648552626371384, 0.06235547363758087, 0.0682254210114479, 0.07409536838531494, 0.07996531575918198, 0.08583526313304901, 0.09170521795749664, 0.09757515788078308, 0.10344511270523071, 0.10931506007909775, 0.11518500745296478, 0.12105495482683182, 0.12692490220069885, 0.13279485702514648, 0.13866479694843292, 0.14453475177288055, 0.150404691696167, 0.15627464652061462, 0.16214460134506226, 0.1680145561695099, 0.17388449609279633, 0.17975445091724396, 0.1856243908405304, 0.19149434566497803, 0.19736430048942566, 0.2032342404127121, 0.20910418033599854]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 0.0, 4.0, 4.0, 3.0, 3.0, 6.0, 3.0, 10.0, 17.0, 17.0, 30.0, 45.0, 79.0, 121.0, 251.0, 617.0, 1665.0, 5816.0, 30988.0, 252803.0, 619317.0, 114968.0, 16293.0, 3464.0, 1114.0, 440.0, 199.0, 93.0, 69.0, 42.0, 16.0, 20.0, 11.0, 8.0, 8.0, 10.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0556640625, -0.05394172668457031, -0.052219390869140625, -0.05049705505371094, -0.04877471923828125, -0.04705238342285156, -0.045330047607421875, -0.04360771179199219, -0.0418853759765625, -0.04016304016113281, -0.038440704345703125, -0.03671836853027344, -0.03499603271484375, -0.03327369689941406, -0.031551361083984375, -0.029829025268554688, -0.028106689453125, -0.026384353637695312, -0.024662017822265625, -0.022939682006835938, -0.02121734619140625, -0.019495010375976562, -0.017772674560546875, -0.016050338745117188, -0.0143280029296875, -0.012605667114257812, -0.010883331298828125, -0.009160995483398438, -0.00743865966796875, -0.0057163238525390625, -0.003993988037109375, -0.0022716522216796875, -0.00054931640625, 0.0011730194091796875, 0.002895355224609375, 0.0046176910400390625, 0.00634002685546875, 0.008062362670898438, 0.009784698486328125, 0.011507034301757812, 0.0132293701171875, 0.014951705932617188, 0.016674041748046875, 0.018396377563476562, 0.02011871337890625, 0.021841049194335938, 0.023563385009765625, 0.025285720825195312, 0.027008056640625, 0.028730392456054688, 0.030452728271484375, 0.03217506408691406, 0.03389739990234375, 0.03561973571777344, 0.037342071533203125, 0.03906440734863281, 0.0407867431640625, 0.04250907897949219, 0.044231414794921875, 0.04595375061035156, 0.04767608642578125, 0.04939842224121094, 0.051120758056640625, 0.05284309387207031, 0.0545654296875]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 5.0, 3.0, 9.0, 7.0, 10.0, 26.0, 23.0, 33.0, 25.0, 46.0, 43.0, 66.0, 49.0, 58.0, 62.0, 57.0, 63.0, 59.0, 51.0, 67.0, 49.0, 47.0, 37.0, 21.0, 23.0, 14.0, 12.0, 8.0, 9.0, 3.0, 2.0, 1.0, 4.0, 3.0, 2.0, 2.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0271148681640625, -0.026281356811523438, -0.025447845458984375, -0.024614334106445312, -0.02378082275390625, -0.022947311401367188, -0.022113800048828125, -0.021280288696289062, -0.02044677734375, -0.019613265991210938, -0.018779754638671875, -0.017946243286132812, -0.01711273193359375, -0.016279220581054688, -0.015445709228515625, -0.014612197875976562, -0.0137786865234375, -0.012945175170898438, -0.012111663818359375, -0.011278152465820312, -0.01044464111328125, -0.009611129760742188, -0.008777618408203125, -0.007944107055664062, -0.007110595703125, -0.0062770843505859375, -0.005443572998046875, -0.0046100616455078125, -0.00377655029296875, -0.0029430389404296875, -0.002109527587890625, -0.0012760162353515625, -0.0004425048828125, 0.0003910064697265625, 0.001224517822265625, 0.0020580291748046875, 0.00289154052734375, 0.0037250518798828125, 0.004558563232421875, 0.0053920745849609375, 0.0062255859375, 0.0070590972900390625, 0.007892608642578125, 0.008726119995117188, 0.00955963134765625, 0.010393142700195312, 0.011226654052734375, 0.012060165405273438, 0.0128936767578125, 0.013727188110351562, 0.014560699462890625, 0.015394210815429688, 0.01622772216796875, 0.017061233520507812, 0.017894744873046875, 0.018728256225585938, 0.019561767578125, 0.020395278930664062, 0.021228790283203125, 0.022062301635742188, 0.02289581298828125, 0.023729324340820312, 0.024562835693359375, 0.025396347045898438, 0.0262298583984375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 4.0, 7.0, 8.0, 13.0, 26.0, 22.0, 38.0, 40.0, 53.0, 89.0, 99.0, 174.0, 251.0, 390.0, 636.0, 1112.0, 2684.0, 9797.0, 90057.0, 763897.0, 158704.0, 13685.0, 3311.0, 1401.0, 732.0, 397.0, 278.0, 176.0, 126.0, 90.0, 65.0, 43.0, 38.0, 26.0, 16.0, 16.0, 8.0, 11.0, 7.0, 8.0, 4.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.044677734375, -0.04321765899658203, -0.04175758361816406, -0.040297508239746094, -0.038837432861328125, -0.037377357482910156, -0.03591728210449219, -0.03445720672607422, -0.03299713134765625, -0.03153705596923828, -0.030076980590820312, -0.028616905212402344, -0.027156829833984375, -0.025696754455566406, -0.024236679077148438, -0.02277660369873047, -0.0213165283203125, -0.01985645294189453, -0.018396377563476562, -0.016936302185058594, -0.015476226806640625, -0.014016151428222656, -0.012556076049804688, -0.011096000671386719, -0.00963592529296875, -0.008175849914550781, -0.0067157745361328125, -0.005255699157714844, -0.003795623779296875, -0.0023355484008789062, -0.0008754730224609375, 0.0005846023559570312, 0.002044677734375, 0.0035047531127929688, 0.0049648284912109375, 0.006424903869628906, 0.007884979248046875, 0.009345054626464844, 0.010805130004882812, 0.012265205383300781, 0.01372528076171875, 0.015185356140136719, 0.016645431518554688, 0.018105506896972656, 0.019565582275390625, 0.021025657653808594, 0.022485733032226562, 0.02394580841064453, 0.0254058837890625, 0.02686595916748047, 0.028326034545898438, 0.029786109924316406, 0.031246185302734375, 0.032706260681152344, 0.03416633605957031, 0.03562641143798828, 0.03708648681640625, 0.03854656219482422, 0.04000663757324219, 0.041466712951660156, 0.042926788330078125, 0.044386863708496094, 0.04584693908691406, 0.04730701446533203, 0.04876708984375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 2.0, 4.0, 5.0, 6.0, 1.0, 3.0, 9.0, 7.0, 7.0, 7.0, 14.0, 13.0, 13.0, 23.0, 21.0, 24.0, 17.0, 36.0, 30.0, 35.0, 30.0, 37.0, 44.0, 41.0, 30.0, 34.0, 53.0, 33.0, 43.0, 40.0, 38.0, 38.0, 33.0, 37.0, 22.0, 29.0, 26.0, 11.0, 18.0, 16.0, 18.0, 8.0, 6.0, 7.0, 8.0, 5.0, 6.0, 5.0, 2.0, 4.0, 5.0, 3.0, 3.0, 0.0, 3.0, 3.0, 1.0], "bins": [-0.0577392578125, -0.05598640441894531, -0.054233551025390625, -0.05248069763183594, -0.05072784423828125, -0.04897499084472656, -0.047222137451171875, -0.04546928405761719, -0.0437164306640625, -0.04196357727050781, -0.040210723876953125, -0.03845787048339844, -0.03670501708984375, -0.03495216369628906, -0.033199310302734375, -0.03144645690917969, -0.029693603515625, -0.027940750122070312, -0.026187896728515625, -0.024435043334960938, -0.02268218994140625, -0.020929336547851562, -0.019176483154296875, -0.017423629760742188, -0.0156707763671875, -0.013917922973632812, -0.012165069580078125, -0.010412216186523438, -0.00865936279296875, -0.0069065093994140625, -0.005153656005859375, -0.0034008026123046875, -0.00164794921875, 0.0001049041748046875, 0.001857757568359375, 0.0036106109619140625, 0.00536346435546875, 0.0071163177490234375, 0.008869171142578125, 0.010622024536132812, 0.0123748779296875, 0.014127731323242188, 0.015880584716796875, 0.017633438110351562, 0.01938629150390625, 0.021139144897460938, 0.022891998291015625, 0.024644851684570312, 0.026397705078125, 0.028150558471679688, 0.029903411865234375, 0.03165626525878906, 0.03340911865234375, 0.03516197204589844, 0.036914825439453125, 0.03866767883300781, 0.0404205322265625, 0.04217338562011719, 0.043926239013671875, 0.04567909240722656, 0.04743194580078125, 0.04918479919433594, 0.050937652587890625, 0.05269050598144531, 0.054443359375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 4.0, 2.0, 1.0, 4.0, 6.0, 7.0, 5.0, 11.0, 17.0, 10.0, 20.0, 28.0, 38.0, 51.0, 82.0, 147.0, 269.0, 427.0, 820.0, 1912.0, 5617.0, 22870.0, 294987.0, 668884.0, 39525.0, 7767.0, 2558.0, 1094.0, 514.0, 328.0, 174.0, 103.0, 77.0, 51.0, 36.0, 21.0, 25.0, 20.0, 14.0, 9.0, 9.0, 2.0, 3.0, 3.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0187530517578125, -0.0182037353515625, -0.0176544189453125, -0.0171051025390625, -0.0165557861328125, -0.0160064697265625, -0.0154571533203125, -0.0149078369140625, -0.0143585205078125, -0.0138092041015625, -0.0132598876953125, -0.0127105712890625, -0.0121612548828125, -0.0116119384765625, -0.0110626220703125, -0.0105133056640625, -0.0099639892578125, -0.0094146728515625, -0.0088653564453125, -0.0083160400390625, -0.0077667236328125, -0.0072174072265625, -0.0066680908203125, -0.0061187744140625, -0.0055694580078125, -0.0050201416015625, -0.0044708251953125, -0.0039215087890625, -0.0033721923828125, -0.0028228759765625, -0.0022735595703125, -0.0017242431640625, -0.0011749267578125, -0.0006256103515625, -7.62939453125e-05, 0.0004730224609375, 0.0010223388671875, 0.0015716552734375, 0.0021209716796875, 0.0026702880859375, 0.0032196044921875, 0.0037689208984375, 0.0043182373046875, 0.0048675537109375, 0.0054168701171875, 0.0059661865234375, 0.0065155029296875, 0.0070648193359375, 0.0076141357421875, 0.0081634521484375, 0.0087127685546875, 0.0092620849609375, 0.0098114013671875, 0.0103607177734375, 0.0109100341796875, 0.0114593505859375, 0.0120086669921875, 0.0125579833984375, 0.0131072998046875, 0.0136566162109375, 0.0142059326171875, 0.0147552490234375, 0.0153045654296875, 0.0158538818359375, 0.0164031982421875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 4.0, 10.0, 14.0, 22.0, 27.0, 31.0, 36.0, 50.0, 44.0, 73.0, 59.0, 76.0, 62.0, 100.0, 77.0, 57.0, 69.0, 33.0, 39.0, 30.0, 23.0, 14.0, 21.0, 9.0, 4.0, 8.0, 2.0, 1.0, 4.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.377696990966797e-06, -6.168149411678314e-06, -5.9586018323898315e-06, -5.749054253101349e-06, -5.539506673812866e-06, -5.3299590945243835e-06, -5.120411515235901e-06, -4.910863935947418e-06, -4.7013163566589355e-06, -4.491768777370453e-06, -4.28222119808197e-06, -4.0726736187934875e-06, -3.863126039505005e-06, -3.6535784602165222e-06, -3.4440308809280396e-06, -3.234483301639557e-06, -3.0249357223510742e-06, -2.8153881430625916e-06, -2.605840563774109e-06, -2.3962929844856262e-06, -2.1867454051971436e-06, -1.977197825908661e-06, -1.7676502466201782e-06, -1.5581026673316956e-06, -1.3485550880432129e-06, -1.1390075087547302e-06, -9.294599294662476e-07, -7.199123501777649e-07, -5.103647708892822e-07, -3.0081719160079956e-07, -9.12696123123169e-08, 1.1827796697616577e-07, 3.2782554626464844e-07, 5.373731255531311e-07, 7.469207048416138e-07, 9.564682841300964e-07, 1.166015863418579e-06, 1.3755634427070618e-06, 1.5851110219955444e-06, 1.794658601284027e-06, 2.0042061805725098e-06, 2.2137537598609924e-06, 2.423301339149475e-06, 2.6328489184379578e-06, 2.8423964977264404e-06, 3.051944077014923e-06, 3.2614916563034058e-06, 3.4710392355918884e-06, 3.680586814880371e-06, 3.890134394168854e-06, 4.0996819734573364e-06, 4.309229552745819e-06, 4.518777132034302e-06, 4.7283247113227844e-06, 4.937872290611267e-06, 5.14741986989975e-06, 5.356967449188232e-06, 5.566515028476715e-06, 5.776062607765198e-06, 5.98561018705368e-06, 6.195157766342163e-06, 6.404705345630646e-06, 6.614252924919128e-06, 6.823800504207611e-06, 7.033348083496094e-06]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 3.0, 4.0, 3.0, 4.0, 5.0, 10.0, 20.0, 21.0, 29.0, 41.0, 67.0, 110.0, 159.0, 287.0, 668.0, 1759.0, 7424.0, 91895.0, 874062.0, 63109.0, 6022.0, 1573.0, 547.0, 279.0, 162.0, 101.0, 55.0, 43.0, 25.0, 18.0, 13.0, 8.0, 11.0, 2.0, 6.0, 1.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.024383544921875, -0.023654460906982422, -0.022925376892089844, -0.022196292877197266, -0.021467208862304688, -0.02073812484741211, -0.02000904083251953, -0.019279956817626953, -0.018550872802734375, -0.017821788787841797, -0.01709270477294922, -0.01636362075805664, -0.015634536743164062, -0.014905452728271484, -0.014176368713378906, -0.013447284698486328, -0.01271820068359375, -0.011989116668701172, -0.011260032653808594, -0.010530948638916016, -0.009801864624023438, -0.00907278060913086, -0.008343696594238281, -0.007614612579345703, -0.006885528564453125, -0.006156444549560547, -0.005427360534667969, -0.004698276519775391, -0.0039691925048828125, -0.0032401084899902344, -0.0025110244750976562, -0.0017819404602050781, -0.0010528564453125, -0.0003237724304199219, 0.00040531158447265625, 0.0011343955993652344, 0.0018634796142578125, 0.0025925636291503906, 0.0033216476440429688, 0.004050731658935547, 0.004779815673828125, 0.005508899688720703, 0.006237983703613281, 0.006967067718505859, 0.0076961517333984375, 0.008425235748291016, 0.009154319763183594, 0.009883403778076172, 0.01061248779296875, 0.011341571807861328, 0.012070655822753906, 0.012799739837646484, 0.013528823852539062, 0.01425790786743164, 0.014986991882324219, 0.015716075897216797, 0.016445159912109375, 0.017174243927001953, 0.01790332794189453, 0.01863241195678711, 0.019361495971679688, 0.020090579986572266, 0.020819664001464844, 0.021548748016357422, 0.02227783203125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 4.0, 4.0, 5.0, 3.0, 8.0, 7.0, 10.0, 10.0, 22.0, 34.0, 43.0, 34.0, 63.0, 59.0, 78.0, 75.0, 83.0, 80.0, 64.0, 66.0, 53.0, 39.0, 20.0, 22.0, 26.0, 26.0, 10.0, 13.0, 5.0, 8.0, 2.0, 10.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01523590087890625, -0.0147627592086792, -0.014289617538452148, -0.013816475868225098, -0.013343334197998047, -0.012870192527770996, -0.012397050857543945, -0.011923909187316895, -0.011450767517089844, -0.010977625846862793, -0.010504484176635742, -0.010031342506408691, -0.00955820083618164, -0.00908505916595459, -0.008611917495727539, -0.008138775825500488, -0.0076656341552734375, -0.007192492485046387, -0.006719350814819336, -0.006246209144592285, -0.005773067474365234, -0.005299925804138184, -0.004826784133911133, -0.004353642463684082, -0.0038805007934570312, -0.0034073591232299805, -0.0029342174530029297, -0.002461075782775879, -0.001987934112548828, -0.0015147924423217773, -0.0010416507720947266, -0.0005685091018676758, -9.5367431640625e-05, 0.0003777742385864258, 0.0008509159088134766, 0.0013240575790405273, 0.0017971992492675781, 0.002270340919494629, 0.0027434825897216797, 0.0032166242599487305, 0.0036897659301757812, 0.004162907600402832, 0.004636049270629883, 0.005109190940856934, 0.005582332611083984, 0.006055474281311035, 0.006528615951538086, 0.007001757621765137, 0.0074748992919921875, 0.007948040962219238, 0.008421182632446289, 0.00889432430267334, 0.00936746597290039, 0.009840607643127441, 0.010313749313354492, 0.010786890983581543, 0.011260032653808594, 0.011733174324035645, 0.012206315994262695, 0.012679457664489746, 0.013152599334716797, 0.013625741004943848, 0.014098882675170898, 0.01457202434539795, 0.015045166015625]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 13.0, 13.0, 46.0, 153.0, 369.0, 302.0, 74.0, 23.0, 8.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.34949028491973877, -0.32884424924850464, -0.3081982135772705, -0.2875521779060364, -0.26690614223480225, -0.24626010656356812, -0.22561407089233398, -0.20496803522109985, -0.18432199954986572, -0.1636759638786316, -0.14302992820739746, -0.12238389253616333, -0.1017378568649292, -0.08109182119369507, -0.06044578552246094, -0.03979974985122681, -0.019153714179992676, 0.001492321491241455, 0.022138357162475586, 0.04278439283370972, 0.06343042850494385, 0.08407646417617798, 0.10472249984741211, 0.12536853551864624, 0.14601457118988037, 0.1666606068611145, 0.18730664253234863, 0.20795267820358276, 0.2285987138748169, 0.24924474954605103, 0.26989078521728516, 0.2905368208885193, 0.31118279695510864, 0.3318288326263428, 0.3524748682975769, 0.37312090396881104, 0.39376693964004517, 0.4144129753112793, 0.4350590109825134, 0.45570504665374756, 0.4763510823249817, 0.4969971179962158, 0.51764315366745, 0.5382891893386841, 0.5589352250099182, 0.5795812606811523, 0.6002272963523865, 0.6208733320236206, 0.6415193676948547, 0.6621654033660889, 0.682811439037323, 0.7034574747085571, 0.7241035103797913, 0.7447495460510254, 0.7653955817222595, 0.7860416173934937, 0.8066876530647278, 0.8273336887359619, 0.847979724407196, 0.8686257600784302, 0.8892717957496643, 0.9099178314208984, 0.9305638670921326, 0.9512099027633667, 0.9718559384346008]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 5.0, 3.0, 5.0, 10.0, 9.0, 10.0, 8.0, 10.0, 20.0, 14.0, 15.0, 12.0, 30.0, 21.0, 31.0, 27.0, 49.0, 43.0, 36.0, 43.0, 57.0, 49.0, 61.0, 48.0, 40.0, 35.0, 42.0, 34.0, 40.0, 19.0, 29.0, 23.0, 21.0, 17.0, 11.0, 15.0, 7.0, 16.0, 4.0, 7.0, 8.0, 6.0, 7.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0], "bins": [-0.24312418699264526, -0.23563644289970398, -0.2281486988067627, -0.2206609547138214, -0.21317321062088013, -0.20568546652793884, -0.19819772243499756, -0.19070997834205627, -0.183222234249115, -0.1757344901561737, -0.16824674606323242, -0.16075900197029114, -0.15327125787734985, -0.14578351378440857, -0.13829576969146729, -0.130808025598526, -0.12332029640674591, -0.11583255231380463, -0.10834480822086334, -0.10085706412792206, -0.09336932003498077, -0.08588157594203949, -0.0783938392996788, -0.07090609520673752, -0.06341835111379623, -0.05593060702085495, -0.048442862927913666, -0.04095512256026268, -0.033467378467321396, -0.02597963437438011, -0.018491894006729126, -0.011004149913787842, -0.0035164058208465576, 0.003971337340772152, 0.011459080502390862, 0.018946822732686996, 0.02643456682562828, 0.033922310918569565, 0.04141005128622055, 0.048897795379161835, 0.05638553947210312, 0.0638732835650444, 0.07136102765798569, 0.07884876430034637, 0.08633650839328766, 0.09382425248622894, 0.10131199657917023, 0.10879974067211151, 0.1162874847650528, 0.12377522885799408, 0.13126297295093536, 0.13875071704387665, 0.14623846113681793, 0.15372620522975922, 0.1612139344215393, 0.1687016785144806, 0.17618942260742188, 0.18367716670036316, 0.19116491079330444, 0.19865265488624573, 0.206140398979187, 0.2136281430721283, 0.22111588716506958, 0.22860363125801086, 0.23609137535095215]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 3.0, 3.0, 11.0, 20.0, 24.0, 79.0, 159.0, 320.0, 1222.0, 4191573.0, 467.0, 205.0, 97.0, 50.0, 23.0, 10.0, 8.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.056640625, -2.0089797973632812, -1.9613189697265625, -1.9136581420898438, -1.865997314453125, -1.8183364868164062, -1.7706756591796875, -1.7230148315429688, -1.67535400390625, -1.6276931762695312, -1.5800323486328125, -1.5323715209960938, -1.484710693359375, -1.4370498657226562, -1.3893890380859375, -1.3417282104492188, -1.2940673828125, -1.2464065551757812, -1.1987457275390625, -1.1510848999023438, -1.103424072265625, -1.0557632446289062, -1.0081024169921875, -0.9604415893554688, -0.91278076171875, -0.8651199340820312, -0.8174591064453125, -0.7697982788085938, -0.722137451171875, -0.6744766235351562, -0.6268157958984375, -0.5791549682617188, -0.531494140625, -0.48383331298828125, -0.4361724853515625, -0.38851165771484375, -0.340850830078125, -0.29319000244140625, -0.2455291748046875, -0.19786834716796875, -0.15020751953125, -0.10254669189453125, -0.0548858642578125, -0.00722503662109375, 0.040435791015625, 0.08809661865234375, 0.1357574462890625, 0.18341827392578125, 0.2310791015625, 0.27873992919921875, 0.3264007568359375, 0.37406158447265625, 0.421722412109375, 0.46938323974609375, 0.5170440673828125, 0.5647048950195312, 0.61236572265625, 0.6600265502929688, 0.7076873779296875, 0.7553482055664062, 0.803009033203125, 0.8506698608398438, 0.8983306884765625, 0.9459915161132812, 0.99365234375]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 2.0, 7.0, 8.0, 4.0, 19.0, 21.0, 22.0, 30.0, 34.0, 51.0, 57.0, 61.0, 67.0, 70.0, 62.0, 69.0, 75.0, 68.0, 63.0, 41.0, 58.0, 28.0, 23.0, 16.0, 14.0, 7.0, 3.0, 6.0, 5.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0307769775390625, -0.029887914657592773, -0.028998851776123047, -0.02810978889465332, -0.027220726013183594, -0.026331663131713867, -0.02544260025024414, -0.024553537368774414, -0.023664474487304688, -0.02277541160583496, -0.021886348724365234, -0.020997285842895508, -0.02010822296142578, -0.019219160079956055, -0.018330097198486328, -0.0174410343170166, -0.016551971435546875, -0.01566290855407715, -0.014773845672607422, -0.013884782791137695, -0.012995719909667969, -0.012106657028198242, -0.011217594146728516, -0.010328531265258789, -0.009439468383789062, -0.008550405502319336, -0.007661342620849609, -0.006772279739379883, -0.005883216857910156, -0.00499415397644043, -0.004105091094970703, -0.0032160282135009766, -0.00232696533203125, -0.0014379024505615234, -0.0005488395690917969, 0.0003402233123779297, 0.0012292861938476562, 0.002118349075317383, 0.0030074119567871094, 0.003896474838256836, 0.0047855377197265625, 0.005674600601196289, 0.006563663482666016, 0.007452726364135742, 0.008341789245605469, 0.009230852127075195, 0.010119915008544922, 0.011008977890014648, 0.011898040771484375, 0.012787103652954102, 0.013676166534423828, 0.014565229415893555, 0.015454292297363281, 0.016343355178833008, 0.017232418060302734, 0.01812148094177246, 0.019010543823242188, 0.019899606704711914, 0.02078866958618164, 0.021677732467651367, 0.022566795349121094, 0.02345585823059082, 0.024344921112060547, 0.025233983993530273, 0.026123046875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 5.0, 9.0, 16.0, 19.0, 45.0, 93.0, 269.0, 2088.0, 491835.0, 3694913.0, 4275.0, 390.0, 151.0, 74.0, 51.0, 26.0, 20.0, 9.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.194580078125, -0.1900625228881836, -0.1855449676513672, -0.18102741241455078, -0.17650985717773438, -0.17199230194091797, -0.16747474670410156, -0.16295719146728516, -0.15843963623046875, -0.15392208099365234, -0.14940452575683594, -0.14488697052001953, -0.14036941528320312, -0.13585186004638672, -0.1313343048095703, -0.1268167495727539, -0.1222991943359375, -0.1177816390991211, -0.11326408386230469, -0.10874652862548828, -0.10422897338867188, -0.09971141815185547, -0.09519386291503906, -0.09067630767822266, -0.08615875244140625, -0.08164119720458984, -0.07712364196777344, -0.07260608673095703, -0.06808853149414062, -0.06357097625732422, -0.05905342102050781, -0.054535865783691406, -0.050018310546875, -0.045500755310058594, -0.04098320007324219, -0.03646564483642578, -0.031948089599609375, -0.02743053436279297, -0.022912979125976562, -0.018395423889160156, -0.01387786865234375, -0.009360313415527344, -0.0048427581787109375, -0.00032520294189453125, 0.004192352294921875, 0.008709907531738281, 0.013227462768554688, 0.017745018005371094, 0.0222625732421875, 0.026780128479003906, 0.03129768371582031, 0.03581523895263672, 0.040332794189453125, 0.04485034942626953, 0.04936790466308594, 0.053885459899902344, 0.05840301513671875, 0.06292057037353516, 0.06743812561035156, 0.07195568084716797, 0.07647323608398438, 0.08099079132080078, 0.08550834655761719, 0.0900259017944336, 0.09454345703125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 4.0, 7.0, 11.0, 33.0, 48.0, 164.0, 813.0, 2177.0, 556.0, 134.0, 51.0, 29.0, 15.0, 13.0, 8.0, 2.0, 1.0, 2.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.044677734375, -0.042484283447265625, -0.04029083251953125, -0.038097381591796875, -0.0359039306640625, -0.033710479736328125, -0.03151702880859375, -0.029323577880859375, -0.027130126953125, -0.024936676025390625, -0.02274322509765625, -0.020549774169921875, -0.0183563232421875, -0.016162872314453125, -0.01396942138671875, -0.011775970458984375, -0.00958251953125, -0.007389068603515625, -0.00519561767578125, -0.003002166748046875, -0.0008087158203125, 0.001384735107421875, 0.00357818603515625, 0.005771636962890625, 0.007965087890625, 0.010158538818359375, 0.01235198974609375, 0.014545440673828125, 0.0167388916015625, 0.018932342529296875, 0.02112579345703125, 0.023319244384765625, 0.0255126953125, 0.027706146240234375, 0.02989959716796875, 0.032093048095703125, 0.0342864990234375, 0.036479949951171875, 0.03867340087890625, 0.040866851806640625, 0.043060302734375, 0.045253753662109375, 0.04744720458984375, 0.049640655517578125, 0.0518341064453125, 0.054027557373046875, 0.05622100830078125, 0.058414459228515625, 0.06060791015625, 0.06280136108398438, 0.06499481201171875, 0.06718826293945312, 0.0693817138671875, 0.07157516479492188, 0.07376861572265625, 0.07596206665039062, 0.078155517578125, 0.08034896850585938, 0.08254241943359375, 0.08473587036132812, 0.0869293212890625, 0.08912277221679688, 0.09131622314453125, 0.09350967407226562, 0.095703125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 9.0, 8.0, 39.0, 124.0, 290.0, 294.0, 153.0, 41.0, 18.0, 11.0, 7.0, 3.0, 6.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2759837508201599, -0.2606286108493805, -0.24527345597743988, -0.22991830110549927, -0.21456316113471985, -0.19920802116394043, -0.18385286629199982, -0.1684977114200592, -0.15314257144927979, -0.13778743147850037, -0.12243227660655975, -0.10707712918519974, -0.09172198176383972, -0.0763668343424797, -0.06101168692111969, -0.045656539499759674, -0.030301392078399658, -0.014946244657039642, 0.00040890276432037354, 0.01576405018568039, 0.031119197607040405, 0.04647434502840042, 0.06182949244976044, 0.07718463987112045, 0.09253978729248047, 0.10789493471384048, 0.1232500821352005, 0.1386052370071411, 0.15396037697792053, 0.16931551694869995, 0.18467067182064056, 0.20002582669258118, 0.2153809666633606, 0.23073610663414001, 0.24609126150608063, 0.26144641637802124, 0.27680155634880066, 0.2921566963195801, 0.3075118660926819, 0.3228670060634613, 0.3382221460342407, 0.35357728600502014, 0.36893242597579956, 0.38428759574890137, 0.3996427357196808, 0.4149978756904602, 0.430353045463562, 0.44570818543434143, 0.46106332540512085, 0.47641846537590027, 0.4917736053466797, 0.5071287751197815, 0.5224839448928833, 0.5378390550613403, 0.5531942248344421, 0.5685493350028992, 0.583904504776001, 0.5992596745491028, 0.6146147847175598, 0.6299699544906616, 0.6453250646591187, 0.6606802344322205, 0.6760354042053223, 0.6913905143737793, 0.7067456841468811]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 4.0, 5.0, 2.0, 7.0, 8.0, 5.0, 11.0, 16.0, 16.0, 22.0, 17.0, 19.0, 34.0, 31.0, 38.0, 38.0, 41.0, 43.0, 54.0, 54.0, 54.0, 53.0, 56.0, 52.0, 39.0, 37.0, 31.0, 38.0, 39.0, 31.0, 24.0, 22.0, 14.0, 11.0, 9.0, 5.0, 8.0, 8.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.18403828144073486, -0.17900219559669495, -0.17396612465381622, -0.1689300388097763, -0.16389396786689758, -0.15885788202285767, -0.15382179617881775, -0.14878571033477783, -0.1437496393918991, -0.1387135535478592, -0.13367748260498047, -0.12864139676094055, -0.12360531836748123, -0.11856923997402191, -0.113533154129982, -0.10849707573652267, -0.10346099734306335, -0.09842491894960403, -0.09338884055614471, -0.0883527547121048, -0.08331667631864548, -0.07828059792518616, -0.07324451208114624, -0.06820843368768692, -0.0631723552942276, -0.05813627690076828, -0.05310019478201866, -0.04806411266326904, -0.04302803426980972, -0.0379919558763504, -0.032955873757600784, -0.027919791638851166, -0.022883713245391846, -0.017847632989287376, -0.012811552733182907, -0.007775472477078438, -0.0027393922209739685, 0.002296688035130501, 0.00733276829123497, 0.012368850409984589, 0.01740492880344391, 0.022441009059548378, 0.027477089315652847, 0.032513171434402466, 0.037549249827861786, 0.042585328221321106, 0.047621410340070724, 0.05265749245882034, 0.05769357085227966, 0.06272964924573898, 0.0677657276391983, 0.07280181348323822, 0.07783789187669754, 0.08287397027015686, 0.08791005611419678, 0.0929461345076561, 0.09798221290111542, 0.10301829129457474, 0.10805436968803406, 0.11309045553207397, 0.1181265339255333, 0.12316261231899261, 0.12819869816303253, 0.13323476910591125, 0.13827085494995117]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 5.0, 6.0, 8.0, 9.0, 11.0, 13.0, 21.0, 29.0, 44.0, 68.0, 117.0, 229.0, 564.0, 1546.0, 5489.0, 97630.0, 915539.0, 22037.0, 3305.0, 993.0, 412.0, 189.0, 91.0, 67.0, 37.0, 19.0, 16.0, 16.0, 9.0, 7.0, 10.0, 2.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.18505859375, -0.1800994873046875, -0.175140380859375, -0.1701812744140625, -0.16522216796875, -0.1602630615234375, -0.155303955078125, -0.1503448486328125, -0.1453857421875, -0.1404266357421875, -0.135467529296875, -0.1305084228515625, -0.12554931640625, -0.1205902099609375, -0.115631103515625, -0.1106719970703125, -0.105712890625, -0.1007537841796875, -0.095794677734375, -0.0908355712890625, -0.08587646484375, -0.0809173583984375, -0.075958251953125, -0.0709991455078125, -0.0660400390625, -0.0610809326171875, -0.056121826171875, -0.0511627197265625, -0.04620361328125, -0.0412445068359375, -0.036285400390625, -0.0313262939453125, -0.0263671875, -0.0214080810546875, -0.016448974609375, -0.0114898681640625, -0.00653076171875, -0.0015716552734375, 0.003387451171875, 0.0083465576171875, 0.0133056640625, 0.0182647705078125, 0.023223876953125, 0.0281829833984375, 0.03314208984375, 0.0381011962890625, 0.043060302734375, 0.0480194091796875, 0.052978515625, 0.0579376220703125, 0.062896728515625, 0.0678558349609375, 0.07281494140625, 0.0777740478515625, 0.082733154296875, 0.0876922607421875, 0.0926513671875, 0.0976104736328125, 0.102569580078125, 0.1075286865234375, 0.11248779296875, 0.1174468994140625, 0.122406005859375, 0.1273651123046875, 0.13232421875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 7.0, 4.0, 8.0, 11.0, 10.0, 14.0, 25.0, 21.0, 37.0, 61.0, 56.0, 67.0, 70.0, 64.0, 75.0, 57.0, 86.0, 68.0, 54.0, 48.0, 39.0, 37.0, 20.0, 21.0, 12.0, 4.0, 6.0, 4.0, 7.0, 3.0, 4.0, 4.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.031097412109375, -0.030173540115356445, -0.02924966812133789, -0.028325796127319336, -0.02740192413330078, -0.026478052139282227, -0.025554180145263672, -0.024630308151245117, -0.023706436157226562, -0.022782564163208008, -0.021858692169189453, -0.0209348201751709, -0.020010948181152344, -0.01908707618713379, -0.018163204193115234, -0.01723933219909668, -0.016315460205078125, -0.01539158821105957, -0.014467716217041016, -0.013543844223022461, -0.012619972229003906, -0.011696100234985352, -0.010772228240966797, -0.009848356246948242, -0.008924484252929688, -0.008000612258911133, -0.007076740264892578, -0.0061528682708740234, -0.005228996276855469, -0.004305124282836914, -0.0033812522888183594, -0.0024573802947998047, -0.00153350830078125, -0.0006096363067626953, 0.0003142356872558594, 0.001238107681274414, 0.0021619796752929688, 0.0030858516693115234, 0.004009723663330078, 0.004933595657348633, 0.0058574676513671875, 0.006781339645385742, 0.007705211639404297, 0.008629083633422852, 0.009552955627441406, 0.010476827621459961, 0.011400699615478516, 0.01232457160949707, 0.013248443603515625, 0.01417231559753418, 0.015096187591552734, 0.01602005958557129, 0.016943931579589844, 0.0178678035736084, 0.018791675567626953, 0.019715547561645508, 0.020639419555664062, 0.021563291549682617, 0.022487163543701172, 0.023411035537719727, 0.02433490753173828, 0.025258779525756836, 0.02618265151977539, 0.027106523513793945, 0.0280303955078125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 4.0, 9.0, 6.0, 5.0, 9.0, 7.0, 15.0, 14.0, 18.0, 37.0, 47.0, 56.0, 84.0, 133.0, 193.0, 360.0, 656.0, 1366.0, 3306.0, 10186.0, 51607.0, 421768.0, 486707.0, 54858.0, 10655.0, 3363.0, 1366.0, 651.0, 382.0, 236.0, 125.0, 108.0, 56.0, 47.0, 26.0, 12.0, 20.0, 9.0, 12.0, 9.0, 8.0, 9.0, 5.0, 5.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0543212890625, -0.052813053131103516, -0.05130481719970703, -0.04979658126831055, -0.04828834533691406, -0.04678010940551758, -0.045271873474121094, -0.04376363754272461, -0.042255401611328125, -0.04074716567993164, -0.039238929748535156, -0.03773069381713867, -0.03622245788574219, -0.0347142219543457, -0.03320598602294922, -0.031697750091552734, -0.03018951416015625, -0.028681278228759766, -0.02717304229736328, -0.025664806365966797, -0.024156570434570312, -0.022648334503173828, -0.021140098571777344, -0.01963186264038086, -0.018123626708984375, -0.01661539077758789, -0.015107154846191406, -0.013598918914794922, -0.012090682983398438, -0.010582447052001953, -0.009074211120605469, -0.007565975189208984, -0.0060577392578125, -0.004549503326416016, -0.0030412673950195312, -0.0015330314636230469, -2.47955322265625e-05, 0.0014834403991699219, 0.0029916763305664062, 0.004499912261962891, 0.006008148193359375, 0.007516384124755859, 0.009024620056152344, 0.010532855987548828, 0.012041091918945312, 0.013549327850341797, 0.015057563781738281, 0.016565799713134766, 0.01807403564453125, 0.019582271575927734, 0.02109050750732422, 0.022598743438720703, 0.024106979370117188, 0.025615215301513672, 0.027123451232910156, 0.02863168716430664, 0.030139923095703125, 0.03164815902709961, 0.033156394958496094, 0.03466463088989258, 0.03617286682128906, 0.03768110275268555, 0.03918933868408203, 0.040697574615478516, 0.042205810546875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 0.0, 2.0, 8.0, 4.0, 5.0, 10.0, 13.0, 24.0, 10.0, 18.0, 25.0, 29.0, 23.0, 38.0, 21.0, 35.0, 32.0, 48.0, 45.0, 45.0, 45.0, 38.0, 47.0, 45.0, 47.0, 37.0, 30.0, 40.0, 42.0, 19.0, 24.0, 30.0, 37.0, 14.0, 17.0, 5.0, 13.0, 16.0, 7.0, 2.0, 4.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.061798095703125, -0.05991315841674805, -0.058028221130371094, -0.05614328384399414, -0.05425834655761719, -0.052373409271240234, -0.05048847198486328, -0.04860353469848633, -0.046718597412109375, -0.04483366012573242, -0.04294872283935547, -0.041063785552978516, -0.03917884826660156, -0.03729391098022461, -0.035408973693847656, -0.0335240364074707, -0.03163909912109375, -0.029754161834716797, -0.027869224548339844, -0.02598428726196289, -0.024099349975585938, -0.022214412689208984, -0.02032947540283203, -0.018444538116455078, -0.016559600830078125, -0.014674663543701172, -0.012789726257324219, -0.010904788970947266, -0.009019851684570312, -0.007134914398193359, -0.005249977111816406, -0.003365039825439453, -0.0014801025390625, 0.0004048347473144531, 0.0022897720336914062, 0.004174709320068359, 0.0060596466064453125, 0.007944583892822266, 0.009829521179199219, 0.011714458465576172, 0.013599395751953125, 0.015484333038330078, 0.01736927032470703, 0.019254207611083984, 0.021139144897460938, 0.02302408218383789, 0.024909019470214844, 0.026793956756591797, 0.02867889404296875, 0.030563831329345703, 0.032448768615722656, 0.03433370590209961, 0.03621864318847656, 0.038103580474853516, 0.03998851776123047, 0.04187345504760742, 0.043758392333984375, 0.04564332962036133, 0.04752826690673828, 0.049413204193115234, 0.05129814147949219, 0.05318307876586914, 0.055068016052246094, 0.05695295333862305, 0.058837890625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 3.0, 1.0, 4.0, 5.0, 1.0, 9.0, 3.0, 10.0, 17.0, 9.0, 25.0, 37.0, 57.0, 97.0, 122.0, 218.0, 401.0, 759.0, 1515.0, 3762.0, 10311.0, 52297.0, 874042.0, 83996.0, 12740.0, 4261.0, 1834.0, 896.0, 458.0, 232.0, 158.0, 87.0, 58.0, 33.0, 23.0, 19.0, 14.0, 11.0, 12.0, 3.0, 8.0, 1.0, 2.0, 2.0, 5.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.040008544921875, -0.03865623474121094, -0.037303924560546875, -0.03595161437988281, -0.03459930419921875, -0.03324699401855469, -0.031894683837890625, -0.030542373657226562, -0.0291900634765625, -0.027837753295898438, -0.026485443115234375, -0.025133132934570312, -0.02378082275390625, -0.022428512573242188, -0.021076202392578125, -0.019723892211914062, -0.01837158203125, -0.017019271850585938, -0.015666961669921875, -0.014314651489257812, -0.01296234130859375, -0.011610031127929688, -0.010257720947265625, -0.008905410766601562, -0.0075531005859375, -0.0062007904052734375, -0.004848480224609375, -0.0034961700439453125, -0.00214385986328125, -0.0007915496826171875, 0.000560760498046875, 0.0019130706787109375, 0.003265380859375, 0.0046176910400390625, 0.005970001220703125, 0.0073223114013671875, 0.00867462158203125, 0.010026931762695312, 0.011379241943359375, 0.012731552124023438, 0.0140838623046875, 0.015436172485351562, 0.016788482666015625, 0.018140792846679688, 0.01949310302734375, 0.020845413208007812, 0.022197723388671875, 0.023550033569335938, 0.02490234375, 0.026254653930664062, 0.027606964111328125, 0.028959274291992188, 0.03031158447265625, 0.03166389465332031, 0.033016204833984375, 0.03436851501464844, 0.0357208251953125, 0.03707313537597656, 0.038425445556640625, 0.03977775573730469, 0.04113006591796875, 0.04248237609863281, 0.043834686279296875, 0.04518699645996094, 0.046539306640625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0, 0.0, 3.0, 5.0, 4.0, 7.0, 19.0, 24.0, 99.0, 157.0, 238.0, 186.0, 138.0, 57.0, 28.0, 19.0, 4.0, 7.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.682209014892578e-05, -2.6073306798934937e-05, -2.5324523448944092e-05, -2.4575740098953247e-05, -2.3826956748962402e-05, -2.3078173398971558e-05, -2.2329390048980713e-05, -2.1580606698989868e-05, -2.0831823348999023e-05, -2.008303999900818e-05, -1.9334256649017334e-05, -1.858547329902649e-05, -1.7836689949035645e-05, -1.70879065990448e-05, -1.6339123249053955e-05, -1.559033989906311e-05, -1.4841556549072266e-05, -1.4092773199081421e-05, -1.3343989849090576e-05, -1.2595206499099731e-05, -1.1846423149108887e-05, -1.1097639799118042e-05, -1.0348856449127197e-05, -9.600073099136353e-06, -8.851289749145508e-06, -8.102506399154663e-06, -7.353723049163818e-06, -6.604939699172974e-06, -5.856156349182129e-06, -5.107372999191284e-06, -4.3585896492004395e-06, -3.6098062992095947e-06, -2.86102294921875e-06, -2.1122395992279053e-06, -1.3634562492370605e-06, -6.146728992462158e-07, 1.341104507446289e-07, 8.828938007354736e-07, 1.6316771507263184e-06, 2.380460500717163e-06, 3.129243850708008e-06, 3.8780272006988525e-06, 4.626810550689697e-06, 5.375593900680542e-06, 6.124377250671387e-06, 6.8731606006622314e-06, 7.621943950653076e-06, 8.370727300643921e-06, 9.119510650634766e-06, 9.86829400062561e-06, 1.0617077350616455e-05, 1.13658607006073e-05, 1.2114644050598145e-05, 1.286342740058899e-05, 1.3612210750579834e-05, 1.4360994100570679e-05, 1.5109777450561523e-05, 1.5858560800552368e-05, 1.6607344150543213e-05, 1.7356127500534058e-05, 1.8104910850524902e-05, 1.8853694200515747e-05, 1.9602477550506592e-05, 2.0351260900497437e-05, 2.110004425048828e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 5.0, 2.0, 4.0, 6.0, 7.0, 10.0, 6.0, 28.0, 34.0, 40.0, 60.0, 89.0, 139.0, 301.0, 557.0, 1254.0, 3059.0, 9243.0, 48572.0, 710050.0, 242283.0, 23119.0, 5721.0, 2052.0, 884.0, 418.0, 227.0, 126.0, 79.0, 61.0, 35.0, 22.0, 18.0, 17.0, 12.0, 9.0, 4.0, 3.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.034942626953125, -0.03387737274169922, -0.03281211853027344, -0.031746864318847656, -0.030681610107421875, -0.029616355895996094, -0.028551101684570312, -0.02748584747314453, -0.02642059326171875, -0.02535533905029297, -0.024290084838867188, -0.023224830627441406, -0.022159576416015625, -0.021094322204589844, -0.020029067993164062, -0.01896381378173828, -0.0178985595703125, -0.01683330535888672, -0.015768051147460938, -0.014702796936035156, -0.013637542724609375, -0.012572288513183594, -0.011507034301757812, -0.010441780090332031, -0.00937652587890625, -0.008311271667480469, -0.0072460174560546875, -0.006180763244628906, -0.005115509033203125, -0.004050254821777344, -0.0029850006103515625, -0.0019197463989257812, -0.0008544921875, 0.00021076202392578125, 0.0012760162353515625, 0.0023412704467773438, 0.003406524658203125, 0.004471778869628906, 0.0055370330810546875, 0.006602287292480469, 0.00766754150390625, 0.008732795715332031, 0.009798049926757812, 0.010863304138183594, 0.011928558349609375, 0.012993812561035156, 0.014059066772460938, 0.015124320983886719, 0.0161895751953125, 0.01725482940673828, 0.018320083618164062, 0.019385337829589844, 0.020450592041015625, 0.021515846252441406, 0.022581100463867188, 0.02364635467529297, 0.02471160888671875, 0.02577686309814453, 0.026842117309570312, 0.027907371520996094, 0.028972625732421875, 0.030037879943847656, 0.031103134155273438, 0.03216838836669922, 0.033233642578125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 7.0, 5.0, 6.0, 4.0, 5.0, 11.0, 4.0, 10.0, 18.0, 11.0, 19.0, 32.0, 25.0, 47.0, 61.0, 60.0, 93.0, 89.0, 85.0, 97.0, 72.0, 48.0, 43.0, 46.0, 31.0, 17.0, 10.0, 16.0, 7.0, 4.0, 9.0, 6.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.022247314453125, -0.021552562713623047, -0.020857810974121094, -0.02016305923461914, -0.019468307495117188, -0.018773555755615234, -0.01807880401611328, -0.017384052276611328, -0.016689300537109375, -0.015994548797607422, -0.015299797058105469, -0.014605045318603516, -0.013910293579101562, -0.01321554183959961, -0.012520790100097656, -0.011826038360595703, -0.01113128662109375, -0.010436534881591797, -0.009741783142089844, -0.00904703140258789, -0.008352279663085938, -0.007657527923583984, -0.006962776184082031, -0.006268024444580078, -0.005573272705078125, -0.004878520965576172, -0.004183769226074219, -0.0034890174865722656, -0.0027942657470703125, -0.0020995140075683594, -0.0014047622680664062, -0.0007100105285644531, -1.52587890625e-05, 0.0006794929504394531, 0.0013742446899414062, 0.0020689964294433594, 0.0027637481689453125, 0.0034584999084472656, 0.004153251647949219, 0.004848003387451172, 0.005542755126953125, 0.006237506866455078, 0.006932258605957031, 0.007627010345458984, 0.008321762084960938, 0.00901651382446289, 0.009711265563964844, 0.010406017303466797, 0.01110076904296875, 0.011795520782470703, 0.012490272521972656, 0.01318502426147461, 0.013879776000976562, 0.014574527740478516, 0.015269279479980469, 0.015964031219482422, 0.016658782958984375, 0.017353534698486328, 0.01804828643798828, 0.018743038177490234, 0.019437789916992188, 0.02013254165649414, 0.020827293395996094, 0.021522045135498047, 0.022216796875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 4.0, 5.0, 18.0, 35.0, 76.0, 244.0, 464.0, 134.0, 19.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3096916675567627, -1.2764331102371216, -1.2431745529174805, -1.2099159955978394, -1.1766574382781982, -1.1433990001678467, -1.1101404428482056, -1.0768818855285645, -1.0436233282089233, -1.0103647708892822, -0.9771062135696411, -0.9438477158546448, -0.9105891585350037, -0.8773306012153625, -0.8440721035003662, -0.8108135461807251, -0.777554988861084, -0.7442964315414429, -0.7110378742218018, -0.6777793765068054, -0.6445208191871643, -0.6112622618675232, -0.5780037641525269, -0.5447452068328857, -0.5114866495132446, -0.4782280921936035, -0.4449695646762848, -0.41171103715896606, -0.37845247983932495, -0.34519392251968384, -0.3119353950023651, -0.2786768674850464, -0.24541842937469482, -0.2121598869562149, -0.17890134453773499, -0.14564280211925507, -0.11238425970077515, -0.07912571728229523, -0.04586717486381531, -0.012608632445335388, 0.02064990997314453, 0.05390845239162445, 0.08716699481010437, 0.12042553722858429, 0.1536840796470642, 0.18694262206554413, 0.22020116448402405, 0.2534596920013428, 0.2867182493209839, 0.319976806640625, 0.3532353341579437, 0.38649386167526245, 0.41975241899490356, 0.4530109763145447, 0.4862695038318634, 0.5195280313491821, 0.5527865886688232, 0.5860451459884644, 0.6193037033081055, 0.6525622010231018, 0.6858207583427429, 0.719079315662384, 0.7523378133773804, 0.7855963706970215, 0.8188549280166626]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 0.0, 3.0, 6.0, 9.0, 10.0, 10.0, 13.0, 11.0, 18.0, 17.0, 26.0, 34.0, 29.0, 42.0, 45.0, 45.0, 52.0, 54.0, 50.0, 74.0, 63.0, 56.0, 51.0, 43.0, 30.0, 35.0, 29.0, 36.0, 19.0, 12.0, 16.0, 17.0, 10.0, 13.0, 7.0, 5.0, 8.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2323240041732788, -0.22319872677326202, -0.21407346427440643, -0.20494818687438965, -0.19582292437553406, -0.18669764697551727, -0.1775723695755005, -0.1684471070766449, -0.1593218445777893, -0.15019656717777252, -0.14107130467891693, -0.13194602727890015, -0.12282076478004456, -0.11369548738002777, -0.10457021743059158, -0.0954449474811554, -0.08631967008113861, -0.07719440013170242, -0.06806913018226624, -0.05894385650753975, -0.04981858655810356, -0.040693316608667374, -0.03156804293394089, -0.0224427729845047, -0.013317503035068512, -0.00419223215430975, 0.004933038726449013, 0.01405831053853035, 0.023183580487966537, 0.032308850437402725, 0.04143412411212921, 0.0505593940615654, 0.05968466401100159, 0.06880993396043777, 0.07793520390987396, 0.08706048130989075, 0.09618574380874634, 0.10531102120876312, 0.11443629115819931, 0.1235615611076355, 0.1326868236064911, 0.14181210100650787, 0.15093736350536346, 0.16006264090538025, 0.16918790340423584, 0.17831318080425262, 0.1874384582042694, 0.196563720703125, 0.20568899810314178, 0.21481427550315857, 0.22393953800201416, 0.23306481540203094, 0.24219007790088654, 0.2513153553009033, 0.2604406177997589, 0.2695658802986145, 0.2786911725997925, 0.28781643509864807, 0.29694172739982605, 0.30606698989868164, 0.31519225239753723, 0.3243175148963928, 0.3334428071975708, 0.3425680696964264, 0.351693332195282]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 3.0, 4.0, 10.0, 29.0, 43.0, 74.0, 133.0, 402.0, 3507.0, 4179562.0, 9682.0, 508.0, 146.0, 75.0, 39.0, 28.0, 15.0, 9.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3583984375, -0.3497810363769531, -0.34116363525390625, -0.3325462341308594, -0.3239288330078125, -0.3153114318847656, -0.30669403076171875, -0.2980766296386719, -0.289459228515625, -0.2808418273925781, -0.27222442626953125, -0.2636070251464844, -0.2549896240234375, -0.24637222290039062, -0.23775482177734375, -0.22913742065429688, -0.22052001953125, -0.21190261840820312, -0.20328521728515625, -0.19466781616210938, -0.1860504150390625, -0.17743301391601562, -0.16881561279296875, -0.16019821166992188, -0.151580810546875, -0.14296340942382812, -0.13434600830078125, -0.12572860717773438, -0.1171112060546875, -0.10849380493164062, -0.09987640380859375, -0.09125900268554688, -0.0826416015625, -0.07402420043945312, -0.06540679931640625, -0.056789398193359375, -0.0481719970703125, -0.039554595947265625, -0.03093719482421875, -0.022319793701171875, -0.013702392578125, -0.005084991455078125, 0.00353240966796875, 0.012149810791015625, 0.0207672119140625, 0.029384613037109375, 0.03800201416015625, 0.046619415283203125, 0.05523681640625, 0.06385421752929688, 0.07247161865234375, 0.08108901977539062, 0.0897064208984375, 0.09832382202148438, 0.10694122314453125, 0.11555862426757812, 0.124176025390625, 0.13279342651367188, 0.14141082763671875, 0.15002822875976562, 0.1586456298828125, 0.16726303100585938, 0.17588043212890625, 0.18449783325195312, 0.193115234375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 5.0, 4.0, 5.0, 14.0, 12.0, 17.0, 20.0, 38.0, 40.0, 54.0, 74.0, 65.0, 78.0, 65.0, 90.0, 75.0, 66.0, 47.0, 66.0, 39.0, 32.0, 28.0, 15.0, 12.0, 9.0, 2.0, 8.0, 5.0, 6.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.031982421875, -0.031069040298461914, -0.030155658721923828, -0.029242277145385742, -0.028328895568847656, -0.02741551399230957, -0.026502132415771484, -0.0255887508392334, -0.024675369262695312, -0.023761987686157227, -0.02284860610961914, -0.021935224533081055, -0.02102184295654297, -0.020108461380004883, -0.019195079803466797, -0.01828169822692871, -0.017368316650390625, -0.01645493507385254, -0.015541553497314453, -0.014628171920776367, -0.013714790344238281, -0.012801408767700195, -0.01188802719116211, -0.010974645614624023, -0.010061264038085938, -0.009147882461547852, -0.008234500885009766, -0.00732111930847168, -0.006407737731933594, -0.005494356155395508, -0.004580974578857422, -0.003667593002319336, -0.00275421142578125, -0.001840829849243164, -0.0009274482727050781, -1.4066696166992188e-05, 0.0008993148803710938, 0.0018126964569091797, 0.0027260780334472656, 0.0036394596099853516, 0.0045528411865234375, 0.0054662227630615234, 0.006379604339599609, 0.007292985916137695, 0.008206367492675781, 0.009119749069213867, 0.010033130645751953, 0.010946512222290039, 0.011859893798828125, 0.012773275375366211, 0.013686656951904297, 0.014600038528442383, 0.015513420104980469, 0.016426801681518555, 0.01734018325805664, 0.018253564834594727, 0.019166946411132812, 0.0200803279876709, 0.020993709564208984, 0.02190709114074707, 0.022820472717285156, 0.023733854293823242, 0.024647235870361328, 0.025560617446899414, 0.0264739990234375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 7.0, 4.0, 10.0, 15.0, 12.0, 26.0, 37.0, 42.0, 56.0, 88.0, 151.0, 285.0, 642.0, 2473.0, 65412.0, 4096359.0, 25123.0, 2157.0, 692.0, 280.0, 129.0, 85.0, 56.0, 26.0, 32.0, 23.0, 20.0, 12.0, 9.0, 8.0, 2.0, 4.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1614990234375, -0.1570596694946289, -0.1526203155517578, -0.14818096160888672, -0.14374160766601562, -0.13930225372314453, -0.13486289978027344, -0.13042354583740234, -0.12598419189453125, -0.12154483795166016, -0.11710548400878906, -0.11266613006591797, -0.10822677612304688, -0.10378742218017578, -0.09934806823730469, -0.0949087142944336, -0.0904693603515625, -0.0860300064086914, -0.08159065246582031, -0.07715129852294922, -0.07271194458007812, -0.06827259063720703, -0.06383323669433594, -0.059393882751464844, -0.05495452880859375, -0.050515174865722656, -0.04607582092285156, -0.04163646697998047, -0.037197113037109375, -0.03275775909423828, -0.028318405151367188, -0.023879051208496094, -0.019439697265625, -0.015000343322753906, -0.010560989379882812, -0.006121635437011719, -0.001682281494140625, 0.0027570724487304688, 0.0071964263916015625, 0.011635780334472656, 0.01607513427734375, 0.020514488220214844, 0.024953842163085938, 0.02939319610595703, 0.033832550048828125, 0.03827190399169922, 0.04271125793457031, 0.047150611877441406, 0.0515899658203125, 0.056029319763183594, 0.06046867370605469, 0.06490802764892578, 0.06934738159179688, 0.07378673553466797, 0.07822608947753906, 0.08266544342041016, 0.08710479736328125, 0.09154415130615234, 0.09598350524902344, 0.10042285919189453, 0.10486221313476562, 0.10930156707763672, 0.11374092102050781, 0.1181802749633789, 0.12261962890625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 8.0, 13.0, 13.0, 14.0, 56.0, 101.0, 279.0, 1250.0, 1686.0, 389.0, 129.0, 49.0, 30.0, 18.0, 15.0, 11.0, 7.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.10205078125, -0.09914016723632812, -0.09622955322265625, -0.09331893920898438, -0.0904083251953125, -0.08749771118164062, -0.08458709716796875, -0.08167648315429688, -0.078765869140625, -0.07585525512695312, -0.07294464111328125, -0.07003402709960938, -0.0671234130859375, -0.06421279907226562, -0.06130218505859375, -0.058391571044921875, -0.05548095703125, -0.052570343017578125, -0.04965972900390625, -0.046749114990234375, -0.0438385009765625, -0.040927886962890625, -0.03801727294921875, -0.035106658935546875, -0.032196044921875, -0.029285430908203125, -0.02637481689453125, -0.023464202880859375, -0.0205535888671875, -0.017642974853515625, -0.01473236083984375, -0.011821746826171875, -0.0089111328125, -0.006000518798828125, -0.00308990478515625, -0.000179290771484375, 0.0027313232421875, 0.005641937255859375, 0.00855255126953125, 0.011463165283203125, 0.014373779296875, 0.017284393310546875, 0.02019500732421875, 0.023105621337890625, 0.0260162353515625, 0.028926849365234375, 0.03183746337890625, 0.034748077392578125, 0.03765869140625, 0.040569305419921875, 0.04347991943359375, 0.046390533447265625, 0.0493011474609375, 0.052211761474609375, 0.05512237548828125, 0.058032989501953125, 0.060943603515625, 0.06385421752929688, 0.06676483154296875, 0.06967544555664062, 0.0725860595703125, 0.07549667358398438, 0.07840728759765625, 0.08131790161132812, 0.084228515625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 4.0, 2.0, 4.0, 7.0, 16.0, 11.0, 20.0, 34.0, 65.0, 130.0, 207.0, 186.0, 127.0, 80.0, 42.0, 24.0, 16.0, 11.0, 6.0, 9.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7711883783340454, -0.7489662170410156, -0.7267439961433411, -0.7045218348503113, -0.6822996139526367, -0.6600774526596069, -0.6378552913665771, -0.6156330704689026, -0.5934109091758728, -0.571188747882843, -0.5489665269851685, -0.5267443656921387, -0.5045221447944641, -0.4822999835014343, -0.46007779240608215, -0.43785560131073, -0.4156334102153778, -0.39341121912002563, -0.37118902802467346, -0.3489668369293213, -0.3267446756362915, -0.30452248454093933, -0.28230029344558716, -0.2600781321525574, -0.237855926156044, -0.21563373506069183, -0.19341155886650085, -0.17118936777114868, -0.1489671766757965, -0.12674500048160553, -0.10452280938625336, -0.08230063319206238, -0.060078442096710205, -0.03785625845193863, -0.015634071081876755, 0.00658811628818512, 0.028810299932956696, 0.05103248357772827, 0.07325467467308044, 0.09547685086727142, 0.1176990419626236, 0.13992123305797577, 0.16214340925216675, 0.18436560034751892, 0.2065877914428711, 0.22880996763706207, 0.25103217363357544, 0.2732543349266052, 0.2954765260219574, 0.31769871711730957, 0.33992090821266174, 0.3621430993080139, 0.3843652606010437, 0.4065874516963959, 0.42880964279174805, 0.45103180408477783, 0.4732540249824524, 0.49547621607780457, 0.5176984071731567, 0.5399205684661865, 0.5621427893638611, 0.5843649506568909, 0.6065871715545654, 0.6288093328475952, 0.651031494140625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 5.0, 9.0, 12.0, 9.0, 16.0, 23.0, 25.0, 32.0, 32.0, 47.0, 47.0, 46.0, 62.0, 56.0, 58.0, 54.0, 69.0, 58.0, 55.0, 34.0, 47.0, 34.0, 37.0, 25.0, 21.0, 26.0, 17.0, 9.0, 10.0, 9.0, 4.0, 6.0, 3.0, 2.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.27511441707611084, -0.2661312222480774, -0.25714802742004395, -0.2481648474931717, -0.23918165266513824, -0.230198472738266, -0.22121527791023254, -0.2122320830821991, -0.20324888825416565, -0.1942656934261322, -0.18528251349925995, -0.1762993186712265, -0.16731612384319305, -0.1583329439163208, -0.14934974908828735, -0.1403665542602539, -0.13138337433338165, -0.1224001869559288, -0.11341699212789536, -0.1044338047504425, -0.09545060992240906, -0.08646742254495621, -0.07748423516750336, -0.06850104033946991, -0.05951785296201706, -0.05053466185927391, -0.04155147075653076, -0.03256828337907791, -0.023585092276334763, -0.014601901173591614, -0.005618713796138763, 0.003364481031894684, 0.012347668409347534, 0.021330859512090683, 0.030314048752188683, 0.03929723799228668, 0.04828042909502983, 0.05726362019777298, 0.06624680757522583, 0.07523000240325928, 0.08421318978071213, 0.09319637715816498, 0.10217957198619843, 0.11116275936365128, 0.12014594674110413, 0.12912914156913757, 0.13811233639717102, 0.14709553122520447, 0.15607871115207672, 0.16506190598011017, 0.17404508590698242, 0.18302828073501587, 0.19201147556304932, 0.20099467039108276, 0.20997785031795502, 0.21896104514598846, 0.22794422507286072, 0.23692741990089417, 0.24591059982776642, 0.25489377975463867, 0.2638769745826721, 0.27286016941070557, 0.281843364238739, 0.29082655906677246, 0.2998097538948059]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 5.0, 3.0, 9.0, 8.0, 9.0, 14.0, 14.0, 33.0, 45.0, 75.0, 58.0, 111.0, 159.0, 224.0, 332.0, 516.0, 761.0, 1133.0, 1652.0, 2744.0, 4832.0, 8297.0, 15607.0, 30478.0, 62088.0, 129783.0, 236142.0, 253787.0, 149986.0, 72853.0, 35053.0, 17860.0, 9608.0, 5347.0, 3318.0, 1912.0, 1214.0, 794.0, 541.0, 363.0, 233.0, 178.0, 103.0, 95.0, 53.0, 31.0, 24.0, 20.0, 17.0, 21.0, 9.0, 7.0, 4.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0], "bins": [-0.0247039794921875, -0.023909807205200195, -0.02311563491821289, -0.022321462631225586, -0.02152729034423828, -0.020733118057250977, -0.019938945770263672, -0.019144773483276367, -0.018350601196289062, -0.017556428909301758, -0.016762256622314453, -0.01596808433532715, -0.015173912048339844, -0.014379739761352539, -0.013585567474365234, -0.01279139518737793, -0.011997222900390625, -0.01120305061340332, -0.010408878326416016, -0.009614706039428711, -0.008820533752441406, -0.008026361465454102, -0.007232189178466797, -0.006438016891479492, -0.0056438446044921875, -0.004849672317504883, -0.004055500030517578, -0.0032613277435302734, -0.0024671554565429688, -0.001672983169555664, -0.0008788108825683594, -8.463859558105469e-05, 0.00070953369140625, 0.0015037059783935547, 0.0022978782653808594, 0.003092050552368164, 0.0038862228393554688, 0.0046803951263427734, 0.005474567413330078, 0.006268739700317383, 0.0070629119873046875, 0.007857084274291992, 0.008651256561279297, 0.009445428848266602, 0.010239601135253906, 0.011033773422241211, 0.011827945709228516, 0.01262211799621582, 0.013416290283203125, 0.01421046257019043, 0.015004634857177734, 0.01579880714416504, 0.016592979431152344, 0.01738715171813965, 0.018181324005126953, 0.018975496292114258, 0.019769668579101562, 0.020563840866088867, 0.021358013153076172, 0.022152185440063477, 0.02294635772705078, 0.023740530014038086, 0.02453470230102539, 0.025328874588012695, 0.026123046875]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 8.0, 10.0, 12.0, 17.0, 25.0, 41.0, 36.0, 58.0, 79.0, 59.0, 94.0, 79.0, 86.0, 77.0, 68.0, 62.0, 55.0, 31.0, 29.0, 17.0, 12.0, 14.0, 10.0, 6.0, 5.0, 5.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.028656005859375, -0.02762603759765625, -0.0265960693359375, -0.02556610107421875, -0.0245361328125, -0.02350616455078125, -0.0224761962890625, -0.02144622802734375, -0.020416259765625, -0.01938629150390625, -0.0183563232421875, -0.01732635498046875, -0.01629638671875, -0.01526641845703125, -0.0142364501953125, -0.01320648193359375, -0.012176513671875, -0.01114654541015625, -0.0101165771484375, -0.00908660888671875, -0.008056640625, -0.00702667236328125, -0.0059967041015625, -0.00496673583984375, -0.003936767578125, -0.00290679931640625, -0.0018768310546875, -0.00084686279296875, 0.00018310546875, 0.00121307373046875, 0.0022430419921875, 0.00327301025390625, 0.004302978515625, 0.00533294677734375, 0.0063629150390625, 0.00739288330078125, 0.0084228515625, 0.00945281982421875, 0.0104827880859375, 0.01151275634765625, 0.012542724609375, 0.01357269287109375, 0.0146026611328125, 0.01563262939453125, 0.01666259765625, 0.01769256591796875, 0.0187225341796875, 0.01975250244140625, 0.020782470703125, 0.02181243896484375, 0.0228424072265625, 0.02387237548828125, 0.02490234375, 0.02593231201171875, 0.0269622802734375, 0.02799224853515625, 0.029022216796875, 0.03005218505859375, 0.0310821533203125, 0.03211212158203125, 0.03314208984375, 0.03417205810546875, 0.0352020263671875, 0.03623199462890625, 0.037261962890625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 4.0, 2.0, 2.0, 5.0, 11.0, 11.0, 21.0, 39.0, 52.0, 88.0, 118.0, 221.0, 386.0, 740.0, 1491.0, 3743.0, 12278.0, 89615.0, 832490.0, 88275.0, 12161.0, 3672.0, 1460.0, 741.0, 361.0, 218.0, 143.0, 74.0, 52.0, 23.0, 18.0, 12.0, 9.0, 8.0, 8.0, 2.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.10723876953125, -0.10403728485107422, -0.10083580017089844, -0.09763431549072266, -0.09443283081054688, -0.0912313461303711, -0.08802986145019531, -0.08482837677001953, -0.08162689208984375, -0.07842540740966797, -0.07522392272949219, -0.0720224380493164, -0.06882095336914062, -0.06561946868896484, -0.06241798400878906, -0.05921649932861328, -0.0560150146484375, -0.05281352996826172, -0.04961204528808594, -0.046410560607910156, -0.043209075927734375, -0.040007591247558594, -0.03680610656738281, -0.03360462188720703, -0.03040313720703125, -0.02720165252685547, -0.024000167846679688, -0.020798683166503906, -0.017597198486328125, -0.014395713806152344, -0.011194229125976562, -0.007992744445800781, -0.004791259765625, -0.0015897750854492188, 0.0016117095947265625, 0.004813194274902344, 0.008014678955078125, 0.011216163635253906, 0.014417648315429688, 0.01761913299560547, 0.02082061767578125, 0.02402210235595703, 0.027223587036132812, 0.030425071716308594, 0.033626556396484375, 0.036828041076660156, 0.04002952575683594, 0.04323101043701172, 0.0464324951171875, 0.04963397979736328, 0.05283546447753906, 0.056036949157714844, 0.059238433837890625, 0.062439918518066406, 0.06564140319824219, 0.06884288787841797, 0.07204437255859375, 0.07524585723876953, 0.07844734191894531, 0.0816488265991211, 0.08485031127929688, 0.08805179595947266, 0.09125328063964844, 0.09445476531982422, 0.09765625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 7.0, 8.0, 7.0, 7.0, 7.0, 13.0, 21.0, 14.0, 8.0, 34.0, 28.0, 39.0, 43.0, 50.0, 42.0, 51.0, 58.0, 56.0, 56.0, 50.0, 41.0, 61.0, 48.0, 44.0, 41.0, 22.0, 37.0, 17.0, 19.0, 19.0, 14.0, 11.0, 12.0, 4.0, 4.0, 3.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0926513671875, -0.08984947204589844, -0.08704757690429688, -0.08424568176269531, -0.08144378662109375, -0.07864189147949219, -0.07583999633789062, -0.07303810119628906, -0.0702362060546875, -0.06743431091308594, -0.06463241577148438, -0.06183052062988281, -0.05902862548828125, -0.05622673034667969, -0.053424835205078125, -0.05062294006347656, -0.047821044921875, -0.04501914978027344, -0.042217254638671875, -0.03941535949707031, -0.03661346435546875, -0.03381156921386719, -0.031009674072265625, -0.028207778930664062, -0.0254058837890625, -0.022603988647460938, -0.019802093505859375, -0.017000198364257812, -0.01419830322265625, -0.011396408081054688, -0.008594512939453125, -0.0057926177978515625, -0.00299072265625, -0.0001888275146484375, 0.002613067626953125, 0.0054149627685546875, 0.00821685791015625, 0.011018753051757812, 0.013820648193359375, 0.016622543334960938, 0.0194244384765625, 0.022226333618164062, 0.025028228759765625, 0.027830123901367188, 0.03063201904296875, 0.03343391418457031, 0.036235809326171875, 0.03903770446777344, 0.041839599609375, 0.04464149475097656, 0.047443389892578125, 0.05024528503417969, 0.05304718017578125, 0.05584907531738281, 0.058650970458984375, 0.06145286560058594, 0.0642547607421875, 0.06705665588378906, 0.06985855102539062, 0.07266044616699219, 0.07546234130859375, 0.07826423645019531, 0.08106613159179688, 0.08386802673339844, 0.086669921875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 7.0, 10.0, 8.0, 18.0, 25.0, 22.0, 33.0, 57.0, 82.0, 111.0, 210.0, 336.0, 527.0, 928.0, 1618.0, 3096.0, 6817.0, 18756.0, 275058.0, 705141.0, 20876.0, 7365.0, 3330.0, 1694.0, 952.0, 517.0, 314.0, 223.0, 131.0, 84.0, 61.0, 46.0, 32.0, 19.0, 16.0, 7.0, 8.0, 7.0, 8.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1456298828125, -0.1410846710205078, -0.13653945922851562, -0.13199424743652344, -0.12744903564453125, -0.12290382385253906, -0.11835861206054688, -0.11381340026855469, -0.1092681884765625, -0.10472297668457031, -0.10017776489257812, -0.09563255310058594, -0.09108734130859375, -0.08654212951660156, -0.08199691772460938, -0.07745170593261719, -0.072906494140625, -0.06836128234863281, -0.06381607055664062, -0.05927085876464844, -0.05472564697265625, -0.05018043518066406, -0.045635223388671875, -0.04109001159667969, -0.0365447998046875, -0.03199958801269531, -0.027454376220703125, -0.022909164428710938, -0.01836395263671875, -0.013818740844726562, -0.009273529052734375, -0.0047283172607421875, -0.00018310546875, 0.0043621063232421875, 0.008907318115234375, 0.013452529907226562, 0.01799774169921875, 0.022542953491210938, 0.027088165283203125, 0.03163337707519531, 0.0361785888671875, 0.04072380065917969, 0.045269012451171875, 0.04981422424316406, 0.05435943603515625, 0.05890464782714844, 0.06344985961914062, 0.06799507141113281, 0.072540283203125, 0.07708549499511719, 0.08163070678710938, 0.08617591857910156, 0.09072113037109375, 0.09526634216308594, 0.09981155395507812, 0.10435676574707031, 0.1089019775390625, 0.11344718933105469, 0.11799240112304688, 0.12253761291503906, 0.12708282470703125, 0.13162803649902344, 0.13617324829101562, 0.1407184600830078, 0.145263671875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 3.0, 11.0, 18.0, 20.0, 55.0, 413.0, 355.0, 46.0, 14.0, 26.0, 14.0, 7.0, 4.0, 2.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.51207160949707e-05, -4.261266440153122e-05, -4.0104612708091736e-05, -3.759656101465225e-05, -3.508850932121277e-05, -3.2580457627773285e-05, -3.00724059343338e-05, -2.7564354240894318e-05, -2.5056302547454834e-05, -2.254825085401535e-05, -2.0040199160575867e-05, -1.7532147467136383e-05, -1.50240957736969e-05, -1.2516044080257416e-05, -1.0007992386817932e-05, -7.4999406933784485e-06, -4.991888999938965e-06, -2.483837306499481e-06, 2.421438694000244e-08, 2.532266080379486e-06, 5.04031777381897e-06, 7.548369467258453e-06, 1.0056421160697937e-05, 1.256447285413742e-05, 1.5072524547576904e-05, 1.7580576241016388e-05, 2.008862793445587e-05, 2.2596679627895355e-05, 2.510473132133484e-05, 2.7612783014774323e-05, 3.0120834708213806e-05, 3.262888640165329e-05, 3.5136938095092773e-05, 3.764498978853226e-05, 4.015304148197174e-05, 4.2661093175411224e-05, 4.516914486885071e-05, 4.767719656229019e-05, 5.0185248255729675e-05, 5.269329994916916e-05, 5.520135164260864e-05, 5.7709403336048126e-05, 6.021745502948761e-05, 6.27255067229271e-05, 6.523355841636658e-05, 6.774161010980606e-05, 7.024966180324554e-05, 7.275771349668503e-05, 7.526576519012451e-05, 7.7773816883564e-05, 8.028186857700348e-05, 8.278992027044296e-05, 8.529797196388245e-05, 8.780602365732193e-05, 9.031407535076141e-05, 9.28221270442009e-05, 9.533017873764038e-05, 9.783823043107986e-05, 0.00010034628212451935, 0.00010285433381795883, 0.00010536238551139832, 0.0001078704372048378, 0.00011037848889827728, 0.00011288654059171677, 0.00011539459228515625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 0.0, 1.0, 1.0, 2.0, 3.0, 9.0, 2.0, 4.0, 9.0, 12.0, 15.0, 31.0, 48.0, 70.0, 88.0, 171.0, 356.0, 725.0, 1549.0, 3687.0, 11149.0, 64236.0, 933371.0, 22412.0, 6180.0, 2310.0, 1024.0, 486.0, 217.0, 161.0, 70.0, 65.0, 39.0, 19.0, 15.0, 12.0, 8.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1563720703125, -0.150177001953125, -0.14398193359375, -0.137786865234375, -0.131591796875, -0.125396728515625, -0.11920166015625, -0.113006591796875, -0.1068115234375, -0.100616455078125, -0.09442138671875, -0.088226318359375, -0.08203125, -0.075836181640625, -0.06964111328125, -0.063446044921875, -0.0572509765625, -0.051055908203125, -0.04486083984375, -0.038665771484375, -0.032470703125, -0.026275634765625, -0.02008056640625, -0.013885498046875, -0.0076904296875, -0.001495361328125, 0.00469970703125, 0.010894775390625, 0.01708984375, 0.023284912109375, 0.02947998046875, 0.035675048828125, 0.0418701171875, 0.048065185546875, 0.05426025390625, 0.060455322265625, 0.066650390625, 0.072845458984375, 0.07904052734375, 0.085235595703125, 0.0914306640625, 0.097625732421875, 0.10382080078125, 0.110015869140625, 0.1162109375, 0.122406005859375, 0.12860107421875, 0.134796142578125, 0.1409912109375, 0.147186279296875, 0.15338134765625, 0.159576416015625, 0.165771484375, 0.171966552734375, 0.17816162109375, 0.184356689453125, 0.1905517578125, 0.196746826171875, 0.20294189453125, 0.209136962890625, 0.21533203125, 0.221527099609375, 0.22772216796875, 0.233917236328125, 0.2401123046875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 3.0, 6.0, 11.0, 3.0, 12.0, 9.0, 16.0, 37.0, 183.0, 490.0, 133.0, 22.0, 12.0, 14.0, 11.0, 9.0, 6.0, 6.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1834716796875, -0.17843246459960938, -0.17339324951171875, -0.16835403442382812, -0.1633148193359375, -0.15827560424804688, -0.15323638916015625, -0.14819717407226562, -0.143157958984375, -0.13811874389648438, -0.13307952880859375, -0.12804031372070312, -0.1230010986328125, -0.11796188354492188, -0.11292266845703125, -0.10788345336914062, -0.10284423828125, -0.09780502319335938, -0.09276580810546875, -0.08772659301757812, -0.0826873779296875, -0.07764816284179688, -0.07260894775390625, -0.06756973266601562, -0.062530517578125, -0.057491302490234375, -0.05245208740234375, -0.047412872314453125, -0.0423736572265625, -0.037334442138671875, -0.03229522705078125, -0.027256011962890625, -0.022216796875, -0.017177581787109375, -0.01213836669921875, -0.007099151611328125, -0.0020599365234375, 0.002979278564453125, 0.00801849365234375, 0.013057708740234375, 0.018096923828125, 0.023136138916015625, 0.02817535400390625, 0.033214569091796875, 0.0382537841796875, 0.043292999267578125, 0.04833221435546875, 0.053371429443359375, 0.05841064453125, 0.06344985961914062, 0.06848907470703125, 0.07352828979492188, 0.0785675048828125, 0.08360671997070312, 0.08864593505859375, 0.09368515014648438, 0.098724365234375, 0.10376358032226562, 0.10880279541015625, 0.11384201049804688, 0.1188812255859375, 0.12392044067382812, 0.12895965576171875, 0.13399887084960938, 0.1390380859375]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 5.0, 12.0, 20.0, 66.0, 120.0, 309.0, 288.0, 107.0, 45.0, 20.0, 8.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.741485118865967, -2.6500909328460693, -2.558696746826172, -2.4673023223876953, -2.375908136367798, -2.2845139503479004, -2.193119525909424, -2.1017253398895264, -2.010331153869629, -1.9189369678497314, -1.8275426626205444, -1.7361483573913574, -1.64475417137146, -1.5533599853515625, -1.4619656801223755, -1.3705713748931885, -1.279177188873291, -1.1877830028533936, -1.0963886976242065, -1.0049943923950195, -0.9136002063751221, -0.8222059607505798, -0.7308117151260376, -0.6394174695014954, -0.5480232238769531, -0.4566289782524109, -0.36523473262786865, -0.2738404870033264, -0.18244624137878418, -0.09105199575424194, 0.00034224987030029297, 0.09173649549484253, 0.18313097953796387, 0.2745252251625061, 0.36591947078704834, 0.4573137164115906, 0.5487079620361328, 0.640102207660675, 0.7314964532852173, 0.8228906989097595, 0.9142849445343018, 1.0056791305541992, 1.0970734357833862, 1.1884677410125732, 1.2798619270324707, 1.3712561130523682, 1.4626504182815552, 1.5540447235107422, 1.6454389095306396, 1.736833095550537, 1.8282274007797241, 1.9196217060089111, 2.0110158920288086, 2.102410078048706, 2.1938042640686035, 2.28519868850708, 2.3765928745269775, 2.467987060546875, 2.5593814849853516, 2.650775671005249, 2.7421698570251465, 2.833564043045044, 2.9249582290649414, 3.016352653503418, 3.1077468395233154]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 1.0, 7.0, 4.0, 11.0, 8.0, 11.0, 7.0, 11.0, 15.0, 18.0, 22.0, 21.0, 29.0, 33.0, 19.0, 30.0, 30.0, 33.0, 54.0, 69.0, 83.0, 63.0, 62.0, 40.0, 52.0, 28.0, 29.0, 28.0, 34.0, 22.0, 21.0, 18.0, 16.0, 17.0, 18.0, 16.0, 2.0, 10.0, 3.0, 8.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.4319179654121399, -0.4164727032184601, -0.4010274410247803, -0.38558217883110046, -0.37013691663742065, -0.35469162464141846, -0.33924639225006104, -0.32380110025405884, -0.30835583806037903, -0.2929105758666992, -0.2774653136730194, -0.2620200514793396, -0.2465747743844986, -0.2311295121908188, -0.21568424999713898, -0.20023897290229797, -0.18479372560977936, -0.16934846341609955, -0.15390320122241974, -0.13845792412757874, -0.12301266193389893, -0.10756739974021912, -0.0921221375465393, -0.0766768679022789, -0.06123160570859909, -0.04578633978962898, -0.030341075733304024, -0.014895811676979065, 0.0005494542419910431, 0.01599472016096115, 0.03143998235464096, 0.04688525199890137, 0.06233051419258118, 0.07777577638626099, 0.09322104603052139, 0.1086663082242012, 0.12411157786846161, 0.13955684006214142, 0.15500210225582123, 0.17044737935066223, 0.18589264154434204, 0.20133790373802185, 0.21678316593170166, 0.23222842812538147, 0.24767370522022247, 0.2631189823150635, 0.2785642147064209, 0.2940095067024231, 0.3094547390937805, 0.3249000012874603, 0.34034526348114014, 0.35579052567481995, 0.37123578786849976, 0.38668107986450195, 0.4021263122558594, 0.4175716042518616, 0.4330168664455414, 0.4484621286392212, 0.463907390832901, 0.4793526530265808, 0.4947979152202606, 0.5102431774139404, 0.5256884694099426, 0.5411337018013, 0.5565789937973022]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 0.0, 6.0, 12.0, 12.0, 15.0, 22.0, 28.0, 23.0, 46.0, 51.0, 55.0, 107.0, 241.0, 420.0, 943.0, 2556.0, 10408.0, 87696.0, 3796659.0, 271579.0, 17471.0, 3661.0, 1125.0, 437.0, 244.0, 138.0, 87.0, 62.0, 42.0, 22.0, 31.0, 21.0, 10.0, 11.0, 14.0, 3.0, 7.0, 2.0, 2.0, 6.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12078857421875, -0.11708831787109375, -0.1133880615234375, -0.10968780517578125, -0.105987548828125, -0.10228729248046875, -0.0985870361328125, -0.09488677978515625, -0.0911865234375, -0.08748626708984375, -0.0837860107421875, -0.08008575439453125, -0.076385498046875, -0.07268524169921875, -0.0689849853515625, -0.06528472900390625, -0.06158447265625, -0.05788421630859375, -0.0541839599609375, -0.05048370361328125, -0.046783447265625, -0.04308319091796875, -0.0393829345703125, -0.03568267822265625, -0.031982421875, -0.02828216552734375, -0.0245819091796875, -0.02088165283203125, -0.017181396484375, -0.01348114013671875, -0.0097808837890625, -0.00608062744140625, -0.00238037109375, 0.00131988525390625, 0.0050201416015625, 0.00872039794921875, 0.012420654296875, 0.01612091064453125, 0.0198211669921875, 0.02352142333984375, 0.0272216796875, 0.03092193603515625, 0.0346221923828125, 0.03832244873046875, 0.042022705078125, 0.04572296142578125, 0.0494232177734375, 0.05312347412109375, 0.05682373046875, 0.06052398681640625, 0.0642242431640625, 0.06792449951171875, 0.071624755859375, 0.07532501220703125, 0.0790252685546875, 0.08272552490234375, 0.08642578125, 0.09012603759765625, 0.0938262939453125, 0.09752655029296875, 0.101226806640625, 0.10492706298828125, 0.1086273193359375, 0.11232757568359375, 0.11602783203125]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 8.0, 6.0, 13.0, 11.0, 22.0, 22.0, 28.0, 34.0, 44.0, 50.0, 70.0, 66.0, 63.0, 70.0, 80.0, 68.0, 55.0, 55.0, 45.0, 49.0, 27.0, 20.0, 23.0, 28.0, 17.0, 7.0, 3.0, 6.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.035675048828125, -0.03464818000793457, -0.03362131118774414, -0.03259444236755371, -0.03156757354736328, -0.03054070472717285, -0.029513835906982422, -0.028486967086791992, -0.027460098266601562, -0.026433229446411133, -0.025406360626220703, -0.024379491806030273, -0.023352622985839844, -0.022325754165649414, -0.021298885345458984, -0.020272016525268555, -0.019245147705078125, -0.018218278884887695, -0.017191410064697266, -0.016164541244506836, -0.015137672424316406, -0.014110803604125977, -0.013083934783935547, -0.012057065963745117, -0.011030197143554688, -0.010003328323364258, -0.008976459503173828, -0.007949590682983398, -0.006922721862792969, -0.005895853042602539, -0.004868984222412109, -0.0038421154022216797, -0.00281524658203125, -0.0017883777618408203, -0.0007615089416503906, 0.00026535987854003906, 0.0012922286987304688, 0.0023190975189208984, 0.003345966339111328, 0.004372835159301758, 0.0053997039794921875, 0.006426572799682617, 0.007453441619873047, 0.008480310440063477, 0.009507179260253906, 0.010534048080444336, 0.011560916900634766, 0.012587785720825195, 0.013614654541015625, 0.014641523361206055, 0.015668392181396484, 0.016695261001586914, 0.017722129821777344, 0.018748998641967773, 0.019775867462158203, 0.020802736282348633, 0.021829605102539062, 0.022856473922729492, 0.023883342742919922, 0.02491021156311035, 0.02593708038330078, 0.02696394920349121, 0.02799081802368164, 0.02901768684387207, 0.0300445556640625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 11.0, 8.0, 20.0, 17.0, 24.0, 26.0, 36.0, 44.0, 72.0, 101.0, 141.0, 198.0, 402.0, 961.0, 3003.0, 15527.0, 397672.0, 3733551.0, 35124.0, 4776.0, 1324.0, 490.0, 218.0, 150.0, 104.0, 79.0, 52.0, 39.0, 30.0, 30.0, 13.0, 12.0, 7.0, 8.0, 5.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2474365234375, -0.24019432067871094, -0.23295211791992188, -0.2257099151611328, -0.21846771240234375, -0.2112255096435547, -0.20398330688476562, -0.19674110412597656, -0.1894989013671875, -0.18225669860839844, -0.17501449584960938, -0.1677722930908203, -0.16053009033203125, -0.1532878875732422, -0.14604568481445312, -0.13880348205566406, -0.131561279296875, -0.12431907653808594, -0.11707687377929688, -0.10983467102050781, -0.10259246826171875, -0.09535026550292969, -0.08810806274414062, -0.08086585998535156, -0.0736236572265625, -0.06638145446777344, -0.059139251708984375, -0.05189704895019531, -0.04465484619140625, -0.03741264343261719, -0.030170440673828125, -0.022928237915039062, -0.01568603515625, -0.008443832397460938, -0.001201629638671875, 0.0060405731201171875, 0.01328277587890625, 0.020524978637695312, 0.027767181396484375, 0.03500938415527344, 0.0422515869140625, 0.04949378967285156, 0.056735992431640625, 0.06397819519042969, 0.07122039794921875, 0.07846260070800781, 0.08570480346679688, 0.09294700622558594, 0.100189208984375, 0.10743141174316406, 0.11467361450195312, 0.12191581726074219, 0.12915802001953125, 0.1364002227783203, 0.14364242553710938, 0.15088462829589844, 0.1581268310546875, 0.16536903381347656, 0.17261123657226562, 0.1798534393310547, 0.18709564208984375, 0.1943378448486328, 0.20158004760742188, 0.20882225036621094, 0.216064453125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 7.0, 5.0, 6.0, 11.0, 17.0, 41.0, 32.0, 62.0, 119.0, 327.0, 1169.0, 1403.0, 478.0, 164.0, 72.0, 63.0, 31.0, 19.0, 15.0, 9.0, 11.0, 5.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.126953125, -0.12208747863769531, -0.11722183227539062, -0.11235618591308594, -0.10749053955078125, -0.10262489318847656, -0.09775924682617188, -0.09289360046386719, -0.0880279541015625, -0.08316230773925781, -0.07829666137695312, -0.07343101501464844, -0.06856536865234375, -0.06369972229003906, -0.058834075927734375, -0.05396842956542969, -0.049102783203125, -0.04423713684082031, -0.039371490478515625, -0.03450584411621094, -0.02964019775390625, -0.024774551391601562, -0.019908905029296875, -0.015043258666992188, -0.0101776123046875, -0.0053119659423828125, -0.000446319580078125, 0.0044193267822265625, 0.00928497314453125, 0.014150619506835938, 0.019016265869140625, 0.023881912231445312, 0.02874755859375, 0.03361320495605469, 0.038478851318359375, 0.04334449768066406, 0.04821014404296875, 0.05307579040527344, 0.057941436767578125, 0.06280708312988281, 0.0676727294921875, 0.07253837585449219, 0.07740402221679688, 0.08226966857910156, 0.08713531494140625, 0.09200096130371094, 0.09686660766601562, 0.10173225402832031, 0.106597900390625, 0.11146354675292969, 0.11632919311523438, 0.12119483947753906, 0.12606048583984375, 0.13092613220214844, 0.13579177856445312, 0.1406574249267578, 0.1455230712890625, 0.1503887176513672, 0.15525436401367188, 0.16012001037597656, 0.16498565673828125, 0.16985130310058594, 0.17471694946289062, 0.1795825958251953, 0.1844482421875]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 6.0, 10.0, 10.0, 17.0, 33.0, 47.0, 96.0, 141.0, 193.0, 177.0, 106.0, 65.0, 43.0, 21.0, 6.0, 5.0, 6.0, 6.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3531936407089233, -1.3090887069702148, -1.2649837732315063, -1.2208788394927979, -1.1767737865447998, -1.1326688528060913, -1.0885639190673828, -1.0444589853286743, -1.0003540515899658, -0.9562491178512573, -0.912144124507904, -0.8680391907691956, -0.8239341974258423, -0.7798292636871338, -0.7357243299484253, -0.6916193962097168, -0.6475143432617188, -0.6034094095230103, -0.559304416179657, -0.5151994824409485, -0.4710945188999176, -0.4269895553588867, -0.3828846216201782, -0.33877965807914734, -0.29467469453811646, -0.25056973099708557, -0.20646478235721588, -0.1623598337173462, -0.11825487017631531, -0.07414990663528442, -0.030044972896575928, 0.014059990644454956, 0.05816495418548584, 0.10226991027593613, 0.1463748663663864, 0.1904798150062561, 0.234584778547287, 0.27868974208831787, 0.32279467582702637, 0.36689963936805725, 0.41100460290908813, 0.455109566450119, 0.4992145299911499, 0.5433194637298584, 0.5874243974685669, 0.6315293908119202, 0.6756343245506287, 0.7197393178939819, 0.7638442516326904, 0.8079491853713989, 0.8520541787147522, 0.8961591124534607, 0.940264105796814, 0.9843690395355225, 1.028473973274231, 1.0725789070129395, 1.1166839599609375, 1.160788893699646, 1.2048938274383545, 1.2489988803863525, 1.293103814125061, 1.3372087478637695, 1.381313681602478, 1.4254186153411865, 1.469523549079895]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 5.0, 1.0, 5.0, 11.0, 10.0, 10.0, 14.0, 20.0, 31.0, 19.0, 23.0, 43.0, 28.0, 40.0, 35.0, 40.0, 32.0, 54.0, 50.0, 39.0, 44.0, 45.0, 46.0, 38.0, 40.0, 47.0, 40.0, 25.0, 14.0, 28.0, 17.0, 15.0, 16.0, 9.0, 8.0, 10.0, 7.0, 13.0, 5.0, 5.0, 6.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.40947502851486206, -0.39656752347946167, -0.3836599886417389, -0.3707524836063385, -0.3578449487686157, -0.34493744373321533, -0.33202993869781494, -0.31912240386009216, -0.3062148690223694, -0.293307363986969, -0.2803998291492462, -0.2674923241138458, -0.25458478927612305, -0.24167728424072266, -0.22876976430416107, -0.2158622443675995, -0.2029547393321991, -0.1900472193956375, -0.17713969945907593, -0.16423219442367554, -0.15132465958595276, -0.13841715455055237, -0.12550963461399078, -0.1126021146774292, -0.09969459474086761, -0.08678707480430603, -0.07387955486774445, -0.06097204238176346, -0.048064522445201874, -0.03515700250864029, -0.022249490022659302, -0.009341970086097717, 0.003565549850463867, 0.016473067924380302, 0.029380585998296738, 0.042288102209568024, 0.05519562214612961, 0.06810314208269119, 0.08101065456867218, 0.09391817450523376, 0.10682569444179535, 0.11973321437835693, 0.13264073431491852, 0.1455482542514801, 0.1584557592868805, 0.17136329412460327, 0.18427079916000366, 0.19717831909656525, 0.21008583903312683, 0.22299335896968842, 0.23590087890625, 0.2488083839416504, 0.26171591877937317, 0.27462342381477356, 0.28753095865249634, 0.30043846368789673, 0.3133459687232971, 0.3262534737586975, 0.3391610085964203, 0.3520685136318207, 0.36497604846954346, 0.37788355350494385, 0.39079105854034424, 0.403698593378067, 0.4166061282157898]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 4.0, 5.0, 7.0, 6.0, 15.0, 12.0, 22.0, 41.0, 64.0, 93.0, 156.0, 242.0, 440.0, 735.0, 1311.0, 2539.0, 5030.0, 10699.0, 24574.0, 64337.0, 216457.0, 456857.0, 171447.0, 53848.0, 20742.0, 9213.0, 4452.0, 2335.0, 1207.0, 621.0, 401.0, 236.0, 148.0, 84.0, 56.0, 43.0, 25.0, 17.0, 11.0, 10.0, 5.0, 5.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.07733154296875, -0.07470226287841797, -0.07207298278808594, -0.0694437026977539, -0.06681442260742188, -0.06418514251708984, -0.06155586242675781, -0.05892658233642578, -0.05629730224609375, -0.05366802215576172, -0.05103874206542969, -0.048409461975097656, -0.045780181884765625, -0.043150901794433594, -0.04052162170410156, -0.03789234161376953, -0.0352630615234375, -0.03263378143310547, -0.030004501342773438, -0.027375221252441406, -0.024745941162109375, -0.022116661071777344, -0.019487380981445312, -0.01685810089111328, -0.01422882080078125, -0.011599540710449219, -0.008970260620117188, -0.006340980529785156, -0.003711700439453125, -0.0010824203491210938, 0.0015468597412109375, 0.004176139831542969, 0.006805419921875, 0.009434700012207031, 0.012063980102539062, 0.014693260192871094, 0.017322540283203125, 0.019951820373535156, 0.022581100463867188, 0.02521038055419922, 0.02783966064453125, 0.03046894073486328, 0.03309822082519531, 0.035727500915527344, 0.038356781005859375, 0.040986061096191406, 0.04361534118652344, 0.04624462127685547, 0.0488739013671875, 0.05150318145751953, 0.05413246154785156, 0.056761741638183594, 0.059391021728515625, 0.062020301818847656, 0.06464958190917969, 0.06727886199951172, 0.06990814208984375, 0.07253742218017578, 0.07516670227050781, 0.07779598236083984, 0.08042526245117188, 0.0830545425415039, 0.08568382263183594, 0.08831310272216797, 0.0909423828125]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 5.0, 13.0, 12.0, 16.0, 19.0, 29.0, 29.0, 38.0, 37.0, 39.0, 59.0, 60.0, 56.0, 71.0, 59.0, 61.0, 58.0, 58.0, 43.0, 51.0, 43.0, 29.0, 28.0, 22.0, 17.0, 19.0, 10.0, 9.0, 4.0, 4.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.035308837890625, -0.034107208251953125, -0.03290557861328125, -0.031703948974609375, -0.0305023193359375, -0.029300689697265625, -0.02809906005859375, -0.026897430419921875, -0.02569580078125, -0.024494171142578125, -0.02329254150390625, -0.022090911865234375, -0.0208892822265625, -0.019687652587890625, -0.01848602294921875, -0.017284393310546875, -0.016082763671875, -0.014881134033203125, -0.01367950439453125, -0.012477874755859375, -0.0112762451171875, -0.010074615478515625, -0.00887298583984375, -0.007671356201171875, -0.0064697265625, -0.005268096923828125, -0.00406646728515625, -0.002864837646484375, -0.0016632080078125, -0.000461578369140625, 0.00074005126953125, 0.001941680908203125, 0.003143310546875, 0.004344940185546875, 0.00554656982421875, 0.006748199462890625, 0.0079498291015625, 0.009151458740234375, 0.01035308837890625, 0.011554718017578125, 0.01275634765625, 0.013957977294921875, 0.01515960693359375, 0.016361236572265625, 0.0175628662109375, 0.018764495849609375, 0.01996612548828125, 0.021167755126953125, 0.022369384765625, 0.023571014404296875, 0.02477264404296875, 0.025974273681640625, 0.0271759033203125, 0.028377532958984375, 0.02957916259765625, 0.030780792236328125, 0.031982421875, 0.033184051513671875, 0.03438568115234375, 0.035587310791015625, 0.0367889404296875, 0.037990570068359375, 0.03919219970703125, 0.040393829345703125, 0.041595458984375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 9.0, 7.0, 9.0, 10.0, 28.0, 25.0, 39.0, 47.0, 90.0, 93.0, 151.0, 252.0, 325.0, 609.0, 997.0, 1790.0, 3131.0, 6773.0, 17727.0, 64346.0, 580753.0, 297216.0, 47426.0, 14373.0, 5769.0, 2750.0, 1442.0, 813.0, 554.0, 316.0, 236.0, 147.0, 92.0, 67.0, 52.0, 29.0, 18.0, 18.0, 6.0, 6.0, 7.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1494140625, -0.1450061798095703, -0.14059829711914062, -0.13619041442871094, -0.13178253173828125, -0.12737464904785156, -0.12296676635742188, -0.11855888366699219, -0.1141510009765625, -0.10974311828613281, -0.10533523559570312, -0.10092735290527344, -0.09651947021484375, -0.09211158752441406, -0.08770370483398438, -0.08329582214355469, -0.078887939453125, -0.07448005676269531, -0.07007217407226562, -0.06566429138183594, -0.06125640869140625, -0.05684852600097656, -0.052440643310546875, -0.04803276062011719, -0.0436248779296875, -0.03921699523925781, -0.034809112548828125, -0.030401229858398438, -0.02599334716796875, -0.021585464477539062, -0.017177581787109375, -0.012769699096679688, -0.00836181640625, -0.0039539337158203125, 0.000453948974609375, 0.0048618316650390625, 0.00926971435546875, 0.013677597045898438, 0.018085479736328125, 0.022493362426757812, 0.0269012451171875, 0.03130912780761719, 0.035717010498046875, 0.04012489318847656, 0.04453277587890625, 0.04894065856933594, 0.053348541259765625, 0.05775642395019531, 0.062164306640625, 0.06657218933105469, 0.07098007202148438, 0.07538795471191406, 0.07979583740234375, 0.08420372009277344, 0.08861160278320312, 0.09301948547363281, 0.0974273681640625, 0.10183525085449219, 0.10624313354492188, 0.11065101623535156, 0.11505889892578125, 0.11946678161621094, 0.12387466430664062, 0.1282825469970703, 0.1326904296875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 1.0, 2.0, 9.0, 8.0, 8.0, 11.0, 14.0, 19.0, 19.0, 10.0, 30.0, 39.0, 43.0, 39.0, 56.0, 55.0, 64.0, 55.0, 63.0, 58.0, 51.0, 45.0, 51.0, 36.0, 30.0, 26.0, 27.0, 35.0, 20.0, 11.0, 15.0, 13.0, 11.0, 11.0, 6.0, 7.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.15234375, -0.14784812927246094, -0.14335250854492188, -0.1388568878173828, -0.13436126708984375, -0.1298656463623047, -0.12537002563476562, -0.12087440490722656, -0.1163787841796875, -0.11188316345214844, -0.10738754272460938, -0.10289192199707031, -0.09839630126953125, -0.09390068054199219, -0.08940505981445312, -0.08490943908691406, -0.080413818359375, -0.07591819763183594, -0.07142257690429688, -0.06692695617675781, -0.06243133544921875, -0.05793571472167969, -0.053440093994140625, -0.04894447326660156, -0.0444488525390625, -0.03995323181152344, -0.035457611083984375, -0.030961990356445312, -0.02646636962890625, -0.021970748901367188, -0.017475128173828125, -0.012979507446289062, -0.00848388671875, -0.0039882659912109375, 0.000507354736328125, 0.0050029754638671875, 0.00949859619140625, 0.013994216918945312, 0.018489837646484375, 0.022985458374023438, 0.0274810791015625, 0.03197669982910156, 0.036472320556640625, 0.04096794128417969, 0.04546356201171875, 0.04995918273925781, 0.054454803466796875, 0.05895042419433594, 0.063446044921875, 0.06794166564941406, 0.07243728637695312, 0.07693290710449219, 0.08142852783203125, 0.08592414855957031, 0.09041976928710938, 0.09491539001464844, 0.0994110107421875, 0.10390663146972656, 0.10840225219726562, 0.11289787292480469, 0.11739349365234375, 0.12188911437988281, 0.12638473510742188, 0.13088035583496094, 0.1353759765625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 5.0, 4.0, 5.0, 7.0, 2.0, 9.0, 12.0, 26.0, 34.0, 59.0, 70.0, 99.0, 180.0, 299.0, 516.0, 832.0, 1541.0, 2862.0, 5765.0, 12168.0, 30459.0, 122719.0, 740718.0, 84335.0, 24686.0, 10378.0, 5010.0, 2494.0, 1363.0, 773.0, 426.0, 233.0, 152.0, 110.0, 63.0, 47.0, 35.0, 21.0, 16.0, 11.0, 7.0, 5.0, 5.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09991455078125, -0.09683036804199219, -0.09374618530273438, -0.09066200256347656, -0.08757781982421875, -0.08449363708496094, -0.08140945434570312, -0.07832527160644531, -0.0752410888671875, -0.07215690612792969, -0.06907272338867188, -0.06598854064941406, -0.06290435791015625, -0.05982017517089844, -0.056735992431640625, -0.05365180969238281, -0.050567626953125, -0.04748344421386719, -0.044399261474609375, -0.04131507873535156, -0.03823089599609375, -0.03514671325683594, -0.032062530517578125, -0.028978347778320312, -0.0258941650390625, -0.022809982299804688, -0.019725799560546875, -0.016641616821289062, -0.01355743408203125, -0.010473251342773438, -0.007389068603515625, -0.0043048858642578125, -0.001220703125, 0.0018634796142578125, 0.004947662353515625, 0.008031845092773438, 0.01111602783203125, 0.014200210571289062, 0.017284393310546875, 0.020368576049804688, 0.0234527587890625, 0.026536941528320312, 0.029621124267578125, 0.03270530700683594, 0.03578948974609375, 0.03887367248535156, 0.041957855224609375, 0.04504203796386719, 0.048126220703125, 0.05121040344238281, 0.054294586181640625, 0.05737876892089844, 0.06046295166015625, 0.06354713439941406, 0.06663131713867188, 0.06971549987792969, 0.0727996826171875, 0.07588386535644531, 0.07896804809570312, 0.08205223083496094, 0.08513641357421875, 0.08822059631347656, 0.09130477905273438, 0.09438896179199219, 0.09747314453125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 4.0, 1.0, 3.0, 2.0, 3.0, 8.0, 8.0, 10.0, 8.0, 13.0, 30.0, 36.0, 104.0, 326.0, 240.0, 66.0, 35.0, 29.0, 27.0, 10.0, 8.0, 1.0, 2.0, 6.0, 5.0, 3.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.314847946166992e-05, -8.05361196398735e-05, -7.792375981807709e-05, -7.531139999628067e-05, -7.269904017448425e-05, -7.008668035268784e-05, -6.747432053089142e-05, -6.4861960709095e-05, -6.224960088729858e-05, -5.963724106550217e-05, -5.702488124370575e-05, -5.441252142190933e-05, -5.1800161600112915e-05, -4.91878017783165e-05, -4.657544195652008e-05, -4.396308213472366e-05, -4.1350722312927246e-05, -3.873836249113083e-05, -3.612600266933441e-05, -3.3513642847537994e-05, -3.090128302574158e-05, -2.828892320394516e-05, -2.5676563382148743e-05, -2.3064203560352325e-05, -2.0451843738555908e-05, -1.783948391675949e-05, -1.5227124094963074e-05, -1.2614764273166656e-05, -1.000240445137024e-05, -7.390044629573822e-06, -4.777684807777405e-06, -2.1653249859809875e-06, 4.470348358154297e-07, 3.059394657611847e-06, 5.671754479408264e-06, 8.284114301204681e-06, 1.0896474123001099e-05, 1.3508833944797516e-05, 1.6121193766593933e-05, 1.873355358839035e-05, 2.1345913410186768e-05, 2.3958273231983185e-05, 2.6570633053779602e-05, 2.918299287557602e-05, 3.1795352697372437e-05, 3.4407712519168854e-05, 3.702007234096527e-05, 3.963243216276169e-05, 4.2244791984558105e-05, 4.485715180635452e-05, 4.746951162815094e-05, 5.008187144994736e-05, 5.2694231271743774e-05, 5.530659109354019e-05, 5.791895091533661e-05, 6.0531310737133026e-05, 6.314367055892944e-05, 6.575603038072586e-05, 6.836839020252228e-05, 7.09807500243187e-05, 7.359310984611511e-05, 7.620546966791153e-05, 7.881782948970795e-05, 8.143018931150436e-05, 8.404254913330078e-05]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 2.0, 4.0, 9.0, 11.0, 17.0, 20.0, 23.0, 37.0, 60.0, 114.0, 236.0, 409.0, 762.0, 1669.0, 4009.0, 12528.0, 59437.0, 805746.0, 133047.0, 20254.0, 5814.0, 2165.0, 1008.0, 518.0, 257.0, 156.0, 78.0, 57.0, 30.0, 21.0, 16.0, 18.0, 10.0, 2.0, 6.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1361083984375, -0.1319427490234375, -0.127777099609375, -0.1236114501953125, -0.11944580078125, -0.1152801513671875, -0.111114501953125, -0.1069488525390625, -0.102783203125, -0.0986175537109375, -0.094451904296875, -0.0902862548828125, -0.08612060546875, -0.0819549560546875, -0.077789306640625, -0.0736236572265625, -0.0694580078125, -0.0652923583984375, -0.061126708984375, -0.0569610595703125, -0.05279541015625, -0.0486297607421875, -0.044464111328125, -0.0402984619140625, -0.0361328125, -0.0319671630859375, -0.027801513671875, -0.0236358642578125, -0.01947021484375, -0.0153045654296875, -0.011138916015625, -0.0069732666015625, -0.0028076171875, 0.0013580322265625, 0.005523681640625, 0.0096893310546875, 0.01385498046875, 0.0180206298828125, 0.022186279296875, 0.0263519287109375, 0.030517578125, 0.0346832275390625, 0.038848876953125, 0.0430145263671875, 0.04718017578125, 0.0513458251953125, 0.055511474609375, 0.0596771240234375, 0.0638427734375, 0.0680084228515625, 0.072174072265625, 0.0763397216796875, 0.08050537109375, 0.0846710205078125, 0.088836669921875, 0.0930023193359375, 0.09716796875, 0.1013336181640625, 0.105499267578125, 0.1096649169921875, 0.11383056640625, 0.1179962158203125, 0.122161865234375, 0.1263275146484375, 0.1304931640625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 4.0, 10.0, 7.0, 10.0, 17.0, 27.0, 48.0, 47.0, 85.0, 146.0, 211.0, 133.0, 76.0, 49.0, 44.0, 21.0, 13.0, 14.0, 14.0, 3.0, 6.0, 4.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.1219482421875, -0.11806106567382812, -0.11417388916015625, -0.11028671264648438, -0.1063995361328125, -0.10251235961914062, -0.09862518310546875, -0.09473800659179688, -0.090850830078125, -0.08696365356445312, -0.08307647705078125, -0.07918930053710938, -0.0753021240234375, -0.07141494750976562, -0.06752777099609375, -0.06364059448242188, -0.05975341796875, -0.055866241455078125, -0.05197906494140625, -0.048091888427734375, -0.0442047119140625, -0.040317535400390625, -0.03643035888671875, -0.032543182373046875, -0.028656005859375, -0.024768829345703125, -0.02088165283203125, -0.016994476318359375, -0.0131072998046875, -0.009220123291015625, -0.00533294677734375, -0.001445770263671875, 0.00244140625, 0.006328582763671875, 0.01021575927734375, 0.014102935791015625, 0.0179901123046875, 0.021877288818359375, 0.02576446533203125, 0.029651641845703125, 0.033538818359375, 0.037425994873046875, 0.04131317138671875, 0.045200347900390625, 0.0490875244140625, 0.052974700927734375, 0.05686187744140625, 0.060749053955078125, 0.06463623046875, 0.06852340698242188, 0.07241058349609375, 0.07629776000976562, 0.0801849365234375, 0.08407211303710938, 0.08795928955078125, 0.09184646606445312, 0.095733642578125, 0.09962081909179688, 0.10350799560546875, 0.10739517211914062, 0.1112823486328125, 0.11516952514648438, 0.11905670166015625, 0.12294387817382812, 0.1268310546875]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 3.0, 9.0, 20.0, 39.0, 100.0, 205.0, 310.0, 146.0, 66.0, 43.0, 21.0, 16.0, 7.0, 3.0, 4.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.3854055404663086, -3.308715581893921, -3.2320258617401123, -3.1553359031677246, -3.078646183013916, -3.0019562244415283, -2.9252662658691406, -2.848576545715332, -2.7718865871429443, -2.6951966285705566, -2.618506908416748, -2.5418169498443604, -2.4651272296905518, -2.388437271118164, -2.3117475509643555, -2.2350575923919678, -2.15836763381958, -2.0816776752471924, -2.004987955093384, -1.928297996520996, -1.851608157157898, -1.7749183177947998, -1.6982284784317017, -1.6215386390686035, -1.544848918914795, -1.4681590795516968, -1.3914692401885986, -1.314779281616211, -1.2380894422531128, -1.1613996028900146, -1.0847097635269165, -1.0080199241638184, -0.9313299655914307, -0.8546401262283325, -0.7779502272605896, -0.7012603878974915, -0.6245704889297485, -0.5478806495666504, -0.47119081020355225, -0.3945009112358093, -0.3178110718727112, -0.24112120270729065, -0.1644313484430313, -0.08774149417877197, -0.01105162501335144, 0.06563824415206909, 0.14232808351516724, 0.21901798248291016, 0.2957078218460083, 0.37239769101142883, 0.44908756017684937, 0.5257773995399475, 0.6024672985076904, 0.6791571378707886, 0.7558469772338867, 0.8325368762016296, 0.9092267155647278, 0.9859165549278259, 1.0626064538955688, 1.139296293258667, 1.2159861326217651, 1.2926759719848633, 1.369365930557251, 1.4460557699203491, 1.5227456092834473]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 5.0, 4.0, 11.0, 16.0, 14.0, 14.0, 18.0, 10.0, 22.0, 20.0, 27.0, 25.0, 37.0, 35.0, 25.0, 36.0, 40.0, 59.0, 66.0, 73.0, 62.0, 48.0, 39.0, 33.0, 32.0, 35.0, 26.0, 29.0, 19.0, 19.0, 19.0, 16.0, 10.0, 11.0, 4.0, 8.0, 8.0, 6.0, 3.0, 4.0, 2.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5129777789115906, -0.4952527582645416, -0.4775277376174927, -0.4598027169704437, -0.4420776963233948, -0.42435264587402344, -0.4066276252269745, -0.38890260457992554, -0.3711775839328766, -0.35345256328582764, -0.3357275426387787, -0.31800252199172974, -0.3002774715423584, -0.28255248069763184, -0.2648274302482605, -0.24710240960121155, -0.2293773889541626, -0.21165236830711365, -0.1939273476600647, -0.17620231211185455, -0.1584772914648056, -0.14075227081775665, -0.1230272427201271, -0.10530221462249756, -0.08757719397544861, -0.06985217332839966, -0.05212714523077011, -0.03440212085843086, -0.016677096486091614, 0.0010479241609573364, 0.018772952258586884, 0.03649798035621643, 0.054223060607910156, 0.0719480812549591, 0.08967310935258865, 0.1073981374502182, 0.12512315809726715, 0.1428481787443161, 0.16057321429252625, 0.1782982349395752, 0.19602325558662415, 0.2137482762336731, 0.23147329688072205, 0.2491983324289322, 0.26692336797714233, 0.2846483588218689, 0.30237340927124023, 0.3200984299182892, 0.33782345056533813, 0.3555484712123871, 0.37327349185943604, 0.390998512506485, 0.40872353315353394, 0.4264485836029053, 0.4441736042499542, 0.4618986248970032, 0.4796236455440521, 0.4973486661911011, 0.5150737166404724, 0.532798707485199, 0.5505237579345703, 0.5682487487792969, 0.5859737992286682, 0.6036988496780396, 0.6214238405227661]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 5.0, 9.0, 7.0, 8.0, 15.0, 36.0, 34.0, 49.0, 84.0, 122.0, 214.0, 423.0, 960.0, 2402.0, 7410.0, 33421.0, 704351.0, 3325586.0, 98268.0, 14286.0, 3876.0, 1428.0, 583.0, 293.0, 153.0, 87.0, 54.0, 39.0, 15.0, 20.0, 18.0, 11.0, 3.0, 4.0, 5.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.14453125, -0.14075088500976562, -0.13697052001953125, -0.13319015502929688, -0.1294097900390625, -0.12562942504882812, -0.12184906005859375, -0.11806869506835938, -0.114288330078125, -0.11050796508789062, -0.10672760009765625, -0.10294723510742188, -0.0991668701171875, -0.09538650512695312, -0.09160614013671875, -0.08782577514648438, -0.08404541015625, -0.08026504516601562, -0.07648468017578125, -0.07270431518554688, -0.0689239501953125, -0.06514358520507812, -0.06136322021484375, -0.057582855224609375, -0.053802490234375, -0.050022125244140625, -0.04624176025390625, -0.042461395263671875, -0.0386810302734375, -0.034900665283203125, -0.03112030029296875, -0.027339935302734375, -0.0235595703125, -0.019779205322265625, -0.01599884033203125, -0.012218475341796875, -0.0084381103515625, -0.004657745361328125, -0.00087738037109375, 0.002902984619140625, 0.006683349609375, 0.010463714599609375, 0.01424407958984375, 0.018024444580078125, 0.0218048095703125, 0.025585174560546875, 0.02936553955078125, 0.033145904541015625, 0.03692626953125, 0.040706634521484375, 0.04448699951171875, 0.048267364501953125, 0.0520477294921875, 0.055828094482421875, 0.05960845947265625, 0.06338882446289062, 0.067169189453125, 0.07094955444335938, 0.07472991943359375, 0.07851028442382812, 0.0822906494140625, 0.08607101440429688, 0.08985137939453125, 0.09363174438476562, 0.097412109375]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 4.0, 7.0, 11.0, 10.0, 12.0, 19.0, 24.0, 26.0, 27.0, 40.0, 46.0, 58.0, 67.0, 64.0, 81.0, 64.0, 83.0, 75.0, 60.0, 56.0, 37.0, 36.0, 23.0, 20.0, 15.0, 21.0, 4.0, 8.0, 4.0, 4.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.048492431640625, -0.047141075134277344, -0.04578971862792969, -0.04443836212158203, -0.043087005615234375, -0.04173564910888672, -0.04038429260253906, -0.039032936096191406, -0.03768157958984375, -0.036330223083496094, -0.03497886657714844, -0.03362751007080078, -0.032276153564453125, -0.03092479705810547, -0.029573440551757812, -0.028222084045410156, -0.0268707275390625, -0.025519371032714844, -0.024168014526367188, -0.02281665802001953, -0.021465301513671875, -0.02011394500732422, -0.018762588500976562, -0.017411231994628906, -0.01605987548828125, -0.014708518981933594, -0.013357162475585938, -0.012005805969238281, -0.010654449462890625, -0.009303092956542969, -0.007951736450195312, -0.006600379943847656, -0.0052490234375, -0.0038976669311523438, -0.0025463104248046875, -0.0011949539184570312, 0.000156402587890625, 0.0015077590942382812, 0.0028591156005859375, 0.004210472106933594, 0.00556182861328125, 0.006913185119628906, 0.008264541625976562, 0.009615898132324219, 0.010967254638671875, 0.012318611145019531, 0.013669967651367188, 0.015021324157714844, 0.0163726806640625, 0.017724037170410156, 0.019075393676757812, 0.02042675018310547, 0.021778106689453125, 0.02312946319580078, 0.024480819702148438, 0.025832176208496094, 0.02718353271484375, 0.028534889221191406, 0.029886245727539062, 0.03123760223388672, 0.032588958740234375, 0.03394031524658203, 0.03529167175292969, 0.036643028259277344, 0.037994384765625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 8.0, 12.0, 14.0, 17.0, 24.0, 47.0, 57.0, 134.0, 191.0, 451.0, 1540.0, 26154.0, 4132763.0, 29811.0, 1594.0, 581.0, 307.0, 173.0, 132.0, 73.0, 47.0, 41.0, 28.0, 19.0, 17.0, 18.0, 9.0, 6.0, 4.0, 2.0, 3.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.54833984375, -0.5340995788574219, -0.5198593139648438, -0.5056190490722656, -0.4913787841796875, -0.4771385192871094, -0.46289825439453125, -0.4486579895019531, -0.434417724609375, -0.4201774597167969, -0.40593719482421875, -0.3916969299316406, -0.3774566650390625, -0.3632164001464844, -0.34897613525390625, -0.3347358703613281, -0.32049560546875, -0.3062553405761719, -0.29201507568359375, -0.2777748107910156, -0.2635345458984375, -0.24929428100585938, -0.23505401611328125, -0.22081375122070312, -0.206573486328125, -0.19233322143554688, -0.17809295654296875, -0.16385269165039062, -0.1496124267578125, -0.13537216186523438, -0.12113189697265625, -0.10689163208007812, -0.0926513671875, -0.07841110229492188, -0.06417083740234375, -0.049930572509765625, -0.0356903076171875, -0.021450042724609375, -0.00720977783203125, 0.007030487060546875, 0.021270751953125, 0.035511016845703125, 0.04975128173828125, 0.06399154663085938, 0.0782318115234375, 0.09247207641601562, 0.10671234130859375, 0.12095260620117188, 0.13519287109375, 0.14943313598632812, 0.16367340087890625, 0.17791366577148438, 0.1921539306640625, 0.20639419555664062, 0.22063446044921875, 0.23487472534179688, 0.249114990234375, 0.2633552551269531, 0.27759552001953125, 0.2918357849121094, 0.3060760498046875, 0.3203163146972656, 0.33455657958984375, 0.3487968444824219, 0.363037109375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 15.0, 28.0, 71.0, 292.0, 2157.0, 1221.0, 199.0, 59.0, 26.0, 10.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1842041015625, -0.17178916931152344, -0.15937423706054688, -0.1469593048095703, -0.13454437255859375, -0.12212944030761719, -0.10971450805664062, -0.09729957580566406, -0.0848846435546875, -0.07246971130371094, -0.060054779052734375, -0.04763984680175781, -0.03522491455078125, -0.022809982299804688, -0.010395050048828125, 0.0020198822021484375, 0.014434814453125, 0.026849746704101562, 0.039264678955078125, 0.05167961120605469, 0.06409454345703125, 0.07650947570800781, 0.08892440795898438, 0.10133934020996094, 0.1137542724609375, 0.12616920471191406, 0.13858413696289062, 0.1509990692138672, 0.16341400146484375, 0.1758289337158203, 0.18824386596679688, 0.20065879821777344, 0.21307373046875, 0.22548866271972656, 0.23790359497070312, 0.2503185272216797, 0.26273345947265625, 0.2751483917236328, 0.2875633239746094, 0.29997825622558594, 0.3123931884765625, 0.32480812072753906, 0.3372230529785156, 0.3496379852294922, 0.36205291748046875, 0.3744678497314453, 0.3868827819824219, 0.39929771423339844, 0.411712646484375, 0.42412757873535156, 0.4365425109863281, 0.4489574432373047, 0.46137237548828125, 0.4737873077392578, 0.4862022399902344, 0.49861717224121094, 0.5110321044921875, 0.5234470367431641, 0.5358619689941406, 0.5482769012451172, 0.5606918334960938, 0.5731067657470703, 0.5855216979980469, 0.5979366302490234, 0.6103515625]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 1.0, 1.0, 8.0, 7.0, 26.0, 85.0, 274.0, 352.0, 149.0, 53.0, 21.0, 11.0, 4.0, 8.0, 7.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.9749236106872559, -0.8777990937232971, -0.7806745767593384, -0.6835501194000244, -0.5864255428314209, -0.48930105566978455, -0.3921765685081482, -0.29505205154418945, -0.1979275345802307, -0.10080302506685257, -0.0036785155534744263, 0.09344598650932312, 0.19057050347328186, 0.2876950204372406, 0.38481950759887695, 0.4819440245628357, 0.5790685415267944, 0.6761930584907532, 0.7733175754547119, 0.8704420328140259, 0.9675666093826294, 1.0646910667419434, 1.1618156433105469, 1.2589401006698608, 1.3560645580291748, 1.4531890153884888, 1.5503135919570923, 1.6474380493164062, 1.7445626258850098, 1.8416870832443237, 1.9388115406036377, 2.035936117172241, 2.1330606937408447, 2.2301852703094482, 2.3273096084594727, 2.424434185028076, 2.5215587615966797, 2.618683338165283, 2.7158076763153076, 2.812932252883911, 2.9100568294525146, 3.007181406021118, 3.1043057441711426, 3.201430320739746, 3.2985548973083496, 3.395679473876953, 3.4928038120269775, 3.589928388595581, 3.6870527267456055, 3.784177303314209, 3.8813016414642334, 3.978426218032837, 4.075550556182861, 4.172675132751465, 4.269799709320068, 4.366924285888672, 4.464048862457275, 4.561173439025879, 4.658298015594482, 4.755422592163086, 4.852546691894531, 4.949671268463135, 5.046795845031738, 5.143920421600342, 5.241044998168945]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 2.0, 4.0, 3.0, 7.0, 10.0, 13.0, 10.0, 19.0, 30.0, 34.0, 36.0, 51.0, 58.0, 66.0, 55.0, 67.0, 75.0, 49.0, 66.0, 62.0, 67.0, 43.0, 34.0, 45.0, 32.0, 17.0, 14.0, 4.0, 11.0, 5.0, 2.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.022066593170166, -0.9856069087982178, -0.9491471648216248, -0.9126874804496765, -0.8762277364730835, -0.8397680521011353, -0.803308367729187, -0.766848623752594, -0.730388879776001, -0.6939291954040527, -0.6574694514274597, -0.6210097670555115, -0.5845500230789185, -0.5480903387069702, -0.511630654335022, -0.47517091035842896, -0.4387112259864807, -0.4022515118122101, -0.36579179763793945, -0.3293321132659912, -0.2928723692893982, -0.25641268491744995, -0.21995297074317932, -0.1834932565689087, -0.14703354239463806, -0.11057382822036743, -0.0741141214966774, -0.037654414772987366, -0.0011947005987167358, 0.035265013575553894, 0.07172471284866333, 0.10818442702293396, 0.1446441411972046, 0.18110385537147522, 0.21756356954574585, 0.2540232539176941, 0.2904829978942871, 0.32694268226623535, 0.363402396440506, 0.3998621106147766, 0.43632182478904724, 0.47278153896331787, 0.5092412233352661, 0.5457009673118591, 0.5821606516838074, 0.6186203956604004, 0.6550800800323486, 0.6915397644042969, 0.7279995083808899, 0.7644591927528381, 0.8009189367294312, 0.8373786211013794, 0.8738383650779724, 0.9102980494499207, 0.9467577934265137, 0.9832174777984619, 1.0196771621704102, 1.0561368465423584, 1.0925965309143066, 1.1290563344955444, 1.1655160188674927, 1.201975703239441, 1.2384353876113892, 1.274895191192627, 1.3113548755645752]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 9.0, 14.0, 24.0, 30.0, 34.0, 51.0, 74.0, 139.0, 170.0, 245.0, 371.0, 583.0, 881.0, 1301.0, 2090.0, 3519.0, 5711.0, 9848.0, 17472.0, 32538.0, 62875.0, 125397.0, 219756.0, 243377.0, 153110.0, 78331.0, 40050.0, 21236.0, 11583.0, 6685.0, 4039.0, 2479.0, 1559.0, 989.0, 666.0, 407.0, 257.0, 203.0, 128.0, 87.0, 69.0, 51.0, 42.0, 25.0, 14.0, 10.0, 7.0, 6.0, 7.0, 3.0, 7.0], "bins": [-0.06011962890625, -0.0584568977355957, -0.056794166564941406, -0.05513143539428711, -0.05346870422363281, -0.051805973052978516, -0.05014324188232422, -0.04848051071166992, -0.046817779541015625, -0.04515504837036133, -0.04349231719970703, -0.041829586029052734, -0.04016685485839844, -0.03850412368774414, -0.036841392517089844, -0.03517866134643555, -0.03351593017578125, -0.03185319900512695, -0.030190467834472656, -0.02852773666381836, -0.026865005493164062, -0.025202274322509766, -0.02353954315185547, -0.021876811981201172, -0.020214080810546875, -0.018551349639892578, -0.01688861846923828, -0.015225887298583984, -0.013563156127929688, -0.01190042495727539, -0.010237693786621094, -0.008574962615966797, -0.0069122314453125, -0.005249500274658203, -0.0035867691040039062, -0.0019240379333496094, -0.0002613067626953125, 0.0014014244079589844, 0.0030641555786132812, 0.004726886749267578, 0.006389617919921875, 0.008052349090576172, 0.009715080261230469, 0.011377811431884766, 0.013040542602539062, 0.01470327377319336, 0.016366004943847656, 0.018028736114501953, 0.01969146728515625, 0.021354198455810547, 0.023016929626464844, 0.02467966079711914, 0.026342391967773438, 0.028005123138427734, 0.02966785430908203, 0.03133058547973633, 0.032993316650390625, 0.03465604782104492, 0.03631877899169922, 0.037981510162353516, 0.03964424133300781, 0.04130697250366211, 0.042969703674316406, 0.0446324348449707, 0.046295166015625]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 5.0, 6.0, 4.0, 7.0, 7.0, 7.0, 16.0, 17.0, 17.0, 23.0, 24.0, 30.0, 32.0, 38.0, 38.0, 47.0, 38.0, 72.0, 52.0, 42.0, 70.0, 50.0, 52.0, 41.0, 33.0, 32.0, 39.0, 29.0, 34.0, 24.0, 17.0, 8.0, 11.0, 10.0, 7.0, 8.0, 5.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.04779052734375, -0.04621696472167969, -0.044643402099609375, -0.04306983947753906, -0.04149627685546875, -0.03992271423339844, -0.038349151611328125, -0.03677558898925781, -0.0352020263671875, -0.03362846374511719, -0.032054901123046875, -0.030481338500976562, -0.02890777587890625, -0.027334213256835938, -0.025760650634765625, -0.024187088012695312, -0.022613525390625, -0.021039962768554688, -0.019466400146484375, -0.017892837524414062, -0.01631927490234375, -0.014745712280273438, -0.013172149658203125, -0.011598587036132812, -0.0100250244140625, -0.008451461791992188, -0.006877899169921875, -0.0053043365478515625, -0.00373077392578125, -0.0021572113037109375, -0.000583648681640625, 0.0009899139404296875, 0.0025634765625, 0.0041370391845703125, 0.005710601806640625, 0.0072841644287109375, 0.00885772705078125, 0.010431289672851562, 0.012004852294921875, 0.013578414916992188, 0.0151519775390625, 0.016725540161132812, 0.018299102783203125, 0.019872665405273438, 0.02144622802734375, 0.023019790649414062, 0.024593353271484375, 0.026166915893554688, 0.027740478515625, 0.029314041137695312, 0.030887603759765625, 0.03246116638183594, 0.03403472900390625, 0.03560829162597656, 0.037181854248046875, 0.03875541687011719, 0.0403289794921875, 0.04190254211425781, 0.043476104736328125, 0.04504966735839844, 0.04662322998046875, 0.04819679260253906, 0.049770355224609375, 0.05134391784667969, 0.05291748046875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 2.0, 3.0, 1.0, 5.0, 3.0, 3.0, 7.0, 7.0, 13.0, 17.0, 13.0, 23.0, 46.0, 53.0, 98.0, 117.0, 232.0, 388.0, 714.0, 1402.0, 3267.0, 9575.0, 40263.0, 287966.0, 615909.0, 66780.0, 13517.0, 4424.0, 1741.0, 851.0, 455.0, 240.0, 149.0, 89.0, 60.0, 43.0, 19.0, 14.0, 15.0, 13.0, 6.0, 5.0, 5.0, 7.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15673828125, -0.15096282958984375, -0.1451873779296875, -0.13941192626953125, -0.133636474609375, -0.12786102294921875, -0.1220855712890625, -0.11631011962890625, -0.11053466796875, -0.10475921630859375, -0.0989837646484375, -0.09320831298828125, -0.087432861328125, -0.08165740966796875, -0.0758819580078125, -0.07010650634765625, -0.0643310546875, -0.05855560302734375, -0.0527801513671875, -0.04700469970703125, -0.041229248046875, -0.03545379638671875, -0.0296783447265625, -0.02390289306640625, -0.01812744140625, -0.01235198974609375, -0.0065765380859375, -0.00080108642578125, 0.004974365234375, 0.01074981689453125, 0.0165252685546875, 0.02230072021484375, 0.028076171875, 0.03385162353515625, 0.0396270751953125, 0.04540252685546875, 0.051177978515625, 0.05695343017578125, 0.0627288818359375, 0.06850433349609375, 0.07427978515625, 0.08005523681640625, 0.0858306884765625, 0.09160614013671875, 0.097381591796875, 0.10315704345703125, 0.1089324951171875, 0.11470794677734375, 0.1204833984375, 0.12625885009765625, 0.1320343017578125, 0.13780975341796875, 0.143585205078125, 0.14936065673828125, 0.1551361083984375, 0.16091156005859375, 0.16668701171875, 0.17246246337890625, 0.1782379150390625, 0.18401336669921875, 0.189788818359375, 0.19556427001953125, 0.2013397216796875, 0.20711517333984375, 0.212890625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 0.0, 0.0, 3.0, 3.0, 4.0, 5.0, 4.0, 10.0, 13.0, 9.0, 19.0, 12.0, 31.0, 28.0, 25.0, 44.0, 54.0, 49.0, 49.0, 63.0, 53.0, 63.0, 55.0, 58.0, 54.0, 52.0, 33.0, 36.0, 37.0, 27.0, 17.0, 29.0, 12.0, 12.0, 6.0, 12.0, 7.0, 6.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.309814453125, -0.3013038635253906, -0.29279327392578125, -0.2842826843261719, -0.2757720947265625, -0.2672615051269531, -0.25875091552734375, -0.2502403259277344, -0.241729736328125, -0.23321914672851562, -0.22470855712890625, -0.21619796752929688, -0.2076873779296875, -0.19917678833007812, -0.19066619873046875, -0.18215560913085938, -0.17364501953125, -0.16513442993164062, -0.15662384033203125, -0.14811325073242188, -0.1396026611328125, -0.13109207153320312, -0.12258148193359375, -0.11407089233398438, -0.105560302734375, -0.09704971313476562, -0.08853912353515625, -0.08002853393554688, -0.0715179443359375, -0.06300735473632812, -0.05449676513671875, -0.045986175537109375, -0.0374755859375, -0.028964996337890625, -0.02045440673828125, -0.011943817138671875, -0.0034332275390625, 0.005077362060546875, 0.01358795166015625, 0.022098541259765625, 0.030609130859375, 0.039119720458984375, 0.04763031005859375, 0.056140899658203125, 0.0646514892578125, 0.07316207885742188, 0.08167266845703125, 0.09018325805664062, 0.09869384765625, 0.10720443725585938, 0.11571502685546875, 0.12422561645507812, 0.1327362060546875, 0.14124679565429688, 0.14975738525390625, 0.15826797485351562, 0.166778564453125, 0.17528915405273438, 0.18379974365234375, 0.19231033325195312, 0.2008209228515625, 0.20933151245117188, 0.21784210205078125, 0.22635269165039062, 0.23486328125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 3.0, 7.0, 8.0, 5.0, 15.0, 26.0, 32.0, 33.0, 64.0, 89.0, 127.0, 166.0, 248.0, 337.0, 503.0, 746.0, 1116.0, 1791.0, 2950.0, 4900.0, 8797.0, 16624.0, 34219.0, 83221.0, 266627.0, 454842.0, 92675.0, 37340.0, 17666.0, 9531.0, 5294.0, 2948.0, 1860.0, 1217.0, 786.0, 534.0, 351.0, 264.0, 178.0, 128.0, 83.0, 48.0, 42.0, 26.0, 34.0, 19.0, 15.0, 12.0, 10.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.045928955078125, -0.04449605941772461, -0.04306316375732422, -0.04163026809692383, -0.04019737243652344, -0.03876447677612305, -0.037331581115722656, -0.035898685455322266, -0.034465789794921875, -0.033032894134521484, -0.031599998474121094, -0.030167102813720703, -0.028734207153320312, -0.027301311492919922, -0.02586841583251953, -0.02443552017211914, -0.02300262451171875, -0.02156972885131836, -0.02013683319091797, -0.018703937530517578, -0.017271041870117188, -0.015838146209716797, -0.014405250549316406, -0.012972354888916016, -0.011539459228515625, -0.010106563568115234, -0.008673667907714844, -0.007240772247314453, -0.0058078765869140625, -0.004374980926513672, -0.0029420852661132812, -0.0015091896057128906, -7.62939453125e-05, 0.0013566017150878906, 0.0027894973754882812, 0.004222393035888672, 0.0056552886962890625, 0.007088184356689453, 0.008521080017089844, 0.009953975677490234, 0.011386871337890625, 0.012819766998291016, 0.014252662658691406, 0.015685558319091797, 0.017118453979492188, 0.018551349639892578, 0.01998424530029297, 0.02141714096069336, 0.02285003662109375, 0.02428293228149414, 0.02571582794189453, 0.027148723602294922, 0.028581619262695312, 0.030014514923095703, 0.031447410583496094, 0.032880306243896484, 0.034313201904296875, 0.035746097564697266, 0.037178993225097656, 0.03861188888549805, 0.04004478454589844, 0.04147768020629883, 0.04291057586669922, 0.04434347152709961, 0.0457763671875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 10.0, 15.0, 18.0, 22.0, 34.0, 70.0, 102.0, 174.0, 234.0, 141.0, 63.0, 41.0, 25.0, 20.0, 9.0, 4.0, 3.0, 1.0, 5.0, 3.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.657838821411133e-05, -6.491877138614655e-05, -6.325915455818176e-05, -6.159953773021698e-05, -5.99399209022522e-05, -5.8280304074287415e-05, -5.662068724632263e-05, -5.496107041835785e-05, -5.3301453590393066e-05, -5.1641836762428284e-05, -4.99822199344635e-05, -4.832260310649872e-05, -4.6662986278533936e-05, -4.500336945056915e-05, -4.334375262260437e-05, -4.168413579463959e-05, -4.0024518966674805e-05, -3.836490213871002e-05, -3.670528531074524e-05, -3.5045668482780457e-05, -3.3386051654815674e-05, -3.172643482685089e-05, -3.006681799888611e-05, -2.8407201170921326e-05, -2.6747584342956543e-05, -2.508796751499176e-05, -2.3428350687026978e-05, -2.1768733859062195e-05, -2.0109117031097412e-05, -1.844950020313263e-05, -1.6789883375167847e-05, -1.5130266547203064e-05, -1.3470649719238281e-05, -1.1811032891273499e-05, -1.0151416063308716e-05, -8.491799235343933e-06, -6.83218240737915e-06, -5.172565579414368e-06, -3.512948751449585e-06, -1.8533319234848022e-06, -1.9371509552001953e-07, 1.4659017324447632e-06, 3.125518560409546e-06, 4.785135388374329e-06, 6.444752216339111e-06, 8.104369044303894e-06, 9.763985872268677e-06, 1.142360270023346e-05, 1.3083219528198242e-05, 1.4742836356163025e-05, 1.6402453184127808e-05, 1.806207001209259e-05, 1.9721686840057373e-05, 2.1381303668022156e-05, 2.304092049598694e-05, 2.470053732395172e-05, 2.6360154151916504e-05, 2.8019770979881287e-05, 2.967938780784607e-05, 3.133900463581085e-05, 3.2998621463775635e-05, 3.465823829174042e-05, 3.63178551197052e-05, 3.797747194766998e-05, 3.9637088775634766e-05]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 3.0, 4.0, 8.0, 7.0, 13.0, 19.0, 12.0, 31.0, 46.0, 72.0, 121.0, 220.0, 396.0, 657.0, 1248.0, 2518.0, 5274.0, 11772.0, 27351.0, 73151.0, 249183.0, 511923.0, 100808.0, 35879.0, 14841.0, 6400.0, 3120.0, 1570.0, 814.0, 441.0, 247.0, 124.0, 97.0, 67.0, 41.0, 24.0, 16.0, 12.0, 4.0, 5.0, 3.0, 4.0, 2.0, 1.0, 3.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.04766845703125, -0.0459747314453125, -0.044281005859375, -0.0425872802734375, -0.0408935546875, -0.0391998291015625, -0.037506103515625, -0.0358123779296875, -0.03411865234375, -0.0324249267578125, -0.030731201171875, -0.0290374755859375, -0.02734375, -0.0256500244140625, -0.023956298828125, -0.0222625732421875, -0.02056884765625, -0.0188751220703125, -0.017181396484375, -0.0154876708984375, -0.0137939453125, -0.0121002197265625, -0.010406494140625, -0.0087127685546875, -0.00701904296875, -0.0053253173828125, -0.003631591796875, -0.0019378662109375, -0.000244140625, 0.0014495849609375, 0.003143310546875, 0.0048370361328125, 0.00653076171875, 0.0082244873046875, 0.009918212890625, 0.0116119384765625, 0.0133056640625, 0.0149993896484375, 0.016693115234375, 0.0183868408203125, 0.02008056640625, 0.0217742919921875, 0.023468017578125, 0.0251617431640625, 0.02685546875, 0.0285491943359375, 0.030242919921875, 0.0319366455078125, 0.03363037109375, 0.0353240966796875, 0.037017822265625, 0.0387115478515625, 0.0404052734375, 0.0420989990234375, 0.043792724609375, 0.0454864501953125, 0.04718017578125, 0.0488739013671875, 0.050567626953125, 0.0522613525390625, 0.053955078125, 0.0556488037109375, 0.057342529296875, 0.0590362548828125, 0.06072998046875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 5.0, 5.0, 5.0, 6.0, 5.0, 2.0, 7.0, 10.0, 15.0, 23.0, 18.0, 18.0, 29.0, 34.0, 44.0, 42.0, 64.0, 83.0, 80.0, 83.0, 83.0, 53.0, 60.0, 44.0, 31.0, 27.0, 25.0, 15.0, 13.0, 16.0, 6.0, 4.0, 12.0, 10.0, 2.0, 2.0, 2.0, 1.0, 4.0, 2.0, 0.0, 4.0, 2.0, 1.0, 1.0, 1.0, 3.0], "bins": [-0.05828857421875, -0.05665779113769531, -0.055027008056640625, -0.05339622497558594, -0.05176544189453125, -0.05013465881347656, -0.048503875732421875, -0.04687309265136719, -0.0452423095703125, -0.04361152648925781, -0.041980743408203125, -0.04034996032714844, -0.03871917724609375, -0.03708839416503906, -0.035457611083984375, -0.03382682800292969, -0.032196044921875, -0.030565261840820312, -0.028934478759765625, -0.027303695678710938, -0.02567291259765625, -0.024042129516601562, -0.022411346435546875, -0.020780563354492188, -0.0191497802734375, -0.017518997192382812, -0.015888214111328125, -0.014257431030273438, -0.01262664794921875, -0.010995864868164062, -0.009365081787109375, -0.0077342987060546875, -0.006103515625, -0.0044727325439453125, -0.002841949462890625, -0.0012111663818359375, 0.00041961669921875, 0.0020503997802734375, 0.003681182861328125, 0.0053119659423828125, 0.0069427490234375, 0.008573532104492188, 0.010204315185546875, 0.011835098266601562, 0.01346588134765625, 0.015096664428710938, 0.016727447509765625, 0.018358230590820312, 0.019989013671875, 0.021619796752929688, 0.023250579833984375, 0.024881362915039062, 0.02651214599609375, 0.028142929077148438, 0.029773712158203125, 0.03140449523925781, 0.0330352783203125, 0.03466606140136719, 0.036296844482421875, 0.03792762756347656, 0.03955841064453125, 0.04118919372558594, 0.042819976806640625, 0.04445075988769531, 0.04608154296875]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 5.0, 8.0, 8.0, 20.0, 63.0, 146.0, 363.0, 222.0, 97.0, 41.0, 13.0, 11.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.823944330215454, -3.7423255443573, -3.6607067584991455, -3.579087972640991, -3.497468948364258, -3.4158501625061035, -3.334231376647949, -3.252612590789795, -3.1709938049316406, -3.0893750190734863, -3.007756233215332, -2.9261374473571777, -2.8445186614990234, -2.76289963722229, -2.6812808513641357, -2.5996620655059814, -2.518043279647827, -2.436424493789673, -2.3548057079315186, -2.2731869220733643, -2.191567897796631, -2.1099491119384766, -2.0283303260803223, -1.946711540222168, -1.8650927543640137, -1.7834739685058594, -1.701855182647705, -1.6202362775802612, -1.538617491722107, -1.4569987058639526, -1.3753798007965088, -1.2937610149383545, -1.212141990661621, -1.1305232048034668, -1.0489044189453125, -0.9672855138778687, -0.8856667280197144, -0.8040479421615601, -0.722429096698761, -0.6408102512359619, -0.5591914653778076, -0.47757264971733093, -0.39595383405685425, -0.31433501839637756, -0.23271620273590088, -0.1510973870754242, -0.06947857141494751, 0.012140274047851562, 0.09375905990600586, 0.17537787556648254, 0.25699669122695923, 0.3386155068874359, 0.4202343225479126, 0.5018531084060669, 0.583471953868866, 0.665090799331665, 0.7467095851898193, 0.8283283710479736, 0.9099472165107727, 0.9915660619735718, 1.073184847831726, 1.1548036336898804, 1.2364225387573242, 1.3180413246154785, 1.3996601104736328]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 9.0, 3.0, 8.0, 12.0, 14.0, 8.0, 14.0, 17.0, 18.0, 21.0, 31.0, 25.0, 35.0, 40.0, 55.0, 44.0, 72.0, 104.0, 83.0, 61.0, 34.0, 37.0, 35.0, 42.0, 33.0, 27.0, 18.0, 20.0, 16.0, 10.0, 9.0, 8.0, 13.0, 6.0, 5.0, 6.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.386664867401123, -1.3442174196243286, -1.3017699718475342, -1.2593225240707397, -1.2168750762939453, -1.1744277477264404, -1.131980299949646, -1.0895328521728516, -1.0470854043960571, -1.0046379566192627, -0.9621905088424683, -0.9197431206703186, -0.8772956728935242, -0.8348482251167297, -0.7924008369445801, -0.7499533891677856, -0.7075059413909912, -0.6650584936141968, -0.6226110458374023, -0.5801636576652527, -0.5377162098884583, -0.4952687621116638, -0.4528213441371918, -0.4103739261627197, -0.3679264783859253, -0.32547903060913086, -0.2830316126346588, -0.24058417975902557, -0.19813674688339233, -0.1556893140077591, -0.11324188113212585, -0.07079446315765381, -0.028346896171569824, 0.014100536704063416, 0.056547969579696655, 0.0989954024553299, 0.14144283533096313, 0.18389026820659637, 0.22633770108222961, 0.26878511905670166, 0.3112325668334961, 0.3536800146102905, 0.3961274325847626, 0.4385748505592346, 0.48102229833602905, 0.5234697461128235, 0.5659171342849731, 0.6083645820617676, 0.650812029838562, 0.6932594776153564, 0.7357069253921509, 0.7781543135643005, 0.820601761341095, 0.8630492091178894, 0.9054965972900391, 0.9479440450668335, 0.9903914928436279, 1.0328389406204224, 1.0752863883972168, 1.1177338361740112, 1.1601812839508057, 1.2026286125183105, 1.245076060295105, 1.2875235080718994, 1.3299709558486938]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 3.0, 7.0, 8.0, 16.0, 10.0, 11.0, 24.0, 15.0, 32.0, 42.0, 67.0, 74.0, 103.0, 163.0, 274.0, 426.0, 765.0, 1385.0, 2692.0, 5723.0, 14596.0, 49115.0, 271190.0, 2123486.0, 1491596.0, 175402.0, 35544.0, 11668.0, 4691.0, 2175.0, 1155.0, 647.0, 405.0, 228.0, 168.0, 103.0, 78.0, 59.0, 41.0, 30.0, 18.0, 19.0, 8.0, 5.0, 8.0, 4.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 4.0], "bins": [-0.08587646484375, -0.0833425521850586, -0.08080863952636719, -0.07827472686767578, -0.07574081420898438, -0.07320690155029297, -0.07067298889160156, -0.06813907623291016, -0.06560516357421875, -0.06307125091552734, -0.06053733825683594, -0.05800342559814453, -0.055469512939453125, -0.05293560028076172, -0.05040168762207031, -0.047867774963378906, -0.0453338623046875, -0.042799949645996094, -0.04026603698730469, -0.03773212432861328, -0.035198211669921875, -0.03266429901123047, -0.030130386352539062, -0.027596473693847656, -0.02506256103515625, -0.022528648376464844, -0.019994735717773438, -0.01746082305908203, -0.014926910400390625, -0.012392997741699219, -0.009859085083007812, -0.007325172424316406, -0.004791259765625, -0.0022573471069335938, 0.0002765655517578125, 0.0028104782104492188, 0.005344390869140625, 0.007878303527832031, 0.010412216186523438, 0.012946128845214844, 0.01548004150390625, 0.018013954162597656, 0.020547866821289062, 0.02308177947998047, 0.025615692138671875, 0.02814960479736328, 0.030683517456054688, 0.033217430114746094, 0.0357513427734375, 0.038285255432128906, 0.04081916809082031, 0.04335308074951172, 0.045886993408203125, 0.04842090606689453, 0.05095481872558594, 0.053488731384277344, 0.05602264404296875, 0.058556556701660156, 0.06109046936035156, 0.06362438201904297, 0.06615829467773438, 0.06869220733642578, 0.07122611999511719, 0.0737600326538086, 0.0762939453125]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 2.0, 1.0, 4.0, 2.0, 6.0, 9.0, 5.0, 10.0, 14.0, 18.0, 18.0, 18.0, 35.0, 31.0, 46.0, 49.0, 54.0, 70.0, 65.0, 71.0, 72.0, 56.0, 60.0, 61.0, 47.0, 26.0, 24.0, 28.0, 16.0, 16.0, 16.0, 17.0, 12.0, 6.0, 4.0, 3.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0616455078125, -0.059569358825683594, -0.05749320983886719, -0.05541706085205078, -0.053340911865234375, -0.05126476287841797, -0.04918861389160156, -0.047112464904785156, -0.04503631591796875, -0.042960166931152344, -0.04088401794433594, -0.03880786895751953, -0.036731719970703125, -0.03465557098388672, -0.03257942199707031, -0.030503273010253906, -0.0284271240234375, -0.026350975036621094, -0.024274826049804688, -0.02219867706298828, -0.020122528076171875, -0.01804637908935547, -0.015970230102539062, -0.013894081115722656, -0.01181793212890625, -0.009741783142089844, -0.0076656341552734375, -0.005589485168457031, -0.003513336181640625, -0.0014371871948242188, 0.0006389617919921875, 0.0027151107788085938, 0.004791259765625, 0.006867408752441406, 0.008943557739257812, 0.011019706726074219, 0.013095855712890625, 0.015172004699707031, 0.017248153686523438, 0.019324302673339844, 0.02140045166015625, 0.023476600646972656, 0.025552749633789062, 0.02762889862060547, 0.029705047607421875, 0.03178119659423828, 0.03385734558105469, 0.035933494567871094, 0.0380096435546875, 0.040085792541503906, 0.04216194152832031, 0.04423809051513672, 0.046314239501953125, 0.04839038848876953, 0.05046653747558594, 0.052542686462402344, 0.05461883544921875, 0.056694984436035156, 0.05877113342285156, 0.06084728240966797, 0.06292343139648438, 0.06499958038330078, 0.06707572937011719, 0.0691518783569336, 0.07122802734375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 6.0, 15.0, 40.0, 81.0, 171.0, 413.0, 1360.0, 38408.0, 4143617.0, 8847.0, 827.0, 301.0, 111.0, 53.0, 19.0, 15.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.73046875, -0.7085723876953125, -0.686676025390625, -0.6647796630859375, -0.64288330078125, -0.6209869384765625, -0.599090576171875, -0.5771942138671875, -0.5552978515625, -0.5334014892578125, -0.511505126953125, -0.4896087646484375, -0.46771240234375, -0.4458160400390625, -0.423919677734375, -0.4020233154296875, -0.380126953125, -0.3582305908203125, -0.336334228515625, -0.3144378662109375, -0.29254150390625, -0.2706451416015625, -0.248748779296875, -0.2268524169921875, -0.2049560546875, -0.1830596923828125, -0.161163330078125, -0.1392669677734375, -0.11737060546875, -0.0954742431640625, -0.073577880859375, -0.0516815185546875, -0.02978515625, -0.0078887939453125, 0.014007568359375, 0.0359039306640625, 0.05780029296875, 0.0796966552734375, 0.101593017578125, 0.1234893798828125, 0.1453857421875, 0.1672821044921875, 0.189178466796875, 0.2110748291015625, 0.23297119140625, 0.2548675537109375, 0.276763916015625, 0.2986602783203125, 0.320556640625, 0.3424530029296875, 0.364349365234375, 0.3862457275390625, 0.40814208984375, 0.4300384521484375, 0.451934814453125, 0.4738311767578125, 0.4957275390625, 0.5176239013671875, 0.539520263671875, 0.5614166259765625, 0.58331298828125, 0.6052093505859375, 0.627105712890625, 0.6490020751953125, 0.6708984375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 5.0, 8.0, 11.0, 20.0, 46.0, 90.0, 161.0, 490.0, 1294.0, 1219.0, 424.0, 159.0, 81.0, 32.0, 18.0, 10.0, 5.0, 1.0, 3.0, 3.0, 1.0, 1.0], "bins": [-0.446044921875, -0.43728160858154297, -0.42851829528808594, -0.4197549819946289, -0.4109916687011719, -0.40222835540771484, -0.3934650421142578, -0.3847017288208008, -0.37593841552734375, -0.3671751022338867, -0.3584117889404297, -0.34964847564697266, -0.3408851623535156, -0.3321218490600586, -0.32335853576660156, -0.31459522247314453, -0.3058319091796875, -0.29706859588623047, -0.28830528259277344, -0.2795419692993164, -0.2707786560058594, -0.26201534271240234, -0.2532520294189453, -0.24448871612548828, -0.23572540283203125, -0.22696208953857422, -0.2181987762451172, -0.20943546295166016, -0.20067214965820312, -0.1919088363647461, -0.18314552307128906, -0.17438220977783203, -0.165618896484375, -0.15685558319091797, -0.14809226989746094, -0.1393289566040039, -0.13056564331054688, -0.12180233001708984, -0.11303901672363281, -0.10427570343017578, -0.09551239013671875, -0.08674907684326172, -0.07798576354980469, -0.06922245025634766, -0.060459136962890625, -0.051695823669433594, -0.04293251037597656, -0.03416919708251953, -0.0254058837890625, -0.01664257049560547, -0.007879257202148438, 0.0008840560913085938, 0.009647369384765625, 0.018410682678222656, 0.027173995971679688, 0.03593730926513672, 0.04470062255859375, 0.05346393585205078, 0.06222724914550781, 0.07099056243896484, 0.07975387573242188, 0.0885171890258789, 0.09728050231933594, 0.10604381561279297, 0.11480712890625]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 6.0, 7.0, 16.0, 62.0, 155.0, 297.0, 283.0, 100.0, 59.0, 7.0, 5.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.645198345184326, -3.5466935634613037, -3.4481890201568604, -3.349684238433838, -3.2511796951293945, -3.152674913406372, -3.0541701316833496, -2.9556655883789062, -2.857161045074463, -2.7586562633514404, -2.660151720046997, -2.5616469383239746, -2.4631423950195312, -2.364637613296509, -2.2661328315734863, -2.167628288269043, -2.0691235065460205, -1.9706188440322876, -1.8721141815185547, -1.7736093997955322, -1.6751048564910889, -1.5766000747680664, -1.4780954122543335, -1.3795907497406006, -1.2810860872268677, -1.1825814247131348, -1.0840767621994019, -0.9855720400810242, -0.8870673775672913, -0.7885627150535583, -0.6900579929351807, -0.5915533304214478, -0.49304890632629395, -0.39454424381256104, -0.29603955149650574, -0.19753485918045044, -0.09903019666671753, -0.0005255341529846191, 0.09797918796539307, 0.19648385047912598, 0.2949885129928589, 0.3934931755065918, 0.4919978678226471, 0.5905025601387024, 0.6890072226524353, 0.7875118851661682, 0.8860166072845459, 0.9845212697982788, 1.0830259323120117, 1.1815305948257446, 1.2800352573394775, 1.3785400390625, 1.4770445823669434, 1.5755493640899658, 1.6740540266036987, 1.7725586891174316, 1.8710633516311646, 1.9695680141448975, 2.06807279586792, 2.1665773391723633, 2.2650821208953857, 2.363586664199829, 2.4620914459228516, 2.560595989227295, 2.6591007709503174]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 5.0, 4.0, 11.0, 9.0, 10.0, 17.0, 26.0, 17.0, 41.0, 45.0, 57.0, 69.0, 71.0, 71.0, 64.0, 67.0, 78.0, 68.0, 49.0, 42.0, 33.0, 28.0, 36.0, 22.0, 18.0, 15.0, 14.0, 10.0, 4.0, 4.0, 6.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7372236251831055, -0.7073788046836853, -0.6775339841842651, -0.6476892232894897, -0.6178444027900696, -0.5879995822906494, -0.558154821395874, -0.5283100008964539, -0.4984651803970337, -0.4686203598976135, -0.43877556920051575, -0.40893077850341797, -0.3790859580039978, -0.34924113750457764, -0.31939634680747986, -0.2895515561103821, -0.2597067356109619, -0.22986193001270294, -0.20001712441444397, -0.170172318816185, -0.14032751321792603, -0.11048270761966705, -0.08063790202140808, -0.05079309642314911, -0.020948290824890137, 0.008896514773368835, 0.03874132037162781, 0.06858612596988678, 0.09843093156814575, 0.12827573716640472, 0.1581205427646637, 0.18796534836292267, 0.21781015396118164, 0.2476549595594406, 0.2774997651576996, 0.30734455585479736, 0.33718937635421753, 0.3670341968536377, 0.3968789875507355, 0.42672377824783325, 0.4565685987472534, 0.4864134192466736, 0.5162582397460938, 0.5461030006408691, 0.5759478211402893, 0.6057926416397095, 0.6356374025344849, 0.665482223033905, 0.6953270435333252, 0.7251718640327454, 0.7550166845321655, 0.7848614454269409, 0.8147062659263611, 0.8445510864257812, 0.8743958473205566, 0.9042406678199768, 0.934085488319397, 0.9639303088188171, 0.9937751293182373, 1.0236198902130127, 1.053464651107788, 1.083309531211853, 1.1131542921066284, 1.1429991722106934, 1.1728439331054688]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 11.0, 11.0, 10.0, 19.0, 22.0, 31.0, 25.0, 45.0, 68.0, 114.0, 160.0, 212.0, 322.0, 527.0, 818.0, 1373.0, 2199.0, 3764.0, 6692.0, 12141.0, 22963.0, 46382.0, 96682.0, 201550.0, 287158.0, 186095.0, 88563.0, 42768.0, 21346.0, 11285.0, 6131.0, 3454.0, 2073.0, 1223.0, 789.0, 502.0, 337.0, 239.0, 129.0, 111.0, 72.0, 43.0, 35.0, 27.0, 16.0, 9.0, 6.0, 4.0, 5.0, 1.0, 3.0, 2.0, 2.0, 1.0], "bins": [-0.06805419921875, -0.06607818603515625, -0.0641021728515625, -0.06212615966796875, -0.060150146484375, -0.05817413330078125, -0.0561981201171875, -0.05422210693359375, -0.05224609375, -0.05027008056640625, -0.0482940673828125, -0.04631805419921875, -0.044342041015625, -0.04236602783203125, -0.0403900146484375, -0.03841400146484375, -0.03643798828125, -0.03446197509765625, -0.0324859619140625, -0.03050994873046875, -0.028533935546875, -0.02655792236328125, -0.0245819091796875, -0.02260589599609375, -0.0206298828125, -0.01865386962890625, -0.0166778564453125, -0.01470184326171875, -0.012725830078125, -0.01074981689453125, -0.0087738037109375, -0.00679779052734375, -0.00482177734375, -0.00284576416015625, -0.0008697509765625, 0.00110626220703125, 0.003082275390625, 0.00505828857421875, 0.0070343017578125, 0.00901031494140625, 0.010986328125, 0.01296234130859375, 0.0149383544921875, 0.01691436767578125, 0.018890380859375, 0.02086639404296875, 0.0228424072265625, 0.02481842041015625, 0.02679443359375, 0.02877044677734375, 0.0307464599609375, 0.03272247314453125, 0.034698486328125, 0.03667449951171875, 0.0386505126953125, 0.04062652587890625, 0.0426025390625, 0.04457855224609375, 0.0465545654296875, 0.04853057861328125, 0.050506591796875, 0.05248260498046875, 0.0544586181640625, 0.05643463134765625, 0.05841064453125]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 3.0, 3.0, 9.0, 10.0, 12.0, 20.0, 14.0, 26.0, 27.0, 30.0, 32.0, 43.0, 53.0, 71.0, 63.0, 75.0, 70.0, 70.0, 55.0, 47.0, 50.0, 48.0, 26.0, 26.0, 18.0, 33.0, 19.0, 8.0, 5.0, 7.0, 9.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0771484375, -0.07466506958007812, -0.07218170166015625, -0.06969833374023438, -0.0672149658203125, -0.06473159790039062, -0.06224822998046875, -0.059764862060546875, -0.057281494140625, -0.054798126220703125, -0.05231475830078125, -0.049831390380859375, -0.0473480224609375, -0.044864654541015625, -0.04238128662109375, -0.039897918701171875, -0.03741455078125, -0.034931182861328125, -0.03244781494140625, -0.029964447021484375, -0.0274810791015625, -0.024997711181640625, -0.02251434326171875, -0.020030975341796875, -0.017547607421875, -0.015064239501953125, -0.01258087158203125, -0.010097503662109375, -0.0076141357421875, -0.005130767822265625, -0.00264739990234375, -0.000164031982421875, 0.0023193359375, 0.004802703857421875, 0.00728607177734375, 0.009769439697265625, 0.0122528076171875, 0.014736175537109375, 0.01721954345703125, 0.019702911376953125, 0.022186279296875, 0.024669647216796875, 0.02715301513671875, 0.029636383056640625, 0.0321197509765625, 0.034603118896484375, 0.03708648681640625, 0.039569854736328125, 0.04205322265625, 0.044536590576171875, 0.04701995849609375, 0.049503326416015625, 0.0519866943359375, 0.054470062255859375, 0.05695343017578125, 0.059436798095703125, 0.061920166015625, 0.06440353393554688, 0.06688690185546875, 0.06937026977539062, 0.0718536376953125, 0.07433700561523438, 0.07682037353515625, 0.07930374145507812, 0.081787109375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 3.0, 5.0, 4.0, 13.0, 9.0, 21.0, 28.0, 44.0, 66.0, 102.0, 192.0, 356.0, 703.0, 1938.0, 8005.0, 82030.0, 869028.0, 75197.0, 7527.0, 1742.0, 677.0, 343.0, 202.0, 113.0, 75.0, 36.0, 28.0, 15.0, 11.0, 10.0, 9.0, 6.0, 1.0, 3.0, 3.0, 0.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.35400390625, -0.3437385559082031, -0.33347320556640625, -0.3232078552246094, -0.3129425048828125, -0.3026771545410156, -0.29241180419921875, -0.2821464538574219, -0.271881103515625, -0.2616157531738281, -0.25135040283203125, -0.24108505249023438, -0.2308197021484375, -0.22055435180664062, -0.21028900146484375, -0.20002365112304688, -0.18975830078125, -0.17949295043945312, -0.16922760009765625, -0.15896224975585938, -0.1486968994140625, -0.13843154907226562, -0.12816619873046875, -0.11790084838867188, -0.107635498046875, -0.09737014770507812, -0.08710479736328125, -0.07683944702148438, -0.0665740966796875, -0.056308746337890625, -0.04604339599609375, -0.035778045654296875, -0.0255126953125, -0.015247344970703125, -0.00498199462890625, 0.005283355712890625, 0.0155487060546875, 0.025814056396484375, 0.03607940673828125, 0.046344757080078125, 0.056610107421875, 0.06687545776367188, 0.07714080810546875, 0.08740615844726562, 0.0976715087890625, 0.10793685913085938, 0.11820220947265625, 0.12846755981445312, 0.13873291015625, 0.14899826049804688, 0.15926361083984375, 0.16952896118164062, 0.1797943115234375, 0.19005966186523438, 0.20032501220703125, 0.21059036254882812, 0.220855712890625, 0.23112106323242188, 0.24138641357421875, 0.2516517639160156, 0.2619171142578125, 0.2721824645996094, 0.28244781494140625, 0.2927131652832031, 0.302978515625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 5.0, 5.0, 5.0, 15.0, 17.0, 22.0, 15.0, 25.0, 43.0, 42.0, 42.0, 51.0, 64.0, 67.0, 74.0, 80.0, 75.0, 72.0, 57.0, 46.0, 29.0, 27.0, 20.0, 30.0, 17.0, 11.0, 10.0, 9.0, 7.0, 5.0, 4.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.435546875, -0.42348480224609375, -0.4114227294921875, -0.39936065673828125, -0.387298583984375, -0.37523651123046875, -0.3631744384765625, -0.35111236572265625, -0.33905029296875, -0.32698822021484375, -0.3149261474609375, -0.30286407470703125, -0.290802001953125, -0.27873992919921875, -0.2666778564453125, -0.25461578369140625, -0.2425537109375, -0.23049163818359375, -0.2184295654296875, -0.20636749267578125, -0.194305419921875, -0.18224334716796875, -0.1701812744140625, -0.15811920166015625, -0.14605712890625, -0.13399505615234375, -0.1219329833984375, -0.10987091064453125, -0.097808837890625, -0.08574676513671875, -0.0736846923828125, -0.06162261962890625, -0.049560546875, -0.03749847412109375, -0.0254364013671875, -0.01337432861328125, -0.001312255859375, 0.01074981689453125, 0.0228118896484375, 0.03487396240234375, 0.04693603515625, 0.05899810791015625, 0.0710601806640625, 0.08312225341796875, 0.095184326171875, 0.10724639892578125, 0.1193084716796875, 0.13137054443359375, 0.1434326171875, 0.15549468994140625, 0.1675567626953125, 0.17961883544921875, 0.191680908203125, 0.20374298095703125, 0.2158050537109375, 0.22786712646484375, 0.23992919921875, 0.25199127197265625, 0.2640533447265625, 0.27611541748046875, 0.288177490234375, 0.30023956298828125, 0.3123016357421875, 0.32436370849609375, 0.33642578125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 2.0, 3.0, 6.0, 6.0, 9.0, 17.0, 15.0, 18.0, 41.0, 59.0, 96.0, 171.0, 338.0, 678.0, 1706.0, 4749.0, 16022.0, 68154.0, 687955.0, 215845.0, 37412.0, 9700.0, 3123.0, 1236.0, 564.0, 260.0, 118.0, 86.0, 59.0, 29.0, 23.0, 18.0, 15.0, 7.0, 7.0, 5.0, 6.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.11236572265625, -0.10947036743164062, -0.10657501220703125, -0.10367965698242188, -0.1007843017578125, -0.09788894653320312, -0.09499359130859375, -0.09209823608398438, -0.089202880859375, -0.08630752563476562, -0.08341217041015625, -0.08051681518554688, -0.0776214599609375, -0.07472610473632812, -0.07183074951171875, -0.06893539428710938, -0.0660400390625, -0.06314468383789062, -0.06024932861328125, -0.057353973388671875, -0.0544586181640625, -0.051563262939453125, -0.04866790771484375, -0.045772552490234375, -0.042877197265625, -0.039981842041015625, -0.03708648681640625, -0.034191131591796875, -0.0312957763671875, -0.028400421142578125, -0.02550506591796875, -0.022609710693359375, -0.01971435546875, -0.016819000244140625, -0.01392364501953125, -0.011028289794921875, -0.0081329345703125, -0.005237579345703125, -0.00234222412109375, 0.000553131103515625, 0.003448486328125, 0.006343841552734375, 0.00923919677734375, 0.012134552001953125, 0.0150299072265625, 0.017925262451171875, 0.02082061767578125, 0.023715972900390625, 0.026611328125, 0.029506683349609375, 0.03240203857421875, 0.035297393798828125, 0.0381927490234375, 0.041088104248046875, 0.04398345947265625, 0.046878814697265625, 0.049774169921875, 0.052669525146484375, 0.05556488037109375, 0.058460235595703125, 0.0613555908203125, 0.06425094604492188, 0.06714630126953125, 0.07004165649414062, 0.07293701171875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 7.0, 6.0, 5.0, 8.0, 8.0, 12.0, 14.0, 17.0, 9.0, 15.0, 29.0, 27.0, 33.0, 48.0, 53.0, 52.0, 100.0, 84.0, 94.0, 82.0, 60.0, 44.0, 32.0, 28.0, 14.0, 28.0, 27.0, 11.0, 12.0, 13.0, 6.0, 6.0, 4.0, 4.0, 2.0, 2.0, 0.0, 4.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1636486053466797e-05, -2.095196396112442e-05, -2.0267441868782043e-05, -1.9582919776439667e-05, -1.889839768409729e-05, -1.8213875591754913e-05, -1.7529353499412537e-05, -1.684483140707016e-05, -1.6160309314727783e-05, -1.5475787222385406e-05, -1.479126513004303e-05, -1.4106743037700653e-05, -1.3422220945358276e-05, -1.27376988530159e-05, -1.2053176760673523e-05, -1.1368654668331146e-05, -1.068413257598877e-05, -9.999610483646393e-06, -9.315088391304016e-06, -8.63056629896164e-06, -7.946044206619263e-06, -7.261522114276886e-06, -6.577000021934509e-06, -5.8924779295921326e-06, -5.207955837249756e-06, -4.523433744907379e-06, -3.8389116525650024e-06, -3.1543895602226257e-06, -2.469867467880249e-06, -1.7853453755378723e-06, -1.1008232831954956e-06, -4.163011908531189e-07, 2.682209014892578e-07, 9.527429938316345e-07, 1.6372650861740112e-06, 2.321787178516388e-06, 3.0063092708587646e-06, 3.6908313632011414e-06, 4.375353455543518e-06, 5.059875547885895e-06, 5.7443976402282715e-06, 6.428919732570648e-06, 7.113441824913025e-06, 7.797963917255402e-06, 8.482486009597778e-06, 9.167008101940155e-06, 9.851530194282532e-06, 1.0536052286624908e-05, 1.1220574378967285e-05, 1.1905096471309662e-05, 1.2589618563652039e-05, 1.3274140655994415e-05, 1.3958662748336792e-05, 1.4643184840679169e-05, 1.5327706933021545e-05, 1.6012229025363922e-05, 1.66967511177063e-05, 1.7381273210048676e-05, 1.8065795302391052e-05, 1.875031739473343e-05, 1.9434839487075806e-05, 2.0119361579418182e-05, 2.080388367176056e-05, 2.1488405764102936e-05, 2.2172927856445312e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 4.0, 3.0, 6.0, 5.0, 8.0, 8.0, 17.0, 30.0, 41.0, 52.0, 66.0, 120.0, 194.0, 380.0, 745.0, 1513.0, 4256.0, 13515.0, 51416.0, 284658.0, 600601.0, 65653.0, 16605.0, 5050.0, 1804.0, 808.0, 402.0, 222.0, 141.0, 72.0, 41.0, 42.0, 26.0, 15.0, 10.0, 6.0, 8.0, 6.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.08233642578125, -0.07977008819580078, -0.07720375061035156, -0.07463741302490234, -0.07207107543945312, -0.0695047378540039, -0.06693840026855469, -0.06437206268310547, -0.06180572509765625, -0.05923938751220703, -0.05667304992675781, -0.054106712341308594, -0.051540374755859375, -0.048974037170410156, -0.04640769958496094, -0.04384136199951172, -0.0412750244140625, -0.03870868682861328, -0.03614234924316406, -0.033576011657714844, -0.031009674072265625, -0.028443336486816406, -0.025876998901367188, -0.02331066131591797, -0.02074432373046875, -0.01817798614501953, -0.015611648559570312, -0.013045310974121094, -0.010478973388671875, -0.007912635803222656, -0.0053462982177734375, -0.0027799606323242188, -0.000213623046875, 0.0023527145385742188, 0.0049190521240234375, 0.007485389709472656, 0.010051727294921875, 0.012618064880371094, 0.015184402465820312, 0.01775074005126953, 0.02031707763671875, 0.02288341522216797, 0.025449752807617188, 0.028016090393066406, 0.030582427978515625, 0.033148765563964844, 0.03571510314941406, 0.03828144073486328, 0.0408477783203125, 0.04341411590576172, 0.04598045349121094, 0.048546791076660156, 0.051113128662109375, 0.053679466247558594, 0.05624580383300781, 0.05881214141845703, 0.06137847900390625, 0.06394481658935547, 0.06651115417480469, 0.0690774917602539, 0.07164382934570312, 0.07421016693115234, 0.07677650451660156, 0.07934284210205078, 0.0819091796875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 3.0, 9.0, 12.0, 11.0, 16.0, 13.0, 8.0, 21.0, 19.0, 30.0, 36.0, 33.0, 54.0, 61.0, 95.0, 106.0, 87.0, 76.0, 67.0, 39.0, 30.0, 34.0, 14.0, 24.0, 17.0, 11.0, 18.0, 15.0, 6.0, 9.0, 9.0, 4.0, 1.0, 2.0, 1.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.07147216796875, -0.0694742202758789, -0.06747627258300781, -0.06547832489013672, -0.06348037719726562, -0.06148242950439453, -0.05948448181152344, -0.057486534118652344, -0.05548858642578125, -0.053490638732910156, -0.05149269104003906, -0.04949474334716797, -0.047496795654296875, -0.04549884796142578, -0.04350090026855469, -0.041502952575683594, -0.0395050048828125, -0.037507057189941406, -0.03550910949707031, -0.03351116180419922, -0.031513214111328125, -0.02951526641845703, -0.027517318725585938, -0.025519371032714844, -0.02352142333984375, -0.021523475646972656, -0.019525527954101562, -0.01752758026123047, -0.015529632568359375, -0.013531684875488281, -0.011533737182617188, -0.009535789489746094, -0.007537841796875, -0.005539894104003906, -0.0035419464111328125, -0.0015439987182617188, 0.000453948974609375, 0.0024518966674804688, 0.0044498443603515625, 0.006447792053222656, 0.00844573974609375, 0.010443687438964844, 0.012441635131835938, 0.014439582824707031, 0.016437530517578125, 0.01843547821044922, 0.020433425903320312, 0.022431373596191406, 0.0244293212890625, 0.026427268981933594, 0.028425216674804688, 0.03042316436767578, 0.032421112060546875, 0.03441905975341797, 0.03641700744628906, 0.038414955139160156, 0.04041290283203125, 0.042410850524902344, 0.04440879821777344, 0.04640674591064453, 0.048404693603515625, 0.05040264129638672, 0.05240058898925781, 0.054398536682128906, 0.056396484375]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 3.0, 10.0, 12.0, 30.0, 84.0, 150.0, 417.0, 176.0, 74.0, 26.0, 11.0, 6.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.353379726409912, -3.2638556957244873, -3.1743316650390625, -3.0848076343536377, -2.995283603668213, -2.905759334564209, -2.816235303878784, -2.7267112731933594, -2.6371872425079346, -2.5476632118225098, -2.458139181137085, -2.36861515045166, -2.2790908813476562, -2.1895668506622314, -2.1000428199768066, -2.010518789291382, -1.920994758605957, -1.8314707279205322, -1.7419466972351074, -1.652422547340393, -1.5628985166549683, -1.4733744859695435, -1.383850336074829, -1.2943263053894043, -1.2048022747039795, -1.1152782440185547, -1.0257542133331299, -0.9362300634384155, -0.8467060327529907, -0.7571820020675659, -0.6676579117774963, -0.5781338214874268, -0.48861002922058105, -0.39908596873283386, -0.30956190824508667, -0.22003784775733948, -0.13051378726959229, -0.04098972678184509, 0.0485343337059021, 0.13805842399597168, 0.22758245468139648, 0.3171065151691437, 0.40663057565689087, 0.49615463614463806, 0.5856786966323853, 0.6752027273178101, 0.7647268176078796, 0.8542509078979492, 0.943774938583374, 1.0332989692687988, 1.1228229999542236, 1.212347149848938, 1.3018711805343628, 1.3913952112197876, 1.480919361114502, 1.5704433917999268, 1.6599674224853516, 1.7494914531707764, 1.8390154838562012, 1.9285396337509155, 2.018063545227051, 2.1075878143310547, 2.1971118450164795, 2.2866358757019043, 2.376159906387329]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 4.0, 2.0, 2.0, 3.0, 3.0, 3.0, 7.0, 8.0, 10.0, 14.0, 16.0, 15.0, 16.0, 16.0, 22.0, 31.0, 28.0, 25.0, 35.0, 38.0, 61.0, 101.0, 151.0, 62.0, 43.0, 39.0, 29.0, 28.0, 32.0, 26.0, 22.0, 14.0, 17.0, 11.0, 9.0, 14.0, 12.0, 5.0, 4.0, 5.0, 7.0, 3.0, 5.0, 1.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.5542035102844238, -1.50739586353302, -1.4605882167816162, -1.4137805700302124, -1.3669729232788086, -1.3201653957366943, -1.2733577489852905, -1.2265501022338867, -1.179742455482483, -1.132934808731079, -1.0861271619796753, -1.0393195152282715, -0.9925119280815125, -0.9457042813301086, -0.8988966941833496, -0.8520890474319458, -0.805281400680542, -0.7584737539291382, -0.7116661071777344, -0.6648585200309753, -0.6180508732795715, -0.5712432265281677, -0.5244356393814087, -0.4776279926300049, -0.4308203458786011, -0.38401269912719727, -0.33720508217811584, -0.2903974652290344, -0.24358981847763062, -0.196782186627388, -0.14997455477714539, -0.10316693782806396, -0.056359291076660156, -0.009551659226417542, 0.03725597262382507, 0.08406360447406769, 0.1308712363243103, 0.17767886817455292, 0.22448650002479553, 0.27129411697387695, 0.31810176372528076, 0.36490941047668457, 0.411717027425766, 0.4585246443748474, 0.5053322911262512, 0.552139937877655, 0.5989475250244141, 0.6457551717758179, 0.6925628185272217, 0.7393704652786255, 0.7861781120300293, 0.8329856991767883, 0.8797933459281921, 0.926600992679596, 0.973408579826355, 1.0202162265777588, 1.0670238733291626, 1.1138315200805664, 1.1606391668319702, 1.207446813583374, 1.2542543411254883, 1.301061987876892, 1.347869634628296, 1.3946772813796997, 1.4414849281311035]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 6.0, 3.0, 3.0, 12.0, 19.0, 15.0, 19.0, 32.0, 47.0, 64.0, 91.0, 138.0, 213.0, 326.0, 525.0, 947.0, 1678.0, 3299.0, 7153.0, 19055.0, 79091.0, 613322.0, 2649574.0, 689300.0, 91295.0, 22190.0, 8061.0, 3550.0, 1784.0, 986.0, 567.0, 348.0, 190.0, 133.0, 87.0, 51.0, 37.0, 30.0, 15.0, 12.0, 11.0, 5.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.09063720703125, -0.08766841888427734, -0.08469963073730469, -0.08173084259033203, -0.07876205444335938, -0.07579326629638672, -0.07282447814941406, -0.0698556900024414, -0.06688690185546875, -0.0639181137084961, -0.06094932556152344, -0.05798053741455078, -0.055011749267578125, -0.05204296112060547, -0.04907417297363281, -0.046105384826660156, -0.0431365966796875, -0.040167808532714844, -0.03719902038574219, -0.03423023223876953, -0.031261444091796875, -0.02829265594482422, -0.025323867797851562, -0.022355079650878906, -0.01938629150390625, -0.016417503356933594, -0.013448715209960938, -0.010479927062988281, -0.007511138916015625, -0.004542350769042969, -0.0015735626220703125, 0.0013952255249023438, 0.004364013671875, 0.007332801818847656, 0.010301589965820312, 0.013270378112792969, 0.016239166259765625, 0.01920795440673828, 0.022176742553710938, 0.025145530700683594, 0.02811431884765625, 0.031083106994628906, 0.03405189514160156, 0.03702068328857422, 0.039989471435546875, 0.04295825958251953, 0.04592704772949219, 0.048895835876464844, 0.0518646240234375, 0.054833412170410156, 0.05780220031738281, 0.06077098846435547, 0.06373977661132812, 0.06670856475830078, 0.06967735290527344, 0.0726461410522461, 0.07561492919921875, 0.0785837173461914, 0.08155250549316406, 0.08452129364013672, 0.08749008178710938, 0.09045886993408203, 0.09342765808105469, 0.09639644622802734, 0.099365234375]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 5.0, 8.0, 11.0, 12.0, 18.0, 24.0, 25.0, 33.0, 40.0, 30.0, 60.0, 54.0, 65.0, 58.0, 69.0, 73.0, 62.0, 64.0, 53.0, 37.0, 39.0, 28.0, 17.0, 24.0, 29.0, 13.0, 14.0, 8.0, 8.0, 7.0, 1.0, 5.0, 2.0, 1.0, 2.0, 2.0, 2.0], "bins": [-0.09417724609375, -0.09191226959228516, -0.08964729309082031, -0.08738231658935547, -0.08511734008789062, -0.08285236358642578, -0.08058738708496094, -0.0783224105834961, -0.07605743408203125, -0.0737924575805664, -0.07152748107910156, -0.06926250457763672, -0.06699752807617188, -0.06473255157470703, -0.06246757507324219, -0.060202598571777344, -0.0579376220703125, -0.055672645568847656, -0.05340766906738281, -0.05114269256591797, -0.048877716064453125, -0.04661273956298828, -0.04434776306152344, -0.042082786560058594, -0.03981781005859375, -0.037552833557128906, -0.03528785705566406, -0.03302288055419922, -0.030757904052734375, -0.02849292755126953, -0.026227951049804688, -0.023962974548339844, -0.021697998046875, -0.019433021545410156, -0.017168045043945312, -0.014903068542480469, -0.012638092041015625, -0.010373115539550781, -0.008108139038085938, -0.005843162536621094, -0.00357818603515625, -0.0013132095336914062, 0.0009517669677734375, 0.0032167434692382812, 0.005481719970703125, 0.007746696472167969, 0.010011672973632812, 0.012276649475097656, 0.0145416259765625, 0.016806602478027344, 0.019071578979492188, 0.02133655548095703, 0.023601531982421875, 0.02586650848388672, 0.028131484985351562, 0.030396461486816406, 0.03266143798828125, 0.034926414489746094, 0.03719139099121094, 0.03945636749267578, 0.041721343994140625, 0.04398632049560547, 0.04625129699707031, 0.048516273498535156, 0.05078125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 5.0, 8.0, 13.0, 20.0, 35.0, 92.0, 264.0, 546.0, 1278.0, 5887.0, 1076354.0, 3099489.0, 7831.0, 1401.0, 568.0, 276.0, 122.0, 43.0, 26.0, 11.0, 3.0, 7.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.55126953125, -0.5335159301757812, -0.5157623291015625, -0.49800872802734375, -0.480255126953125, -0.46250152587890625, -0.4447479248046875, -0.42699432373046875, -0.40924072265625, -0.39148712158203125, -0.3737335205078125, -0.35597991943359375, -0.338226318359375, -0.32047271728515625, -0.3027191162109375, -0.28496551513671875, -0.2672119140625, -0.24945831298828125, -0.2317047119140625, -0.21395111083984375, -0.196197509765625, -0.17844390869140625, -0.1606903076171875, -0.14293670654296875, -0.12518310546875, -0.10742950439453125, -0.0896759033203125, -0.07192230224609375, -0.054168701171875, -0.03641510009765625, -0.0186614990234375, -0.00090789794921875, 0.016845703125, 0.03459930419921875, 0.0523529052734375, 0.07010650634765625, 0.087860107421875, 0.10561370849609375, 0.1233673095703125, 0.14112091064453125, 0.15887451171875, 0.17662811279296875, 0.1943817138671875, 0.21213531494140625, 0.229888916015625, 0.24764251708984375, 0.2653961181640625, 0.28314971923828125, 0.3009033203125, 0.31865692138671875, 0.3364105224609375, 0.35416412353515625, 0.371917724609375, 0.38967132568359375, 0.4074249267578125, 0.42517852783203125, 0.44293212890625, 0.46068572998046875, 0.4784393310546875, 0.49619293212890625, 0.513946533203125, 0.5317001342773438, 0.5494537353515625, 0.5672073364257812, 0.5849609375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 6.0, 9.0, 25.0, 38.0, 60.0, 170.0, 476.0, 1430.0, 1217.0, 354.0, 152.0, 67.0, 37.0, 13.0, 10.0, 5.0, 4.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.416259765625, -0.40433502197265625, -0.3924102783203125, -0.38048553466796875, -0.368560791015625, -0.35663604736328125, -0.3447113037109375, -0.33278656005859375, -0.32086181640625, -0.30893707275390625, -0.2970123291015625, -0.28508758544921875, -0.273162841796875, -0.26123809814453125, -0.2493133544921875, -0.23738861083984375, -0.2254638671875, -0.21353912353515625, -0.2016143798828125, -0.18968963623046875, -0.177764892578125, -0.16584014892578125, -0.1539154052734375, -0.14199066162109375, -0.13006591796875, -0.11814117431640625, -0.1062164306640625, -0.09429168701171875, -0.082366943359375, -0.07044219970703125, -0.0585174560546875, -0.04659271240234375, -0.03466796875, -0.02274322509765625, -0.0108184814453125, 0.00110626220703125, 0.013031005859375, 0.02495574951171875, 0.0368804931640625, 0.04880523681640625, 0.06072998046875, 0.07265472412109375, 0.0845794677734375, 0.09650421142578125, 0.108428955078125, 0.12035369873046875, 0.1322784423828125, 0.14420318603515625, 0.1561279296875, 0.16805267333984375, 0.1799774169921875, 0.19190216064453125, 0.203826904296875, 0.21575164794921875, 0.2276763916015625, 0.23960113525390625, 0.25152587890625, 0.26345062255859375, 0.2753753662109375, 0.28730010986328125, 0.299224853515625, 0.31114959716796875, 0.3230743408203125, 0.33499908447265625, 0.346923828125]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 6.0, 7.0, 6.0, 16.0, 25.0, 44.0, 57.0, 137.0, 201.0, 183.0, 154.0, 71.0, 40.0, 20.0, 10.0, 9.0, 8.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0249059200286865, -1.9553862810134888, -1.8858667612075806, -1.8163471221923828, -1.746827483177185, -1.6773078441619873, -1.607788324356079, -1.5382686853408813, -1.4687490463256836, -1.3992294073104858, -1.3297098875045776, -1.2601902484893799, -1.1906706094741821, -1.1211509704589844, -1.0516314506530762, -0.9821118116378784, -0.9125922918319702, -0.8430727124214172, -0.7735530734062195, -0.7040334939956665, -0.6345138549804688, -0.5649942755699158, -0.4954746961593628, -0.4259550869464874, -0.35643547773361206, -0.2869158685207367, -0.21739627420902252, -0.14787667989730835, -0.07835707068443298, -0.008837461471557617, 0.06068211793899536, 0.13020172715187073, 0.1997213363647461, 0.26924094557762146, 0.3387605547904968, 0.4082801342010498, 0.47779974341392517, 0.5473193526268005, 0.6168389320373535, 0.6863585710525513, 0.7558781504631042, 0.8253977298736572, 0.894917368888855, 0.964436948299408, 1.033956527709961, 1.1034761667251587, 1.1729958057403564, 1.2425153255462646, 1.3120349645614624, 1.3815546035766602, 1.4510741233825684, 1.5205937623977661, 1.5901134014129639, 1.659632921218872, 1.7291525602340698, 1.7986721992492676, 1.8681917190551758, 1.9377113580703735, 2.0072309970855713, 2.0767505168914795, 2.1462700366973877, 2.215789794921875, 2.285309314727783, 2.3548288345336914, 2.4243485927581787]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 4.0, 6.0, 4.0, 7.0, 5.0, 14.0, 11.0, 14.0, 12.0, 20.0, 9.0, 16.0, 20.0, 37.0, 30.0, 37.0, 36.0, 47.0, 40.0, 48.0, 61.0, 49.0, 46.0, 61.0, 52.0, 31.0, 26.0, 35.0, 29.0, 27.0, 19.0, 27.0, 20.0, 21.0, 17.0, 13.0, 13.0, 11.0, 9.0, 5.0, 7.0, 4.0, 0.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.8756514191627502, -0.8485806584358215, -0.8215098977088928, -0.7944391369819641, -0.7673683762550354, -0.7402976155281067, -0.713226854801178, -0.6861560940742493, -0.6590853333473206, -0.6320145726203918, -0.6049438118934631, -0.5778730511665344, -0.5508022904396057, -0.523731529712677, -0.4966607689857483, -0.4695900082588196, -0.4425192177295685, -0.41544845700263977, -0.38837769627571106, -0.36130693554878235, -0.33423617482185364, -0.30716538429260254, -0.28009462356567383, -0.2530238628387451, -0.2259531170129776, -0.1988823562860489, -0.17181159555912018, -0.14474081993103027, -0.11767006665468216, -0.09059929847717285, -0.06352853775024414, -0.03645777702331543, -0.009387016296386719, 0.01768374629318714, 0.044754508882761, 0.07182527333498001, 0.09889603406190872, 0.12596680223941803, 0.15303756296634674, 0.18010832369327545, 0.20717908442020416, 0.23424984514713287, 0.2613206207752228, 0.2883913815021515, 0.3154621422290802, 0.3425329029560089, 0.3696036636829376, 0.39667442440986633, 0.42374518513679504, 0.45081594586372375, 0.47788670659065247, 0.5049574971199036, 0.5320282578468323, 0.559099018573761, 0.5861697793006897, 0.6132405400276184, 0.6403113007545471, 0.6673820614814758, 0.6944528222084045, 0.7215235829353333, 0.748594343662262, 0.7756651043891907, 0.8027358651161194, 0.8298066258430481, 0.8568773865699768]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 3.0, 1.0, 6.0, 3.0, 7.0, 21.0, 21.0, 29.0, 52.0, 99.0, 152.0, 234.0, 449.0, 847.0, 1643.0, 3308.0, 7114.0, 16194.0, 41572.0, 120318.0, 356059.0, 327142.0, 107232.0, 37908.0, 15159.0, 6607.0, 3108.0, 1497.0, 781.0, 429.0, 243.0, 116.0, 86.0, 52.0, 26.0, 12.0, 5.0, 10.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.121337890625, -0.11728668212890625, -0.1132354736328125, -0.10918426513671875, -0.105133056640625, -0.10108184814453125, -0.0970306396484375, -0.09297943115234375, -0.08892822265625, -0.08487701416015625, -0.0808258056640625, -0.07677459716796875, -0.072723388671875, -0.06867218017578125, -0.0646209716796875, -0.06056976318359375, -0.0565185546875, -0.05246734619140625, -0.0484161376953125, -0.04436492919921875, -0.040313720703125, -0.03626251220703125, -0.0322113037109375, -0.02816009521484375, -0.02410888671875, -0.02005767822265625, -0.0160064697265625, -0.01195526123046875, -0.007904052734375, -0.00385284423828125, 0.0001983642578125, 0.00424957275390625, 0.00830078125, 0.01235198974609375, 0.0164031982421875, 0.02045440673828125, 0.024505615234375, 0.02855682373046875, 0.0326080322265625, 0.03665924072265625, 0.04071044921875, 0.04476165771484375, 0.0488128662109375, 0.05286407470703125, 0.056915283203125, 0.06096649169921875, 0.0650177001953125, 0.06906890869140625, 0.0731201171875, 0.07717132568359375, 0.0812225341796875, 0.08527374267578125, 0.089324951171875, 0.09337615966796875, 0.0974273681640625, 0.10147857666015625, 0.10552978515625, 0.10958099365234375, 0.1136322021484375, 0.11768341064453125, 0.121734619140625, 0.12578582763671875, 0.1298370361328125, 0.13388824462890625, 0.137939453125]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 1.0, 7.0, 4.0, 7.0, 6.0, 11.0, 18.0, 13.0, 13.0, 21.0, 20.0, 30.0, 45.0, 29.0, 52.0, 51.0, 56.0, 51.0, 70.0, 59.0, 55.0, 59.0, 62.0, 39.0, 38.0, 29.0, 31.0, 24.0, 22.0, 25.0, 9.0, 6.0, 13.0, 8.0, 8.0, 5.0, 4.0, 2.0, 1.0, 4.0, 1.0, 0.0, 2.0], "bins": [-0.09661865234375, -0.0941934585571289, -0.09176826477050781, -0.08934307098388672, -0.08691787719726562, -0.08449268341064453, -0.08206748962402344, -0.07964229583740234, -0.07721710205078125, -0.07479190826416016, -0.07236671447753906, -0.06994152069091797, -0.06751632690429688, -0.06509113311767578, -0.06266593933105469, -0.060240745544433594, -0.0578155517578125, -0.055390357971191406, -0.05296516418457031, -0.05053997039794922, -0.048114776611328125, -0.04568958282470703, -0.04326438903808594, -0.040839195251464844, -0.03841400146484375, -0.035988807678222656, -0.03356361389160156, -0.03113842010498047, -0.028713226318359375, -0.02628803253173828, -0.023862838745117188, -0.021437644958496094, -0.019012451171875, -0.016587257385253906, -0.014162063598632812, -0.011736869812011719, -0.009311676025390625, -0.006886482238769531, -0.0044612884521484375, -0.0020360946655273438, 0.00038909912109375, 0.0028142929077148438, 0.0052394866943359375, 0.007664680480957031, 0.010089874267578125, 0.012515068054199219, 0.014940261840820312, 0.017365455627441406, 0.0197906494140625, 0.022215843200683594, 0.024641036987304688, 0.02706623077392578, 0.029491424560546875, 0.03191661834716797, 0.03434181213378906, 0.036767005920410156, 0.03919219970703125, 0.041617393493652344, 0.04404258728027344, 0.04646778106689453, 0.048892974853515625, 0.05131816864013672, 0.05374336242675781, 0.056168556213378906, 0.05859375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 6.0, 14.0, 11.0, 11.0, 19.0, 28.0, 38.0, 54.0, 92.0, 148.0, 177.0, 322.0, 565.0, 1125.0, 2443.0, 9012.0, 89222.0, 873583.0, 59760.0, 7369.0, 2148.0, 1033.0, 525.0, 283.0, 207.0, 117.0, 81.0, 49.0, 32.0, 17.0, 22.0, 11.0, 17.0, 4.0, 7.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.35107421875, -0.33990478515625, -0.3287353515625, -0.31756591796875, -0.306396484375, -0.29522705078125, -0.2840576171875, -0.27288818359375, -0.26171875, -0.25054931640625, -0.2393798828125, -0.22821044921875, -0.217041015625, -0.20587158203125, -0.1947021484375, -0.18353271484375, -0.17236328125, -0.16119384765625, -0.1500244140625, -0.13885498046875, -0.127685546875, -0.11651611328125, -0.1053466796875, -0.09417724609375, -0.0830078125, -0.07183837890625, -0.0606689453125, -0.04949951171875, -0.038330078125, -0.02716064453125, -0.0159912109375, -0.00482177734375, 0.00634765625, 0.01751708984375, 0.0286865234375, 0.03985595703125, 0.051025390625, 0.06219482421875, 0.0733642578125, 0.08453369140625, 0.095703125, 0.10687255859375, 0.1180419921875, 0.12921142578125, 0.140380859375, 0.15155029296875, 0.1627197265625, 0.17388916015625, 0.18505859375, 0.19622802734375, 0.2073974609375, 0.21856689453125, 0.229736328125, 0.24090576171875, 0.2520751953125, 0.26324462890625, 0.2744140625, 0.28558349609375, 0.2967529296875, 0.30792236328125, 0.319091796875, 0.33026123046875, 0.3414306640625, 0.35260009765625, 0.36376953125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 0.0, 3.0, 4.0, 4.0, 2.0, 2.0, 3.0, 3.0, 14.0, 11.0, 16.0, 21.0, 18.0, 20.0, 29.0, 27.0, 31.0, 31.0, 51.0, 60.0, 53.0, 53.0, 67.0, 40.0, 57.0, 47.0, 49.0, 47.0, 36.0, 32.0, 32.0, 19.0, 22.0, 18.0, 16.0, 13.0, 7.0, 13.0, 5.0, 5.0, 7.0, 5.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.267333984375, -0.2586631774902344, -0.24999237060546875, -0.24132156372070312, -0.2326507568359375, -0.22397994995117188, -0.21530914306640625, -0.20663833618164062, -0.197967529296875, -0.18929672241210938, -0.18062591552734375, -0.17195510864257812, -0.1632843017578125, -0.15461349487304688, -0.14594268798828125, -0.13727188110351562, -0.12860107421875, -0.11993026733398438, -0.11125946044921875, -0.10258865356445312, -0.0939178466796875, -0.08524703979492188, -0.07657623291015625, -0.06790542602539062, -0.059234619140625, -0.050563812255859375, -0.04189300537109375, -0.033222198486328125, -0.0245513916015625, -0.015880584716796875, -0.00720977783203125, 0.001461029052734375, 0.0101318359375, 0.018802642822265625, 0.02747344970703125, 0.036144256591796875, 0.0448150634765625, 0.053485870361328125, 0.06215667724609375, 0.07082748413085938, 0.079498291015625, 0.08816909790039062, 0.09683990478515625, 0.10551071166992188, 0.1141815185546875, 0.12285232543945312, 0.13152313232421875, 0.14019393920898438, 0.14886474609375, 0.15753555297851562, 0.16620635986328125, 0.17487716674804688, 0.1835479736328125, 0.19221878051757812, 0.20088958740234375, 0.20956039428710938, 0.218231201171875, 0.22690200805664062, 0.23557281494140625, 0.24424362182617188, 0.2529144287109375, 0.2615852355957031, 0.27025604248046875, 0.2789268493652344, 0.28759765625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 8.0, 1.0, 4.0, 14.0, 11.0, 18.0, 19.0, 32.0, 39.0, 52.0, 96.0, 155.0, 268.0, 433.0, 783.0, 1659.0, 3868.0, 11318.0, 48552.0, 654281.0, 273033.0, 38052.0, 9271.0, 3345.0, 1437.0, 718.0, 374.0, 271.0, 157.0, 97.0, 66.0, 49.0, 27.0, 20.0, 11.0, 9.0, 4.0, 6.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.075927734375, -0.0729990005493164, -0.07007026672363281, -0.06714153289794922, -0.06421279907226562, -0.06128406524658203, -0.05835533142089844, -0.055426597595214844, -0.05249786376953125, -0.049569129943847656, -0.04664039611816406, -0.04371166229248047, -0.040782928466796875, -0.03785419464111328, -0.03492546081542969, -0.031996726989746094, -0.0290679931640625, -0.026139259338378906, -0.023210525512695312, -0.02028179168701172, -0.017353057861328125, -0.014424324035644531, -0.011495590209960938, -0.008566856384277344, -0.00563812255859375, -0.0027093887329101562, 0.0002193450927734375, 0.0031480789184570312, 0.006076812744140625, 0.009005546569824219, 0.011934280395507812, 0.014863014221191406, 0.017791748046875, 0.020720481872558594, 0.023649215698242188, 0.02657794952392578, 0.029506683349609375, 0.03243541717529297, 0.03536415100097656, 0.038292884826660156, 0.04122161865234375, 0.044150352478027344, 0.04707908630371094, 0.05000782012939453, 0.052936553955078125, 0.05586528778076172, 0.05879402160644531, 0.061722755432128906, 0.0646514892578125, 0.0675802230834961, 0.07050895690917969, 0.07343769073486328, 0.07636642456054688, 0.07929515838623047, 0.08222389221191406, 0.08515262603759766, 0.08808135986328125, 0.09101009368896484, 0.09393882751464844, 0.09686756134033203, 0.09979629516601562, 0.10272502899169922, 0.10565376281738281, 0.1085824966430664, 0.11151123046875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 4.0, 5.0, 10.0, 7.0, 7.0, 10.0, 17.0, 25.0, 29.0, 43.0, 59.0, 80.0, 125.0, 152.0, 132.0, 67.0, 62.0, 42.0, 35.0, 23.0, 13.0, 8.0, 7.0, 6.0, 8.0, 7.0, 7.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5762786865234375e-05, -3.4543685615062714e-05, -3.332458436489105e-05, -3.210548311471939e-05, -3.088638186454773e-05, -2.9667280614376068e-05, -2.8448179364204407e-05, -2.7229078114032745e-05, -2.6009976863861084e-05, -2.4790875613689423e-05, -2.357177436351776e-05, -2.23526731133461e-05, -2.113357186317444e-05, -1.9914470613002777e-05, -1.8695369362831116e-05, -1.7476268112659454e-05, -1.6257166862487793e-05, -1.5038065612316132e-05, -1.381896436214447e-05, -1.2599863111972809e-05, -1.1380761861801147e-05, -1.0161660611629486e-05, -8.942559361457825e-06, -7.723458111286163e-06, -6.504356861114502e-06, -5.2852556109428406e-06, -4.066154360771179e-06, -2.847053110599518e-06, -1.6279518604278564e-06, -4.0885061025619507e-07, 8.102506399154663e-07, 2.0293518900871277e-06, 3.248453140258789e-06, 4.4675543904304504e-06, 5.686655640602112e-06, 6.905756890773773e-06, 8.124858140945435e-06, 9.343959391117096e-06, 1.0563060641288757e-05, 1.1782161891460419e-05, 1.300126314163208e-05, 1.4220364391803741e-05, 1.5439465641975403e-05, 1.6658566892147064e-05, 1.7877668142318726e-05, 1.9096769392490387e-05, 2.031587064266205e-05, 2.153497189283371e-05, 2.275407314300537e-05, 2.3973174393177032e-05, 2.5192275643348694e-05, 2.6411376893520355e-05, 2.7630478143692017e-05, 2.8849579393863678e-05, 3.006868064403534e-05, 3.1287781894207e-05, 3.250688314437866e-05, 3.3725984394550323e-05, 3.4945085644721985e-05, 3.6164186894893646e-05, 3.738328814506531e-05, 3.860238939523697e-05, 3.982149064540863e-05, 4.104059189558029e-05, 4.225969314575195e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 8.0, 7.0, 10.0, 18.0, 18.0, 37.0, 54.0, 79.0, 139.0, 258.0, 459.0, 917.0, 2313.0, 8147.0, 46542.0, 743498.0, 214740.0, 23034.0, 5023.0, 1651.0, 701.0, 360.0, 213.0, 108.0, 81.0, 39.0, 32.0, 18.0, 17.0, 11.0, 8.0, 4.0, 6.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.10821533203125, -0.10501575469970703, -0.10181617736816406, -0.0986166000366211, -0.09541702270507812, -0.09221744537353516, -0.08901786804199219, -0.08581829071044922, -0.08261871337890625, -0.07941913604736328, -0.07621955871582031, -0.07301998138427734, -0.06982040405273438, -0.0666208267211914, -0.06342124938964844, -0.06022167205810547, -0.0570220947265625, -0.05382251739501953, -0.05062294006347656, -0.047423362731933594, -0.044223785400390625, -0.041024208068847656, -0.03782463073730469, -0.03462505340576172, -0.03142547607421875, -0.02822589874267578, -0.025026321411132812, -0.021826744079589844, -0.018627166748046875, -0.015427589416503906, -0.012228012084960938, -0.009028434753417969, -0.005828857421875, -0.0026292800903320312, 0.0005702972412109375, 0.0037698745727539062, 0.006969451904296875, 0.010169029235839844, 0.013368606567382812, 0.01656818389892578, 0.01976776123046875, 0.02296733856201172, 0.026166915893554688, 0.029366493225097656, 0.032566070556640625, 0.035765647888183594, 0.03896522521972656, 0.04216480255126953, 0.0453643798828125, 0.04856395721435547, 0.05176353454589844, 0.054963111877441406, 0.058162689208984375, 0.061362266540527344, 0.06456184387207031, 0.06776142120361328, 0.07096099853515625, 0.07416057586669922, 0.07736015319824219, 0.08055973052978516, 0.08375930786132812, 0.0869588851928711, 0.09015846252441406, 0.09335803985595703, 0.0965576171875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 6.0, 4.0, 6.0, 6.0, 4.0, 5.0, 14.0, 8.0, 12.0, 9.0, 22.0, 23.0, 27.0, 45.0, 40.0, 45.0, 73.0, 72.0, 89.0, 93.0, 82.0, 55.0, 49.0, 48.0, 32.0, 28.0, 19.0, 18.0, 20.0, 9.0, 13.0, 10.0, 5.0, 6.0, 2.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06158447265625, -0.05951690673828125, -0.0574493408203125, -0.05538177490234375, -0.053314208984375, -0.05124664306640625, -0.0491790771484375, -0.04711151123046875, -0.0450439453125, -0.04297637939453125, -0.0409088134765625, -0.03884124755859375, -0.036773681640625, -0.03470611572265625, -0.0326385498046875, -0.03057098388671875, -0.02850341796875, -0.02643585205078125, -0.0243682861328125, -0.02230072021484375, -0.020233154296875, -0.01816558837890625, -0.0160980224609375, -0.01403045654296875, -0.011962890625, -0.00989532470703125, -0.0078277587890625, -0.00576019287109375, -0.003692626953125, -0.00162506103515625, 0.0004425048828125, 0.00251007080078125, 0.00457763671875, 0.00664520263671875, 0.0087127685546875, 0.01078033447265625, 0.012847900390625, 0.01491546630859375, 0.0169830322265625, 0.01905059814453125, 0.0211181640625, 0.02318572998046875, 0.0252532958984375, 0.02732086181640625, 0.029388427734375, 0.03145599365234375, 0.0335235595703125, 0.03559112548828125, 0.03765869140625, 0.03972625732421875, 0.0417938232421875, 0.04386138916015625, 0.045928955078125, 0.04799652099609375, 0.0500640869140625, 0.05213165283203125, 0.05419921875, 0.05626678466796875, 0.0583343505859375, 0.06040191650390625, 0.062469482421875, 0.06453704833984375, 0.0666046142578125, 0.06867218017578125, 0.07073974609375]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 10.0, 7.0, 12.0, 17.0, 43.0, 95.0, 146.0, 410.0, 151.0, 67.0, 23.0, 13.0, 7.0, 3.0, 6.0, 2.0, 0.0, 2.0, 1.0, 3.0], "bins": [-4.686023712158203, -4.595047950744629, -4.504072189331055, -4.413095951080322, -4.322120189666748, -4.231144428253174, -4.1401686668396, -4.049192428588867, -3.958216667175293, -3.8672409057617188, -3.7762649059295654, -3.685289144515991, -3.594313144683838, -3.5033373832702637, -3.4123616218566895, -3.321385622024536, -3.230409860610962, -3.1394340991973877, -3.0484580993652344, -2.95748233795166, -2.866506338119507, -2.7755305767059326, -2.6845545768737793, -2.593578815460205, -2.502603054046631, -2.4116272926330566, -2.3206512928009033, -2.229675531387329, -2.138699531555176, -2.0477237701416016, -1.9567478895187378, -1.865772008895874, -1.7747962474822998, -1.683820366859436, -1.5928444862365723, -1.501868724822998, -1.4108927249908447, -1.3199169635772705, -1.2289410829544067, -1.137965202331543, -1.0469893217086792, -0.9560134410858154, -0.8650375604629517, -0.7740617394447327, -0.6830858588218689, -0.5921099781990051, -0.5011341571807861, -0.41015827655792236, -0.3191823959350586, -0.22820653021335602, -0.13723066449165344, -0.04625481367111206, 0.04472106695175171, 0.13569694757461548, 0.22667276859283447, 0.31764864921569824, 0.408624529838562, 0.4996004104614258, 0.5905762910842896, 0.6815521121025085, 0.7725279927253723, 0.8635038733482361, 0.9544796943664551, 1.0454555749893188, 1.1364314556121826]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 6.0, 10.0, 3.0, 10.0, 6.0, 9.0, 12.0, 17.0, 14.0, 27.0, 22.0, 29.0, 23.0, 30.0, 25.0, 45.0, 47.0, 101.0, 174.0, 91.0, 42.0, 33.0, 31.0, 30.0, 15.0, 12.0, 28.0, 26.0, 22.0, 16.0, 13.0, 13.0, 8.0, 6.0, 2.0, 4.0, 1.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.202040195465088, -1.1623573303222656, -1.122674584388733, -1.0829917192459106, -1.043308973312378, -1.0036261081695557, -0.9639433026313782, -0.9242604970932007, -0.8845776915550232, -0.8448948860168457, -0.8052120804786682, -0.7655292749404907, -0.7258464097976685, -0.6861636638641357, -0.6464807987213135, -0.606797993183136, -0.5671151876449585, -0.527432382106781, -0.4877495765686035, -0.44806674122810364, -0.40838393568992615, -0.36870113015174866, -0.3290182948112488, -0.2893354892730713, -0.2496526837348938, -0.2099698781967163, -0.17028705775737762, -0.13060423731803894, -0.09092143177986145, -0.05123862624168396, -0.011555805802345276, 0.028127014636993408, 0.0678098201751709, 0.10749263316392899, 0.14717544615268707, 0.18685826659202576, 0.22654107213020325, 0.26622387766838074, 0.3059067130088806, 0.3455895185470581, 0.3852723240852356, 0.4249551296234131, 0.4646379351615906, 0.5043207406997681, 0.5440036058425903, 0.583686351776123, 0.6233692169189453, 0.6630520224571228, 0.7027348279953003, 0.7424176335334778, 0.7821004390716553, 0.8217832446098328, 0.8614660501480103, 0.9011489152908325, 0.94083172082901, 0.9805145263671875, 1.0201973915100098, 1.059880256652832, 1.0995630025863647, 1.139245867729187, 1.1789286136627197, 1.218611478805542, 1.2582942247390747, 1.297977089881897, 1.3376598358154297]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 7.0, 5.0, 11.0, 12.0, 31.0, 33.0, 54.0, 98.0, 144.0, 209.0, 339.0, 484.0, 805.0, 1480.0, 2639.0, 5485.0, 12016.0, 31862.0, 107076.0, 525212.0, 2073262.0, 1119509.0, 224085.0, 54459.0, 18740.0, 7787.0, 3726.0, 1914.0, 1093.0, 652.0, 353.0, 242.0, 162.0, 111.0, 55.0, 54.0, 34.0, 14.0, 12.0, 9.0, 7.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.113525390625, -0.10994815826416016, -0.10637092590332031, -0.10279369354248047, -0.09921646118164062, -0.09563922882080078, -0.09206199645996094, -0.0884847640991211, -0.08490753173828125, -0.0813302993774414, -0.07775306701660156, -0.07417583465576172, -0.07059860229492188, -0.06702136993408203, -0.06344413757324219, -0.059866905212402344, -0.0562896728515625, -0.052712440490722656, -0.04913520812988281, -0.04555797576904297, -0.041980743408203125, -0.03840351104736328, -0.03482627868652344, -0.031249046325683594, -0.02767181396484375, -0.024094581604003906, -0.020517349243164062, -0.01694011688232422, -0.013362884521484375, -0.009785652160644531, -0.0062084197998046875, -0.0026311874389648438, 0.000946044921875, 0.004523277282714844, 0.008100509643554688, 0.011677742004394531, 0.015254974365234375, 0.01883220672607422, 0.022409439086914062, 0.025986671447753906, 0.02956390380859375, 0.033141136169433594, 0.03671836853027344, 0.04029560089111328, 0.043872833251953125, 0.04745006561279297, 0.05102729797363281, 0.054604530334472656, 0.0581817626953125, 0.061758995056152344, 0.06533622741699219, 0.06891345977783203, 0.07249069213867188, 0.07606792449951172, 0.07964515686035156, 0.0832223892211914, 0.08679962158203125, 0.0903768539428711, 0.09395408630371094, 0.09753131866455078, 0.10110855102539062, 0.10468578338623047, 0.10826301574707031, 0.11184024810791016, 0.11541748046875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 4.0, 5.0, 3.0, 5.0, 9.0, 11.0, 6.0, 8.0, 7.0, 19.0, 16.0, 15.0, 28.0, 23.0, 24.0, 36.0, 28.0, 40.0, 41.0, 53.0, 45.0, 52.0, 46.0, 38.0, 58.0, 47.0, 40.0, 39.0, 48.0, 22.0, 33.0, 23.0, 28.0, 12.0, 23.0, 16.0, 11.0, 12.0, 5.0, 8.0, 4.0, 4.0, 5.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.05657958984375, -0.05472278594970703, -0.05286598205566406, -0.051009178161621094, -0.049152374267578125, -0.047295570373535156, -0.04543876647949219, -0.04358196258544922, -0.04172515869140625, -0.03986835479736328, -0.03801155090332031, -0.036154747009277344, -0.034297943115234375, -0.032441139221191406, -0.030584335327148438, -0.02872753143310547, -0.0268707275390625, -0.02501392364501953, -0.023157119750976562, -0.021300315856933594, -0.019443511962890625, -0.017586708068847656, -0.015729904174804688, -0.013873100280761719, -0.01201629638671875, -0.010159492492675781, -0.008302688598632812, -0.006445884704589844, -0.004589080810546875, -0.0027322769165039062, -0.0008754730224609375, 0.0009813308715820312, 0.002838134765625, 0.004694938659667969, 0.0065517425537109375, 0.008408546447753906, 0.010265350341796875, 0.012122154235839844, 0.013978958129882812, 0.01583576202392578, 0.01769256591796875, 0.01954936981201172, 0.021406173706054688, 0.023262977600097656, 0.025119781494140625, 0.026976585388183594, 0.028833389282226562, 0.03069019317626953, 0.0325469970703125, 0.03440380096435547, 0.03626060485839844, 0.038117408752441406, 0.039974212646484375, 0.041831016540527344, 0.04368782043457031, 0.04554462432861328, 0.04740142822265625, 0.04925823211669922, 0.05111503601074219, 0.052971839904785156, 0.054828643798828125, 0.056685447692871094, 0.05854225158691406, 0.06039905548095703, 0.062255859375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 6.0, 16.0, 31.0, 88.0, 284.0, 1190.0, 49725.0, 4139730.0, 2562.0, 461.0, 135.0, 33.0, 15.0, 9.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7470703125, -1.691070556640625, -1.63507080078125, -1.579071044921875, -1.5230712890625, -1.467071533203125, -1.41107177734375, -1.355072021484375, -1.299072265625, -1.243072509765625, -1.18707275390625, -1.131072998046875, -1.0750732421875, -1.019073486328125, -0.96307373046875, -0.907073974609375, -0.85107421875, -0.795074462890625, -0.73907470703125, -0.683074951171875, -0.6270751953125, -0.571075439453125, -0.51507568359375, -0.459075927734375, -0.403076171875, -0.347076416015625, -0.29107666015625, -0.235076904296875, -0.1790771484375, -0.123077392578125, -0.06707763671875, -0.011077880859375, 0.044921875, 0.100921630859375, 0.15692138671875, 0.212921142578125, 0.2689208984375, 0.324920654296875, 0.38092041015625, 0.436920166015625, 0.492919921875, 0.548919677734375, 0.60491943359375, 0.660919189453125, 0.7169189453125, 0.772918701171875, 0.82891845703125, 0.884918212890625, 0.94091796875, 0.996917724609375, 1.05291748046875, 1.108917236328125, 1.1649169921875, 1.220916748046875, 1.27691650390625, 1.332916259765625, 1.388916015625, 1.444915771484375, 1.50091552734375, 1.556915283203125, 1.6129150390625, 1.668914794921875, 1.72491455078125, 1.780914306640625, 1.8369140625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 8.0, 11.0, 51.0, 130.0, 326.0, 928.0, 1603.0, 625.0, 224.0, 111.0, 32.0, 11.0, 9.0, 5.0, 4.0, 1.0, 4.0], "bins": [-1.1669921875, -1.1451148986816406, -1.1232376098632812, -1.1013603210449219, -1.0794830322265625, -1.0576057434082031, -1.0357284545898438, -1.0138511657714844, -0.991973876953125, -0.9700965881347656, -0.9482192993164062, -0.9263420104980469, -0.9044647216796875, -0.8825874328613281, -0.8607101440429688, -0.8388328552246094, -0.81695556640625, -0.7950782775878906, -0.7732009887695312, -0.7513236999511719, -0.7294464111328125, -0.7075691223144531, -0.6856918334960938, -0.6638145446777344, -0.641937255859375, -0.6200599670410156, -0.5981826782226562, -0.5763053894042969, -0.5544281005859375, -0.5325508117675781, -0.5106735229492188, -0.4887962341308594, -0.4669189453125, -0.4450416564941406, -0.42316436767578125, -0.4012870788574219, -0.3794097900390625, -0.3575325012207031, -0.33565521240234375, -0.3137779235839844, -0.291900634765625, -0.2700233459472656, -0.24814605712890625, -0.22626876831054688, -0.2043914794921875, -0.18251419067382812, -0.16063690185546875, -0.13875961303710938, -0.11688232421875, -0.09500503540039062, -0.07312774658203125, -0.051250457763671875, -0.0293731689453125, -0.007495880126953125, 0.01438140869140625, 0.036258697509765625, 0.058135986328125, 0.08001327514648438, 0.10189056396484375, 0.12376785278320312, 0.1456451416015625, 0.16752243041992188, 0.18939971923828125, 0.21127700805664062, 0.233154296875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 5.0, 4.0, 7.0, 12.0, 19.0, 24.0, 67.0, 151.0, 243.0, 252.0, 122.0, 47.0, 23.0, 16.0, 5.0, 2.0, 5.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-8.147879600524902, -7.987796306610107, -7.827713489532471, -7.667630195617676, -7.507547378540039, -7.347464084625244, -7.187381267547607, -7.0272979736328125, -6.867215156555176, -6.707131862640381, -6.547049045562744, -6.386965751647949, -6.2268829345703125, -6.066799640655518, -5.906716823577881, -5.746633529663086, -5.586550235748291, -5.426466941833496, -5.266384124755859, -5.1063008308410645, -4.946218013763428, -4.786134719848633, -4.626051902770996, -4.465968608856201, -4.305885314941406, -4.145802021026611, -3.9857192039489746, -3.825636148452759, -3.665553092956543, -3.505469799041748, -3.3453867435455322, -3.1853036880493164, -3.025221347808838, -2.865138292312622, -2.7050552368164062, -2.5449721813201904, -2.3848891258239746, -2.2248058319091797, -2.064722776412964, -1.904639720916748, -1.7445566654205322, -1.5844736099243164, -1.4243905544281006, -1.2643073797225952, -1.1042243242263794, -0.9441412687301636, -0.784058153629303, -0.6239750385284424, -0.46389198303222656, -0.30380889773368835, -0.14372581243515015, 0.01635727286338806, 0.17644035816192627, 0.3365234136581421, 0.4966065287590027, 0.6566896438598633, 0.8167726993560791, 0.9768557548522949, 1.1369388103485107, 1.2970219850540161, 1.457105040550232, 1.6171880960464478, 1.7772712707519531, 1.937354326248169, 2.0974373817443848]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 13.0, 10.0, 13.0, 15.0, 24.0, 42.0, 41.0, 59.0, 51.0, 73.0, 63.0, 83.0, 91.0, 71.0, 48.0, 40.0, 44.0, 29.0, 44.0, 26.0, 24.0, 26.0, 19.0, 13.0, 9.0, 10.0, 4.0, 4.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0049943923950195, -1.927647352218628, -1.8503003120422363, -1.7729532718658447, -1.6956062316894531, -1.6182591915130615, -1.54091215133667, -1.4635651111602783, -1.3862180709838867, -1.3088710308074951, -1.2315239906311035, -1.154176950454712, -1.0768299102783203, -0.9994828701019287, -0.9221358299255371, -0.8447887897491455, -0.7674417495727539, -0.6900947093963623, -0.6127476692199707, -0.5354006290435791, -0.4580535888671875, -0.3807065486907959, -0.3033595085144043, -0.2260124683380127, -0.1486654281616211, -0.07131838798522949, 0.006028652191162109, 0.08337569236755371, 0.1607227325439453, 0.23806977272033691, 0.3154168128967285, 0.3927638530731201, 0.4701106548309326, 0.5474576950073242, 0.6248047351837158, 0.7021517753601074, 0.779498815536499, 0.8568458557128906, 0.9341928958892822, 1.0115399360656738, 1.0888869762420654, 1.166234016418457, 1.2435810565948486, 1.3209280967712402, 1.3982751369476318, 1.4756221771240234, 1.552969217300415, 1.6303162574768066, 1.7076632976531982, 1.7850103378295898, 1.8623573780059814, 1.939704418182373, 2.0170514583587646, 2.0943984985351562, 2.171745538711548, 2.2490925788879395, 2.326439619064331, 2.4037866592407227, 2.4811336994171143, 2.558480739593506, 2.6358277797698975, 2.713174819946289, 2.7905218601226807, 2.8678689002990723, 2.945215940475464]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 5.0, 6.0, 6.0, 11.0, 13.0, 17.0, 28.0, 53.0, 71.0, 87.0, 158.0, 317.0, 548.0, 1163.0, 2467.0, 6155.0, 19387.0, 77816.0, 552276.0, 312469.0, 52221.0, 14484.0, 4819.0, 1882.0, 932.0, 492.0, 266.0, 152.0, 88.0, 67.0, 26.0, 21.0, 20.0, 8.0, 9.0, 5.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1522216796875, -0.1461009979248047, -0.13998031616210938, -0.13385963439941406, -0.12773895263671875, -0.12161827087402344, -0.11549758911132812, -0.10937690734863281, -0.1032562255859375, -0.09713554382324219, -0.09101486206054688, -0.08489418029785156, -0.07877349853515625, -0.07265281677246094, -0.06653213500976562, -0.06041145324707031, -0.054290771484375, -0.04817008972167969, -0.042049407958984375, -0.03592872619628906, -0.02980804443359375, -0.023687362670898438, -0.017566680908203125, -0.011445999145507812, -0.0053253173828125, 0.0007953643798828125, 0.006916046142578125, 0.013036727905273438, 0.01915740966796875, 0.025278091430664062, 0.031398773193359375, 0.03751945495605469, 0.04364013671875, 0.04976081848144531, 0.055881500244140625, 0.06200218200683594, 0.06812286376953125, 0.07424354553222656, 0.08036422729492188, 0.08648490905761719, 0.0926055908203125, 0.09872627258300781, 0.10484695434570312, 0.11096763610839844, 0.11708831787109375, 0.12320899963378906, 0.12932968139648438, 0.1354503631591797, 0.141571044921875, 0.1476917266845703, 0.15381240844726562, 0.15993309020996094, 0.16605377197265625, 0.17217445373535156, 0.17829513549804688, 0.1844158172607422, 0.1905364990234375, 0.1966571807861328, 0.20277786254882812, 0.20889854431152344, 0.21501922607421875, 0.22113990783691406, 0.22726058959960938, 0.2333812713623047, 0.239501953125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 6.0, 9.0, 16.0, 20.0, 23.0, 25.0, 27.0, 43.0, 39.0, 75.0, 70.0, 81.0, 85.0, 80.0, 65.0, 57.0, 55.0, 45.0, 36.0, 37.0, 18.0, 33.0, 14.0, 9.0, 5.0, 5.0, 3.0, 3.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.135986328125, -0.13156890869140625, -0.1271514892578125, -0.12273406982421875, -0.118316650390625, -0.11389923095703125, -0.1094818115234375, -0.10506439208984375, -0.10064697265625, -0.09622955322265625, -0.0918121337890625, -0.08739471435546875, -0.082977294921875, -0.07855987548828125, -0.0741424560546875, -0.06972503662109375, -0.0653076171875, -0.06089019775390625, -0.0564727783203125, -0.05205535888671875, -0.047637939453125, -0.04322052001953125, -0.0388031005859375, -0.03438568115234375, -0.02996826171875, -0.02555084228515625, -0.0211334228515625, -0.01671600341796875, -0.012298583984375, -0.00788116455078125, -0.0034637451171875, 0.00095367431640625, 0.00537109375, 0.00978851318359375, 0.0142059326171875, 0.01862335205078125, 0.023040771484375, 0.02745819091796875, 0.0318756103515625, 0.03629302978515625, 0.04071044921875, 0.04512786865234375, 0.0495452880859375, 0.05396270751953125, 0.058380126953125, 0.06279754638671875, 0.0672149658203125, 0.07163238525390625, 0.0760498046875, 0.08046722412109375, 0.0848846435546875, 0.08930206298828125, 0.093719482421875, 0.09813690185546875, 0.1025543212890625, 0.10697174072265625, 0.11138916015625, 0.11580657958984375, 0.1202239990234375, 0.12464141845703125, 0.129058837890625, 0.13347625732421875, 0.1378936767578125, 0.14231109619140625, 0.146728515625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 3.0, 4.0, 4.0, 2.0, 3.0, 12.0, 14.0, 23.0, 22.0, 39.0, 68.0, 96.0, 181.0, 308.0, 739.0, 2111.0, 10513.0, 211690.0, 804713.0, 13761.0, 2511.0, 837.0, 352.0, 199.0, 130.0, 65.0, 55.0, 29.0, 23.0, 13.0, 12.0, 5.0, 9.0, 4.0, 0.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.42822265625, -0.4163475036621094, -0.40447235107421875, -0.3925971984863281, -0.3807220458984375, -0.3688468933105469, -0.35697174072265625, -0.3450965881347656, -0.333221435546875, -0.3213462829589844, -0.30947113037109375, -0.2975959777832031, -0.2857208251953125, -0.2738456726074219, -0.26197052001953125, -0.2500953674316406, -0.23822021484375, -0.22634506225585938, -0.21446990966796875, -0.20259475708007812, -0.1907196044921875, -0.17884445190429688, -0.16696929931640625, -0.15509414672851562, -0.143218994140625, -0.13134384155273438, -0.11946868896484375, -0.10759353637695312, -0.0957183837890625, -0.08384323120117188, -0.07196807861328125, -0.060092926025390625, -0.0482177734375, -0.036342620849609375, -0.02446746826171875, -0.012592315673828125, -0.0007171630859375, 0.011157989501953125, 0.02303314208984375, 0.034908294677734375, 0.046783447265625, 0.058658599853515625, 0.07053375244140625, 0.08240890502929688, 0.0942840576171875, 0.10615921020507812, 0.11803436279296875, 0.12990951538085938, 0.14178466796875, 0.15365982055664062, 0.16553497314453125, 0.17741012573242188, 0.1892852783203125, 0.20116043090820312, 0.21303558349609375, 0.22491073608398438, 0.236785888671875, 0.24866104125976562, 0.26053619384765625, 0.2724113464355469, 0.2842864990234375, 0.2961616516113281, 0.30803680419921875, 0.3199119567871094, 0.331787109375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 5.0, 5.0, 6.0, 7.0, 9.0, 14.0, 16.0, 14.0, 18.0, 29.0, 27.0, 34.0, 46.0, 51.0, 92.0, 93.0, 110.0, 84.0, 62.0, 60.0, 38.0, 34.0, 25.0, 16.0, 17.0, 18.0, 10.0, 17.0, 15.0, 11.0, 4.0, 4.0, 7.0, 4.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.6708984375, -0.6538772583007812, -0.6368560791015625, -0.6198348999023438, -0.602813720703125, -0.5857925415039062, -0.5687713623046875, -0.5517501831054688, -0.53472900390625, -0.5177078247070312, -0.5006866455078125, -0.48366546630859375, -0.466644287109375, -0.44962310791015625, -0.4326019287109375, -0.41558074951171875, -0.3985595703125, -0.38153839111328125, -0.3645172119140625, -0.34749603271484375, -0.330474853515625, -0.31345367431640625, -0.2964324951171875, -0.27941131591796875, -0.26239013671875, -0.24536895751953125, -0.2283477783203125, -0.21132659912109375, -0.194305419921875, -0.17728424072265625, -0.1602630615234375, -0.14324188232421875, -0.126220703125, -0.10919952392578125, -0.0921783447265625, -0.07515716552734375, -0.058135986328125, -0.04111480712890625, -0.0240936279296875, -0.00707244873046875, 0.00994873046875, 0.02696990966796875, 0.0439910888671875, 0.06101226806640625, 0.078033447265625, 0.09505462646484375, 0.1120758056640625, 0.12909698486328125, 0.1461181640625, 0.16313934326171875, 0.1801605224609375, 0.19718170166015625, 0.214202880859375, 0.23122406005859375, 0.2482452392578125, 0.26526641845703125, 0.28228759765625, 0.29930877685546875, 0.3163299560546875, 0.33335113525390625, 0.350372314453125, 0.36739349365234375, 0.3844146728515625, 0.40143585205078125, 0.41845703125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 2.0, 3.0, 7.0, 6.0, 13.0, 15.0, 18.0, 26.0, 37.0, 38.0, 68.0, 116.0, 192.0, 432.0, 1030.0, 3499.0, 23008.0, 969434.0, 43141.0, 5020.0, 1341.0, 479.0, 224.0, 133.0, 86.0, 52.0, 31.0, 20.0, 13.0, 8.0, 16.0, 14.0, 7.0, 4.0, 10.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12066650390625, -0.1165914535522461, -0.11251640319824219, -0.10844135284423828, -0.10436630249023438, -0.10029125213623047, -0.09621620178222656, -0.09214115142822266, -0.08806610107421875, -0.08399105072021484, -0.07991600036621094, -0.07584095001220703, -0.07176589965820312, -0.06769084930419922, -0.06361579895019531, -0.059540748596191406, -0.0554656982421875, -0.051390647888183594, -0.04731559753417969, -0.04324054718017578, -0.039165496826171875, -0.03509044647216797, -0.031015396118164062, -0.026940345764160156, -0.02286529541015625, -0.018790245056152344, -0.014715194702148438, -0.010640144348144531, -0.006565093994140625, -0.0024900436401367188, 0.0015850067138671875, 0.005660057067871094, 0.009735107421875, 0.013810157775878906, 0.017885208129882812, 0.02196025848388672, 0.026035308837890625, 0.03011035919189453, 0.03418540954589844, 0.038260459899902344, 0.04233551025390625, 0.046410560607910156, 0.05048561096191406, 0.05456066131591797, 0.058635711669921875, 0.06271076202392578, 0.06678581237792969, 0.0708608627319336, 0.0749359130859375, 0.0790109634399414, 0.08308601379394531, 0.08716106414794922, 0.09123611450195312, 0.09531116485595703, 0.09938621520996094, 0.10346126556396484, 0.10753631591796875, 0.11161136627197266, 0.11568641662597656, 0.11976146697998047, 0.12383651733398438, 0.12791156768798828, 0.1319866180419922, 0.1360616683959961, 0.14013671875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 5.0, 10.0, 24.0, 13.0, 26.0, 38.0, 71.0, 148.0, 229.0, 197.0, 72.0, 43.0, 28.0, 24.0, 14.0, 15.0, 8.0, 8.0, 7.0, 5.0, 5.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.361701965332031e-05, -3.220513463020325e-05, -3.079324960708618e-05, -2.9381364583969116e-05, -2.796947956085205e-05, -2.6557594537734985e-05, -2.514570951461792e-05, -2.3733824491500854e-05, -2.232193946838379e-05, -2.0910054445266724e-05, -1.9498169422149658e-05, -1.8086284399032593e-05, -1.6674399375915527e-05, -1.5262514352798462e-05, -1.3850629329681396e-05, -1.2438744306564331e-05, -1.1026859283447266e-05, -9.6149742603302e-06, -8.203089237213135e-06, -6.791204214096069e-06, -5.379319190979004e-06, -3.9674341678619385e-06, -2.555549144744873e-06, -1.1436641216278076e-06, 2.682209014892578e-07, 1.6801059246063232e-06, 3.0919909477233887e-06, 4.503875970840454e-06, 5.9157609939575195e-06, 7.327646017074585e-06, 8.73953104019165e-06, 1.0151416063308716e-05, 1.1563301086425781e-05, 1.2975186109542847e-05, 1.4387071132659912e-05, 1.5798956155776978e-05, 1.7210841178894043e-05, 1.862272620201111e-05, 2.0034611225128174e-05, 2.144649624824524e-05, 2.2858381271362305e-05, 2.427026629447937e-05, 2.5682151317596436e-05, 2.70940363407135e-05, 2.8505921363830566e-05, 2.9917806386947632e-05, 3.13296914100647e-05, 3.274157643318176e-05, 3.415346145629883e-05, 3.5565346479415894e-05, 3.697723150253296e-05, 3.8389116525650024e-05, 3.980100154876709e-05, 4.1212886571884155e-05, 4.262477159500122e-05, 4.4036656618118286e-05, 4.544854164123535e-05, 4.686042666435242e-05, 4.827231168746948e-05, 4.968419671058655e-05, 5.109608173370361e-05, 5.250796675682068e-05, 5.3919851779937744e-05, 5.533173680305481e-05, 5.6743621826171875e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 5.0, 5.0, 6.0, 12.0, 17.0, 28.0, 41.0, 84.0, 141.0, 268.0, 530.0, 1367.0, 4335.0, 19889.0, 841505.0, 162218.0, 12871.0, 3149.0, 1107.0, 471.0, 232.0, 103.0, 51.0, 42.0, 21.0, 19.0, 12.0, 7.0, 6.0, 3.0, 2.0, 7.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.074462890625, -0.07169246673583984, -0.06892204284667969, -0.06615161895751953, -0.06338119506835938, -0.06061077117919922, -0.05784034729003906, -0.055069923400878906, -0.05229949951171875, -0.049529075622558594, -0.04675865173339844, -0.04398822784423828, -0.041217803955078125, -0.03844738006591797, -0.03567695617675781, -0.032906532287597656, -0.0301361083984375, -0.027365684509277344, -0.024595260620117188, -0.02182483673095703, -0.019054412841796875, -0.01628398895263672, -0.013513565063476562, -0.010743141174316406, -0.00797271728515625, -0.005202293395996094, -0.0024318695068359375, 0.00033855438232421875, 0.003108978271484375, 0.005879402160644531, 0.008649826049804688, 0.011420249938964844, 0.014190673828125, 0.016961097717285156, 0.019731521606445312, 0.02250194549560547, 0.025272369384765625, 0.02804279327392578, 0.030813217163085938, 0.033583641052246094, 0.03635406494140625, 0.039124488830566406, 0.04189491271972656, 0.04466533660888672, 0.047435760498046875, 0.05020618438720703, 0.05297660827636719, 0.055747032165527344, 0.0585174560546875, 0.061287879943847656, 0.06405830383300781, 0.06682872772216797, 0.06959915161132812, 0.07236957550048828, 0.07513999938964844, 0.0779104232788086, 0.08068084716796875, 0.0834512710571289, 0.08622169494628906, 0.08899211883544922, 0.09176254272460938, 0.09453296661376953, 0.09730339050292969, 0.10007381439208984, 0.10284423828125]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 3.0, 6.0, 8.0, 6.0, 10.0, 7.0, 21.0, 18.0, 32.0, 50.0, 120.0, 195.0, 202.0, 129.0, 62.0, 37.0, 26.0, 10.0, 10.0, 8.0, 13.0, 6.0, 3.0, 2.0, 0.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07196044921875, -0.06920242309570312, -0.06644439697265625, -0.06368637084960938, -0.0609283447265625, -0.058170318603515625, -0.05541229248046875, -0.052654266357421875, -0.049896240234375, -0.047138214111328125, -0.04438018798828125, -0.041622161865234375, -0.0388641357421875, -0.036106109619140625, -0.03334808349609375, -0.030590057373046875, -0.02783203125, -0.025074005126953125, -0.02231597900390625, -0.019557952880859375, -0.0167999267578125, -0.014041900634765625, -0.01128387451171875, -0.008525848388671875, -0.005767822265625, -0.003009796142578125, -0.00025177001953125, 0.002506256103515625, 0.0052642822265625, 0.008022308349609375, 0.01078033447265625, 0.013538360595703125, 0.01629638671875, 0.019054412841796875, 0.02181243896484375, 0.024570465087890625, 0.0273284912109375, 0.030086517333984375, 0.03284454345703125, 0.035602569580078125, 0.038360595703125, 0.041118621826171875, 0.04387664794921875, 0.046634674072265625, 0.0493927001953125, 0.052150726318359375, 0.05490875244140625, 0.057666778564453125, 0.0604248046875, 0.06318283081054688, 0.06594085693359375, 0.06869888305664062, 0.0714569091796875, 0.07421493530273438, 0.07697296142578125, 0.07973098754882812, 0.082489013671875, 0.08524703979492188, 0.08800506591796875, 0.09076309204101562, 0.0935211181640625, 0.09627914428710938, 0.09903717041015625, 0.10179519653320312, 0.10455322265625]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 6.0, 15.0, 50.0, 586.0, 266.0, 57.0, 16.0, 4.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.014270782470703, -6.842845916748047, -6.671421527862549, -6.499996662139893, -6.328571796417236, -6.157147407531738, -5.985722541809082, -5.814297676086426, -5.642873287200928, -5.4714484214782715, -5.300024032592773, -5.128599166870117, -4.957174301147461, -4.785749912261963, -4.614325046539307, -4.442900657653809, -4.271475791931152, -4.100050926208496, -3.928626298904419, -3.757201671600342, -3.5857770442962646, -3.4143524169921875, -3.2429275512695312, -3.071502923965454, -2.9000778198242188, -2.7286531925201416, -2.5572283267974854, -2.385803699493408, -2.214379072189331, -2.042954444885254, -1.8715295791625977, -1.7001049518585205, -1.5286803245544434, -1.3572555780410767, -1.1858309507369995, -1.0144062042236328, -0.8429815173149109, -0.671556830406189, -0.5001320838928223, -0.3287074565887451, -0.15728271007537842, 0.0141419917345047, 0.18556669354438782, 0.35699141025543213, 0.528416097164154, 0.699840784072876, 0.8712655305862427, 1.0426901578903198, 1.2141149044036865, 1.3855396509170532, 1.5569642782211304, 1.728389024734497, 1.8998136520385742, 2.0712385177612305, 2.2426631450653076, 2.4140877723693848, 2.585512638092041, 2.756937265396118, 2.9283621311187744, 3.0997867584228516, 3.2712113857269287, 3.442636013031006, 3.614060878753662, 3.7854855060577393, 3.9569101333618164]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 1.0, 3.0, 2.0, 3.0, 4.0, 5.0, 6.0, 4.0, 7.0, 8.0, 10.0, 12.0, 19.0, 22.0, 23.0, 27.0, 29.0, 32.0, 18.0, 49.0, 299.0, 172.0, 27.0, 27.0, 25.0, 22.0, 24.0, 19.0, 12.0, 12.0, 8.0, 8.0, 13.0, 10.0, 8.0, 3.0, 10.0, 2.0, 1.0, 5.0, 7.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4504411220550537, -1.4062793254852295, -1.3621174097061157, -1.3179556131362915, -1.2737938165664673, -1.2296319007873535, -1.1854701042175293, -1.141308307647705, -1.0971463918685913, -1.052984595298767, -1.0088226795196533, -0.9646608829498291, -0.9204990267753601, -0.8763371706008911, -0.8321753740310669, -0.7880135178565979, -0.7438517212867737, -0.6996898651123047, -0.6555280685424805, -0.6113662123680115, -0.5672043561935425, -0.5230425596237183, -0.47888070344924927, -0.4347188472747803, -0.39055702090263367, -0.34639519453048706, -0.30223333835601807, -0.25807151198387146, -0.21390967071056366, -0.16974782943725586, -0.12558600306510925, -0.08142414689064026, -0.03726232051849365, 0.0068995170295238495, 0.05106135457754135, 0.09522318840026855, 0.13938502967357635, 0.18354687094688416, 0.22770869731903076, 0.27187055349349976, 0.31603237986564636, 0.36019420623779297, 0.40435606241226196, 0.44851788878440857, 0.4926797151565552, 0.5368415713310242, 0.5810034275054932, 0.6251652240753174, 0.6693270802497864, 0.7134889364242554, 0.7576507329940796, 0.8018125891685486, 0.8459744453430176, 0.8901362419128418, 0.9342980980873108, 0.9784599542617798, 1.022621750831604, 1.0667835474014282, 1.110945463180542, 1.1551072597503662, 1.1992690563201904, 1.2434309720993042, 1.2875927686691284, 1.3317546844482422, 1.3759164810180664]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 5.0, 6.0, 9.0, 18.0, 31.0, 37.0, 46.0, 80.0, 170.0, 310.0, 90.0, 58.0, 50.0, 28.0, 27.0, 16.0, 12.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11920166015625, -0.11260128021240234, -0.10600090026855469, -0.09940052032470703, -0.09280014038085938, -0.08619976043701172, -0.07959938049316406, -0.0729990005493164, -0.06639862060546875, -0.059798240661621094, -0.05319786071777344, -0.04659748077392578, -0.039997100830078125, -0.03339672088623047, -0.026796340942382812, -0.020195960998535156, -0.0135955810546875, -0.006995201110839844, -0.0003948211669921875, 0.006205558776855469, 0.012805938720703125, 0.01940631866455078, 0.026006698608398438, 0.032607078552246094, 0.03920745849609375, 0.045807838439941406, 0.05240821838378906, 0.05900859832763672, 0.06560897827148438, 0.07220935821533203, 0.07880973815917969, 0.08541011810302734, 0.092010498046875, 0.09861087799072266, 0.10521125793457031, 0.11181163787841797, 0.11841201782226562, 0.12501239776611328, 0.13161277770996094, 0.1382131576538086, 0.14481353759765625, 0.1514139175415039, 0.15801429748535156, 0.16461467742919922, 0.17121505737304688, 0.17781543731689453, 0.1844158172607422, 0.19101619720458984, 0.1976165771484375, 0.20421695709228516, 0.2108173370361328, 0.21741771697998047, 0.22401809692382812, 0.23061847686767578, 0.23721885681152344, 0.2438192367553711, 0.25041961669921875, 0.2570199966430664, 0.26362037658691406, 0.2702207565307617, 0.2768211364746094, 0.28342151641845703, 0.2900218963623047, 0.29662227630615234, 0.30322265625]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 9.0, 17.0, 14.0, 28.0, 32.0, 76.0, 80.0, 160.0, 451.0, 1436.0, 9012.0, 8354520.0, 19517.0, 2202.0, 540.0, 202.0, 118.0, 53.0, 32.0, 42.0, 10.0, 15.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 7.0, 1.0], "bins": [-1.5979317426681519, -1.5543206930160522, -1.510709524154663, -1.4670984745025635, -1.4234874248504639, -1.3798762559890747, -1.336265206336975, -1.292654037475586, -1.2490429878234863, -1.2054319381713867, -1.1618207693099976, -1.118209719657898, -1.0745986700057983, -1.0309875011444092, -0.9873764514923096, -0.9437653422355652, -0.9001542925834656, -0.8565431833267212, -0.8129321336746216, -0.7693210244178772, -0.7257099151611328, -0.6820988655090332, -0.6384877562522888, -0.5948766469955444, -0.5512655973434448, -0.5076544880867004, -0.46404340863227844, -0.42043232917785645, -0.37682121992111206, -0.33321014046669006, -0.28959906101226807, -0.24598795175552368, -0.2023768424987793, -0.1587657481431961, -0.11515466123819351, -0.07154357433319092, -0.027932479977607727, 0.015678614377975464, 0.05928969383239746, 0.10290080308914185, 0.14651188254356384, 0.19012297689914703, 0.23373407125473022, 0.2773451507091522, 0.3209562301635742, 0.3645673394203186, 0.4081784188747406, 0.451789528131485, 0.495400607585907, 0.5390117168426514, 0.582622766494751, 0.6262338757514954, 0.6698449850082397, 0.7134560346603394, 0.7570671439170837, 0.8006782531738281, 0.8442893028259277, 0.8879004120826721, 0.9315114617347717, 0.9751225709915161, 1.0187336206436157, 1.0623447895050049, 1.1059558391571045, 1.149566888809204, 1.1931780576705933]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 3.0, 2.0, 3.0, 3.0, 5.0, 4.0, 3.0, 5.0, 4.0, 6.0, 5.0, 7.0, 5.0, 9.0, 8.0, 3.0, 2.0, 5.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.7173702120780945, -0.6894587278366089, -0.6615473031997681, -0.6336358785629272, -0.6057243943214417, -0.577812910079956, -0.5499014854431152, -0.5219900608062744, -0.4940785765647888, -0.4661671221256256, -0.4382556676864624, -0.4103442132472992, -0.382432758808136, -0.3545213043689728, -0.32660984992980957, -0.29869839549064636, -0.27078694105148315, -0.24287548661231995, -0.21496403217315674, -0.18705257773399353, -0.15914112329483032, -0.13122966885566711, -0.1033182144165039, -0.0754067599773407, -0.04749530553817749, -0.019583851099014282, 0.008327603340148926, 0.036239057779312134, 0.06415051221847534, 0.09206196665763855, 0.11997342109680176, 0.14788487553596497, 0.1757962703704834, 0.2037077248096466, 0.23161917924880981, 0.259530633687973, 0.28744208812713623, 0.31535354256629944, 0.34326499700546265, 0.37117645144462585, 0.39908790588378906, 0.42699936032295227, 0.4549108147621155, 0.4828222692012787, 0.5107337236404419, 0.5386451482772827, 0.5665566325187683, 0.5944681167602539, 0.6223795413970947, 0.6502909660339355, 0.6782024502754211, 0.7061139345169067, 0.7340253591537476, 0.7619367837905884, 0.789848268032074, 0.8177597522735596, 0.8456711769104004, 0.8735826015472412, 0.9014940857887268, 0.9294055700302124, 0.9573169946670532, 0.985228419303894, 1.0131399631500244, 1.0410513877868652, 1.068962812423706]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 6.0, 5.0, 8.0, 8.0, 14.0, 12.0, 25.0, 21.0, 42.0, 62.0, 74.0, 113.0, 194.0, 292.0, 503.0, 889.0, 1588.0, 3054.0, 6959.0, 16240.0, 45420.0, 141066.0, 196029.0, 70409.0, 23506.0, 9117.0, 3973.0, 2007.0, 1083.0, 555.0, 330.0, 230.0, 141.0, 86.0, 54.0, 34.0, 26.0, 25.0, 14.0, 14.0, 13.0, 5.0, 5.0, 10.0, 2.0, 4.0, 3.0, 0.0, 1.0, 2.0], "bins": [-0.92919921875, -0.9035263061523438, -0.8778533935546875, -0.8521804809570312, -0.826507568359375, -0.8008346557617188, -0.7751617431640625, -0.7494888305664062, -0.72381591796875, -0.6981430053710938, -0.6724700927734375, -0.6467971801757812, -0.621124267578125, -0.5954513549804688, -0.5697784423828125, -0.5441055297851562, -0.5184326171875, -0.49275970458984375, -0.4670867919921875, -0.44141387939453125, -0.415740966796875, -0.39006805419921875, -0.3643951416015625, -0.33872222900390625, -0.31304931640625, -0.28737640380859375, -0.2617034912109375, -0.23603057861328125, -0.210357666015625, -0.18468475341796875, -0.1590118408203125, -0.13333892822265625, -0.107666015625, -0.08199310302734375, -0.0563201904296875, -0.03064727783203125, -0.004974365234375, 0.02069854736328125, 0.0463714599609375, 0.07204437255859375, 0.09771728515625, 0.12339019775390625, 0.1490631103515625, 0.17473602294921875, 0.200408935546875, 0.22608184814453125, 0.2517547607421875, 0.27742767333984375, 0.3031005859375, 0.32877349853515625, 0.3544464111328125, 0.38011932373046875, 0.405792236328125, 0.43146514892578125, 0.4571380615234375, 0.48281097412109375, 0.50848388671875, 0.5341567993164062, 0.5598297119140625, 0.5855026245117188, 0.611175537109375, 0.6368484497070312, 0.6625213623046875, 0.6881942749023438, 0.7138671875]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 3.0, 3.0, 7.0, 8.0, 10.0, 22.0, 22.0, 23.0, 30.0, 38.0, 61.0, 67.0, 89.0, 81.0, 97.0, 79.0, 83.0, 72.0, 40.0, 36.0, 25.0, 28.0, 21.0, 18.0, 9.0, 7.0, 2.0, 5.0, 7.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.139892578125, -0.13499069213867188, -0.13008880615234375, -0.12518692016601562, -0.1202850341796875, -0.11538314819335938, -0.11048126220703125, -0.10557937622070312, -0.100677490234375, -0.09577560424804688, -0.09087371826171875, -0.08597183227539062, -0.0810699462890625, -0.07616806030273438, -0.07126617431640625, -0.06636428833007812, -0.06146240234375, -0.056560516357421875, -0.05165863037109375, -0.046756744384765625, -0.0418548583984375, -0.036952972412109375, -0.03205108642578125, -0.027149200439453125, -0.022247314453125, -0.017345428466796875, -0.01244354248046875, -0.007541656494140625, -0.0026397705078125, 0.002262115478515625, 0.00716400146484375, 0.012065887451171875, 0.0169677734375, 0.021869659423828125, 0.02677154541015625, 0.031673431396484375, 0.0365753173828125, 0.041477203369140625, 0.04637908935546875, 0.051280975341796875, 0.056182861328125, 0.061084747314453125, 0.06598663330078125, 0.07088851928710938, 0.0757904052734375, 0.08069229125976562, 0.08559417724609375, 0.09049606323242188, 0.09539794921875, 0.10029983520507812, 0.10520172119140625, 0.11010360717773438, 0.1150054931640625, 0.11990737915039062, 0.12480926513671875, 0.12971115112304688, 0.134613037109375, 0.13951492309570312, 0.14441680908203125, 0.14931869506835938, 0.1542205810546875, 0.15912246704101562, 0.16402435302734375, 0.16892623901367188, 0.173828125]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 7.0, 8.0, 6.0, 11.0, 21.0, 44.0, 86.0, 95.0, 84.0, 37.0, 28.0, 9.0, 16.0, 11.0, 13.0, 3.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.835953950881958, -0.8033477663993835, -0.7707415819168091, -0.7381354570388794, -0.7055292725563049, -0.6729230880737305, -0.640316903591156, -0.6077107191085815, -0.5751045942306519, -0.5424984097480774, -0.5098922252655029, -0.47728607058525085, -0.4446799159049988, -0.4120737314224243, -0.37946754693984985, -0.3468613624572754, -0.3142551779747009, -0.28164899349212646, -0.2490428388118744, -0.21643665432929993, -0.18383048474788666, -0.1512243151664734, -0.11861813068389893, -0.08601196110248566, -0.05340579152107239, -0.02079961821436882, 0.011806555092334747, 0.04441273212432861, 0.07701890170574188, 0.10962507128715515, 0.14223125576972961, 0.17483742535114288, 0.20744359493255615, 0.24004976451396942, 0.2726559340953827, 0.30526211857795715, 0.33786827325820923, 0.3704744577407837, 0.40308064222335815, 0.4356868267059326, 0.4682929813861847, 0.5008991360664368, 0.5335053205490112, 0.5661115050315857, 0.5987176895141602, 0.6313238143920898, 0.6639300584793091, 0.6965361833572388, 0.7291423678398132, 0.7617485523223877, 0.7943547368049622, 0.8269609212875366, 0.8595670461654663, 0.8921732306480408, 0.9247794151306152, 0.9573855996131897, 0.9899917840957642, 1.0225979089736938, 1.055204153060913, 1.0878102779388428, 1.120416522026062, 1.1530226469039917, 1.185628890991211, 1.2182350158691406, 1.2508411407470703]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 3.0, 9.0, 6.0, 12.0, 20.0, 22.0, 72.0, 94.0, 90.0, 58.0, 35.0, 11.0, 12.0, 11.0, 3.0, 7.0, 5.0, 2.0, 2.0, 5.0, 4.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-1.0994641780853271, -1.0718600749969482, -1.0442558526992798, -1.0166516304016113, -0.9890475273132324, -0.9614433646202087, -0.9338392019271851, -0.9062350392341614, -0.8786308765411377, -0.851026713848114, -0.8234225511550903, -0.7958183884620667, -0.768214225769043, -0.7406100630760193, -0.7130059003829956, -0.6854017376899719, -0.6577975749969482, -0.6301934123039246, -0.6025892496109009, -0.5749850869178772, -0.5473809242248535, -0.5197767615318298, -0.49217259883880615, -0.46456843614578247, -0.4369642734527588, -0.4093601107597351, -0.3817559480667114, -0.35415178537368774, -0.32654762268066406, -0.2989434599876404, -0.2713392972946167, -0.24373513460159302, -0.2161310315132141, -0.18852686882019043, -0.16092270612716675, -0.13331854343414307, -0.10571438074111938, -0.0781102180480957, -0.05050605535507202, -0.02290189266204834, 0.004702270030975342, 0.03230643272399902, 0.059910595417022705, 0.08751475811004639, 0.11511892080307007, 0.14272308349609375, 0.17032724618911743, 0.1979314088821411, 0.2255355715751648, 0.2531397342681885, 0.28074389696121216, 0.30834805965423584, 0.3359522223472595, 0.3635563850402832, 0.3911605477333069, 0.41876471042633057, 0.44636887311935425, 0.47397303581237793, 0.5015771985054016, 0.5291813611984253, 0.556785523891449, 0.5843896865844727, 0.6119938492774963, 0.63959801197052, 0.6672021746635437]}, "eval/loss": 4.234867572784424, "eval/wer": 1.9679492264974217, "eval/runtime": 791.3294, "eval/samples_per_second": 3.339, "eval/steps_per_second": 0.279} \ No newline at end of file