diff --git "a/wandb/run-20220302_000300-2ebwk6gp/files/wandb-summary.json" "b/wandb/run-20220302_000300-2ebwk6gp/files/wandb-summary.json" --- "a/wandb/run-20220302_000300-2ebwk6gp/files/wandb-summary.json" +++ "b/wandb/run-20220302_000300-2ebwk6gp/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 4.7853, "train/learning_rate": 5.805515239477504e-07, "train/epoch": 1.0, "train/global_step": 1189, "_runtime": 6633, "_timestamp": 1646186014, "_step": 1191, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 6.0, 7.0, 21.0, 31.0, 147.0, 519.0, 207.0, 32.0, 21.0, 12.0, 6.0, 4.0, 4.0], "bins": [-485.33099365234375, -476.75994873046875, -468.1888732910156, -459.6178283691406, -451.0467834472656, -442.4757385253906, -433.9046630859375, -425.3336181640625, -416.7625732421875, -408.1915283203125, -399.6204528808594, -391.0494079589844, -382.4783630371094, -373.9073181152344, -365.33624267578125, -356.76519775390625, -348.19415283203125, -339.62310791015625, -331.0520324707031, -322.4809875488281, -313.9099426269531, -305.3388977050781, -296.767822265625, -288.19677734375, -279.6257019042969, -271.0546569824219, -262.48358154296875, -253.91253662109375, -245.34149169921875, -236.7704315185547, -228.19937133789062, -219.62832641601562, -211.0572967529297, -202.48623657226562, -193.91519165039062, -185.34413146972656, -176.77308654785156, -168.2020263671875, -159.6309814453125, -151.05992126464844, -142.48887634277344, -133.91781616210938, -125.34677124023438, -116.77571105957031, -108.20466613769531, -99.63360595703125, -91.06255340576172, -82.49150085449219, -73.92044067382812, -65.3493881225586, -56.77833557128906, -48.207279205322266, -39.636226654052734, -31.065174102783203, -22.494117736816406, -13.923065185546875, -5.352016448974609, 3.2190370559692383, 11.790090560913086, 20.36114501953125, 28.93219757080078, 37.50325012207031, 46.07430648803711, 54.64535903930664, 63.21641159057617]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 6.0, 5.0, 0.0, 6.0, 4.0, 3.0, 4.0, 8.0, 10.0, 8.0, 15.0, 15.0, 23.0, 15.0, 22.0, 28.0, 21.0, 33.0, 43.0, 50.0, 59.0, 73.0, 74.0, 62.0, 69.0, 55.0, 48.0, 32.0, 32.0, 32.0, 22.0, 16.0, 22.0, 18.0, 14.0, 16.0, 7.0, 13.0, 6.0, 2.0, 5.0, 2.0, 4.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-121.59696960449219, -117.4406509399414, -113.28433227539062, -109.12801361083984, -104.97169494628906, -100.81536865234375, -96.65904998779297, -92.50273132324219, -88.3464126586914, -84.19009399414062, -80.03377532958984, -75.87745666503906, -71.72113037109375, -67.5648193359375, -63.40849304199219, -59.252174377441406, -55.095855712890625, -50.939537048339844, -46.78321838378906, -42.626895904541016, -38.470577239990234, -34.31425857543945, -30.15793800354004, -26.001617431640625, -21.845298767089844, -17.688980102539062, -13.532659530639648, -9.37633991241455, -5.220020294189453, -1.0637016296386719, 3.092618942260742, 7.248939514160156, 11.405258178710938, 15.561577796936035, 19.717897415161133, 23.874217987060547, 28.030536651611328, 32.18685531616211, 36.343177795410156, 40.49949645996094, 44.65581512451172, 48.8121337890625, 52.96845245361328, 57.12477493286133, 61.28109359741211, 65.43740844726562, 69.59373474121094, 73.75005340576172, 77.9063720703125, 82.06269073486328, 86.21900939941406, 90.37532806396484, 94.53164672851562, 98.68797302246094, 102.84429168701172, 107.0006103515625, 111.15692901611328, 115.31324768066406, 119.46956634521484, 123.62588500976562, 127.78221130371094, 131.9385223388672, 136.0948486328125, 140.25115966796875, 144.40748596191406]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 5.0, 5.0, 4.0, 6.0, 7.0, 11.0, 13.0, 8.0, 11.0, 23.0, 19.0, 16.0, 17.0, 40.0, 45.0, 60.0, 86.0, 108.0, 101.0, 73.0, 57.0, 41.0, 43.0, 29.0, 21.0, 22.0, 17.0, 14.0, 19.0, 10.0, 10.0, 14.0, 9.0, 6.0, 9.0, 3.0, 5.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.4140625, -9.10400390625, -8.7939453125, -8.48388671875, -8.173828125, -7.86376953125, -7.5537109375, -7.24365234375, -6.93359375, -6.62353515625, -6.3134765625, -6.00341796875, -5.693359375, -5.38330078125, -5.0732421875, -4.76318359375, -4.453125, -4.14306640625, -3.8330078125, -3.52294921875, -3.212890625, -2.90283203125, -2.5927734375, -2.28271484375, -1.97265625, -1.66259765625, -1.3525390625, -1.04248046875, -0.732421875, -0.42236328125, -0.1123046875, 0.19775390625, 0.5078125, 0.81787109375, 1.1279296875, 1.43798828125, 1.748046875, 2.05810546875, 2.3681640625, 2.67822265625, 2.98828125, 3.29833984375, 3.6083984375, 3.91845703125, 4.228515625, 4.53857421875, 4.8486328125, 5.15869140625, 5.46875, 5.77880859375, 6.0888671875, 6.39892578125, 6.708984375, 7.01904296875, 7.3291015625, 7.63916015625, 7.94921875, 8.25927734375, 8.5693359375, 8.87939453125, 9.189453125, 9.49951171875, 9.8095703125, 10.11962890625, 10.4296875]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 6.0, 4.0, 4.0, 4.0, 7.0, 9.0, 11.0, 15.0, 29.0, 44.0, 54.0, 80.0, 105.0, 128.0, 156.0, 270.0, 398.0, 602.0, 878.0, 1353.0, 2231.0, 3736.0, 6684.0, 13309.0, 37672.0, 481680.0, 3393357.0, 195460.0, 27874.0, 11931.0, 6384.0, 3601.0, 2235.0, 1322.0, 900.0, 554.0, 390.0, 257.0, 175.0, 112.0, 85.0, 44.0, 43.0, 22.0, 26.0, 14.0, 14.0, 10.0, 2.0, 4.0, 3.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-29.3125, -28.34716796875, -27.3818359375, -26.41650390625, -25.451171875, -24.48583984375, -23.5205078125, -22.55517578125, -21.58984375, -20.62451171875, -19.6591796875, -18.69384765625, -17.728515625, -16.76318359375, -15.7978515625, -14.83251953125, -13.8671875, -12.90185546875, -11.9365234375, -10.97119140625, -10.005859375, -9.04052734375, -8.0751953125, -7.10986328125, -6.14453125, -5.17919921875, -4.2138671875, -3.24853515625, -2.283203125, -1.31787109375, -0.3525390625, 0.61279296875, 1.578125, 2.54345703125, 3.5087890625, 4.47412109375, 5.439453125, 6.40478515625, 7.3701171875, 8.33544921875, 9.30078125, 10.26611328125, 11.2314453125, 12.19677734375, 13.162109375, 14.12744140625, 15.0927734375, 16.05810546875, 17.0234375, 17.98876953125, 18.9541015625, 19.91943359375, 20.884765625, 21.85009765625, 22.8154296875, 23.78076171875, 24.74609375, 25.71142578125, 26.6767578125, 27.64208984375, 28.607421875, 29.57275390625, 30.5380859375, 31.50341796875, 32.46875]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 5.0, 3.0, 6.0, 4.0, 5.0, 10.0, 9.0, 6.0, 20.0, 12.0, 18.0, 25.0, 31.0, 49.0, 52.0, 46.0, 88.0, 109.0, 236.0, 401.0, 660.0, 783.0, 593.0, 324.0, 186.0, 89.0, 63.0, 40.0, 42.0, 26.0, 26.0, 15.0, 23.0, 15.0, 18.0, 11.0, 6.0, 6.0, 2.0, 2.0, 3.0, 2.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-28.46875, -27.5576171875, -26.646484375, -25.7353515625, -24.82421875, -23.9130859375, -23.001953125, -22.0908203125, -21.1796875, -20.2685546875, -19.357421875, -18.4462890625, -17.53515625, -16.6240234375, -15.712890625, -14.8017578125, -13.890625, -12.9794921875, -12.068359375, -11.1572265625, -10.24609375, -9.3349609375, -8.423828125, -7.5126953125, -6.6015625, -5.6904296875, -4.779296875, -3.8681640625, -2.95703125, -2.0458984375, -1.134765625, -0.2236328125, 0.6875, 1.5986328125, 2.509765625, 3.4208984375, 4.33203125, 5.2431640625, 6.154296875, 7.0654296875, 7.9765625, 8.8876953125, 9.798828125, 10.7099609375, 11.62109375, 12.5322265625, 13.443359375, 14.3544921875, 15.265625, 16.1767578125, 17.087890625, 17.9990234375, 18.91015625, 19.8212890625, 20.732421875, 21.6435546875, 22.5546875, 23.4658203125, 24.376953125, 25.2880859375, 26.19921875, 27.1103515625, 28.021484375, 28.9326171875, 29.84375]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 5.0, 2.0, 3.0, 1.0, 4.0, 4.0, 6.0, 8.0, 11.0, 17.0, 8.0, 20.0, 26.0, 20.0, 25.0, 53.0, 40.0, 71.0, 119.0, 124.0, 227.0, 391.0, 848.0, 2284.0, 6817.0, 26358.0, 165688.0, 3781773.0, 171036.0, 27069.0, 6961.0, 2279.0, 863.0, 371.0, 221.0, 138.0, 76.0, 59.0, 55.0, 51.0, 41.0, 28.0, 17.0, 22.0, 8.0, 6.0, 6.0, 6.0, 9.0, 5.0, 5.0, 2.0, 5.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0], "bins": [-81.625, -79.0341796875, -76.443359375, -73.8525390625, -71.26171875, -68.6708984375, -66.080078125, -63.4892578125, -60.8984375, -58.3076171875, -55.716796875, -53.1259765625, -50.53515625, -47.9443359375, -45.353515625, -42.7626953125, -40.171875, -37.5810546875, -34.990234375, -32.3994140625, -29.80859375, -27.2177734375, -24.626953125, -22.0361328125, -19.4453125, -16.8544921875, -14.263671875, -11.6728515625, -9.08203125, -6.4912109375, -3.900390625, -1.3095703125, 1.28125, 3.8720703125, 6.462890625, 9.0537109375, 11.64453125, 14.2353515625, 16.826171875, 19.4169921875, 22.0078125, 24.5986328125, 27.189453125, 29.7802734375, 32.37109375, 34.9619140625, 37.552734375, 40.1435546875, 42.734375, 45.3251953125, 47.916015625, 50.5068359375, 53.09765625, 55.6884765625, 58.279296875, 60.8701171875, 63.4609375, 66.0517578125, 68.642578125, 71.2333984375, 73.82421875, 76.4150390625, 79.005859375, 81.5966796875, 84.1875]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 5.0, 9.0, 26.0, 22.0, 56.0, 85.0, 184.0, 248.0, 152.0, 102.0, 46.0, 31.0, 23.0, 6.0, 4.0, 6.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-86.32012939453125, -82.11811065673828, -77.91609191894531, -73.71407318115234, -69.51205444335938, -65.31004333496094, -61.10802459716797, -56.906005859375, -52.70398712158203, -48.50196838378906, -44.299949645996094, -40.09793472290039, -35.89591598510742, -31.693897247314453, -27.491880416870117, -23.28986358642578, -19.087844848632812, -14.88582706451416, -10.683809280395508, -6.4817914962768555, -2.279773712158203, 1.9222450256347656, 6.124261856079102, 10.326278686523438, 14.528297424316406, 18.730316162109375, 22.93233299255371, 27.134349822998047, 31.336368560791016, 35.538387298583984, 39.74040222167969, 43.942420959472656, 48.144439697265625, 52.346458435058594, 56.54847717285156, 60.750492095947266, 64.9525146484375, 69.15452575683594, 73.3565444946289, 77.55856323242188, 81.76058197021484, 85.96260070800781, 90.16461944580078, 94.36663818359375, 98.56864929199219, 102.77067565917969, 106.97268676757812, 111.1747055053711, 115.37672424316406, 119.57874298095703, 123.78076171875, 127.98278045654297, 132.18479919433594, 136.38681030273438, 140.58883666992188, 144.7908477783203, 148.99285888671875, 153.1948699951172, 157.3968963623047, 161.59890747070312, 165.80093383789062, 170.00294494628906, 174.20497131347656, 178.406982421875, 182.6090087890625]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 3.0, 6.0, 11.0, 9.0, 14.0, 6.0, 13.0, 22.0, 14.0, 21.0, 31.0, 25.0, 24.0, 29.0, 31.0, 31.0, 52.0, 38.0, 40.0, 49.0, 51.0, 47.0, 34.0, 36.0, 34.0, 39.0, 44.0, 37.0, 29.0, 24.0, 26.0, 23.0, 20.0, 18.0, 17.0, 13.0, 17.0, 5.0, 8.0, 6.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0], "bins": [-98.53227233886719, -95.51553344726562, -92.49879455566406, -89.4820556640625, -86.46531677246094, -83.4485855102539, -80.43184661865234, -77.41510772705078, -74.39836883544922, -71.38162994384766, -68.3648910522461, -65.34815216064453, -62.331417083740234, -59.31467819213867, -56.297943115234375, -53.28120422363281, -50.26446533203125, -47.24772644042969, -44.230987548828125, -41.21425247192383, -38.197513580322266, -35.1807746887207, -32.164039611816406, -29.147300720214844, -26.13056182861328, -23.11382293701172, -20.09708595275879, -17.08034896850586, -14.063610076904297, -11.04687213897705, -8.030134201049805, -5.013397216796875, -1.9966583251953125, 1.0200796127319336, 4.03681755065918, 7.053555488586426, 10.070293426513672, 13.087031364440918, 16.103769302368164, 19.120506286621094, 22.137245178222656, 25.15398406982422, 28.17072105407715, 31.187458038330078, 34.20419692993164, 37.2209358215332, 40.2376708984375, 43.25440979003906, 46.271148681640625, 49.28788757324219, 52.30462646484375, 55.32136154174805, 58.33810043334961, 61.35483932495117, 64.37157440185547, 67.38831329345703, 70.4050521850586, 73.42179107666016, 76.43852996826172, 79.45526885986328, 82.47200012207031, 85.48873901367188, 88.50547790527344, 91.522216796875, 94.53895568847656]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 5.0, 2.0, 2.0, 2.0, 2.0, 6.0, 9.0, 9.0, 8.0, 14.0, 13.0, 13.0, 31.0, 28.0, 34.0, 30.0, 57.0, 62.0, 60.0, 75.0, 74.0, 66.0, 60.0, 61.0, 55.0, 27.0, 33.0, 35.0, 20.0, 20.0, 19.0, 13.0, 20.0, 9.0, 8.0, 4.0, 4.0, 7.0, 6.0, 0.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.6328125, -10.287841796875, -9.94287109375, -9.597900390625, -9.2529296875, -8.907958984375, -8.56298828125, -8.218017578125, -7.873046875, -7.528076171875, -7.18310546875, -6.838134765625, -6.4931640625, -6.148193359375, -5.80322265625, -5.458251953125, -5.11328125, -4.768310546875, -4.42333984375, -4.078369140625, -3.7333984375, -3.388427734375, -3.04345703125, -2.698486328125, -2.353515625, -2.008544921875, -1.66357421875, -1.318603515625, -0.9736328125, -0.628662109375, -0.28369140625, 0.061279296875, 0.40625, 0.751220703125, 1.09619140625, 1.441162109375, 1.7861328125, 2.131103515625, 2.47607421875, 2.821044921875, 3.166015625, 3.510986328125, 3.85595703125, 4.200927734375, 4.5458984375, 4.890869140625, 5.23583984375, 5.580810546875, 5.92578125, 6.270751953125, 6.61572265625, 6.960693359375, 7.3056640625, 7.650634765625, 7.99560546875, 8.340576171875, 8.685546875, 9.030517578125, 9.37548828125, 9.720458984375, 10.0654296875, 10.410400390625, 10.75537109375, 11.100341796875, 11.4453125]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 7.0, 12.0, 14.0, 17.0, 42.0, 39.0, 57.0, 94.0, 121.0, 171.0, 277.0, 344.0, 493.0, 667.0, 920.0, 1331.0, 1903.0, 2991.0, 4489.0, 6866.0, 10835.0, 18452.0, 32866.0, 64598.0, 148587.0, 325822.0, 225996.0, 93543.0, 44193.0, 23773.0, 13738.0, 8494.0, 5386.0, 3556.0, 2406.0, 1620.0, 1072.0, 831.0, 534.0, 422.0, 279.0, 183.0, 164.0, 107.0, 76.0, 53.0, 46.0, 20.0, 16.0, 12.0, 13.0, 2.0, 4.0, 2.0, 0.0, 1.0, 4.0, 1.0], "bins": [-1.0390625, -1.006317138671875, -0.97357177734375, -0.940826416015625, -0.9080810546875, -0.875335693359375, -0.84259033203125, -0.809844970703125, -0.777099609375, -0.744354248046875, -0.71160888671875, -0.678863525390625, -0.6461181640625, -0.613372802734375, -0.58062744140625, -0.547882080078125, -0.51513671875, -0.482391357421875, -0.44964599609375, -0.416900634765625, -0.3841552734375, -0.351409912109375, -0.31866455078125, -0.285919189453125, -0.253173828125, -0.220428466796875, -0.18768310546875, -0.154937744140625, -0.1221923828125, -0.089447021484375, -0.05670166015625, -0.023956298828125, 0.0087890625, 0.041534423828125, 0.07427978515625, 0.107025146484375, 0.1397705078125, 0.172515869140625, 0.20526123046875, 0.238006591796875, 0.270751953125, 0.303497314453125, 0.33624267578125, 0.368988037109375, 0.4017333984375, 0.434478759765625, 0.46722412109375, 0.499969482421875, 0.53271484375, 0.565460205078125, 0.59820556640625, 0.630950927734375, 0.6636962890625, 0.696441650390625, 0.72918701171875, 0.761932373046875, 0.794677734375, 0.827423095703125, 0.86016845703125, 0.892913818359375, 0.9256591796875, 0.958404541015625, 0.99114990234375, 1.023895263671875, 1.056640625]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 4.0, 7.0, 10.0, 8.0, 6.0, 10.0, 6.0, 12.0, 8.0, 23.0, 21.0, 16.0, 22.0, 23.0, 20.0, 19.0, 33.0, 26.0, 37.0, 27.0, 40.0, 36.0, 39.0, 39.0, 1056.0, 35.0, 45.0, 40.0, 42.0, 41.0, 32.0, 21.0, 19.0, 20.0, 25.0, 21.0, 15.0, 21.0, 19.0, 18.0, 12.0, 11.0, 10.0, 5.0, 5.0, 6.0, 5.0, 5.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0], "bins": [-5.01171875, -4.8643798828125, -4.717041015625, -4.5697021484375, -4.42236328125, -4.2750244140625, -4.127685546875, -3.9803466796875, -3.8330078125, -3.6856689453125, -3.538330078125, -3.3909912109375, -3.24365234375, -3.0963134765625, -2.948974609375, -2.8016357421875, -2.654296875, -2.5069580078125, -2.359619140625, -2.2122802734375, -2.06494140625, -1.9176025390625, -1.770263671875, -1.6229248046875, -1.4755859375, -1.3282470703125, -1.180908203125, -1.0335693359375, -0.88623046875, -0.7388916015625, -0.591552734375, -0.4442138671875, -0.296875, -0.1495361328125, -0.002197265625, 0.1451416015625, 0.29248046875, 0.4398193359375, 0.587158203125, 0.7344970703125, 0.8818359375, 1.0291748046875, 1.176513671875, 1.3238525390625, 1.47119140625, 1.6185302734375, 1.765869140625, 1.9132080078125, 2.060546875, 2.2078857421875, 2.355224609375, 2.5025634765625, 2.64990234375, 2.7972412109375, 2.944580078125, 3.0919189453125, 3.2392578125, 3.3865966796875, 3.533935546875, 3.6812744140625, 3.82861328125, 3.9759521484375, 4.123291015625, 4.2706298828125, 4.41796875]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 6.0, 5.0, 6.0, 12.0, 12.0, 31.0, 55.0, 76.0, 116.0, 174.0, 259.0, 400.0, 579.0, 855.0, 1238.0, 1783.0, 2665.0, 3875.0, 5694.0, 8397.0, 12192.0, 18147.0, 26811.0, 40711.0, 64764.0, 106952.0, 202669.0, 1231618.0, 136620.0, 80462.0, 49767.0, 32694.0, 21568.0, 14531.0, 9897.0, 6739.0, 4687.0, 3225.0, 2187.0, 1521.0, 1016.0, 714.0, 464.0, 328.0, 204.0, 143.0, 93.0, 60.0, 43.0, 23.0, 17.0, 11.0, 7.0, 5.0, 8.0, 4.0, 1.0, 4.0, 0.0, 1.0, 1.0], "bins": [-0.416015625, -0.402252197265625, -0.38848876953125, -0.374725341796875, -0.3609619140625, -0.347198486328125, -0.33343505859375, -0.319671630859375, -0.305908203125, -0.292144775390625, -0.27838134765625, -0.264617919921875, -0.2508544921875, -0.237091064453125, -0.22332763671875, -0.209564208984375, -0.19580078125, -0.182037353515625, -0.16827392578125, -0.154510498046875, -0.1407470703125, -0.126983642578125, -0.11322021484375, -0.099456787109375, -0.085693359375, -0.071929931640625, -0.05816650390625, -0.044403076171875, -0.0306396484375, -0.016876220703125, -0.00311279296875, 0.010650634765625, 0.0244140625, 0.038177490234375, 0.05194091796875, 0.065704345703125, 0.0794677734375, 0.093231201171875, 0.10699462890625, 0.120758056640625, 0.134521484375, 0.148284912109375, 0.16204833984375, 0.175811767578125, 0.1895751953125, 0.203338623046875, 0.21710205078125, 0.230865478515625, 0.24462890625, 0.258392333984375, 0.27215576171875, 0.285919189453125, 0.2996826171875, 0.313446044921875, 0.32720947265625, 0.340972900390625, 0.354736328125, 0.368499755859375, 0.38226318359375, 0.396026611328125, 0.4097900390625, 0.423553466796875, 0.43731689453125, 0.451080322265625, 0.46484375]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 1.0, 5.0, 6.0, 7.0, 10.0, 12.0, 15.0, 16.0, 19.0, 20.0, 18.0, 24.0, 32.0, 31.0, 34.0, 40.0, 37.0, 33.0, 36.0, 38.0, 44.0, 46.0, 41.0, 48.0, 37.0, 46.0, 33.0, 37.0, 31.0, 36.0, 28.0, 29.0, 14.0, 17.0, 13.0, 16.0, 5.0, 12.0, 6.0, 6.0, 7.0, 3.0, 3.0, 1.0, 4.0, 6.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.0209808349609375, -0.020348072052001953, -0.019715309143066406, -0.01908254623413086, -0.018449783325195312, -0.017817020416259766, -0.01718425750732422, -0.016551494598388672, -0.015918731689453125, -0.015285968780517578, -0.014653205871582031, -0.014020442962646484, -0.013387680053710938, -0.01275491714477539, -0.012122154235839844, -0.011489391326904297, -0.01085662841796875, -0.010223865509033203, -0.009591102600097656, -0.00895833969116211, -0.008325576782226562, -0.007692813873291016, -0.007060050964355469, -0.006427288055419922, -0.005794525146484375, -0.005161762237548828, -0.004528999328613281, -0.0038962364196777344, -0.0032634735107421875, -0.0026307106018066406, -0.0019979476928710938, -0.0013651847839355469, -0.000732421875, -9.965896606445312e-05, 0.0005331039428710938, 0.0011658668518066406, 0.0017986297607421875, 0.0024313926696777344, 0.0030641555786132812, 0.003696918487548828, 0.004329681396484375, 0.004962444305419922, 0.005595207214355469, 0.006227970123291016, 0.0068607330322265625, 0.007493495941162109, 0.008126258850097656, 0.008759021759033203, 0.00939178466796875, 0.010024547576904297, 0.010657310485839844, 0.01129007339477539, 0.011922836303710938, 0.012555599212646484, 0.013188362121582031, 0.013821125030517578, 0.014453887939453125, 0.015086650848388672, 0.01571941375732422, 0.016352176666259766, 0.016984939575195312, 0.01761770248413086, 0.018250465393066406, 0.018883228302001953, 0.0195159912109375]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 5.0, 4.0, 3.0, 5.0, 4.0, 12.0, 13.0, 6.0, 13.0, 20.0, 21.0, 27.0, 42.0, 54.0, 65.0, 111.0, 159.0, 211.0, 314.0, 496.0, 988.0, 1004028.0, 39967.0, 627.0, 393.0, 287.0, 190.0, 128.0, 92.0, 51.0, 40.0, 48.0, 22.0, 24.0, 16.0, 17.0, 13.0, 10.0, 6.0, 10.0, 4.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.5166015625, -0.4998321533203125, -0.483062744140625, -0.4662933349609375, -0.44952392578125, -0.4327545166015625, -0.415985107421875, -0.3992156982421875, -0.3824462890625, -0.3656768798828125, -0.348907470703125, -0.3321380615234375, -0.31536865234375, -0.2985992431640625, -0.281829833984375, -0.2650604248046875, -0.248291015625, -0.2315216064453125, -0.214752197265625, -0.1979827880859375, -0.18121337890625, -0.1644439697265625, -0.147674560546875, -0.1309051513671875, -0.1141357421875, -0.0973663330078125, -0.080596923828125, -0.0638275146484375, -0.04705810546875, -0.0302886962890625, -0.013519287109375, 0.0032501220703125, 0.02001953125, 0.0367889404296875, 0.053558349609375, 0.0703277587890625, 0.08709716796875, 0.1038665771484375, 0.120635986328125, 0.1374053955078125, 0.1541748046875, 0.1709442138671875, 0.187713623046875, 0.2044830322265625, 0.22125244140625, 0.2380218505859375, 0.254791259765625, 0.2715606689453125, 0.288330078125, 0.3050994873046875, 0.321868896484375, 0.3386383056640625, 0.35540771484375, 0.3721771240234375, 0.388946533203125, 0.4057159423828125, 0.4224853515625, 0.4392547607421875, 0.456024169921875, 0.4727935791015625, 0.48956298828125, 0.5063323974609375, 0.523101806640625, 0.5398712158203125, 0.556640625]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 929.0, 84.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5500984191894531, -0.527895450592041, -0.5056924819946289, -0.4834895431995392, -0.4612865746021271, -0.43908363580703735, -0.41688066720962524, -0.39467769861221313, -0.372474730014801, -0.3502717614173889, -0.3280688226222992, -0.3058658540248871, -0.283662885427475, -0.26145994663238525, -0.23925697803497314, -0.21705400943756104, -0.1948510706424713, -0.1726481169462204, -0.1504451483488083, -0.12824219465255737, -0.10603923350572586, -0.08383627235889435, -0.06163331866264343, -0.03943035006523132, -0.017227396368980408, 0.0049755629152059555, 0.02717852219939232, 0.04938147962093353, 0.07158444076776505, 0.09378740191459656, 0.11599035561084747, 0.13819332420825958, 0.1603962779045105, 0.1825992316007614, 0.20480220019817352, 0.22700515389442444, 0.24920812249183655, 0.27141106128692627, 0.2936140298843384, 0.3158169984817505, 0.3380199670791626, 0.3602229356765747, 0.38242587447166443, 0.40462884306907654, 0.42683181166648865, 0.44903475046157837, 0.4712377190589905, 0.4934406876564026, 0.5156435966491699, 0.537846565246582, 0.5600495338439941, 0.5822525024414062, 0.6044554114341736, 0.6266583800315857, 0.6488613486289978, 0.6710643172264099, 0.693267285823822, 0.7154702544212341, 0.7376732230186462, 0.7598761320114136, 0.7820791006088257, 0.8042820692062378, 0.8264850378036499, 0.848688006401062, 0.8708909749984741]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 4.0, 9.0, 7.0, 11.0, 7.0, 17.0, 22.0, 25.0, 39.0, 64.0, 46.0, 39.0, 70.0, 71.0, 54.0, 59.0, 66.0, 57.0, 63.0, 61.0, 56.0, 44.0, 32.0, 26.0, 22.0, 12.0, 5.0, 7.0, 7.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1001366376876831, -0.09781963378190994, -0.09550262987613678, -0.09318562597036362, -0.09086862206459045, -0.08855162560939789, -0.08623462170362473, -0.08391761779785156, -0.0816006138920784, -0.07928360998630524, -0.07696660608053207, -0.07464960217475891, -0.07233260571956635, -0.07001560181379318, -0.06769859790802002, -0.06538159400224686, -0.0630645900964737, -0.06074758619070053, -0.05843058228492737, -0.056113582104444504, -0.05379657819867134, -0.05147957429289818, -0.049162574112415314, -0.04684557020664215, -0.04452856630086899, -0.042211562395095825, -0.03989455848932266, -0.0375775583088398, -0.035260554403066635, -0.03294355049729347, -0.03062654845416546, -0.028309546411037445, -0.025992542505264282, -0.02367553859949112, -0.021358536556363106, -0.019041534513235092, -0.01672453060746193, -0.014407527633011341, -0.012090524658560753, -0.00977352261543274, -0.007456518709659576, -0.005139515735208988, -0.0028225127607584, -0.0005055097863078117, 0.0018114931881427765, 0.004128496162593365, 0.006445499137043953, 0.008762501180171967, 0.01107950508594513, 0.013396508060395718, 0.015713511034846306, 0.01803051307797432, 0.020347516983747482, 0.022664520889520645, 0.02498152293264866, 0.027298524975776672, 0.029615528881549835, 0.031932532787323, 0.03424953669309616, 0.036566536873579025, 0.03888354077935219, 0.04120054468512535, 0.043517544865608215, 0.04583454877138138, 0.04815155267715454]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 5.0, 2.0, 2.0, 2.0, 2.0, 6.0, 9.0, 9.0, 8.0, 14.0, 13.0, 12.0, 32.0, 28.0, 34.0, 30.0, 57.0, 62.0, 60.0, 75.0, 74.0, 66.0, 60.0, 61.0, 55.0, 27.0, 33.0, 35.0, 20.0, 20.0, 19.0, 13.0, 20.0, 9.0, 8.0, 4.0, 4.0, 7.0, 6.0, 0.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.6328125, -10.287841796875, -9.94287109375, -9.597900390625, -9.2529296875, -8.907958984375, -8.56298828125, -8.218017578125, -7.873046875, -7.528076171875, -7.18310546875, -6.838134765625, -6.4931640625, -6.148193359375, -5.80322265625, -5.458251953125, -5.11328125, -4.768310546875, -4.42333984375, -4.078369140625, -3.7333984375, -3.388427734375, -3.04345703125, -2.698486328125, -2.353515625, -2.008544921875, -1.66357421875, -1.318603515625, -0.9736328125, -0.628662109375, -0.28369140625, 0.061279296875, 0.40625, 0.751220703125, 1.09619140625, 1.441162109375, 1.7861328125, 2.131103515625, 2.47607421875, 2.821044921875, 3.166015625, 3.510986328125, 3.85595703125, 4.200927734375, 4.5458984375, 4.890869140625, 5.23583984375, 5.580810546875, 5.92578125, 6.270751953125, 6.61572265625, 6.960693359375, 7.3056640625, 7.650634765625, 7.99560546875, 8.340576171875, 8.685546875, 9.030517578125, 9.37548828125, 9.720458984375, 10.0654296875, 10.410400390625, 10.75537109375, 11.100341796875, 11.4453125]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 6.0, 6.0, 6.0, 9.0, 21.0, 26.0, 27.0, 47.0, 77.0, 84.0, 109.0, 186.0, 245.0, 370.0, 503.0, 849.0, 1229.0, 2019.0, 3340.0, 6277.0, 13250.0, 39339.0, 327918.0, 570727.0, 49799.0, 15466.0, 6798.0, 3676.0, 2077.0, 1313.0, 893.0, 564.0, 398.0, 258.0, 171.0, 150.0, 90.0, 59.0, 55.0, 48.0, 21.0, 17.0, 12.0, 13.0, 3.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.453125, -30.407470703125, -29.36181640625, -28.316162109375, -27.2705078125, -26.224853515625, -25.17919921875, -24.133544921875, -23.087890625, -22.042236328125, -20.99658203125, -19.950927734375, -18.9052734375, -17.859619140625, -16.81396484375, -15.768310546875, -14.72265625, -13.677001953125, -12.63134765625, -11.585693359375, -10.5400390625, -9.494384765625, -8.44873046875, -7.403076171875, -6.357421875, -5.311767578125, -4.26611328125, -3.220458984375, -2.1748046875, -1.129150390625, -0.08349609375, 0.962158203125, 2.0078125, 3.053466796875, 4.09912109375, 5.144775390625, 6.1904296875, 7.236083984375, 8.28173828125, 9.327392578125, 10.373046875, 11.418701171875, 12.46435546875, 13.510009765625, 14.5556640625, 15.601318359375, 16.64697265625, 17.692626953125, 18.73828125, 19.783935546875, 20.82958984375, 21.875244140625, 22.9208984375, 23.966552734375, 25.01220703125, 26.057861328125, 27.103515625, 28.149169921875, 29.19482421875, 30.240478515625, 31.2861328125, 32.331787109375, 33.37744140625, 34.423095703125, 35.46875]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 5.0, 3.0, 3.0, 6.0, 8.0, 6.0, 7.0, 11.0, 9.0, 21.0, 15.0, 19.0, 26.0, 23.0, 28.0, 29.0, 37.0, 33.0, 37.0, 52.0, 66.0, 84.0, 136.0, 1698.0, 172.0, 80.0, 61.0, 54.0, 42.0, 24.0, 27.0, 42.0, 20.0, 31.0, 25.0, 21.0, 19.0, 11.0, 6.0, 15.0, 10.0, 6.0, 6.0, 5.0, 7.0, 1.0, 5.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0], "bins": [-29.6875, -28.804443359375, -27.92138671875, -27.038330078125, -26.1552734375, -25.272216796875, -24.38916015625, -23.506103515625, -22.623046875, -21.739990234375, -20.85693359375, -19.973876953125, -19.0908203125, -18.207763671875, -17.32470703125, -16.441650390625, -15.55859375, -14.675537109375, -13.79248046875, -12.909423828125, -12.0263671875, -11.143310546875, -10.26025390625, -9.377197265625, -8.494140625, -7.611083984375, -6.72802734375, -5.844970703125, -4.9619140625, -4.078857421875, -3.19580078125, -2.312744140625, -1.4296875, -0.546630859375, 0.33642578125, 1.219482421875, 2.1025390625, 2.985595703125, 3.86865234375, 4.751708984375, 5.634765625, 6.517822265625, 7.40087890625, 8.283935546875, 9.1669921875, 10.050048828125, 10.93310546875, 11.816162109375, 12.69921875, 13.582275390625, 14.46533203125, 15.348388671875, 16.2314453125, 17.114501953125, 17.99755859375, 18.880615234375, 19.763671875, 20.646728515625, 21.52978515625, 22.412841796875, 23.2958984375, 24.178955078125, 25.06201171875, 25.945068359375, 26.828125]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 4.0, 5.0, 5.0, 2.0, 7.0, 5.0, 9.0, 15.0, 5.0, 17.0, 20.0, 21.0, 20.0, 16.0, 34.0, 32.0, 36.0, 59.0, 118.0, 175.0, 519.0, 4826.0, 3073946.0, 63939.0, 1080.0, 300.0, 122.0, 76.0, 55.0, 38.0, 33.0, 25.0, 19.0, 22.0, 20.0, 15.0, 8.0, 12.0, 8.0, 7.0, 5.0, 8.0, 8.0, 2.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-127.5, -123.3515625, -119.203125, -115.0546875, -110.90625, -106.7578125, -102.609375, -98.4609375, -94.3125, -90.1640625, -86.015625, -81.8671875, -77.71875, -73.5703125, -69.421875, -65.2734375, -61.125, -56.9765625, -52.828125, -48.6796875, -44.53125, -40.3828125, -36.234375, -32.0859375, -27.9375, -23.7890625, -19.640625, -15.4921875, -11.34375, -7.1953125, -3.046875, 1.1015625, 5.25, 9.3984375, 13.546875, 17.6953125, 21.84375, 25.9921875, 30.140625, 34.2890625, 38.4375, 42.5859375, 46.734375, 50.8828125, 55.03125, 59.1796875, 63.328125, 67.4765625, 71.625, 75.7734375, 79.921875, 84.0703125, 88.21875, 92.3671875, 96.515625, 100.6640625, 104.8125, 108.9609375, 113.109375, 117.2578125, 121.40625, 125.5546875, 129.703125, 133.8515625, 138.0]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 971.0, 42.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-937.2486572265625, -917.9788818359375, -898.7090454101562, -879.4392700195312, -860.16943359375, -840.899658203125, -821.6298217773438, -802.3600463867188, -783.0902099609375, -763.8204345703125, -744.5505981445312, -725.2808227539062, -706.010986328125, -686.7412109375, -667.4713745117188, -648.2015991210938, -628.9318237304688, -609.6620483398438, -590.3922119140625, -571.1224365234375, -551.8526000976562, -532.5828247070312, -513.31298828125, -494.043212890625, -474.7734069824219, -455.50360107421875, -436.2337951660156, -416.9639892578125, -397.6942138671875, -378.42437744140625, -359.15460205078125, -339.8847961425781, -320.6149597167969, -301.34515380859375, -282.0753479003906, -262.8055419921875, -243.53575134277344, -224.2659454345703, -204.99615478515625, -185.72634887695312, -166.45654296875, -147.18673706054688, -127.91693878173828, -108.64714050292969, -89.37733459472656, -70.10752868652344, -50.837730407714844, -31.56793212890625, -12.298126220703125, 6.971675872802734, 26.241477966308594, 45.51128005981445, 64.78108215332031, 84.05088806152344, 103.32068634033203, 122.59048461914062, 141.86029052734375, 161.13009643554688, 180.39990234375, 199.66969299316406, 218.9394989013672, 238.2093048095703, 257.4790954589844, 276.7489013671875, 296.0187072753906]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 2.0, 3.0, 6.0, 4.0, 9.0, 7.0, 11.0, 13.0, 17.0, 14.0, 14.0, 22.0, 24.0, 35.0, 25.0, 29.0, 21.0, 31.0, 36.0, 43.0, 38.0, 35.0, 47.0, 31.0, 41.0, 47.0, 41.0, 27.0, 37.0, 32.0, 24.0, 40.0, 38.0, 24.0, 25.0, 13.0, 11.0, 10.0, 13.0, 15.0, 12.0, 6.0, 8.0, 8.0, 5.0, 4.0, 6.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-93.83245086669922, -90.99108123779297, -88.14971923828125, -85.308349609375, -82.46697998046875, -79.62561798095703, -76.78424835205078, -73.94288635253906, -71.10151672363281, -68.26014709472656, -65.41878509521484, -62.577415466308594, -59.73604965209961, -56.894683837890625, -54.053314208984375, -51.21194839477539, -48.370582580566406, -45.52921676635742, -42.68785095214844, -39.84648132324219, -37.0051155090332, -34.16374969482422, -31.3223819732666, -28.481014251708984, -25.6396484375, -22.798282623291016, -19.9569149017334, -17.11554718017578, -14.274181365966797, -11.432814598083496, -8.591447830200195, -5.750080108642578, -2.908721923828125, -0.06735515594482422, 2.7740116119384766, 5.615378379821777, 8.456745147705078, 11.298111915588379, 14.13947868347168, 16.980846405029297, 19.82221221923828, 22.663578033447266, 25.504945755004883, 28.3463134765625, 31.187679290771484, 34.02904510498047, 36.87041473388672, 39.7117805480957, 42.55314636230469, 45.39451217651367, 48.235877990722656, 51.077247619628906, 53.91861343383789, 56.759979248046875, 59.601348876953125, 62.44271469116211, 65.2840805053711, 68.12545013427734, 70.96681213378906, 73.80818176269531, 76.64955139160156, 79.49091339111328, 82.33228302001953, 85.17364501953125, 88.0150146484375]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 2.0, 1.0, 3.0, 8.0, 7.0, 5.0, 6.0, 14.0, 14.0, 12.0, 21.0, 33.0, 36.0, 31.0, 40.0, 53.0, 65.0, 66.0, 76.0, 84.0, 69.0, 61.0, 46.0, 34.0, 38.0, 32.0, 24.0, 21.0, 19.0, 15.0, 21.0, 12.0, 9.0, 1.0, 7.0, 8.0, 1.0, 3.0, 3.0, 2.0, 0.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.1953125, -10.8250732421875, -10.454833984375, -10.0845947265625, -9.71435546875, -9.3441162109375, -8.973876953125, -8.6036376953125, -8.2333984375, -7.8631591796875, -7.492919921875, -7.1226806640625, -6.75244140625, -6.3822021484375, -6.011962890625, -5.6417236328125, -5.271484375, -4.9012451171875, -4.531005859375, -4.1607666015625, -3.79052734375, -3.4202880859375, -3.050048828125, -2.6798095703125, -2.3095703125, -1.9393310546875, -1.569091796875, -1.1988525390625, -0.82861328125, -0.4583740234375, -0.088134765625, 0.2821044921875, 0.65234375, 1.0225830078125, 1.392822265625, 1.7630615234375, 2.13330078125, 2.5035400390625, 2.873779296875, 3.2440185546875, 3.6142578125, 3.9844970703125, 4.354736328125, 4.7249755859375, 5.09521484375, 5.4654541015625, 5.835693359375, 6.2059326171875, 6.576171875, 6.9464111328125, 7.316650390625, 7.6868896484375, 8.05712890625, 8.4273681640625, 8.797607421875, 9.1678466796875, 9.5380859375, 9.9083251953125, 10.278564453125, 10.6488037109375, 11.01904296875, 11.3892822265625, 11.759521484375, 12.1297607421875, 12.5]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 5.0, 7.0, 3.0, 10.0, 15.0, 22.0, 23.0, 41.0, 45.0, 74.0, 99.0, 186.0, 251.0, 462.0, 722.0, 1303.0, 2501.0, 5252.0, 12910.0, 54356.0, 2474029.0, 1576471.0, 41683.0, 12439.0, 5330.0, 2612.0, 1367.0, 757.0, 499.0, 264.0, 178.0, 121.0, 71.0, 46.0, 37.0, 25.0, 18.0, 19.0, 8.0, 13.0, 3.0, 4.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.125, -38.78515625, -37.4453125, -36.10546875, -34.765625, -33.42578125, -32.0859375, -30.74609375, -29.40625, -28.06640625, -26.7265625, -25.38671875, -24.046875, -22.70703125, -21.3671875, -20.02734375, -18.6875, -17.34765625, -16.0078125, -14.66796875, -13.328125, -11.98828125, -10.6484375, -9.30859375, -7.96875, -6.62890625, -5.2890625, -3.94921875, -2.609375, -1.26953125, 0.0703125, 1.41015625, 2.75, 4.08984375, 5.4296875, 6.76953125, 8.109375, 9.44921875, 10.7890625, 12.12890625, 13.46875, 14.80859375, 16.1484375, 17.48828125, 18.828125, 20.16796875, 21.5078125, 22.84765625, 24.1875, 25.52734375, 26.8671875, 28.20703125, 29.546875, 30.88671875, 32.2265625, 33.56640625, 34.90625, 36.24609375, 37.5859375, 38.92578125, 40.265625, 41.60546875, 42.9453125, 44.28515625, 45.625]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 5.0, 11.0, 5.0, 8.0, 12.0, 12.0, 12.0, 19.0, 17.0, 22.0, 23.0, 27.0, 55.0, 59.0, 88.0, 151.0, 313.0, 528.0, 756.0, 758.0, 417.0, 287.0, 155.0, 65.0, 59.0, 35.0, 30.0, 30.0, 20.0, 14.0, 10.0, 10.0, 8.0, 9.0, 8.0, 9.0, 3.0, 3.0, 5.0, 1.0, 6.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0], "bins": [-28.828125, -27.924072265625, -27.02001953125, -26.115966796875, -25.2119140625, -24.307861328125, -23.40380859375, -22.499755859375, -21.595703125, -20.691650390625, -19.78759765625, -18.883544921875, -17.9794921875, -17.075439453125, -16.17138671875, -15.267333984375, -14.36328125, -13.459228515625, -12.55517578125, -11.651123046875, -10.7470703125, -9.843017578125, -8.93896484375, -8.034912109375, -7.130859375, -6.226806640625, -5.32275390625, -4.418701171875, -3.5146484375, -2.610595703125, -1.70654296875, -0.802490234375, 0.1015625, 1.005615234375, 1.90966796875, 2.813720703125, 3.7177734375, 4.621826171875, 5.52587890625, 6.429931640625, 7.333984375, 8.238037109375, 9.14208984375, 10.046142578125, 10.9501953125, 11.854248046875, 12.75830078125, 13.662353515625, 14.56640625, 15.470458984375, 16.37451171875, 17.278564453125, 18.1826171875, 19.086669921875, 19.99072265625, 20.894775390625, 21.798828125, 22.702880859375, 23.60693359375, 24.510986328125, 25.4150390625, 26.319091796875, 27.22314453125, 28.127197265625, 29.03125]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 2.0, 7.0, 9.0, 4.0, 6.0, 10.0, 10.0, 21.0, 34.0, 39.0, 45.0, 67.0, 105.0, 171.0, 263.0, 410.0, 730.0, 1127.0, 1890.0, 3069.0, 5297.0, 9380.0, 17635.0, 36546.0, 97020.0, 940385.0, 2811242.0, 169229.0, 49047.0, 22540.0, 11639.0, 6560.0, 3831.0, 2250.0, 1274.0, 816.0, 539.0, 388.0, 236.0, 146.0, 106.0, 71.0, 45.0, 23.0, 14.0, 4.0, 11.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.25, -33.953125, -32.65625, -31.359375, -30.0625, -28.765625, -27.46875, -26.171875, -24.875, -23.578125, -22.28125, -20.984375, -19.6875, -18.390625, -17.09375, -15.796875, -14.5, -13.203125, -11.90625, -10.609375, -9.3125, -8.015625, -6.71875, -5.421875, -4.125, -2.828125, -1.53125, -0.234375, 1.0625, 2.359375, 3.65625, 4.953125, 6.25, 7.546875, 8.84375, 10.140625, 11.4375, 12.734375, 14.03125, 15.328125, 16.625, 17.921875, 19.21875, 20.515625, 21.8125, 23.109375, 24.40625, 25.703125, 27.0, 28.296875, 29.59375, 30.890625, 32.1875, 33.484375, 34.78125, 36.078125, 37.375, 38.671875, 39.96875, 41.265625, 42.5625, 43.859375, 45.15625, 46.453125, 47.75]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 5.0, 12.0, 16.0, 25.0, 55.0, 83.0, 221.0, 277.0, 155.0, 69.0, 39.0, 21.0, 12.0, 6.0, 3.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0], "bins": [-302.0759582519531, -296.0727233886719, -290.0694580078125, -284.06622314453125, -278.0629577636719, -272.0597229003906, -266.05645751953125, -260.05322265625, -254.0499725341797, -248.04672241210938, -242.04347229003906, -236.04022216796875, -230.0369873046875, -224.0337371826172, -218.03048706054688, -212.02723693847656, -206.02398681640625, -200.02073669433594, -194.01748657226562, -188.0142364501953, -182.010986328125, -176.00775146484375, -170.00450134277344, -164.00125122070312, -157.9980010986328, -151.9947509765625, -145.9915008544922, -139.98825073242188, -133.98501586914062, -127.98175811767578, -121.978515625, -115.97526550292969, -109.97200775146484, -103.96875762939453, -97.96551513671875, -91.96226501464844, -85.95901489257812, -79.95576477050781, -73.9525146484375, -67.94927215576172, -61.946022033691406, -55.942771911621094, -49.93952560424805, -43.936279296875, -37.93302917480469, -31.929780960083008, -25.926532745361328, -19.92328643798828, -13.920036315917969, -7.916788101196289, -1.9135398864746094, 4.08970832824707, 10.09295654296875, 16.09620475769043, 22.09945297241211, 28.102699279785156, 34.10594940185547, 40.10919952392578, 46.11244583129883, 52.115692138671875, 58.11894226074219, 64.1221923828125, 70.12544250488281, 76.1286849975586, 82.1319351196289]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 4.0, 2.0, 7.0, 12.0, 6.0, 12.0, 12.0, 18.0, 18.0, 25.0, 27.0, 29.0, 21.0, 34.0, 34.0, 38.0, 39.0, 43.0, 37.0, 42.0, 39.0, 34.0, 58.0, 50.0, 51.0, 37.0, 23.0, 19.0, 28.0, 28.0, 24.0, 32.0, 19.0, 16.0, 18.0, 12.0, 10.0, 11.0, 6.0, 13.0, 11.0, 2.0, 0.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-99.378662109375, -96.53338623046875, -93.68810272216797, -90.84281921386719, -87.99754333496094, -85.15226745605469, -82.3069839477539, -79.46170043945312, -76.61642456054688, -73.77114868164062, -70.92586517333984, -68.08058166503906, -65.23530578613281, -62.3900260925293, -59.54474639892578, -56.699466705322266, -53.85418701171875, -51.008907318115234, -48.16362762451172, -45.3183479309082, -42.47306823730469, -39.62778854370117, -36.782508850097656, -33.93722915649414, -31.091949462890625, -28.24666976928711, -25.401390075683594, -22.556110382080078, -19.710830688476562, -16.865550994873047, -14.020271301269531, -11.174991607666016, -8.3297119140625, -5.484432220458984, -2.6391525268554688, 0.20612716674804688, 3.0514068603515625, 5.896686553955078, 8.741966247558594, 11.58724594116211, 14.432525634765625, 17.27780532836914, 20.123085021972656, 22.968364715576172, 25.813644409179688, 28.658924102783203, 31.50420379638672, 34.349483489990234, 37.19476318359375, 40.040042877197266, 42.88532257080078, 45.7306022644043, 48.57588195800781, 51.42116165161133, 54.266441345214844, 57.11172103881836, 59.957000732421875, 62.80228042602539, 65.6475601196289, 68.49284362792969, 71.33811950683594, 74.18339538574219, 77.02867889404297, 79.87396240234375, 82.71923828125]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 3.0, 4.0, 2.0, 5.0, 11.0, 10.0, 12.0, 9.0, 19.0, 16.0, 26.0, 38.0, 34.0, 39.0, 45.0, 58.0, 58.0, 63.0, 55.0, 43.0, 60.0, 63.0, 47.0, 48.0, 35.0, 41.0, 38.0, 17.0, 15.0, 16.0, 15.0, 16.0, 8.0, 4.0, 10.0, 3.0, 4.0, 4.0, 2.0, 6.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.625, -11.25048828125, -10.8759765625, -10.50146484375, -10.126953125, -9.75244140625, -9.3779296875, -9.00341796875, -8.62890625, -8.25439453125, -7.8798828125, -7.50537109375, -7.130859375, -6.75634765625, -6.3818359375, -6.00732421875, -5.6328125, -5.25830078125, -4.8837890625, -4.50927734375, -4.134765625, -3.76025390625, -3.3857421875, -3.01123046875, -2.63671875, -2.26220703125, -1.8876953125, -1.51318359375, -1.138671875, -0.76416015625, -0.3896484375, -0.01513671875, 0.359375, 0.73388671875, 1.1083984375, 1.48291015625, 1.857421875, 2.23193359375, 2.6064453125, 2.98095703125, 3.35546875, 3.72998046875, 4.1044921875, 4.47900390625, 4.853515625, 5.22802734375, 5.6025390625, 5.97705078125, 6.3515625, 6.72607421875, 7.1005859375, 7.47509765625, 7.849609375, 8.22412109375, 8.5986328125, 8.97314453125, 9.34765625, 9.72216796875, 10.0966796875, 10.47119140625, 10.845703125, 11.22021484375, 11.5947265625, 11.96923828125, 12.34375]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 9.0, 13.0, 20.0, 26.0, 30.0, 65.0, 67.0, 98.0, 175.0, 270.0, 421.0, 657.0, 1032.0, 1558.0, 2585.0, 4188.0, 7074.0, 12257.0, 22600.0, 42976.0, 90700.0, 223307.0, 348733.0, 150069.0, 65281.0, 32348.0, 17409.0, 9684.0, 5719.0, 3433.0, 2083.0, 1246.0, 911.0, 525.0, 331.0, 238.0, 134.0, 89.0, 55.0, 39.0, 45.0, 17.0, 24.0, 6.0, 4.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2451171875, -1.2065582275390625, -1.167999267578125, -1.1294403076171875, -1.09088134765625, -1.0523223876953125, -1.013763427734375, -0.9752044677734375, -0.9366455078125, -0.8980865478515625, -0.859527587890625, -0.8209686279296875, -0.78240966796875, -0.7438507080078125, -0.705291748046875, -0.6667327880859375, -0.628173828125, -0.5896148681640625, -0.551055908203125, -0.5124969482421875, -0.47393798828125, -0.4353790283203125, -0.396820068359375, -0.3582611083984375, -0.3197021484375, -0.2811431884765625, -0.242584228515625, -0.2040252685546875, -0.16546630859375, -0.1269073486328125, -0.088348388671875, -0.0497894287109375, -0.01123046875, 0.0273284912109375, 0.065887451171875, 0.1044464111328125, 0.14300537109375, 0.1815643310546875, 0.220123291015625, 0.2586822509765625, 0.2972412109375, 0.3358001708984375, 0.374359130859375, 0.4129180908203125, 0.45147705078125, 0.4900360107421875, 0.528594970703125, 0.5671539306640625, 0.605712890625, 0.6442718505859375, 0.682830810546875, 0.7213897705078125, 0.75994873046875, 0.7985076904296875, 0.837066650390625, 0.8756256103515625, 0.9141845703125, 0.9527435302734375, 0.991302490234375, 1.0298614501953125, 1.06842041015625, 1.1069793701171875, 1.145538330078125, 1.1840972900390625, 1.22265625]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 7.0, 5.0, 6.0, 13.0, 10.0, 13.0, 8.0, 12.0, 20.0, 19.0, 22.0, 29.0, 50.0, 27.0, 35.0, 40.0, 47.0, 51.0, 52.0, 35.0, 1064.0, 37.0, 45.0, 48.0, 42.0, 43.0, 39.0, 28.0, 26.0, 23.0, 21.0, 22.0, 15.0, 15.0, 11.0, 14.0, 18.0, 7.0, 5.0, 6.0, 0.0, 4.0, 4.0, 3.0, 0.0, 0.0, 1.0], "bins": [-8.078125, -7.86114501953125, -7.6441650390625, -7.42718505859375, -7.210205078125, -6.99322509765625, -6.7762451171875, -6.55926513671875, -6.34228515625, -6.12530517578125, -5.9083251953125, -5.69134521484375, -5.474365234375, -5.25738525390625, -5.0404052734375, -4.82342529296875, -4.6064453125, -4.38946533203125, -4.1724853515625, -3.95550537109375, -3.738525390625, -3.52154541015625, -3.3045654296875, -3.08758544921875, -2.87060546875, -2.65362548828125, -2.4366455078125, -2.21966552734375, -2.002685546875, -1.78570556640625, -1.5687255859375, -1.35174560546875, -1.134765625, -0.91778564453125, -0.7008056640625, -0.48382568359375, -0.266845703125, -0.04986572265625, 0.1671142578125, 0.38409423828125, 0.60107421875, 0.81805419921875, 1.0350341796875, 1.25201416015625, 1.468994140625, 1.68597412109375, 1.9029541015625, 2.11993408203125, 2.3369140625, 2.55389404296875, 2.7708740234375, 2.98785400390625, 3.204833984375, 3.42181396484375, 3.6387939453125, 3.85577392578125, 4.07275390625, 4.28973388671875, 4.5067138671875, 4.72369384765625, 4.940673828125, 5.15765380859375, 5.3746337890625, 5.59161376953125, 5.80859375]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [4.0, 4.0, 5.0, 8.0, 17.0, 19.0, 16.0, 37.0, 37.0, 37.0, 97.0, 159.0, 256.0, 347.0, 649.0, 956.0, 1532.0, 2323.0, 3495.0, 5331.0, 8102.0, 12556.0, 19505.0, 32014.0, 54838.0, 98969.0, 188949.0, 1299646.0, 158256.0, 83730.0, 47685.0, 28437.0, 17474.0, 10990.0, 7183.0, 4692.0, 3165.0, 1980.0, 1358.0, 820.0, 495.0, 347.0, 245.0, 142.0, 75.0, 61.0, 30.0, 28.0, 16.0, 15.0, 8.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.53515625, -0.5156021118164062, -0.4960479736328125, -0.47649383544921875, -0.456939697265625, -0.43738555908203125, -0.4178314208984375, -0.39827728271484375, -0.37872314453125, -0.35916900634765625, -0.3396148681640625, -0.32006072998046875, -0.300506591796875, -0.28095245361328125, -0.2613983154296875, -0.24184417724609375, -0.2222900390625, -0.20273590087890625, -0.1831817626953125, -0.16362762451171875, -0.144073486328125, -0.12451934814453125, -0.1049652099609375, -0.08541107177734375, -0.06585693359375, -0.04630279541015625, -0.0267486572265625, -0.00719451904296875, 0.012359619140625, 0.03191375732421875, 0.0514678955078125, 0.07102203369140625, 0.090576171875, 0.11013031005859375, 0.1296844482421875, 0.14923858642578125, 0.168792724609375, 0.18834686279296875, 0.2079010009765625, 0.22745513916015625, 0.24700927734375, 0.26656341552734375, 0.2861175537109375, 0.30567169189453125, 0.325225830078125, 0.34477996826171875, 0.3643341064453125, 0.38388824462890625, 0.4034423828125, 0.42299652099609375, 0.4425506591796875, 0.46210479736328125, 0.481658935546875, 0.5012130737304688, 0.5207672119140625, 0.5403213500976562, 0.55987548828125, 0.5794296264648438, 0.5989837646484375, 0.6185379028320312, 0.638092041015625, 0.6576461791992188, 0.6772003173828125, 0.6967544555664062, 0.71630859375]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 3.0, 7.0, 7.0, 9.0, 11.0, 9.0, 12.0, 15.0, 16.0, 26.0, 37.0, 35.0, 40.0, 37.0, 38.0, 35.0, 53.0, 49.0, 50.0, 49.0, 70.0, 53.0, 51.0, 42.0, 46.0, 25.0, 31.0, 26.0, 13.0, 15.0, 14.0, 16.0, 10.0, 12.0, 7.0, 8.0, 2.0, 2.0, 3.0, 4.0, 1.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.016937255859375, -0.016445398330688477, -0.015953540802001953, -0.01546168327331543, -0.014969825744628906, -0.014477968215942383, -0.01398611068725586, -0.013494253158569336, -0.013002395629882812, -0.012510538101196289, -0.012018680572509766, -0.011526823043823242, -0.011034965515136719, -0.010543107986450195, -0.010051250457763672, -0.009559392929077148, -0.009067535400390625, -0.008575677871704102, -0.008083820343017578, -0.007591962814331055, -0.007100105285644531, -0.006608247756958008, -0.006116390228271484, -0.005624532699584961, -0.0051326751708984375, -0.004640817642211914, -0.004148960113525391, -0.003657102584838867, -0.0031652450561523438, -0.0026733875274658203, -0.002181529998779297, -0.0016896724700927734, -0.00119781494140625, -0.0007059574127197266, -0.00021409988403320312, 0.0002777576446533203, 0.0007696151733398438, 0.0012614727020263672, 0.0017533302307128906, 0.002245187759399414, 0.0027370452880859375, 0.003228902816772461, 0.0037207603454589844, 0.004212617874145508, 0.004704475402832031, 0.005196332931518555, 0.005688190460205078, 0.0061800479888916016, 0.006671905517578125, 0.0071637630462646484, 0.007655620574951172, 0.008147478103637695, 0.008639335632324219, 0.009131193161010742, 0.009623050689697266, 0.010114908218383789, 0.010606765747070312, 0.011098623275756836, 0.01159048080444336, 0.012082338333129883, 0.012574195861816406, 0.01306605339050293, 0.013557910919189453, 0.014049768447875977, 0.0145416259765625]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 0.0, 4.0, 4.0, 0.0, 6.0, 3.0, 12.0, 13.0, 8.0, 25.0, 17.0, 10.0, 26.0, 33.0, 37.0, 29.0, 47.0, 77.0, 82.0, 121.0, 224.0, 502.0, 117316.0, 928720.0, 516.0, 215.0, 112.0, 73.0, 53.0, 38.0, 50.0, 37.0, 36.0, 17.0, 14.0, 15.0, 13.0, 12.0, 13.0, 8.0, 3.0, 5.0, 5.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.513671875, -0.49658203125, -0.4794921875, -0.46240234375, -0.4453125, -0.42822265625, -0.4111328125, -0.39404296875, -0.376953125, -0.35986328125, -0.3427734375, -0.32568359375, -0.30859375, -0.29150390625, -0.2744140625, -0.25732421875, -0.240234375, -0.22314453125, -0.2060546875, -0.18896484375, -0.171875, -0.15478515625, -0.1376953125, -0.12060546875, -0.103515625, -0.08642578125, -0.0693359375, -0.05224609375, -0.03515625, -0.01806640625, -0.0009765625, 0.01611328125, 0.033203125, 0.05029296875, 0.0673828125, 0.08447265625, 0.1015625, 0.11865234375, 0.1357421875, 0.15283203125, 0.169921875, 0.18701171875, 0.2041015625, 0.22119140625, 0.23828125, 0.25537109375, 0.2724609375, 0.28955078125, 0.306640625, 0.32373046875, 0.3408203125, 0.35791015625, 0.375, 0.39208984375, 0.4091796875, 0.42626953125, 0.443359375, 0.46044921875, 0.4775390625, 0.49462890625, 0.51171875, 0.52880859375, 0.5458984375, 0.56298828125, 0.580078125]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1012.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007155167404562235, 0.007726811338216066, 0.022608790546655655, 0.03749076649546623, 0.05237274616956711, 0.06725472956895828, 0.08213670551776886, 0.09701868891716003, 0.11190066486597061, 0.1267826408147812, 0.14166462421417236, 0.15654659271240234, 0.17142857611179352, 0.1863105595111847, 0.20119252800941467, 0.21607452630996704, 0.23095649480819702, 0.2458384782075882, 0.26072046160697937, 0.27560243010520935, 0.29048439860343933, 0.3053663969039917, 0.3202483654022217, 0.33513033390045166, 0.35001233220100403, 0.364894300699234, 0.3797762989997864, 0.39465826749801636, 0.40954023599624634, 0.4244222342967987, 0.4393042027950287, 0.45418620109558105, 0.46906813979148865, 0.48395010828971863, 0.498832106590271, 0.513714075088501, 0.528596043586731, 0.5434780120849609, 0.5583599805831909, 0.5732420086860657, 0.5881239771842957, 0.6030059456825256, 0.6178879141807556, 0.6327699422836304, 0.6476519107818604, 0.6625338792800903, 0.6774158477783203, 0.6922978162765503, 0.7071797847747803, 0.7220617532730103, 0.7369437217712402, 0.7518256902694702, 0.766707718372345, 0.781589686870575, 0.7964716553688049, 0.8113536238670349, 0.8262356519699097, 0.8411176204681396, 0.8559995889663696, 0.8708815574645996, 0.8857635855674744, 0.9006455540657043, 0.9155275225639343, 0.9304094910621643, 0.9452914595603943]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 8.0, 8.0, 18.0, 19.0, 15.0, 16.0, 28.0, 26.0, 33.0, 30.0, 40.0, 33.0, 46.0, 45.0, 53.0, 47.0, 49.0, 61.0, 47.0, 43.0, 44.0, 58.0, 38.0, 38.0, 29.0, 32.0, 24.0, 10.0, 23.0, 8.0, 12.0, 7.0, 9.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.05142170190811157, -0.0501592755317688, -0.048896849155426025, -0.04763442650437355, -0.04637200012803078, -0.045109573751688004, -0.04384715110063553, -0.042584724724292755, -0.04132229834794998, -0.04005987197160721, -0.038797445595264435, -0.03753502294421196, -0.036272596567869186, -0.03501017019152641, -0.03374774754047394, -0.032485321164131165, -0.03122289478778839, -0.029960468411445618, -0.028698043897747993, -0.02743561938405037, -0.026173193007707596, -0.024910766631364822, -0.023648342117667198, -0.022385917603969574, -0.0211234912276268, -0.019861064851284027, -0.018598640337586403, -0.01733621582388878, -0.016073789447546005, -0.014811364002525806, -0.013548938557505608, -0.012286513112485409, -0.01102408766746521, -0.009761662222445011, -0.008499236777424812, -0.0072368113324046135, -0.005974385887384415, -0.004711960442364216, -0.003449534997344017, -0.002187109552323818, -0.0009246841073036194, 0.00033774133771657944, 0.0016001667827367783, 0.002862592227756977, 0.004125017672777176, 0.005387443117797375, 0.0066498685628175735, 0.007912294007837772, 0.009174719452857971, 0.01043714489787817, 0.011699570342898369, 0.012961995787918568, 0.014224421232938766, 0.015486846677958965, 0.016749272122979164, 0.01801169663667679, 0.019274123013019562, 0.020536549389362335, 0.02179897390305996, 0.023061398416757584, 0.024323824793100357, 0.02558625116944313, 0.026848675683140755, 0.02811110019683838, 0.029373526573181152]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 3.0, 4.0, 2.0, 5.0, 11.0, 10.0, 12.0, 9.0, 19.0, 16.0, 26.0, 38.0, 34.0, 39.0, 45.0, 58.0, 58.0, 63.0, 55.0, 43.0, 60.0, 63.0, 48.0, 47.0, 35.0, 41.0, 38.0, 17.0, 15.0, 16.0, 15.0, 16.0, 8.0, 4.0, 10.0, 3.0, 4.0, 4.0, 2.0, 6.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.625, -11.25048828125, -10.8759765625, -10.50146484375, -10.126953125, -9.75244140625, -9.3779296875, -9.00341796875, -8.62890625, -8.25439453125, -7.8798828125, -7.50537109375, -7.130859375, -6.75634765625, -6.3818359375, -6.00732421875, -5.6328125, -5.25830078125, -4.8837890625, -4.50927734375, -4.134765625, -3.76025390625, -3.3857421875, -3.01123046875, -2.63671875, -2.26220703125, -1.8876953125, -1.51318359375, -1.138671875, -0.76416015625, -0.3896484375, -0.01513671875, 0.359375, 0.73388671875, 1.1083984375, 1.48291015625, 1.857421875, 2.23193359375, 2.6064453125, 2.98095703125, 3.35546875, 3.72998046875, 4.1044921875, 4.47900390625, 4.853515625, 5.22802734375, 5.6025390625, 5.97705078125, 6.3515625, 6.72607421875, 7.1005859375, 7.47509765625, 7.849609375, 8.22412109375, 8.5986328125, 8.97314453125, 9.34765625, 9.72216796875, 10.0966796875, 10.47119140625, 10.845703125, 11.22021484375, 11.5947265625, 11.96923828125, 12.34375]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 4.0, 6.0, 5.0, 5.0, 15.0, 20.0, 29.0, 39.0, 44.0, 65.0, 94.0, 165.0, 197.0, 318.0, 553.0, 1065.0, 1991.0, 4532.0, 12482.0, 44583.0, 266744.0, 596431.0, 85712.0, 20666.0, 6867.0, 2719.0, 1299.0, 712.0, 371.0, 260.0, 153.0, 125.0, 83.0, 51.0, 45.0, 30.0, 19.0, 21.0, 11.0, 10.0, 4.0, 4.0, 6.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.640625, -10.2996826171875, -9.958740234375, -9.6177978515625, -9.27685546875, -8.9359130859375, -8.594970703125, -8.2540283203125, -7.9130859375, -7.5721435546875, -7.231201171875, -6.8902587890625, -6.54931640625, -6.2083740234375, -5.867431640625, -5.5264892578125, -5.185546875, -4.8446044921875, -4.503662109375, -4.1627197265625, -3.82177734375, -3.4808349609375, -3.139892578125, -2.7989501953125, -2.4580078125, -2.1170654296875, -1.776123046875, -1.4351806640625, -1.09423828125, -0.7532958984375, -0.412353515625, -0.0714111328125, 0.26953125, 0.6104736328125, 0.951416015625, 1.2923583984375, 1.63330078125, 1.9742431640625, 2.315185546875, 2.6561279296875, 2.9970703125, 3.3380126953125, 3.678955078125, 4.0198974609375, 4.36083984375, 4.7017822265625, 5.042724609375, 5.3836669921875, 5.724609375, 6.0655517578125, 6.406494140625, 6.7474365234375, 7.08837890625, 7.4293212890625, 7.770263671875, 8.1112060546875, 8.4521484375, 8.7930908203125, 9.134033203125, 9.4749755859375, 9.81591796875, 10.1568603515625, 10.497802734375, 10.8387451171875, 11.1796875]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 5.0, 6.0, 2.0, 5.0, 8.0, 9.0, 9.0, 8.0, 14.0, 13.0, 14.0, 24.0, 15.0, 39.0, 25.0, 41.0, 31.0, 34.0, 47.0, 49.0, 55.0, 64.0, 1865.0, 188.0, 66.0, 53.0, 35.0, 45.0, 29.0, 32.0, 23.0, 36.0, 25.0, 20.0, 18.0, 18.0, 19.0, 13.0, 8.0, 9.0, 8.0, 9.0, 5.0, 4.0, 6.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0], "bins": [-41.0, -39.8544921875, -38.708984375, -37.5634765625, -36.41796875, -35.2724609375, -34.126953125, -32.9814453125, -31.8359375, -30.6904296875, -29.544921875, -28.3994140625, -27.25390625, -26.1083984375, -24.962890625, -23.8173828125, -22.671875, -21.5263671875, -20.380859375, -19.2353515625, -18.08984375, -16.9443359375, -15.798828125, -14.6533203125, -13.5078125, -12.3623046875, -11.216796875, -10.0712890625, -8.92578125, -7.7802734375, -6.634765625, -5.4892578125, -4.34375, -3.1982421875, -2.052734375, -0.9072265625, 0.23828125, 1.3837890625, 2.529296875, 3.6748046875, 4.8203125, 5.9658203125, 7.111328125, 8.2568359375, 9.40234375, 10.5478515625, 11.693359375, 12.8388671875, 13.984375, 15.1298828125, 16.275390625, 17.4208984375, 18.56640625, 19.7119140625, 20.857421875, 22.0029296875, 23.1484375, 24.2939453125, 25.439453125, 26.5849609375, 27.73046875, 28.8759765625, 30.021484375, 31.1669921875, 32.3125]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 5.0, 1.0, 3.0, 6.0, 5.0, 7.0, 8.0, 11.0, 7.0, 13.0, 16.0, 21.0, 19.0, 20.0, 28.0, 47.0, 38.0, 55.0, 64.0, 104.0, 199.0, 450.0, 1436.0, 28177.0, 3106234.0, 6901.0, 904.0, 335.0, 174.0, 80.0, 63.0, 59.0, 36.0, 46.0, 18.0, 29.0, 15.0, 10.0, 19.0, 9.0, 9.0, 8.0, 5.0, 7.0, 4.0, 4.0, 5.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.3125, -70.7255859375, -68.138671875, -65.5517578125, -62.96484375, -60.3779296875, -57.791015625, -55.2041015625, -52.6171875, -50.0302734375, -47.443359375, -44.8564453125, -42.26953125, -39.6826171875, -37.095703125, -34.5087890625, -31.921875, -29.3349609375, -26.748046875, -24.1611328125, -21.57421875, -18.9873046875, -16.400390625, -13.8134765625, -11.2265625, -8.6396484375, -6.052734375, -3.4658203125, -0.87890625, 1.7080078125, 4.294921875, 6.8818359375, 9.46875, 12.0556640625, 14.642578125, 17.2294921875, 19.81640625, 22.4033203125, 24.990234375, 27.5771484375, 30.1640625, 32.7509765625, 35.337890625, 37.9248046875, 40.51171875, 43.0986328125, 45.685546875, 48.2724609375, 50.859375, 53.4462890625, 56.033203125, 58.6201171875, 61.20703125, 63.7939453125, 66.380859375, 68.9677734375, 71.5546875, 74.1416015625, 76.728515625, 79.3154296875, 81.90234375, 84.4892578125, 87.076171875, 89.6630859375, 92.25]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 164.0, 857.0], "bins": [-921.3816528320312, -906.7872924804688, -892.1929321289062, -877.5985717773438, -863.004150390625, -848.4097900390625, -833.8154296875, -819.2210693359375, -804.626708984375, -790.0323486328125, -775.43798828125, -760.8436279296875, -746.249267578125, -731.6548461914062, -717.0604858398438, -702.4661254882812, -687.8717651367188, -673.2774047851562, -658.6830444335938, -644.0886840820312, -629.4942626953125, -614.89990234375, -600.3055419921875, -585.711181640625, -571.1168212890625, -556.5224609375, -541.9281005859375, -527.333740234375, -512.7393798828125, -498.1449890136719, -483.55059814453125, -468.95623779296875, -454.36187744140625, -439.76751708984375, -425.17315673828125, -410.5787658691406, -395.9844055175781, -381.3900451660156, -366.795654296875, -352.2012939453125, -337.60693359375, -323.0125732421875, -308.418212890625, -293.8238220214844, -279.2294616699219, -264.6351013183594, -250.0407257080078, -235.44635009765625, -220.85198974609375, -206.25762939453125, -191.6632537841797, -177.06887817382812, -162.47451782226562, -147.88015747070312, -133.28578186035156, -118.69141387939453, -104.0970458984375, -89.50267791748047, -74.90830993652344, -60.313941955566406, -45.719573974609375, -31.125205993652344, -16.530838012695312, -1.9364700317382812, 12.657898902893066]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 5.0, 7.0, 5.0, 5.0, 14.0, 9.0, 18.0, 11.0, 20.0, 21.0, 20.0, 18.0, 33.0, 33.0, 32.0, 31.0, 44.0, 35.0, 34.0, 33.0, 45.0, 58.0, 41.0, 37.0, 35.0, 37.0, 32.0, 23.0, 33.0, 33.0, 39.0, 21.0, 26.0, 23.0, 22.0, 15.0, 6.0, 7.0, 12.0, 7.0, 5.0, 5.0, 2.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-106.93266296386719, -103.48381042480469, -100.03496551513672, -96.58611297607422, -93.13726806640625, -89.68841552734375, -86.23956298828125, -82.79071807861328, -79.34187316894531, -75.89302062988281, -72.44417572021484, -68.99532318115234, -65.54647827148438, -62.097625732421875, -58.64877700805664, -55.199928283691406, -51.751075744628906, -48.30222702026367, -44.85337829589844, -41.40452575683594, -37.95568084716797, -34.50682830810547, -31.057979583740234, -27.609130859375, -24.160282135009766, -20.71143341064453, -17.262584686279297, -13.81373405456543, -10.364885330200195, -6.916036605834961, -3.4671859741210938, -0.018337249755859375, 3.4305038452148438, 6.879353046417236, 10.328202247619629, 13.77705192565918, 17.225900650024414, 20.67474937438965, 24.123600006103516, 27.57244873046875, 31.021297454833984, 34.47014617919922, 37.91899490356445, 41.36784362792969, 44.81669616699219, 48.265541076660156, 51.714393615722656, 55.16324234008789, 58.612091064453125, 62.06093978881836, 65.5097885131836, 68.9586410522461, 72.40748596191406, 75.85633850097656, 79.30519104003906, 82.75403594970703, 86.202880859375, 89.6517333984375, 93.10057830810547, 96.54943084716797, 99.99827575683594, 103.44712829589844, 106.89598083496094, 110.3448257446289, 113.7936782836914]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 1.0, 5.0, 3.0, 4.0, 10.0, 11.0, 10.0, 9.0, 16.0, 22.0, 24.0, 32.0, 39.0, 39.0, 40.0, 49.0, 65.0, 63.0, 57.0, 52.0, 61.0, 63.0, 44.0, 41.0, 46.0, 38.0, 33.0, 22.0, 20.0, 10.0, 18.0, 16.0, 7.0, 8.0, 6.0, 1.0, 5.0, 3.0, 4.0, 5.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.0390625, -11.6522216796875, -11.265380859375, -10.8785400390625, -10.49169921875, -10.1048583984375, -9.718017578125, -9.3311767578125, -8.9443359375, -8.5574951171875, -8.170654296875, -7.7838134765625, -7.39697265625, -7.0101318359375, -6.623291015625, -6.2364501953125, -5.849609375, -5.4627685546875, -5.075927734375, -4.6890869140625, -4.30224609375, -3.9154052734375, -3.528564453125, -3.1417236328125, -2.7548828125, -2.3680419921875, -1.981201171875, -1.5943603515625, -1.20751953125, -0.8206787109375, -0.433837890625, -0.0469970703125, 0.33984375, 0.7266845703125, 1.113525390625, 1.5003662109375, 1.88720703125, 2.2740478515625, 2.660888671875, 3.0477294921875, 3.4345703125, 3.8214111328125, 4.208251953125, 4.5950927734375, 4.98193359375, 5.3687744140625, 5.755615234375, 6.1424560546875, 6.529296875, 6.9161376953125, 7.302978515625, 7.6898193359375, 8.07666015625, 8.4635009765625, 8.850341796875, 9.2371826171875, 9.6240234375, 10.0108642578125, 10.397705078125, 10.7845458984375, 11.17138671875, 11.5582275390625, 11.945068359375, 12.3319091796875, 12.71875]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 1.0, 6.0, 9.0, 11.0, 16.0, 24.0, 32.0, 44.0, 65.0, 131.0, 226.0, 335.0, 572.0, 1241.0, 2543.0, 5728.0, 16076.0, 187857.0, 3871790.0, 84485.0, 13119.0, 5010.0, 2276.0, 1161.0, 621.0, 373.0, 198.0, 111.0, 68.0, 46.0, 34.0, 15.0, 19.0, 8.0, 6.0, 6.0, 8.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.5, -51.796875, -50.09375, -48.390625, -46.6875, -44.984375, -43.28125, -41.578125, -39.875, -38.171875, -36.46875, -34.765625, -33.0625, -31.359375, -29.65625, -27.953125, -26.25, -24.546875, -22.84375, -21.140625, -19.4375, -17.734375, -16.03125, -14.328125, -12.625, -10.921875, -9.21875, -7.515625, -5.8125, -4.109375, -2.40625, -0.703125, 1.0, 2.703125, 4.40625, 6.109375, 7.8125, 9.515625, 11.21875, 12.921875, 14.625, 16.328125, 18.03125, 19.734375, 21.4375, 23.140625, 24.84375, 26.546875, 28.25, 29.953125, 31.65625, 33.359375, 35.0625, 36.765625, 38.46875, 40.171875, 41.875, 43.578125, 45.28125, 46.984375, 48.6875, 50.390625, 52.09375, 53.796875, 55.5]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 4.0, 4.0, 5.0, 5.0, 6.0, 8.0, 9.0, 10.0, 15.0, 14.0, 23.0, 21.0, 21.0, 34.0, 29.0, 59.0, 107.0, 222.0, 385.0, 733.0, 882.0, 668.0, 310.0, 170.0, 93.0, 59.0, 33.0, 32.0, 23.0, 14.0, 8.0, 9.0, 8.0, 11.0, 6.0, 8.0, 4.0, 8.0, 3.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-28.84375, -27.86083984375, -26.8779296875, -25.89501953125, -24.912109375, -23.92919921875, -22.9462890625, -21.96337890625, -20.98046875, -19.99755859375, -19.0146484375, -18.03173828125, -17.048828125, -16.06591796875, -15.0830078125, -14.10009765625, -13.1171875, -12.13427734375, -11.1513671875, -10.16845703125, -9.185546875, -8.20263671875, -7.2197265625, -6.23681640625, -5.25390625, -4.27099609375, -3.2880859375, -2.30517578125, -1.322265625, -0.33935546875, 0.6435546875, 1.62646484375, 2.609375, 3.59228515625, 4.5751953125, 5.55810546875, 6.541015625, 7.52392578125, 8.5068359375, 9.48974609375, 10.47265625, 11.45556640625, 12.4384765625, 13.42138671875, 14.404296875, 15.38720703125, 16.3701171875, 17.35302734375, 18.3359375, 19.31884765625, 20.3017578125, 21.28466796875, 22.267578125, 23.25048828125, 24.2333984375, 25.21630859375, 26.19921875, 27.18212890625, 28.1650390625, 29.14794921875, 30.130859375, 31.11376953125, 32.0966796875, 33.07958984375, 34.0625]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 0.0, 3.0, 7.0, 11.0, 3.0, 7.0, 9.0, 16.0, 29.0, 37.0, 50.0, 60.0, 102.0, 115.0, 172.0, 226.0, 340.0, 487.0, 666.0, 1002.0, 1420.0, 2092.0, 3205.0, 4710.0, 7480.0, 12036.0, 20583.0, 40210.0, 113751.0, 1051310.0, 2608134.0, 206224.0, 53991.0, 25447.0, 14428.0, 8786.0, 5526.0, 3690.0, 2435.0, 1655.0, 1115.0, 793.0, 551.0, 369.0, 295.0, 185.0, 166.0, 113.0, 61.0, 47.0, 34.0, 22.0, 21.0, 21.0, 18.0, 10.0, 7.0, 5.0, 3.0, 3.0, 1.0], "bins": [-35.25, -34.1875, -33.125, -32.0625, -31.0, -29.9375, -28.875, -27.8125, -26.75, -25.6875, -24.625, -23.5625, -22.5, -21.4375, -20.375, -19.3125, -18.25, -17.1875, -16.125, -15.0625, -14.0, -12.9375, -11.875, -10.8125, -9.75, -8.6875, -7.625, -6.5625, -5.5, -4.4375, -3.375, -2.3125, -1.25, -0.1875, 0.875, 1.9375, 3.0, 4.0625, 5.125, 6.1875, 7.25, 8.3125, 9.375, 10.4375, 11.5, 12.5625, 13.625, 14.6875, 15.75, 16.8125, 17.875, 18.9375, 20.0, 21.0625, 22.125, 23.1875, 24.25, 25.3125, 26.375, 27.4375, 28.5, 29.5625, 30.625, 31.6875, 32.75]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 4.0, 3.0, 6.0, 23.0, 45.0, 60.0, 144.0, 306.0, 215.0, 103.0, 51.0, 24.0, 11.0, 4.0, 7.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-384.76837158203125, -377.0287170410156, -369.2890625, -361.54937744140625, -353.8097229003906, -346.070068359375, -338.3304138183594, -330.59075927734375, -322.85107421875, -315.1114196777344, -307.37176513671875, -299.632080078125, -291.8924255371094, -284.15277099609375, -276.4131164550781, -268.6734619140625, -260.9338073730469, -253.19415283203125, -245.45448303222656, -237.71482849121094, -229.97515869140625, -222.23550415039062, -214.495849609375, -206.75619506835938, -199.0165252685547, -191.27687072753906, -183.53720092773438, -175.79754638671875, -168.05789184570312, -160.31822204589844, -152.5785675048828, -144.83889770507812, -137.09925842285156, -129.35960388183594, -121.61993408203125, -113.88027954101562, -106.14061737060547, -98.40095520019531, -90.66130065917969, -82.92163848876953, -75.18197631835938, -67.44231414794922, -59.70265579223633, -51.96299743652344, -44.22333526611328, -36.483673095703125, -28.744014739990234, -21.004356384277344, -13.264694213867188, -5.525033950805664, 2.2146263122558594, 9.954286575317383, 17.693946838378906, 25.433609008789062, 33.17326736450195, 40.912925720214844, 48.652587890625, 56.392250061035156, 64.13191223144531, 71.87156677246094, 79.6112289428711, 87.35089111328125, 95.09054565429688, 102.83020782470703, 110.56986999511719]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 4.0, 4.0, 4.0, 6.0, 5.0, 10.0, 10.0, 15.0, 15.0, 19.0, 17.0, 25.0, 27.0, 20.0, 15.0, 32.0, 41.0, 39.0, 32.0, 32.0, 31.0, 44.0, 33.0, 33.0, 39.0, 41.0, 52.0, 39.0, 43.0, 30.0, 28.0, 30.0, 24.0, 28.0, 22.0, 16.0, 19.0, 14.0, 17.0, 8.0, 8.0, 8.0, 11.0, 2.0, 3.0, 4.0, 5.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-87.39977264404297, -84.71659851074219, -82.03343200683594, -79.35026550292969, -76.6670913696289, -73.98391723632812, -71.30075073242188, -68.61758422851562, -65.93441009521484, -63.25123977661133, -60.56806945800781, -57.8848991394043, -55.20172882080078, -52.518558502197266, -49.83538818359375, -47.152217864990234, -44.46904754638672, -41.7858772277832, -39.10270690917969, -36.41953659057617, -33.736366271972656, -31.05319595336914, -28.370025634765625, -25.68685531616211, -23.003684997558594, -20.320514678955078, -17.637344360351562, -14.954174041748047, -12.271003723144531, -9.587833404541016, -6.9046630859375, -4.221492767333984, -1.5383148193359375, 1.1448554992675781, 3.8280258178710938, 6.511196136474609, 9.194366455078125, 11.87753677368164, 14.560707092285156, 17.243877410888672, 19.927047729492188, 22.610218048095703, 25.29338836669922, 27.976558685302734, 30.65972900390625, 33.342899322509766, 36.02606964111328, 38.7092399597168, 41.39241027832031, 44.07558059692383, 46.758750915527344, 49.44192123413086, 52.125091552734375, 54.80826187133789, 57.491432189941406, 60.17460250854492, 62.85777282714844, 65.54093933105469, 68.22411346435547, 70.90728759765625, 73.5904541015625, 76.27362060546875, 78.95679473876953, 81.63996887207031, 84.32313537597656]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 6.0, 5.0, 2.0, 4.0, 8.0, 6.0, 6.0, 6.0, 18.0, 17.0, 17.0, 15.0, 32.0, 20.0, 36.0, 39.0, 31.0, 50.0, 55.0, 58.0, 65.0, 56.0, 58.0, 40.0, 52.0, 47.0, 36.0, 26.0, 27.0, 34.0, 31.0, 18.0, 12.0, 15.0, 18.0, 7.0, 5.0, 6.0, 5.0, 7.0, 5.0, 1.0, 2.0, 5.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.4609375, -11.0955810546875, -10.730224609375, -10.3648681640625, -9.99951171875, -9.6341552734375, -9.268798828125, -8.9034423828125, -8.5380859375, -8.1727294921875, -7.807373046875, -7.4420166015625, -7.07666015625, -6.7113037109375, -6.345947265625, -5.9805908203125, -5.615234375, -5.2498779296875, -4.884521484375, -4.5191650390625, -4.15380859375, -3.7884521484375, -3.423095703125, -3.0577392578125, -2.6923828125, -2.3270263671875, -1.961669921875, -1.5963134765625, -1.23095703125, -0.8656005859375, -0.500244140625, -0.1348876953125, 0.23046875, 0.5958251953125, 0.961181640625, 1.3265380859375, 1.69189453125, 2.0572509765625, 2.422607421875, 2.7879638671875, 3.1533203125, 3.5186767578125, 3.884033203125, 4.2493896484375, 4.61474609375, 4.9801025390625, 5.345458984375, 5.7108154296875, 6.076171875, 6.4415283203125, 6.806884765625, 7.1722412109375, 7.53759765625, 7.9029541015625, 8.268310546875, 8.6336669921875, 8.9990234375, 9.3643798828125, 9.729736328125, 10.0950927734375, 10.46044921875, 10.8258056640625, 11.191162109375, 11.5565185546875, 11.921875]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 9.0, 13.0, 11.0, 9.0, 33.0, 37.0, 47.0, 82.0, 123.0, 185.0, 237.0, 370.0, 495.0, 727.0, 1025.0, 1598.0, 2362.0, 3592.0, 5670.0, 9006.0, 14921.0, 24869.0, 43867.0, 84457.0, 178833.0, 304704.0, 178403.0, 84017.0, 43960.0, 24737.0, 14612.0, 8967.0, 5615.0, 3610.0, 2351.0, 1591.0, 1080.0, 753.0, 503.0, 303.0, 248.0, 176.0, 103.0, 76.0, 56.0, 40.0, 28.0, 25.0, 16.0, 6.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0], "bins": [-1.119140625, -1.0847015380859375, -1.050262451171875, -1.0158233642578125, -0.98138427734375, -0.9469451904296875, -0.912506103515625, -0.8780670166015625, -0.8436279296875, -0.8091888427734375, -0.774749755859375, -0.7403106689453125, -0.70587158203125, -0.6714324951171875, -0.636993408203125, -0.6025543212890625, -0.568115234375, -0.5336761474609375, -0.499237060546875, -0.4647979736328125, -0.43035888671875, -0.3959197998046875, -0.361480712890625, -0.3270416259765625, -0.2926025390625, -0.2581634521484375, -0.223724365234375, -0.1892852783203125, -0.15484619140625, -0.1204071044921875, -0.085968017578125, -0.0515289306640625, -0.01708984375, 0.0173492431640625, 0.051788330078125, 0.0862274169921875, 0.12066650390625, 0.1551055908203125, 0.189544677734375, 0.2239837646484375, 0.2584228515625, 0.2928619384765625, 0.327301025390625, 0.3617401123046875, 0.39617919921875, 0.4306182861328125, 0.465057373046875, 0.4994964599609375, 0.533935546875, 0.5683746337890625, 0.602813720703125, 0.6372528076171875, 0.67169189453125, 0.7061309814453125, 0.740570068359375, 0.7750091552734375, 0.8094482421875, 0.8438873291015625, 0.878326416015625, 0.9127655029296875, 0.94720458984375, 0.9816436767578125, 1.016082763671875, 1.0505218505859375, 1.0849609375]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 6.0, 6.0, 4.0, 1.0, 4.0, 5.0, 5.0, 7.0, 9.0, 8.0, 12.0, 11.0, 16.0, 21.0, 21.0, 12.0, 27.0, 25.0, 42.0, 28.0, 35.0, 41.0, 32.0, 36.0, 39.0, 47.0, 1079.0, 36.0, 33.0, 36.0, 29.0, 35.0, 33.0, 25.0, 28.0, 26.0, 29.0, 27.0, 19.0, 16.0, 16.0, 10.0, 10.0, 16.0, 6.0, 5.0, 9.0, 6.0, 3.0, 3.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.06640625, -5.86688232421875, -5.6673583984375, -5.46783447265625, -5.268310546875, -5.06878662109375, -4.8692626953125, -4.66973876953125, -4.47021484375, -4.27069091796875, -4.0711669921875, -3.87164306640625, -3.672119140625, -3.47259521484375, -3.2730712890625, -3.07354736328125, -2.8740234375, -2.67449951171875, -2.4749755859375, -2.27545166015625, -2.075927734375, -1.87640380859375, -1.6768798828125, -1.47735595703125, -1.27783203125, -1.07830810546875, -0.8787841796875, -0.67926025390625, -0.479736328125, -0.28021240234375, -0.0806884765625, 0.11883544921875, 0.318359375, 0.51788330078125, 0.7174072265625, 0.91693115234375, 1.116455078125, 1.31597900390625, 1.5155029296875, 1.71502685546875, 1.91455078125, 2.11407470703125, 2.3135986328125, 2.51312255859375, 2.712646484375, 2.91217041015625, 3.1116943359375, 3.31121826171875, 3.5107421875, 3.71026611328125, 3.9097900390625, 4.10931396484375, 4.308837890625, 4.50836181640625, 4.7078857421875, 4.90740966796875, 5.10693359375, 5.30645751953125, 5.5059814453125, 5.70550537109375, 5.905029296875, 6.10455322265625, 6.3040771484375, 6.50360107421875, 6.703125]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 6.0, 7.0, 14.0, 16.0, 30.0, 67.0, 94.0, 143.0, 201.0, 283.0, 424.0, 605.0, 939.0, 1322.0, 2057.0, 3098.0, 4697.0, 6991.0, 10652.0, 16160.0, 24753.0, 39659.0, 67568.0, 119524.0, 317240.0, 1155977.0, 130534.0, 73189.0, 43345.0, 26832.0, 17116.0, 11157.0, 7344.0, 4958.0, 3259.0, 2366.0, 1444.0, 1045.0, 679.0, 435.0, 298.0, 203.0, 135.0, 93.0, 57.0, 35.0, 27.0, 16.0, 13.0, 13.0, 3.0, 5.0, 4.0, 4.0], "bins": [-0.673828125, -0.6546173095703125, -0.635406494140625, -0.6161956787109375, -0.59698486328125, -0.5777740478515625, -0.558563232421875, -0.5393524169921875, -0.5201416015625, -0.5009307861328125, -0.481719970703125, -0.4625091552734375, -0.44329833984375, -0.4240875244140625, -0.404876708984375, -0.3856658935546875, -0.366455078125, -0.3472442626953125, -0.328033447265625, -0.3088226318359375, -0.28961181640625, -0.2704010009765625, -0.251190185546875, -0.2319793701171875, -0.2127685546875, -0.1935577392578125, -0.174346923828125, -0.1551361083984375, -0.13592529296875, -0.1167144775390625, -0.097503662109375, -0.0782928466796875, -0.05908203125, -0.0398712158203125, -0.020660400390625, -0.0014495849609375, 0.01776123046875, 0.0369720458984375, 0.056182861328125, 0.0753936767578125, 0.0946044921875, 0.1138153076171875, 0.133026123046875, 0.1522369384765625, 0.17144775390625, 0.1906585693359375, 0.209869384765625, 0.2290802001953125, 0.248291015625, 0.2675018310546875, 0.286712646484375, 0.3059234619140625, 0.32513427734375, 0.3443450927734375, 0.363555908203125, 0.3827667236328125, 0.4019775390625, 0.4211883544921875, 0.440399169921875, 0.4596099853515625, 0.47882080078125, 0.4980316162109375, 0.517242431640625, 0.5364532470703125, 0.5556640625]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 4.0, 0.0, 6.0, 6.0, 13.0, 8.0, 7.0, 16.0, 15.0, 18.0, 20.0, 19.0, 31.0, 32.0, 41.0, 60.0, 62.0, 95.0, 76.0, 85.0, 59.0, 64.0, 51.0, 35.0, 29.0, 20.0, 31.0, 13.0, 5.0, 16.0, 9.0, 11.0, 11.0, 7.0, 6.0, 4.0, 7.0, 6.0, 3.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.020294189453125, -0.019631385803222656, -0.018968582153320312, -0.01830577850341797, -0.017642974853515625, -0.01698017120361328, -0.016317367553710938, -0.015654563903808594, -0.01499176025390625, -0.014328956604003906, -0.013666152954101562, -0.013003349304199219, -0.012340545654296875, -0.011677742004394531, -0.011014938354492188, -0.010352134704589844, -0.0096893310546875, -0.009026527404785156, -0.008363723754882812, -0.007700920104980469, -0.007038116455078125, -0.006375312805175781, -0.0057125091552734375, -0.005049705505371094, -0.00438690185546875, -0.0037240982055664062, -0.0030612945556640625, -0.0023984909057617188, -0.001735687255859375, -0.0010728836059570312, -0.0004100799560546875, 0.00025272369384765625, 0.00091552734375, 0.0015783309936523438, 0.0022411346435546875, 0.0029039382934570312, 0.003566741943359375, 0.004229545593261719, 0.0048923492431640625, 0.005555152893066406, 0.00621795654296875, 0.006880760192871094, 0.0075435638427734375, 0.008206367492675781, 0.008869171142578125, 0.009531974792480469, 0.010194778442382812, 0.010857582092285156, 0.0115203857421875, 0.012183189392089844, 0.012845993041992188, 0.013508796691894531, 0.014171600341796875, 0.014834403991699219, 0.015497207641601562, 0.016160011291503906, 0.01682281494140625, 0.017485618591308594, 0.018148422241210938, 0.01881122589111328, 0.019474029541015625, 0.02013683319091797, 0.020799636840820312, 0.021462440490722656, 0.022125244140625]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 5.0, 5.0, 4.0, 5.0, 6.0, 8.0, 10.0, 10.0, 13.0, 14.0, 6.0, 16.0, 28.0, 26.0, 25.0, 37.0, 69.0, 104.0, 163.0, 594.0, 32613.0, 1012452.0, 1635.0, 275.0, 132.0, 65.0, 46.0, 22.0, 26.0, 29.0, 19.0, 18.0, 20.0, 12.0, 8.0, 9.0, 14.0, 5.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.63818359375, -0.6183624267578125, -0.598541259765625, -0.5787200927734375, -0.55889892578125, -0.5390777587890625, -0.519256591796875, -0.4994354248046875, -0.4796142578125, -0.4597930908203125, -0.439971923828125, -0.4201507568359375, -0.40032958984375, -0.3805084228515625, -0.360687255859375, -0.3408660888671875, -0.321044921875, -0.3012237548828125, -0.281402587890625, -0.2615814208984375, -0.24176025390625, -0.2219390869140625, -0.202117919921875, -0.1822967529296875, -0.1624755859375, -0.1426544189453125, -0.122833251953125, -0.1030120849609375, -0.08319091796875, -0.0633697509765625, -0.043548583984375, -0.0237274169921875, -0.00390625, 0.0159149169921875, 0.035736083984375, 0.0555572509765625, 0.07537841796875, 0.0951995849609375, 0.115020751953125, 0.1348419189453125, 0.1546630859375, 0.1744842529296875, 0.194305419921875, 0.2141265869140625, 0.23394775390625, 0.2537689208984375, 0.273590087890625, 0.2934112548828125, 0.313232421875, 0.3330535888671875, 0.352874755859375, 0.3726959228515625, 0.39251708984375, 0.4123382568359375, 0.432159423828125, 0.4519805908203125, 0.4718017578125, 0.4916229248046875, 0.511444091796875, 0.5312652587890625, 0.55108642578125, 0.5709075927734375, 0.590728759765625, 0.6105499267578125, 0.63037109375]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [34.0, 851.0, 127.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.018961401656270027, -0.007432793267071247, 0.004095815122127533, 0.015624424442648888, 0.027153031900525093, 0.03868164122104645, 0.05021025240421295, 0.06173885613679886, 0.07326746731996536, 0.08479607850313187, 0.09632468223571777, 0.10785329341888428, 0.11938190460205078, 0.13091051578521729, 0.1424391269683838, 0.1539677232503891, 0.1654963344335556, 0.1770249456167221, 0.1885535567998886, 0.20008215308189392, 0.21161076426506042, 0.22313937544822693, 0.23466798663139343, 0.24619659781455994, 0.25772520899772644, 0.26925382018089294, 0.28078243136405945, 0.29231104254722595, 0.30383965373039246, 0.3153682351112366, 0.3268968462944031, 0.3384254574775696, 0.3499540388584137, 0.3614826500415802, 0.3730112612247467, 0.3845398724079132, 0.3960684835910797, 0.40759706497192383, 0.41912567615509033, 0.43065428733825684, 0.44218289852142334, 0.45371150970458984, 0.46524012088775635, 0.47676873207092285, 0.48829734325408936, 0.49982595443725586, 0.5113545656204224, 0.5228831768035889, 0.5344117879867554, 0.5459403991699219, 0.5574690103530884, 0.5689976215362549, 0.5805262327194214, 0.5920548439025879, 0.6035834550857544, 0.6151120662689209, 0.6266406178474426, 0.6381692290306091, 0.6496978402137756, 0.6612264513969421, 0.6727550625801086, 0.6842836737632751, 0.6958122849464417, 0.7073408961296082, 0.7188695073127747]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 3.0, 8.0, 7.0, 12.0, 10.0, 6.0, 23.0, 18.0, 12.0, 19.0, 15.0, 24.0, 20.0, 28.0, 40.0, 31.0, 42.0, 41.0, 39.0, 42.0, 35.0, 46.0, 43.0, 36.0, 43.0, 41.0, 42.0, 32.0, 29.0, 25.0, 41.0, 23.0, 19.0, 16.0, 14.0, 20.0, 16.0, 12.0, 8.0, 7.0, 6.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.04014807939529419, -0.03895947337150574, -0.037770871073007584, -0.03658226877450943, -0.03539366275072098, -0.034205056726932526, -0.03301645442843437, -0.03182785212993622, -0.030639246106147766, -0.029450641945004463, -0.02826203778386116, -0.027073433622717857, -0.025884829461574554, -0.02469622530043125, -0.02350762113928795, -0.022319016978144646, -0.021130412817001343, -0.01994180865585804, -0.018753204494714737, -0.017564600333571434, -0.01637599617242813, -0.015187392011284828, -0.013998787850141525, -0.012810183688998222, -0.01162157952785492, -0.010432975366711617, -0.009244371205568314, -0.00805576704442501, -0.006867162883281708, -0.005678558722138405, -0.004489954560995102, -0.003301350399851799, -0.002112746238708496, -0.0009241420775651932, 0.00026446208357810974, 0.0014530662447214127, 0.0026416704058647156, 0.0038302745670080185, 0.005018878728151321, 0.006207482889294624, 0.007396087050437927, 0.00858469121158123, 0.009773295372724533, 0.010961899533867836, 0.012150503695011139, 0.013339107856154442, 0.014527712017297745, 0.015716316178441048, 0.01690492033958435, 0.018093524500727654, 0.019282128661870956, 0.02047073282301426, 0.021659336984157562, 0.022847941145300865, 0.024036545306444168, 0.02522514946758747, 0.026413753628730774, 0.027602357789874077, 0.02879096195101738, 0.029979566112160683, 0.031168170273303986, 0.03235677629709244, 0.03354537859559059, 0.034733980894088745, 0.0359225869178772]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 6.0, 5.0, 2.0, 4.0, 8.0, 6.0, 6.0, 6.0, 19.0, 16.0, 17.0, 15.0, 32.0, 20.0, 36.0, 39.0, 31.0, 50.0, 55.0, 58.0, 65.0, 56.0, 58.0, 40.0, 52.0, 47.0, 36.0, 26.0, 27.0, 34.0, 31.0, 18.0, 12.0, 15.0, 18.0, 7.0, 5.0, 6.0, 5.0, 7.0, 5.0, 1.0, 2.0, 5.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.4609375, -11.0955810546875, -10.730224609375, -10.3648681640625, -9.99951171875, -9.6341552734375, -9.268798828125, -8.9034423828125, -8.5380859375, -8.1727294921875, -7.807373046875, -7.4420166015625, -7.07666015625, -6.7113037109375, -6.345947265625, -5.9805908203125, -5.615234375, -5.2498779296875, -4.884521484375, -4.5191650390625, -4.15380859375, -3.7884521484375, -3.423095703125, -3.0577392578125, -2.6923828125, -2.3270263671875, -1.961669921875, -1.5963134765625, -1.23095703125, -0.8656005859375, -0.500244140625, -0.1348876953125, 0.23046875, 0.5958251953125, 0.961181640625, 1.3265380859375, 1.69189453125, 2.0572509765625, 2.422607421875, 2.7879638671875, 3.1533203125, 3.5186767578125, 3.884033203125, 4.2493896484375, 4.61474609375, 4.9801025390625, 5.345458984375, 5.7108154296875, 6.076171875, 6.4415283203125, 6.806884765625, 7.1722412109375, 7.53759765625, 7.9029541015625, 8.268310546875, 8.6336669921875, 8.9990234375, 9.3643798828125, 9.729736328125, 10.0950927734375, 10.46044921875, 10.8258056640625, 11.191162109375, 11.5565185546875, 11.921875]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 6.0, 6.0, 12.0, 7.0, 15.0, 20.0, 25.0, 38.0, 43.0, 73.0, 83.0, 123.0, 188.0, 267.0, 372.0, 512.0, 882.0, 1433.0, 2624.0, 5438.0, 13326.0, 42394.0, 190395.0, 606277.0, 130529.0, 32001.0, 10921.0, 4587.0, 2258.0, 1252.0, 783.0, 469.0, 321.0, 231.0, 162.0, 134.0, 78.0, 76.0, 53.0, 34.0, 20.0, 26.0, 17.0, 14.0, 9.0, 7.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-8.4453125, -8.1845703125, -7.923828125, -7.6630859375, -7.40234375, -7.1416015625, -6.880859375, -6.6201171875, -6.359375, -6.0986328125, -5.837890625, -5.5771484375, -5.31640625, -5.0556640625, -4.794921875, -4.5341796875, -4.2734375, -4.0126953125, -3.751953125, -3.4912109375, -3.23046875, -2.9697265625, -2.708984375, -2.4482421875, -2.1875, -1.9267578125, -1.666015625, -1.4052734375, -1.14453125, -0.8837890625, -0.623046875, -0.3623046875, -0.1015625, 0.1591796875, 0.419921875, 0.6806640625, 0.94140625, 1.2021484375, 1.462890625, 1.7236328125, 1.984375, 2.2451171875, 2.505859375, 2.7666015625, 3.02734375, 3.2880859375, 3.548828125, 3.8095703125, 4.0703125, 4.3310546875, 4.591796875, 4.8525390625, 5.11328125, 5.3740234375, 5.634765625, 5.8955078125, 6.15625, 6.4169921875, 6.677734375, 6.9384765625, 7.19921875, 7.4599609375, 7.720703125, 7.9814453125, 8.2421875]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 6.0, 7.0, 7.0, 5.0, 11.0, 8.0, 15.0, 16.0, 19.0, 31.0, 33.0, 22.0, 30.0, 25.0, 38.0, 30.0, 47.0, 34.0, 42.0, 77.0, 266.0, 1730.0, 94.0, 51.0, 37.0, 44.0, 32.0, 34.0, 37.0, 29.0, 24.0, 28.0, 16.0, 22.0, 15.0, 14.0, 11.0, 15.0, 11.0, 9.0, 6.0, 3.0, 4.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-35.15625, -34.02734375, -32.8984375, -31.76953125, -30.640625, -29.51171875, -28.3828125, -27.25390625, -26.125, -24.99609375, -23.8671875, -22.73828125, -21.609375, -20.48046875, -19.3515625, -18.22265625, -17.09375, -15.96484375, -14.8359375, -13.70703125, -12.578125, -11.44921875, -10.3203125, -9.19140625, -8.0625, -6.93359375, -5.8046875, -4.67578125, -3.546875, -2.41796875, -1.2890625, -0.16015625, 0.96875, 2.09765625, 3.2265625, 4.35546875, 5.484375, 6.61328125, 7.7421875, 8.87109375, 10.0, 11.12890625, 12.2578125, 13.38671875, 14.515625, 15.64453125, 16.7734375, 17.90234375, 19.03125, 20.16015625, 21.2890625, 22.41796875, 23.546875, 24.67578125, 25.8046875, 26.93359375, 28.0625, 29.19140625, 30.3203125, 31.44921875, 32.578125, 33.70703125, 34.8359375, 35.96484375, 37.09375]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 6.0, 5.0, 4.0, 10.0, 13.0, 19.0, 11.0, 10.0, 22.0, 16.0, 30.0, 41.0, 38.0, 58.0, 70.0, 114.0, 174.0, 331.0, 833.0, 5113.0, 1908376.0, 1223594.0, 5021.0, 756.0, 382.0, 193.0, 94.0, 80.0, 50.0, 40.0, 28.0, 34.0, 33.0, 20.0, 18.0, 7.0, 15.0, 12.0, 5.0, 8.0, 5.0, 4.0, 1.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-62.84375, -60.93896484375, -59.0341796875, -57.12939453125, -55.224609375, -53.31982421875, -51.4150390625, -49.51025390625, -47.60546875, -45.70068359375, -43.7958984375, -41.89111328125, -39.986328125, -38.08154296875, -36.1767578125, -34.27197265625, -32.3671875, -30.46240234375, -28.5576171875, -26.65283203125, -24.748046875, -22.84326171875, -20.9384765625, -19.03369140625, -17.12890625, -15.22412109375, -13.3193359375, -11.41455078125, -9.509765625, -7.60498046875, -5.7001953125, -3.79541015625, -1.890625, 0.01416015625, 1.9189453125, 3.82373046875, 5.728515625, 7.63330078125, 9.5380859375, 11.44287109375, 13.34765625, 15.25244140625, 17.1572265625, 19.06201171875, 20.966796875, 22.87158203125, 24.7763671875, 26.68115234375, 28.5859375, 30.49072265625, 32.3955078125, 34.30029296875, 36.205078125, 38.10986328125, 40.0146484375, 41.91943359375, 43.82421875, 45.72900390625, 47.6337890625, 49.53857421875, 51.443359375, 53.34814453125, 55.2529296875, 57.15771484375, 59.0625]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 20.0, 840.0, 160.0], "bins": [-659.6683959960938, -649.1531982421875, -638.637939453125, -628.1227416992188, -617.6075439453125, -607.09228515625, -596.5770874023438, -586.0618896484375, -575.5466918945312, -565.031494140625, -554.5162353515625, -544.0010375976562, -533.48583984375, -522.9705810546875, -512.4553833007812, -501.940185546875, -491.4249267578125, -480.9096984863281, -470.3945007324219, -459.8792724609375, -449.36407470703125, -438.8488464355469, -428.3336181640625, -417.81842041015625, -407.30322265625, -396.7879943847656, -386.2727966308594, -375.757568359375, -365.24237060546875, -354.7271423339844, -344.2119140625, -333.69671630859375, -323.1814880371094, -312.666259765625, -302.15106201171875, -291.6358337402344, -281.1206359863281, -270.60540771484375, -260.0902099609375, -249.57498168945312, -239.0597686767578, -228.5445556640625, -218.0293426513672, -207.51412963867188, -196.9989013671875, -186.4836883544922, -175.96847534179688, -165.4532470703125, -154.93804931640625, -144.42283630371094, -133.90762329101562, -123.39240264892578, -112.87718200683594, -102.36196899414062, -91.84675598144531, -81.33153533935547, -70.81632232666016, -60.30110549926758, -49.785888671875, -39.27067565917969, -28.75545883178711, -18.24024200439453, -7.725028991699219, 2.790191650390625, 13.305407524108887]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 5.0, 3.0, 2.0, 3.0, 8.0, 6.0, 11.0, 15.0, 16.0, 16.0, 20.0, 19.0, 17.0, 25.0, 24.0, 30.0, 39.0, 38.0, 34.0, 41.0, 33.0, 39.0, 33.0, 48.0, 49.0, 49.0, 49.0, 46.0, 36.0, 29.0, 28.0, 34.0, 19.0, 27.0, 19.0, 22.0, 11.0, 13.0, 12.0, 9.0, 8.0, 3.0, 6.0, 3.0, 2.0, 5.0, 2.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-133.70159912109375, -129.6881866455078, -125.67477416992188, -121.66136169433594, -117.64794921875, -113.63453674316406, -109.62113189697266, -105.60771942138672, -101.59430694580078, -97.58089447021484, -93.5674819946289, -89.55406951904297, -85.54066467285156, -81.52725219726562, -77.51383972167969, -73.50042724609375, -69.48701477050781, -65.47360229492188, -61.46018981933594, -57.446781158447266, -53.43336868286133, -49.41995620727539, -45.40654754638672, -41.39313507080078, -37.379722595214844, -33.366310119628906, -29.3528995513916, -25.339488983154297, -21.32607650756836, -17.312664031982422, -13.299253463745117, -9.285842895507812, -5.2724456787109375, -1.2590341567993164, 2.7543773651123047, 6.767788887023926, 10.781200408935547, 14.794612884521484, 18.80802345275879, 22.821434020996094, 26.83484649658203, 30.84825897216797, 34.861671447753906, 38.87508010864258, 42.888492584228516, 46.90190505981445, 50.915313720703125, 54.92872619628906, 58.942138671875, 62.95555114746094, 66.96896362304688, 70.98237609863281, 74.99578857421875, 79.00920104980469, 83.0226058959961, 87.03601837158203, 91.04943084716797, 95.0628433227539, 99.07625579833984, 103.08966827392578, 107.10307312011719, 111.11648559570312, 115.12989807128906, 119.143310546875, 123.15672302246094]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 4.0, 5.0, 5.0, 6.0, 4.0, 6.0, 7.0, 10.0, 19.0, 13.0, 17.0, 22.0, 23.0, 42.0, 34.0, 28.0, 34.0, 54.0, 49.0, 69.0, 67.0, 53.0, 51.0, 61.0, 44.0, 43.0, 37.0, 18.0, 38.0, 23.0, 31.0, 13.0, 15.0, 17.0, 9.0, 7.0, 4.0, 9.0, 3.0, 6.0, 2.0, 2.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.96875, -11.582275390625, -11.19580078125, -10.809326171875, -10.4228515625, -10.036376953125, -9.64990234375, -9.263427734375, -8.876953125, -8.490478515625, -8.10400390625, -7.717529296875, -7.3310546875, -6.944580078125, -6.55810546875, -6.171630859375, -5.78515625, -5.398681640625, -5.01220703125, -4.625732421875, -4.2392578125, -3.852783203125, -3.46630859375, -3.079833984375, -2.693359375, -2.306884765625, -1.92041015625, -1.533935546875, -1.1474609375, -0.760986328125, -0.37451171875, 0.011962890625, 0.3984375, 0.784912109375, 1.17138671875, 1.557861328125, 1.9443359375, 2.330810546875, 2.71728515625, 3.103759765625, 3.490234375, 3.876708984375, 4.26318359375, 4.649658203125, 5.0361328125, 5.422607421875, 5.80908203125, 6.195556640625, 6.58203125, 6.968505859375, 7.35498046875, 7.741455078125, 8.1279296875, 8.514404296875, 8.90087890625, 9.287353515625, 9.673828125, 10.060302734375, 10.44677734375, 10.833251953125, 11.2197265625, 11.606201171875, 11.99267578125, 12.379150390625, 12.765625]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 3.0, 7.0, 5.0, 3.0, 4.0, 11.0, 12.0, 18.0, 27.0, 24.0, 38.0, 61.0, 111.0, 192.0, 351.0, 771.0, 2086.0, 6530.0, 36187.0, 4021071.0, 112608.0, 9279.0, 2844.0, 1045.0, 425.0, 230.0, 91.0, 72.0, 47.0, 35.0, 22.0, 11.0, 24.0, 5.0, 9.0, 5.0, 7.0, 3.0, 4.0, 1.0, 3.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-71.0, -68.681640625, -66.36328125, -64.044921875, -61.7265625, -59.408203125, -57.08984375, -54.771484375, -52.453125, -50.134765625, -47.81640625, -45.498046875, -43.1796875, -40.861328125, -38.54296875, -36.224609375, -33.90625, -31.587890625, -29.26953125, -26.951171875, -24.6328125, -22.314453125, -19.99609375, -17.677734375, -15.359375, -13.041015625, -10.72265625, -8.404296875, -6.0859375, -3.767578125, -1.44921875, 0.869140625, 3.1875, 5.505859375, 7.82421875, 10.142578125, 12.4609375, 14.779296875, 17.09765625, 19.416015625, 21.734375, 24.052734375, 26.37109375, 28.689453125, 31.0078125, 33.326171875, 35.64453125, 37.962890625, 40.28125, 42.599609375, 44.91796875, 47.236328125, 49.5546875, 51.873046875, 54.19140625, 56.509765625, 58.828125, 61.146484375, 63.46484375, 65.783203125, 68.1015625, 70.419921875, 72.73828125, 75.056640625, 77.375]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 1.0, 6.0, 7.0, 4.0, 3.0, 3.0, 9.0, 8.0, 5.0, 13.0, 15.0, 20.0, 36.0, 37.0, 56.0, 117.0, 217.0, 446.0, 811.0, 926.0, 611.0, 296.0, 171.0, 71.0, 45.0, 25.0, 19.0, 12.0, 12.0, 10.0, 12.0, 7.0, 7.0, 8.0, 4.0, 5.0, 9.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.9375, -27.98095703125, -27.0244140625, -26.06787109375, -25.111328125, -24.15478515625, -23.1982421875, -22.24169921875, -21.28515625, -20.32861328125, -19.3720703125, -18.41552734375, -17.458984375, -16.50244140625, -15.5458984375, -14.58935546875, -13.6328125, -12.67626953125, -11.7197265625, -10.76318359375, -9.806640625, -8.85009765625, -7.8935546875, -6.93701171875, -5.98046875, -5.02392578125, -4.0673828125, -3.11083984375, -2.154296875, -1.19775390625, -0.2412109375, 0.71533203125, 1.671875, 2.62841796875, 3.5849609375, 4.54150390625, 5.498046875, 6.45458984375, 7.4111328125, 8.36767578125, 9.32421875, 10.28076171875, 11.2373046875, 12.19384765625, 13.150390625, 14.10693359375, 15.0634765625, 16.02001953125, 16.9765625, 17.93310546875, 18.8896484375, 19.84619140625, 20.802734375, 21.75927734375, 22.7158203125, 23.67236328125, 24.62890625, 25.58544921875, 26.5419921875, 27.49853515625, 28.455078125, 29.41162109375, 30.3681640625, 31.32470703125, 32.28125]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 5.0, 11.0, 13.0, 22.0, 33.0, 57.0, 86.0, 155.0, 249.0, 430.0, 736.0, 1313.0, 2326.0, 4302.0, 8370.0, 18175.0, 52113.0, 638659.0, 3298913.0, 115672.0, 27938.0, 11777.0, 5725.0, 3145.0, 1718.0, 969.0, 581.0, 306.0, 177.0, 102.0, 77.0, 47.0, 27.0, 17.0, 13.0, 7.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-56.5, -54.7998046875, -53.099609375, -51.3994140625, -49.69921875, -47.9990234375, -46.298828125, -44.5986328125, -42.8984375, -41.1982421875, -39.498046875, -37.7978515625, -36.09765625, -34.3974609375, -32.697265625, -30.9970703125, -29.296875, -27.5966796875, -25.896484375, -24.1962890625, -22.49609375, -20.7958984375, -19.095703125, -17.3955078125, -15.6953125, -13.9951171875, -12.294921875, -10.5947265625, -8.89453125, -7.1943359375, -5.494140625, -3.7939453125, -2.09375, -0.3935546875, 1.306640625, 3.0068359375, 4.70703125, 6.4072265625, 8.107421875, 9.8076171875, 11.5078125, 13.2080078125, 14.908203125, 16.6083984375, 18.30859375, 20.0087890625, 21.708984375, 23.4091796875, 25.109375, 26.8095703125, 28.509765625, 30.2099609375, 31.91015625, 33.6103515625, 35.310546875, 37.0107421875, 38.7109375, 40.4111328125, 42.111328125, 43.8115234375, 45.51171875, 47.2119140625, 48.912109375, 50.6123046875, 52.3125]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 6.0, 12.0, 17.0, 24.0, 41.0, 63.0, 99.0, 176.0, 204.0, 142.0, 90.0, 51.0, 26.0, 24.0, 11.0, 9.0, 7.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-244.9332733154297, -239.7628936767578, -234.59251403808594, -229.42213439941406, -224.2517547607422, -219.0813751220703, -213.91099548339844, -208.74063110351562, -203.57025146484375, -198.39987182617188, -193.2294921875, -188.05911254882812, -182.88873291015625, -177.71835327148438, -172.5479736328125, -167.37759399414062, -162.20721435546875, -157.03683471679688, -151.866455078125, -146.69607543945312, -141.52569580078125, -136.35531616210938, -131.1849365234375, -126.01456451416016, -120.84418487548828, -115.6738052368164, -110.50342559814453, -105.33304595947266, -100.16267395019531, -94.99229431152344, -89.82191467285156, -84.65153503417969, -79.48117065429688, -74.310791015625, -69.14041137695312, -63.970035552978516, -58.79965591430664, -53.629276275634766, -48.458900451660156, -43.28852081298828, -38.118141174316406, -32.94776153564453, -27.77738380432129, -22.607006072998047, -17.436626434326172, -12.266246795654297, -7.095869064331055, -1.9254913330078125, 3.2448883056640625, 8.415266990661621, 13.58564567565918, 18.756023406982422, 23.926403045654297, 29.096782684326172, 34.26715850830078, 39.437538146972656, 44.60791778564453, 49.778297424316406, 54.94867706298828, 60.11905288696289, 65.2894287109375, 70.45980834960938, 75.63018798828125, 80.80056762695312, 85.970947265625]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 2.0, 4.0, 6.0, 3.0, 1.0, 8.0, 7.0, 5.0, 6.0, 20.0, 13.0, 24.0, 18.0, 15.0, 25.0, 23.0, 23.0, 26.0, 32.0, 33.0, 30.0, 41.0, 40.0, 38.0, 43.0, 41.0, 31.0, 39.0, 45.0, 39.0, 44.0, 31.0, 37.0, 27.0, 31.0, 14.0, 21.0, 18.0, 16.0, 19.0, 10.0, 13.0, 8.0, 9.0, 7.0, 6.0, 2.0, 2.0, 3.0, 4.0, 4.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.24476623535156, -66.90499877929688, -64.56523132324219, -62.225460052490234, -59.88569259643555, -57.545921325683594, -55.206153869628906, -52.86638641357422, -50.52661895751953, -48.186851501464844, -45.84708023071289, -43.5073127746582, -41.167545318603516, -38.82777404785156, -36.488006591796875, -34.14823913574219, -31.808467864990234, -29.468698501586914, -27.128931045532227, -24.789161682128906, -22.44939422607422, -20.1096248626709, -17.769855499267578, -15.43008804321289, -13.09031867980957, -10.750550270080566, -8.410781860351562, -6.071012496948242, -3.7312440872192383, -1.3914756774902344, 0.9482936859130859, 3.2880611419677734, 5.627830505371094, 7.967598915100098, 10.307367324829102, 12.647136688232422, 14.986905097961426, 17.32667350769043, 19.66644287109375, 22.006210327148438, 24.345979690551758, 26.685749053955078, 29.025516510009766, 31.365285873413086, 33.705055236816406, 36.044822692871094, 38.38459014892578, 40.72435760498047, 43.06412887573242, 45.40389633178711, 47.74366760253906, 50.08343505859375, 52.42320251464844, 54.762969970703125, 57.10274124145508, 59.442508697509766, 61.78227996826172, 64.1220474243164, 66.4618148803711, 68.80158996582031, 71.141357421875, 73.48112487792969, 75.82089233398438, 78.16065979003906, 80.50042724609375]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 4.0, 1.0, 4.0, 4.0, 4.0, 4.0, 9.0, 8.0, 6.0, 14.0, 12.0, 12.0, 21.0, 19.0, 25.0, 37.0, 31.0, 35.0, 30.0, 31.0, 49.0, 55.0, 54.0, 46.0, 57.0, 39.0, 48.0, 36.0, 39.0, 35.0, 33.0, 35.0, 32.0, 18.0, 25.0, 18.0, 19.0, 18.0, 13.0, 7.0, 4.0, 4.0, 2.0, 3.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.265625, -10.899658203125, -10.53369140625, -10.167724609375, -9.8017578125, -9.435791015625, -9.06982421875, -8.703857421875, -8.337890625, -7.971923828125, -7.60595703125, -7.239990234375, -6.8740234375, -6.508056640625, -6.14208984375, -5.776123046875, -5.41015625, -5.044189453125, -4.67822265625, -4.312255859375, -3.9462890625, -3.580322265625, -3.21435546875, -2.848388671875, -2.482421875, -2.116455078125, -1.75048828125, -1.384521484375, -1.0185546875, -0.652587890625, -0.28662109375, 0.079345703125, 0.4453125, 0.811279296875, 1.17724609375, 1.543212890625, 1.9091796875, 2.275146484375, 2.64111328125, 3.007080078125, 3.373046875, 3.739013671875, 4.10498046875, 4.470947265625, 4.8369140625, 5.202880859375, 5.56884765625, 5.934814453125, 6.30078125, 6.666748046875, 7.03271484375, 7.398681640625, 7.7646484375, 8.130615234375, 8.49658203125, 8.862548828125, 9.228515625, 9.594482421875, 9.96044921875, 10.326416015625, 10.6923828125, 11.058349609375, 11.42431640625, 11.790283203125, 12.15625]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 3.0, 5.0, 7.0, 15.0, 18.0, 13.0, 29.0, 48.0, 68.0, 104.0, 129.0, 196.0, 268.0, 329.0, 546.0, 796.0, 1149.0, 1507.0, 2400.0, 3448.0, 5343.0, 8116.0, 12790.0, 20371.0, 33655.0, 58089.0, 108637.0, 222712.0, 262609.0, 132377.0, 68256.0, 39022.0, 23346.0, 14478.0, 9293.0, 6023.0, 3916.0, 2655.0, 1831.0, 1149.0, 808.0, 607.0, 405.0, 315.0, 213.0, 136.0, 97.0, 73.0, 51.0, 30.0, 33.0, 24.0, 16.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.1142578125, -1.0784759521484375, -1.042694091796875, -1.0069122314453125, -0.97113037109375, -0.9353485107421875, -0.899566650390625, -0.8637847900390625, -0.8280029296875, -0.7922210693359375, -0.756439208984375, -0.7206573486328125, -0.68487548828125, -0.6490936279296875, -0.613311767578125, -0.5775299072265625, -0.541748046875, -0.5059661865234375, -0.470184326171875, -0.4344024658203125, -0.39862060546875, -0.3628387451171875, -0.327056884765625, -0.2912750244140625, -0.2554931640625, -0.2197113037109375, -0.183929443359375, -0.1481475830078125, -0.11236572265625, -0.0765838623046875, -0.040802001953125, -0.0050201416015625, 0.03076171875, 0.0665435791015625, 0.102325439453125, 0.1381072998046875, 0.17388916015625, 0.2096710205078125, 0.245452880859375, 0.2812347412109375, 0.3170166015625, 0.3527984619140625, 0.388580322265625, 0.4243621826171875, 0.46014404296875, 0.4959259033203125, 0.531707763671875, 0.5674896240234375, 0.603271484375, 0.6390533447265625, 0.674835205078125, 0.7106170654296875, 0.74639892578125, 0.7821807861328125, 0.817962646484375, 0.8537445068359375, 0.8895263671875, 0.9253082275390625, 0.961090087890625, 0.9968719482421875, 1.03265380859375, 1.0684356689453125, 1.104217529296875, 1.1399993896484375, 1.17578125]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 5.0, 1.0, 9.0, 5.0, 4.0, 11.0, 16.0, 16.0, 16.0, 18.0, 31.0, 27.0, 26.0, 22.0, 31.0, 39.0, 24.0, 25.0, 36.0, 31.0, 40.0, 51.0, 1054.0, 42.0, 44.0, 33.0, 38.0, 30.0, 29.0, 33.0, 38.0, 30.0, 30.0, 23.0, 17.0, 17.0, 17.0, 14.0, 11.0, 10.0, 8.0, 8.0, 5.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.0234375, -5.8134765625, -5.603515625, -5.3935546875, -5.18359375, -4.9736328125, -4.763671875, -4.5537109375, -4.34375, -4.1337890625, -3.923828125, -3.7138671875, -3.50390625, -3.2939453125, -3.083984375, -2.8740234375, -2.6640625, -2.4541015625, -2.244140625, -2.0341796875, -1.82421875, -1.6142578125, -1.404296875, -1.1943359375, -0.984375, -0.7744140625, -0.564453125, -0.3544921875, -0.14453125, 0.0654296875, 0.275390625, 0.4853515625, 0.6953125, 0.9052734375, 1.115234375, 1.3251953125, 1.53515625, 1.7451171875, 1.955078125, 2.1650390625, 2.375, 2.5849609375, 2.794921875, 3.0048828125, 3.21484375, 3.4248046875, 3.634765625, 3.8447265625, 4.0546875, 4.2646484375, 4.474609375, 4.6845703125, 4.89453125, 5.1044921875, 5.314453125, 5.5244140625, 5.734375, 5.9443359375, 6.154296875, 6.3642578125, 6.57421875, 6.7841796875, 6.994140625, 7.2041015625, 7.4140625]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 7.0, 9.0, 17.0, 16.0, 37.0, 49.0, 87.0, 116.0, 160.0, 279.0, 413.0, 685.0, 995.0, 1577.0, 2530.0, 3840.0, 6088.0, 9694.0, 15455.0, 24680.0, 40913.0, 69615.0, 124625.0, 683999.0, 806968.0, 126088.0, 69611.0, 40639.0, 25077.0, 15711.0, 9997.0, 6267.0, 3951.0, 2468.0, 1559.0, 1033.0, 643.0, 453.0, 270.0, 150.0, 125.0, 89.0, 56.0, 33.0, 20.0, 14.0, 8.0, 9.0, 4.0, 1.0, 5.0, 0.0, 2.0], "bins": [-0.767578125, -0.7456512451171875, -0.723724365234375, -0.7017974853515625, -0.67987060546875, -0.6579437255859375, -0.636016845703125, -0.6140899658203125, -0.5921630859375, -0.5702362060546875, -0.548309326171875, -0.5263824462890625, -0.50445556640625, -0.4825286865234375, -0.460601806640625, -0.4386749267578125, -0.416748046875, -0.3948211669921875, -0.372894287109375, -0.3509674072265625, -0.32904052734375, -0.3071136474609375, -0.285186767578125, -0.2632598876953125, -0.2413330078125, -0.2194061279296875, -0.197479248046875, -0.1755523681640625, -0.15362548828125, -0.1316986083984375, -0.109771728515625, -0.0878448486328125, -0.06591796875, -0.0439910888671875, -0.022064208984375, -0.0001373291015625, 0.02178955078125, 0.0437164306640625, 0.065643310546875, 0.0875701904296875, 0.1094970703125, 0.1314239501953125, 0.153350830078125, 0.1752777099609375, 0.19720458984375, 0.2191314697265625, 0.241058349609375, 0.2629852294921875, 0.284912109375, 0.3068389892578125, 0.328765869140625, 0.3506927490234375, 0.37261962890625, 0.3945465087890625, 0.416473388671875, 0.4384002685546875, 0.4603271484375, 0.4822540283203125, 0.504180908203125, 0.5261077880859375, 0.54803466796875, 0.5699615478515625, 0.591888427734375, 0.6138153076171875, 0.6357421875]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 3.0, 5.0, 4.0, 3.0, 7.0, 2.0, 5.0, 10.0, 8.0, 13.0, 10.0, 9.0, 11.0, 18.0, 16.0, 18.0, 25.0, 28.0, 35.0, 39.0, 49.0, 62.0, 67.0, 72.0, 68.0, 72.0, 54.0, 47.0, 31.0, 38.0, 22.0, 25.0, 16.0, 19.0, 19.0, 12.0, 10.0, 13.0, 2.0, 4.0, 9.0, 5.0, 5.0, 3.0, 3.0, 1.0, 5.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01110076904296875, -0.010750174522399902, -0.010399580001831055, -0.010048985481262207, -0.00969839096069336, -0.009347796440124512, -0.008997201919555664, -0.008646607398986816, -0.008296012878417969, -0.007945418357849121, -0.0075948238372802734, -0.007244229316711426, -0.006893634796142578, -0.0065430402755737305, -0.006192445755004883, -0.005841851234436035, -0.0054912567138671875, -0.00514066219329834, -0.004790067672729492, -0.0044394731521606445, -0.004088878631591797, -0.0037382841110229492, -0.0033876895904541016, -0.003037095069885254, -0.0026865005493164062, -0.0023359060287475586, -0.001985311508178711, -0.0016347169876098633, -0.0012841224670410156, -0.000933527946472168, -0.0005829334259033203, -0.00023233890533447266, 0.000118255615234375, 0.00046885013580322266, 0.0008194446563720703, 0.001170039176940918, 0.0015206336975097656, 0.0018712282180786133, 0.002221822738647461, 0.0025724172592163086, 0.0029230117797851562, 0.003273606300354004, 0.0036242008209228516, 0.003974795341491699, 0.004325389862060547, 0.0046759843826293945, 0.005026578903198242, 0.00537717342376709, 0.0057277679443359375, 0.006078362464904785, 0.006428956985473633, 0.0067795515060424805, 0.007130146026611328, 0.007480740547180176, 0.007831335067749023, 0.008181929588317871, 0.008532524108886719, 0.008883118629455566, 0.009233713150024414, 0.009584307670593262, 0.00993490219116211, 0.010285496711730957, 0.010636091232299805, 0.010986685752868652, 0.0113372802734375]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 6.0, 2.0, 6.0, 8.0, 8.0, 10.0, 10.0, 10.0, 23.0, 27.0, 29.0, 28.0, 52.0, 79.0, 114.0, 154.0, 272.0, 743.0, 6406.0, 884851.0, 151469.0, 2998.0, 514.0, 235.0, 105.0, 101.0, 64.0, 44.0, 39.0, 30.0, 32.0, 23.0, 17.0, 9.0, 7.0, 10.0, 4.0, 3.0, 3.0, 1.0, 1.0, 3.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0], "bins": [-0.5537109375, -0.5373573303222656, -0.5210037231445312, -0.5046501159667969, -0.4882965087890625, -0.4719429016113281, -0.45558929443359375, -0.4392356872558594, -0.422882080078125, -0.4065284729003906, -0.39017486572265625, -0.3738212585449219, -0.3574676513671875, -0.3411140441894531, -0.32476043701171875, -0.3084068298339844, -0.29205322265625, -0.2756996154785156, -0.25934600830078125, -0.24299240112304688, -0.2266387939453125, -0.21028518676757812, -0.19393157958984375, -0.17757797241210938, -0.161224365234375, -0.14487075805664062, -0.12851715087890625, -0.11216354370117188, -0.0958099365234375, -0.07945632934570312, -0.06310272216796875, -0.046749114990234375, -0.0303955078125, -0.014041900634765625, 0.00231170654296875, 0.018665313720703125, 0.0350189208984375, 0.051372528076171875, 0.06772613525390625, 0.08407974243164062, 0.100433349609375, 0.11678695678710938, 0.13314056396484375, 0.14949417114257812, 0.1658477783203125, 0.18220138549804688, 0.19855499267578125, 0.21490859985351562, 0.23126220703125, 0.24761581420898438, 0.26396942138671875, 0.2803230285644531, 0.2966766357421875, 0.3130302429199219, 0.32938385009765625, 0.3457374572753906, 0.362091064453125, 0.3784446716308594, 0.39479827880859375, 0.4111518859863281, 0.4275054931640625, 0.4438591003417969, 0.46021270751953125, 0.4765663146972656, 0.492919921875]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [3.0, 14.0, 46.0, 226.0, 550.0, 136.0, 29.0, 10.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.033143263310194016, -0.025342797860503197, -0.017542332410812378, -0.009741868823766708, -0.0019414033740758896, 0.005859062075614929, 0.013659525662660599, 0.021459992974996567, 0.029260456562042236, 0.037060920149087906, 0.044861387461423874, 0.05266185104846954, 0.06046231836080551, 0.06826278567314148, 0.07606324553489685, 0.08386371284723282, 0.09166418015956879, 0.09946464747190475, 0.10726510733366013, 0.1150655746459961, 0.12286604195833206, 0.13066650927066803, 0.1384669691324234, 0.14626744389533997, 0.15406790375709534, 0.1618683636188507, 0.16966883838176727, 0.17746929824352264, 0.18526975810527802, 0.19307023286819458, 0.20087069272994995, 0.20867115259170532, 0.2164716273546219, 0.22427208721637726, 0.23207256197929382, 0.2398730218410492, 0.24767348170280457, 0.25547394156455994, 0.2632744312286377, 0.27107489109039307, 0.27887535095214844, 0.2866758108139038, 0.2944762706756592, 0.30227673053741455, 0.3100772202014923, 0.3178776800632477, 0.32567813992500305, 0.3334785997867584, 0.3412790596485138, 0.34907951951026917, 0.35687997937202454, 0.3646804690361023, 0.37248092889785767, 0.38028138875961304, 0.3880818486213684, 0.3958823084831238, 0.40368279814720154, 0.4114832580089569, 0.4192837178707123, 0.42708420753479004, 0.4348846673965454, 0.4426851272583008, 0.45048558712005615, 0.4582860469818115, 0.4660865068435669]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 7.0, 5.0, 8.0, 7.0, 13.0, 11.0, 14.0, 14.0, 17.0, 20.0, 15.0, 11.0, 22.0, 29.0, 25.0, 41.0, 35.0, 35.0, 36.0, 37.0, 45.0, 40.0, 43.0, 39.0, 42.0, 38.0, 34.0, 29.0, 37.0, 30.0, 23.0, 27.0, 32.0, 22.0, 22.0, 15.0, 15.0, 22.0, 11.0, 11.0, 9.0, 6.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.013226926326751709, -0.01282772421836853, -0.012428522109985352, -0.012029320001602173, -0.011630117893218994, -0.011230915784835815, -0.010831713676452637, -0.010432511568069458, -0.01003330945968628, -0.0096341073513031, -0.009234905242919922, -0.008835703134536743, -0.008436501026153564, -0.008037298917770386, -0.007638096809387207, -0.007238894701004028, -0.00683969259262085, -0.006440490484237671, -0.006041288375854492, -0.0056420862674713135, -0.005242884159088135, -0.004843682050704956, -0.004444479942321777, -0.004045277833938599, -0.00364607572555542, -0.003246873617172241, -0.0028476715087890625, -0.002448469400405884, -0.002049267292022705, -0.0016500651836395264, -0.0012508630752563477, -0.0008516609668731689, -0.00045245885848999023, -5.3256750106811523e-05, 0.0003459453582763672, 0.0007451474666595459, 0.0011443495750427246, 0.0015435516834259033, 0.001942753791809082, 0.0023419559001922607, 0.0027411580085754395, 0.003140360116958618, 0.003539562225341797, 0.003938764333724976, 0.004337966442108154, 0.004737168550491333, 0.005136370658874512, 0.00553557276725769, 0.005934774875640869, 0.006333976984024048, 0.0067331790924072266, 0.007132381200790405, 0.007531583309173584, 0.007930785417556763, 0.008329987525939941, 0.00872918963432312, 0.009128391742706299, 0.009527593851089478, 0.009926795959472656, 0.010325998067855835, 0.010725200176239014, 0.011124402284622192, 0.011523604393005371, 0.01192280650138855, 0.012322008609771729]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 4.0, 1.0, 4.0, 4.0, 4.0, 4.0, 9.0, 8.0, 6.0, 15.0, 11.0, 12.0, 21.0, 19.0, 25.0, 37.0, 31.0, 35.0, 30.0, 31.0, 49.0, 55.0, 54.0, 46.0, 57.0, 39.0, 48.0, 36.0, 39.0, 35.0, 33.0, 35.0, 32.0, 18.0, 25.0, 18.0, 19.0, 18.0, 13.0, 7.0, 4.0, 4.0, 2.0, 3.0, 3.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.265625, -10.899658203125, -10.53369140625, -10.167724609375, -9.8017578125, -9.435791015625, -9.06982421875, -8.703857421875, -8.337890625, -7.971923828125, -7.60595703125, -7.239990234375, -6.8740234375, -6.508056640625, -6.14208984375, -5.776123046875, -5.41015625, -5.044189453125, -4.67822265625, -4.312255859375, -3.9462890625, -3.580322265625, -3.21435546875, -2.848388671875, -2.482421875, -2.116455078125, -1.75048828125, -1.384521484375, -1.0185546875, -0.652587890625, -0.28662109375, 0.079345703125, 0.4453125, 0.811279296875, 1.17724609375, 1.543212890625, 1.9091796875, 2.275146484375, 2.64111328125, 3.007080078125, 3.373046875, 3.739013671875, 4.10498046875, 4.470947265625, 4.8369140625, 5.202880859375, 5.56884765625, 5.934814453125, 6.30078125, 6.666748046875, 7.03271484375, 7.398681640625, 7.7646484375, 8.130615234375, 8.49658203125, 8.862548828125, 9.228515625, 9.594482421875, 9.96044921875, 10.326416015625, 10.6923828125, 11.058349609375, 11.42431640625, 11.790283203125, 12.15625]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 4.0, 2.0, 3.0, 3.0, 6.0, 5.0, 8.0, 13.0, 12.0, 12.0, 23.0, 30.0, 43.0, 59.0, 95.0, 108.0, 187.0, 237.0, 402.0, 593.0, 1053.0, 1863.0, 3594.0, 7412.0, 17179.0, 47684.0, 163485.0, 533642.0, 183643.0, 52206.0, 18566.0, 7611.0, 3629.0, 2009.0, 1122.0, 688.0, 410.0, 290.0, 182.0, 141.0, 95.0, 58.0, 46.0, 29.0, 20.0, 16.0, 18.0, 7.0, 7.0, 4.0, 6.0, 2.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.06640625, -4.8948974609375, -4.723388671875, -4.5518798828125, -4.38037109375, -4.2088623046875, -4.037353515625, -3.8658447265625, -3.6943359375, -3.5228271484375, -3.351318359375, -3.1798095703125, -3.00830078125, -2.8367919921875, -2.665283203125, -2.4937744140625, -2.322265625, -2.1507568359375, -1.979248046875, -1.8077392578125, -1.63623046875, -1.4647216796875, -1.293212890625, -1.1217041015625, -0.9501953125, -0.7786865234375, -0.607177734375, -0.4356689453125, -0.26416015625, -0.0926513671875, 0.078857421875, 0.2503662109375, 0.421875, 0.5933837890625, 0.764892578125, 0.9364013671875, 1.10791015625, 1.2794189453125, 1.450927734375, 1.6224365234375, 1.7939453125, 1.9654541015625, 2.136962890625, 2.3084716796875, 2.47998046875, 2.6514892578125, 2.822998046875, 2.9945068359375, 3.166015625, 3.3375244140625, 3.509033203125, 3.6805419921875, 3.85205078125, 4.0235595703125, 4.195068359375, 4.3665771484375, 4.5380859375, 4.7095947265625, 4.881103515625, 5.0526123046875, 5.22412109375, 5.3956298828125, 5.567138671875, 5.7386474609375, 5.91015625]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 3.0, 1.0, 7.0, 5.0, 5.0, 12.0, 8.0, 7.0, 15.0, 15.0, 19.0, 29.0, 19.0, 25.0, 25.0, 25.0, 34.0, 32.0, 34.0, 32.0, 44.0, 55.0, 206.0, 1890.0, 70.0, 40.0, 24.0, 44.0, 26.0, 33.0, 33.0, 28.0, 28.0, 16.0, 27.0, 22.0, 16.0, 16.0, 19.0, 10.0, 10.0, 11.0, 11.0, 6.0, 4.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-39.46875, -38.27880859375, -37.0888671875, -35.89892578125, -34.708984375, -33.51904296875, -32.3291015625, -31.13916015625, -29.94921875, -28.75927734375, -27.5693359375, -26.37939453125, -25.189453125, -23.99951171875, -22.8095703125, -21.61962890625, -20.4296875, -19.23974609375, -18.0498046875, -16.85986328125, -15.669921875, -14.47998046875, -13.2900390625, -12.10009765625, -10.91015625, -9.72021484375, -8.5302734375, -7.34033203125, -6.150390625, -4.96044921875, -3.7705078125, -2.58056640625, -1.390625, -0.20068359375, 0.9892578125, 2.17919921875, 3.369140625, 4.55908203125, 5.7490234375, 6.93896484375, 8.12890625, 9.31884765625, 10.5087890625, 11.69873046875, 12.888671875, 14.07861328125, 15.2685546875, 16.45849609375, 17.6484375, 18.83837890625, 20.0283203125, 21.21826171875, 22.408203125, 23.59814453125, 24.7880859375, 25.97802734375, 27.16796875, 28.35791015625, 29.5478515625, 30.73779296875, 31.927734375, 33.11767578125, 34.3076171875, 35.49755859375, 36.6875]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 4.0, 6.0, 10.0, 10.0, 6.0, 15.0, 19.0, 14.0, 19.0, 21.0, 29.0, 25.0, 44.0, 55.0, 64.0, 117.0, 132.0, 213.0, 352.0, 664.0, 2958.0, 3031486.0, 106462.0, 1466.0, 528.0, 312.0, 199.0, 110.0, 79.0, 51.0, 40.0, 36.0, 23.0, 28.0, 22.0, 18.0, 15.0, 8.0, 8.0, 7.0, 6.0, 6.0, 7.0, 1.0, 2.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-60.1875, -58.2353515625, -56.283203125, -54.3310546875, -52.37890625, -50.4267578125, -48.474609375, -46.5224609375, -44.5703125, -42.6181640625, -40.666015625, -38.7138671875, -36.76171875, -34.8095703125, -32.857421875, -30.9052734375, -28.953125, -27.0009765625, -25.048828125, -23.0966796875, -21.14453125, -19.1923828125, -17.240234375, -15.2880859375, -13.3359375, -11.3837890625, -9.431640625, -7.4794921875, -5.52734375, -3.5751953125, -1.623046875, 0.3291015625, 2.28125, 4.2333984375, 6.185546875, 8.1376953125, 10.08984375, 12.0419921875, 13.994140625, 15.9462890625, 17.8984375, 19.8505859375, 21.802734375, 23.7548828125, 25.70703125, 27.6591796875, 29.611328125, 31.5634765625, 33.515625, 35.4677734375, 37.419921875, 39.3720703125, 41.32421875, 43.2763671875, 45.228515625, 47.1806640625, 49.1328125, 51.0849609375, 53.037109375, 54.9892578125, 56.94140625, 58.8935546875, 60.845703125, 62.7978515625, 64.75]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 412.0, 606.0, 1.0, 1.0, 2.0], "bins": [-669.5501708984375, -658.401123046875, -647.2520751953125, -636.10302734375, -624.9539794921875, -613.8049926757812, -602.6559448242188, -591.5068969726562, -580.3578491210938, -569.2088012695312, -558.0597534179688, -546.9107055664062, -535.7616577148438, -524.6126708984375, -513.463623046875, -502.3145751953125, -491.16552734375, -480.0164794921875, -468.867431640625, -457.7184143066406, -446.5693664550781, -435.4203186035156, -424.2712707519531, -413.12225341796875, -401.9731750488281, -390.8241271972656, -379.6750793457031, -368.52606201171875, -357.37701416015625, -346.22796630859375, -335.07891845703125, -323.92987060546875, -312.78082275390625, -301.63177490234375, -290.48272705078125, -279.3337097167969, -268.1846618652344, -257.0356140136719, -245.88656616210938, -234.73753356933594, -223.5885009765625, -212.439453125, -201.29042053222656, -190.14137268066406, -178.99234008789062, -167.84329223632812, -156.69424438476562, -145.5452117919922, -134.39617919921875, -123.24713897705078, -112.09809875488281, -100.94905090332031, -89.80001831054688, -78.65097045898438, -67.5019302368164, -56.35289001464844, -45.20384216308594, -34.05480194091797, -22.905759811401367, -11.756717681884766, -0.6076774597167969, 10.541362762451172, 21.690406799316406, 32.839447021484375, 43.988487243652344]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 6.0, 5.0, 2.0, 5.0, 10.0, 6.0, 6.0, 10.0, 14.0, 11.0, 12.0, 24.0, 26.0, 21.0, 26.0, 20.0, 28.0, 31.0, 42.0, 32.0, 34.0, 40.0, 30.0, 36.0, 46.0, 40.0, 35.0, 29.0, 25.0, 32.0, 33.0, 41.0, 32.0, 23.0, 22.0, 21.0, 16.0, 23.0, 12.0, 17.0, 9.0, 17.0, 11.0, 6.0, 10.0, 9.0, 8.0, 7.0, 5.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0], "bins": [-127.93402099609375, -124.18264770507812, -120.43128204345703, -116.67991638183594, -112.92854309082031, -109.17716979980469, -105.4258041381836, -101.6744384765625, -97.92306518554688, -94.17169189453125, -90.42032623291016, -86.66896057128906, -82.91758728027344, -79.16621398925781, -75.41484832763672, -71.66348266601562, -67.912109375, -64.16073608398438, -60.40937042236328, -56.65800094604492, -52.90663146972656, -49.1552619934082, -45.403892517089844, -41.652523040771484, -37.901153564453125, -34.149784088134766, -30.398414611816406, -26.647045135498047, -22.895675659179688, -19.144306182861328, -15.392936706542969, -11.64156723022461, -7.89019775390625, -4.138828277587891, -0.38745880126953125, 3.363910675048828, 7.1152801513671875, 10.866649627685547, 14.618019104003906, 18.369388580322266, 22.120758056640625, 25.872127532958984, 29.623497009277344, 33.3748664855957, 37.12623596191406, 40.87760543823242, 44.62897491455078, 48.38034439086914, 52.1317138671875, 55.88308334350586, 59.63445281982422, 63.38582229614258, 67.13719177246094, 70.88856506347656, 74.63993072509766, 78.39129638671875, 82.14266967773438, 85.89404296875, 89.6454086303711, 93.39677429199219, 97.14814758300781, 100.89952087402344, 104.65088653564453, 108.40225219726562, 112.15362548828125]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 1.0, 3.0, 4.0, 6.0, 4.0, 6.0, 6.0, 10.0, 14.0, 9.0, 13.0, 20.0, 11.0, 27.0, 34.0, 35.0, 28.0, 29.0, 37.0, 38.0, 54.0, 54.0, 47.0, 55.0, 42.0, 47.0, 39.0, 41.0, 32.0, 40.0, 30.0, 36.0, 23.0, 18.0, 24.0, 18.0, 14.0, 21.0, 8.0, 6.0, 4.0, 4.0, 1.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-11.3828125, -11.017822265625, -10.65283203125, -10.287841796875, -9.9228515625, -9.557861328125, -9.19287109375, -8.827880859375, -8.462890625, -8.097900390625, -7.73291015625, -7.367919921875, -7.0029296875, -6.637939453125, -6.27294921875, -5.907958984375, -5.54296875, -5.177978515625, -4.81298828125, -4.447998046875, -4.0830078125, -3.718017578125, -3.35302734375, -2.988037109375, -2.623046875, -2.258056640625, -1.89306640625, -1.528076171875, -1.1630859375, -0.798095703125, -0.43310546875, -0.068115234375, 0.296875, 0.661865234375, 1.02685546875, 1.391845703125, 1.7568359375, 2.121826171875, 2.48681640625, 2.851806640625, 3.216796875, 3.581787109375, 3.94677734375, 4.311767578125, 4.6767578125, 5.041748046875, 5.40673828125, 5.771728515625, 6.13671875, 6.501708984375, 6.86669921875, 7.231689453125, 7.5966796875, 7.961669921875, 8.32666015625, 8.691650390625, 9.056640625, 9.421630859375, 9.78662109375, 10.151611328125, 10.5166015625, 10.881591796875, 11.24658203125, 11.611572265625, 11.9765625]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 3.0, 3.0, 5.0, 6.0, 9.0, 13.0, 9.0, 21.0, 31.0, 38.0, 44.0, 75.0, 85.0, 130.0, 147.0, 213.0, 336.0, 425.0, 713.0, 936.0, 1508.0, 2239.0, 3688.0, 6241.0, 11755.0, 47183.0, 1004766.0, 2944907.0, 131017.0, 17568.0, 7864.0, 4526.0, 2674.0, 1695.0, 1070.0, 743.0, 475.0, 330.0, 233.0, 158.0, 120.0, 79.0, 63.0, 38.0, 33.0, 23.0, 14.0, 7.0, 16.0, 5.0, 2.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-32.84375, -31.85400390625, -30.8642578125, -29.87451171875, -28.884765625, -27.89501953125, -26.9052734375, -25.91552734375, -24.92578125, -23.93603515625, -22.9462890625, -21.95654296875, -20.966796875, -19.97705078125, -18.9873046875, -17.99755859375, -17.0078125, -16.01806640625, -15.0283203125, -14.03857421875, -13.048828125, -12.05908203125, -11.0693359375, -10.07958984375, -9.08984375, -8.10009765625, -7.1103515625, -6.12060546875, -5.130859375, -4.14111328125, -3.1513671875, -2.16162109375, -1.171875, -0.18212890625, 0.8076171875, 1.79736328125, 2.787109375, 3.77685546875, 4.7666015625, 5.75634765625, 6.74609375, 7.73583984375, 8.7255859375, 9.71533203125, 10.705078125, 11.69482421875, 12.6845703125, 13.67431640625, 14.6640625, 15.65380859375, 16.6435546875, 17.63330078125, 18.623046875, 19.61279296875, 20.6025390625, 21.59228515625, 22.58203125, 23.57177734375, 24.5615234375, 25.55126953125, 26.541015625, 27.53076171875, 28.5205078125, 29.51025390625, 30.5]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 5.0, 2.0, 6.0, 7.0, 6.0, 10.0, 11.0, 12.0, 10.0, 12.0, 19.0, 32.0, 30.0, 72.0, 126.0, 274.0, 530.0, 929.0, 877.0, 507.0, 245.0, 118.0, 61.0, 36.0, 29.0, 13.0, 16.0, 9.0, 13.0, 10.0, 4.0, 9.0, 6.0, 4.0, 9.0, 1.0, 2.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-34.375, -33.361572265625, -32.34814453125, -31.334716796875, -30.3212890625, -29.307861328125, -28.29443359375, -27.281005859375, -26.267578125, -25.254150390625, -24.24072265625, -23.227294921875, -22.2138671875, -21.200439453125, -20.18701171875, -19.173583984375, -18.16015625, -17.146728515625, -16.13330078125, -15.119873046875, -14.1064453125, -13.093017578125, -12.07958984375, -11.066162109375, -10.052734375, -9.039306640625, -8.02587890625, -7.012451171875, -5.9990234375, -4.985595703125, -3.97216796875, -2.958740234375, -1.9453125, -0.931884765625, 0.08154296875, 1.094970703125, 2.1083984375, 3.121826171875, 4.13525390625, 5.148681640625, 6.162109375, 7.175537109375, 8.18896484375, 9.202392578125, 10.2158203125, 11.229248046875, 12.24267578125, 13.256103515625, 14.26953125, 15.282958984375, 16.29638671875, 17.309814453125, 18.3232421875, 19.336669921875, 20.35009765625, 21.363525390625, 22.376953125, 23.390380859375, 24.40380859375, 25.417236328125, 26.4306640625, 27.444091796875, 28.45751953125, 29.470947265625, 30.484375]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 5.0, 7.0, 10.0, 15.0, 26.0, 21.0, 42.0, 67.0, 95.0, 143.0, 231.0, 316.0, 466.0, 726.0, 1139.0, 1694.0, 2780.0, 4390.0, 7326.0, 12642.0, 24948.0, 69090.0, 735850.0, 3090272.0, 162153.0, 37933.0, 17192.0, 9504.0, 5550.0, 3464.0, 2169.0, 1379.0, 915.0, 597.0, 370.0, 260.0, 160.0, 110.0, 65.0, 55.0, 45.0, 19.0, 15.0, 12.0, 12.0, 4.0, 2.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.03125, -36.6845703125, -35.337890625, -33.9912109375, -32.64453125, -31.2978515625, -29.951171875, -28.6044921875, -27.2578125, -25.9111328125, -24.564453125, -23.2177734375, -21.87109375, -20.5244140625, -19.177734375, -17.8310546875, -16.484375, -15.1376953125, -13.791015625, -12.4443359375, -11.09765625, -9.7509765625, -8.404296875, -7.0576171875, -5.7109375, -4.3642578125, -3.017578125, -1.6708984375, -0.32421875, 1.0224609375, 2.369140625, 3.7158203125, 5.0625, 6.4091796875, 7.755859375, 9.1025390625, 10.44921875, 11.7958984375, 13.142578125, 14.4892578125, 15.8359375, 17.1826171875, 18.529296875, 19.8759765625, 21.22265625, 22.5693359375, 23.916015625, 25.2626953125, 26.609375, 27.9560546875, 29.302734375, 30.6494140625, 31.99609375, 33.3427734375, 34.689453125, 36.0361328125, 37.3828125, 38.7294921875, 40.076171875, 41.4228515625, 42.76953125, 44.1162109375, 45.462890625, 46.8095703125, 48.15625]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 7.0, 21.0, 48.0, 92.0, 255.0, 344.0, 132.0, 51.0, 23.0, 17.0, 7.0, 11.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-137.1599578857422, -126.76881408691406, -116.37767028808594, -105.98652648925781, -95.59538269042969, -85.20423889160156, -74.81310272216797, -64.42195892333984, -54.03081512451172, -43.639671325683594, -33.24852752685547, -22.85738754272461, -12.466243743896484, -2.0750999450683594, 8.3160400390625, 18.707183837890625, 29.09832763671875, 39.489471435546875, 49.880615234375, 60.27175521850586, 70.66290283203125, 81.05404663085938, 91.44518280029297, 101.8363265991211, 112.22747039794922, 122.61861419677734, 133.00975036621094, 143.40089416503906, 153.7920379638672, 164.1831817626953, 174.57432556152344, 184.96546936035156, 195.35659790039062, 205.74774169921875, 216.13888549804688, 226.530029296875, 236.92117309570312, 247.31231689453125, 257.7034606933594, 268.0946044921875, 278.4857482910156, 288.87689208984375, 299.2680358886719, 309.6591796875, 320.0503234863281, 330.44146728515625, 340.8326110839844, 351.2237548828125, 361.6148681640625, 372.0060119628906, 382.39715576171875, 392.7882995605469, 403.179443359375, 413.5705871582031, 423.96173095703125, 434.3528747558594, 444.7440185546875, 455.1351623535156, 465.52630615234375, 475.9174499511719, 486.30859375, 496.6997375488281, 507.09088134765625, 517.4819946289062, 527.8731689453125]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 5.0, 7.0, 5.0, 10.0, 14.0, 13.0, 20.0, 27.0, 16.0, 27.0, 23.0, 23.0, 25.0, 31.0, 34.0, 37.0, 35.0, 51.0, 42.0, 44.0, 49.0, 43.0, 55.0, 38.0, 41.0, 28.0, 32.0, 31.0, 24.0, 26.0, 31.0, 20.0, 17.0, 17.0, 11.0, 17.0, 6.0, 7.0, 12.0, 5.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.45968627929688, -81.68390655517578, -78.90812683105469, -76.13233947753906, -73.35655975341797, -70.58078002929688, -67.80500030517578, -65.02922058105469, -62.25343704223633, -59.477657318115234, -56.701873779296875, -53.92609405517578, -51.15031433105469, -48.37453079223633, -45.598751068115234, -42.822967529296875, -40.04718780517578, -37.27140808105469, -34.49562454223633, -31.719844818115234, -28.944063186645508, -26.16828155517578, -23.392501831054688, -20.61672019958496, -17.840938568115234, -15.065156936645508, -12.289376258850098, -9.513595581054688, -6.737813949584961, -3.9620323181152344, -1.1862525939941406, 1.589529037475586, 4.365318298339844, 7.141099452972412, 9.91688060760498, 12.69266128540039, 15.468442916870117, 18.244224548339844, 21.020004272460938, 23.795785903930664, 26.57156753540039, 29.347349166870117, 32.123130798339844, 34.89891052246094, 37.67469024658203, 40.45047378540039, 43.226253509521484, 46.002037048339844, 48.77781677246094, 51.55359649658203, 54.32938003540039, 57.105159759521484, 59.880943298339844, 62.65672302246094, 65.43250274658203, 68.20828247070312, 70.98406982421875, 73.75984954833984, 76.53562927246094, 79.31141662597656, 82.08719635009766, 84.86297607421875, 87.63875579833984, 90.41453552246094, 93.19031524658203]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 5.0, 3.0, 8.0, 3.0, 9.0, 10.0, 6.0, 11.0, 10.0, 16.0, 14.0, 16.0, 32.0, 28.0, 31.0, 45.0, 34.0, 40.0, 36.0, 31.0, 55.0, 41.0, 60.0, 47.0, 52.0, 45.0, 31.0, 36.0, 27.0, 39.0, 34.0, 24.0, 24.0, 21.0, 19.0, 16.0, 12.0, 6.0, 7.0, 6.0, 8.0, 3.0, 0.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.9453125, -11.5615234375, -11.177734375, -10.7939453125, -10.41015625, -10.0263671875, -9.642578125, -9.2587890625, -8.875, -8.4912109375, -8.107421875, -7.7236328125, -7.33984375, -6.9560546875, -6.572265625, -6.1884765625, -5.8046875, -5.4208984375, -5.037109375, -4.6533203125, -4.26953125, -3.8857421875, -3.501953125, -3.1181640625, -2.734375, -2.3505859375, -1.966796875, -1.5830078125, -1.19921875, -0.8154296875, -0.431640625, -0.0478515625, 0.3359375, 0.7197265625, 1.103515625, 1.4873046875, 1.87109375, 2.2548828125, 2.638671875, 3.0224609375, 3.40625, 3.7900390625, 4.173828125, 4.5576171875, 4.94140625, 5.3251953125, 5.708984375, 6.0927734375, 6.4765625, 6.8603515625, 7.244140625, 7.6279296875, 8.01171875, 8.3955078125, 8.779296875, 9.1630859375, 9.546875, 9.9306640625, 10.314453125, 10.6982421875, 11.08203125, 11.4658203125, 11.849609375, 12.2333984375, 12.6171875]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 0.0, 3.0, 9.0, 4.0, 8.0, 9.0, 15.0, 34.0, 45.0, 64.0, 87.0, 138.0, 217.0, 265.0, 417.0, 672.0, 955.0, 1425.0, 2226.0, 3324.0, 5263.0, 9029.0, 14632.0, 25552.0, 45476.0, 87416.0, 182913.0, 296389.0, 178301.0, 85298.0, 44912.0, 25034.0, 14708.0, 8532.0, 5386.0, 3397.0, 2124.0, 1389.0, 921.0, 626.0, 422.0, 290.0, 201.0, 134.0, 90.0, 82.0, 40.0, 29.0, 21.0, 14.0, 12.0, 6.0, 8.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.2529296875, -1.213134765625, -1.17333984375, -1.133544921875, -1.09375, -1.053955078125, -1.01416015625, -0.974365234375, -0.9345703125, -0.894775390625, -0.85498046875, -0.815185546875, -0.775390625, -0.735595703125, -0.69580078125, -0.656005859375, -0.6162109375, -0.576416015625, -0.53662109375, -0.496826171875, -0.45703125, -0.417236328125, -0.37744140625, -0.337646484375, -0.2978515625, -0.258056640625, -0.21826171875, -0.178466796875, -0.138671875, -0.098876953125, -0.05908203125, -0.019287109375, 0.0205078125, 0.060302734375, 0.10009765625, 0.139892578125, 0.1796875, 0.219482421875, 0.25927734375, 0.299072265625, 0.3388671875, 0.378662109375, 0.41845703125, 0.458251953125, 0.498046875, 0.537841796875, 0.57763671875, 0.617431640625, 0.6572265625, 0.697021484375, 0.73681640625, 0.776611328125, 0.81640625, 0.856201171875, 0.89599609375, 0.935791015625, 0.9755859375, 1.015380859375, 1.05517578125, 1.094970703125, 1.134765625, 1.174560546875, 1.21435546875, 1.254150390625, 1.2939453125]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 5.0, 3.0, 3.0, 7.0, 11.0, 6.0, 16.0, 14.0, 21.0, 25.0, 18.0, 25.0, 36.0, 30.0, 33.0, 41.0, 35.0, 48.0, 42.0, 34.0, 49.0, 1063.0, 43.0, 35.0, 50.0, 31.0, 34.0, 25.0, 35.0, 20.0, 33.0, 31.0, 31.0, 19.0, 15.0, 5.0, 11.0, 7.0, 9.0, 11.0, 4.0, 7.0, 9.0, 4.0, 2.0, 1.0, 0.0, 2.0], "bins": [-8.7265625, -8.49481201171875, -8.2630615234375, -8.03131103515625, -7.799560546875, -7.56781005859375, -7.3360595703125, -7.10430908203125, -6.87255859375, -6.64080810546875, -6.4090576171875, -6.17730712890625, -5.945556640625, -5.71380615234375, -5.4820556640625, -5.25030517578125, -5.0185546875, -4.78680419921875, -4.5550537109375, -4.32330322265625, -4.091552734375, -3.85980224609375, -3.6280517578125, -3.39630126953125, -3.16455078125, -2.93280029296875, -2.7010498046875, -2.46929931640625, -2.237548828125, -2.00579833984375, -1.7740478515625, -1.54229736328125, -1.310546875, -1.07879638671875, -0.8470458984375, -0.61529541015625, -0.383544921875, -0.15179443359375, 0.0799560546875, 0.31170654296875, 0.54345703125, 0.77520751953125, 1.0069580078125, 1.23870849609375, 1.470458984375, 1.70220947265625, 1.9339599609375, 2.16571044921875, 2.3974609375, 2.62921142578125, 2.8609619140625, 3.09271240234375, 3.324462890625, 3.55621337890625, 3.7879638671875, 4.01971435546875, 4.25146484375, 4.48321533203125, 4.7149658203125, 4.94671630859375, 5.178466796875, 5.41021728515625, 5.6419677734375, 5.87371826171875, 6.10546875]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 7.0, 7.0, 11.0, 17.0, 16.0, 21.0, 54.0, 64.0, 132.0, 198.0, 297.0, 435.0, 696.0, 1140.0, 1791.0, 2708.0, 4280.0, 6849.0, 10664.0, 17273.0, 28949.0, 48769.0, 87465.0, 169389.0, 1312293.0, 179893.0, 92804.0, 51473.0, 30167.0, 18515.0, 11451.0, 7153.0, 4303.0, 2769.0, 1811.0, 1175.0, 760.0, 502.0, 298.0, 206.0, 146.0, 71.0, 32.0, 27.0, 18.0, 10.0, 17.0, 7.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.666015625, -0.6426849365234375, -0.619354248046875, -0.5960235595703125, -0.57269287109375, -0.5493621826171875, -0.526031494140625, -0.5027008056640625, -0.4793701171875, -0.4560394287109375, -0.432708740234375, -0.4093780517578125, -0.38604736328125, -0.3627166748046875, -0.339385986328125, -0.3160552978515625, -0.292724609375, -0.2693939208984375, -0.246063232421875, -0.2227325439453125, -0.19940185546875, -0.1760711669921875, -0.152740478515625, -0.1294097900390625, -0.1060791015625, -0.0827484130859375, -0.059417724609375, -0.0360870361328125, -0.01275634765625, 0.0105743408203125, 0.033905029296875, 0.0572357177734375, 0.08056640625, 0.1038970947265625, 0.127227783203125, 0.1505584716796875, 0.17388916015625, 0.1972198486328125, 0.220550537109375, 0.2438812255859375, 0.2672119140625, 0.2905426025390625, 0.313873291015625, 0.3372039794921875, 0.36053466796875, 0.3838653564453125, 0.407196044921875, 0.4305267333984375, 0.453857421875, 0.4771881103515625, 0.500518798828125, 0.5238494873046875, 0.54718017578125, 0.5705108642578125, 0.593841552734375, 0.6171722412109375, 0.6405029296875, 0.6638336181640625, 0.687164306640625, 0.7104949951171875, 0.73382568359375, 0.7571563720703125, 0.780487060546875, 0.8038177490234375, 0.8271484375]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 5.0, 4.0, 2.0, 2.0, 10.0, 6.0, 8.0, 9.0, 16.0, 13.0, 12.0, 20.0, 21.0, 19.0, 33.0, 35.0, 43.0, 44.0, 49.0, 50.0, 84.0, 78.0, 72.0, 71.0, 50.0, 48.0, 28.0, 29.0, 31.0, 20.0, 18.0, 14.0, 12.0, 9.0, 11.0, 8.0, 8.0, 7.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0106048583984375, -0.010184049606323242, -0.009763240814208984, -0.009342432022094727, -0.008921623229980469, -0.008500814437866211, -0.008080005645751953, -0.007659196853637695, -0.0072383880615234375, -0.00681757926940918, -0.006396770477294922, -0.005975961685180664, -0.005555152893066406, -0.0051343441009521484, -0.004713535308837891, -0.004292726516723633, -0.003871917724609375, -0.003451108932495117, -0.0030303001403808594, -0.0026094913482666016, -0.0021886825561523438, -0.001767873764038086, -0.0013470649719238281, -0.0009262561798095703, -0.0005054473876953125, -8.463859558105469e-05, 0.0003361701965332031, 0.0007569789886474609, 0.0011777877807617188, 0.0015985965728759766, 0.0020194053649902344, 0.002440214157104492, 0.00286102294921875, 0.003281831741333008, 0.0037026405334472656, 0.0041234493255615234, 0.004544258117675781, 0.004965066909790039, 0.005385875701904297, 0.005806684494018555, 0.0062274932861328125, 0.00664830207824707, 0.007069110870361328, 0.007489919662475586, 0.007910728454589844, 0.008331537246704102, 0.00875234603881836, 0.009173154830932617, 0.009593963623046875, 0.010014772415161133, 0.01043558120727539, 0.010856389999389648, 0.011277198791503906, 0.011698007583618164, 0.012118816375732422, 0.01253962516784668, 0.012960433959960938, 0.013381242752075195, 0.013802051544189453, 0.014222860336303711, 0.014643669128417969, 0.015064477920532227, 0.015485286712646484, 0.015906095504760742, 0.016326904296875]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 4.0, 11.0, 6.0, 12.0, 8.0, 16.0, 22.0, 21.0, 19.0, 28.0, 30.0, 40.0, 55.0, 76.0, 125.0, 298.0, 1491.0, 25166.0, 1006211.0, 13133.0, 1069.0, 229.0, 119.0, 76.0, 50.0, 38.0, 28.0, 33.0, 21.0, 20.0, 13.0, 18.0, 12.0, 11.0, 13.0, 12.0, 4.0, 6.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.4375, -0.4247894287109375, -0.412078857421875, -0.3993682861328125, -0.38665771484375, -0.3739471435546875, -0.361236572265625, -0.3485260009765625, -0.3358154296875, -0.3231048583984375, -0.310394287109375, -0.2976837158203125, -0.28497314453125, -0.2722625732421875, -0.259552001953125, -0.2468414306640625, -0.234130859375, -0.2214202880859375, -0.208709716796875, -0.1959991455078125, -0.18328857421875, -0.1705780029296875, -0.157867431640625, -0.1451568603515625, -0.1324462890625, -0.1197357177734375, -0.107025146484375, -0.0943145751953125, -0.08160400390625, -0.0688934326171875, -0.056182861328125, -0.0434722900390625, -0.03076171875, -0.0180511474609375, -0.005340576171875, 0.0073699951171875, 0.02008056640625, 0.0327911376953125, 0.045501708984375, 0.0582122802734375, 0.0709228515625, 0.0836334228515625, 0.096343994140625, 0.1090545654296875, 0.12176513671875, 0.1344757080078125, 0.147186279296875, 0.1598968505859375, 0.172607421875, 0.1853179931640625, 0.198028564453125, 0.2107391357421875, 0.22344970703125, 0.2361602783203125, 0.248870849609375, 0.2615814208984375, 0.2742919921875, 0.2870025634765625, 0.299713134765625, 0.3124237060546875, 0.32513427734375, 0.3378448486328125, 0.350555419921875, 0.3632659912109375, 0.3759765625]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 16.0, 38.0, 94.0, 330.0, 350.0, 103.0, 36.0, 20.0, 11.0, 4.0, 1.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.035230644047260284, -0.03170756995677948, -0.028184499591588974, -0.02466142736375332, -0.021138355135917664, -0.01761528290808201, -0.014092210680246353, -0.010569138452410698, -0.007046066224575043, -0.0035229939967393875, 7.82310962677002e-08, 0.003523150458931923, 0.007046222686767578, 0.010569294914603233, 0.014092367142438889, 0.017615439370274544, 0.0211385115981102, 0.024661583825945854, 0.02818465605378151, 0.031707726418972015, 0.03523080050945282, 0.038753874599933624, 0.04227694496512413, 0.045800015330314636, 0.04932308942079544, 0.052846163511276245, 0.05636923387646675, 0.05989230424165726, 0.06341537833213806, 0.06693845242261887, 0.07046152651309967, 0.07398459315299988, 0.07750765979290009, 0.08103073388338089, 0.0845538079738617, 0.0880768746137619, 0.0915999487042427, 0.09512302279472351, 0.09864608943462372, 0.10216916352510452, 0.10569223761558533, 0.10921531170606613, 0.11273838579654694, 0.11626145243644714, 0.11978452652692795, 0.12330760061740875, 0.12683066725730896, 0.13035374879837036, 0.13387681543827057, 0.13739988207817078, 0.14092296361923218, 0.14444603025913239, 0.1479690968990326, 0.151492178440094, 0.1550152450799942, 0.1585383266210556, 0.1620613932609558, 0.16558445990085602, 0.16910754144191742, 0.17263060808181763, 0.17615368962287903, 0.17967675626277924, 0.18319982290267944, 0.18672290444374084, 0.19024597108364105]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 2.0, 4.0, 7.0, 14.0, 10.0, 9.0, 20.0, 15.0, 24.0, 18.0, 18.0, 20.0, 20.0, 23.0, 34.0, 23.0, 20.0, 41.0, 38.0, 41.0, 44.0, 45.0, 37.0, 29.0, 38.0, 36.0, 43.0, 40.0, 53.0, 31.0, 34.0, 20.0, 27.0, 19.0, 16.0, 15.0, 15.0, 15.0, 13.0, 7.0, 5.0, 4.0, 5.0, 0.0, 5.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.020763278007507324, -0.020069709047675133, -0.01937614008784294, -0.01868257112801075, -0.01798900216817856, -0.017295433208346367, -0.016601864248514175, -0.015908295288681984, -0.015214726328849792, -0.014521157369017601, -0.01382758840918541, -0.013134019449353218, -0.012440450489521027, -0.011746881529688835, -0.011053312569856644, -0.010359743610024452, -0.00966617465019226, -0.00897260569036007, -0.008279036730527878, -0.007585467770695686, -0.006891898810863495, -0.006198329851031303, -0.005504760891199112, -0.0048111919313669205, -0.004117622971534729, -0.0034240540117025375, -0.002730485051870346, -0.0020369160920381546, -0.0013433471322059631, -0.0006497781723737717, 4.37907874584198e-05, 0.0007373597472906113, 0.0014309287071228027, 0.002124497666954994, 0.0028180666267871857, 0.003511635586619377, 0.004205204546451569, 0.00489877350628376, 0.0055923424661159515, 0.006285911425948143, 0.0069794803857803345, 0.007673049345612526, 0.008366618305444717, 0.009060187265276909, 0.0097537562251091, 0.010447325184941292, 0.011140894144773483, 0.011834463104605675, 0.012528032064437866, 0.013221601024270058, 0.01391516998410225, 0.01460873894393444, 0.015302307903766632, 0.015995876863598824, 0.016689445823431015, 0.017383014783263206, 0.018076583743095398, 0.01877015270292759, 0.01946372166275978, 0.020157290622591972, 0.020850859582424164, 0.021544428542256355, 0.022237997502088547, 0.022931566461920738, 0.02362513542175293]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 5.0, 3.0, 8.0, 3.0, 9.0, 10.0, 6.0, 11.0, 10.0, 16.0, 14.0, 16.0, 32.0, 28.0, 31.0, 45.0, 34.0, 39.0, 37.0, 31.0, 55.0, 41.0, 60.0, 47.0, 52.0, 45.0, 31.0, 36.0, 27.0, 39.0, 34.0, 24.0, 25.0, 20.0, 19.0, 16.0, 12.0, 6.0, 7.0, 6.0, 8.0, 3.0, 0.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.9453125, -11.5615234375, -11.177734375, -10.7939453125, -10.41015625, -10.0263671875, -9.642578125, -9.2587890625, -8.875, -8.4912109375, -8.107421875, -7.7236328125, -7.33984375, -6.9560546875, -6.572265625, -6.1884765625, -5.8046875, -5.4208984375, -5.037109375, -4.6533203125, -4.26953125, -3.8857421875, -3.501953125, -3.1181640625, -2.734375, -2.3505859375, -1.966796875, -1.5830078125, -1.19921875, -0.8154296875, -0.431640625, -0.0478515625, 0.3359375, 0.7197265625, 1.103515625, 1.4873046875, 1.87109375, 2.2548828125, 2.638671875, 3.0224609375, 3.40625, 3.7900390625, 4.173828125, 4.5576171875, 4.94140625, 5.3251953125, 5.708984375, 6.0927734375, 6.4765625, 6.8603515625, 7.244140625, 7.6279296875, 8.01171875, 8.3955078125, 8.779296875, 9.1630859375, 9.546875, 9.9306640625, 10.314453125, 10.6982421875, 11.08203125, 11.4658203125, 11.849609375, 12.2333984375, 12.6171875]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 3.0, 5.0, 6.0, 3.0, 8.0, 16.0, 6.0, 12.0, 18.0, 23.0, 38.0, 52.0, 108.0, 150.0, 276.0, 537.0, 1150.0, 2762.0, 7288.0, 21371.0, 71480.0, 297407.0, 480472.0, 115230.0, 32470.0, 10693.0, 3811.0, 1578.0, 719.0, 342.0, 197.0, 89.0, 60.0, 64.0, 32.0, 24.0, 19.0, 7.0, 10.0, 7.0, 6.0, 4.0, 1.0, 3.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.38671875, -6.181884765625, -5.97705078125, -5.772216796875, -5.5673828125, -5.362548828125, -5.15771484375, -4.952880859375, -4.748046875, -4.543212890625, -4.33837890625, -4.133544921875, -3.9287109375, -3.723876953125, -3.51904296875, -3.314208984375, -3.109375, -2.904541015625, -2.69970703125, -2.494873046875, -2.2900390625, -2.085205078125, -1.88037109375, -1.675537109375, -1.470703125, -1.265869140625, -1.06103515625, -0.856201171875, -0.6513671875, -0.446533203125, -0.24169921875, -0.036865234375, 0.16796875, 0.372802734375, 0.57763671875, 0.782470703125, 0.9873046875, 1.192138671875, 1.39697265625, 1.601806640625, 1.806640625, 2.011474609375, 2.21630859375, 2.421142578125, 2.6259765625, 2.830810546875, 3.03564453125, 3.240478515625, 3.4453125, 3.650146484375, 3.85498046875, 4.059814453125, 4.2646484375, 4.469482421875, 4.67431640625, 4.879150390625, 5.083984375, 5.288818359375, 5.49365234375, 5.698486328125, 5.9033203125, 6.108154296875, 6.31298828125, 6.517822265625, 6.72265625]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 8.0, 4.0, 4.0, 6.0, 5.0, 12.0, 13.0, 13.0, 11.0, 19.0, 18.0, 20.0, 20.0, 31.0, 24.0, 36.0, 35.0, 32.0, 36.0, 40.0, 41.0, 68.0, 1762.0, 315.0, 62.0, 40.0, 23.0, 41.0, 31.0, 33.0, 43.0, 26.0, 34.0, 26.0, 26.0, 18.0, 15.0, 10.0, 9.0, 7.0, 13.0, 9.0, 6.0, 4.0, 3.0, 1.0, 2.0, 1.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-41.21875, -39.92626953125, -38.6337890625, -37.34130859375, -36.048828125, -34.75634765625, -33.4638671875, -32.17138671875, -30.87890625, -29.58642578125, -28.2939453125, -27.00146484375, -25.708984375, -24.41650390625, -23.1240234375, -21.83154296875, -20.5390625, -19.24658203125, -17.9541015625, -16.66162109375, -15.369140625, -14.07666015625, -12.7841796875, -11.49169921875, -10.19921875, -8.90673828125, -7.6142578125, -6.32177734375, -5.029296875, -3.73681640625, -2.4443359375, -1.15185546875, 0.140625, 1.43310546875, 2.7255859375, 4.01806640625, 5.310546875, 6.60302734375, 7.8955078125, 9.18798828125, 10.48046875, 11.77294921875, 13.0654296875, 14.35791015625, 15.650390625, 16.94287109375, 18.2353515625, 19.52783203125, 20.8203125, 22.11279296875, 23.4052734375, 24.69775390625, 25.990234375, 27.28271484375, 28.5751953125, 29.86767578125, 31.16015625, 32.45263671875, 33.7451171875, 35.03759765625, 36.330078125, 37.62255859375, 38.9150390625, 40.20751953125, 41.5]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 2.0, 2.0, 1.0, 3.0, 3.0, 6.0, 10.0, 10.0, 7.0, 10.0, 11.0, 15.0, 19.0, 32.0, 36.0, 45.0, 45.0, 66.0, 91.0, 100.0, 205.0, 274.0, 536.0, 1568.0, 224126.0, 2914490.0, 2316.0, 629.0, 313.0, 189.0, 135.0, 102.0, 74.0, 40.0, 45.0, 21.0, 20.0, 22.0, 18.0, 15.0, 10.0, 15.0, 10.0, 5.0, 6.0, 4.0, 8.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-67.5625, -65.4580078125, -63.353515625, -61.2490234375, -59.14453125, -57.0400390625, -54.935546875, -52.8310546875, -50.7265625, -48.6220703125, -46.517578125, -44.4130859375, -42.30859375, -40.2041015625, -38.099609375, -35.9951171875, -33.890625, -31.7861328125, -29.681640625, -27.5771484375, -25.47265625, -23.3681640625, -21.263671875, -19.1591796875, -17.0546875, -14.9501953125, -12.845703125, -10.7412109375, -8.63671875, -6.5322265625, -4.427734375, -2.3232421875, -0.21875, 1.8857421875, 3.990234375, 6.0947265625, 8.19921875, 10.3037109375, 12.408203125, 14.5126953125, 16.6171875, 18.7216796875, 20.826171875, 22.9306640625, 25.03515625, 27.1396484375, 29.244140625, 31.3486328125, 33.453125, 35.5576171875, 37.662109375, 39.7666015625, 41.87109375, 43.9755859375, 46.080078125, 48.1845703125, 50.2890625, 52.3935546875, 54.498046875, 56.6025390625, 58.70703125, 60.8115234375, 62.916015625, 65.0205078125, 67.125]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [47.0, 850.0, 116.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.709879875183105, -4.412458419799805, 2.884963035583496, 10.182385444641113, 17.47980499267578, 24.777225494384766, 32.074649810791016, 39.3720703125, 46.669490814208984, 53.96691131591797, 61.26433563232422, 68.56175231933594, 75.85917663574219, 83.15660095214844, 90.45402526855469, 97.7514419555664, 105.04886627197266, 112.3462905883789, 119.64370727539062, 126.94113159179688, 134.23855590820312, 141.53598022460938, 148.83340454101562, 156.1308135986328, 163.42823791503906, 170.7256622314453, 178.02308654785156, 185.32049560546875, 192.617919921875, 199.91534423828125, 207.2127685546875, 214.51019287109375, 221.8076171875, 229.10504150390625, 236.4024658203125, 243.69989013671875, 250.99729919433594, 258.29473876953125, 265.5921630859375, 272.8895568847656, 280.1869812011719, 287.4844055175781, 294.7818298339844, 302.0792541503906, 309.3766784667969, 316.674072265625, 323.97149658203125, 331.2689208984375, 338.56634521484375, 345.86376953125, 353.16119384765625, 360.4586181640625, 367.75604248046875, 375.053466796875, 382.35089111328125, 389.6482849121094, 396.94573974609375, 404.2431640625, 411.54058837890625, 418.8380126953125, 426.13543701171875, 433.432861328125, 440.73028564453125, 448.0276794433594, 455.3251037597656]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 6.0, 2.0, 6.0, 7.0, 8.0, 3.0, 15.0, 13.0, 17.0, 19.0, 17.0, 21.0, 33.0, 21.0, 21.0, 48.0, 38.0, 28.0, 40.0, 34.0, 47.0, 42.0, 46.0, 47.0, 38.0, 43.0, 41.0, 34.0, 38.0, 31.0, 34.0, 27.0, 22.0, 14.0, 13.0, 14.0, 19.0, 4.0, 13.0, 11.0, 8.0, 3.0, 4.0, 6.0, 2.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0], "bins": [-133.54962158203125, -129.2626953125, -124.97576904296875, -120.6888427734375, -116.40191650390625, -112.114990234375, -107.82806396484375, -103.5411376953125, -99.25421142578125, -94.96728515625, -90.68035888671875, -86.3934326171875, -82.10650634765625, -77.819580078125, -73.53265380859375, -69.2457275390625, -64.95879364013672, -60.67186737060547, -56.38494110107422, -52.09801483154297, -47.81108856201172, -43.52416229248047, -39.23723220825195, -34.9503059387207, -30.663379669189453, -26.376453399658203, -22.089527130126953, -17.80259895324707, -13.51567268371582, -9.22874641418457, -4.9418182373046875, -0.6548919677734375, 3.6320343017578125, 7.918961048126221, 12.205887794494629, 16.492815017700195, 20.779741287231445, 25.066667556762695, 29.353595733642578, 33.64052200317383, 37.92744827270508, 42.21437454223633, 46.50130081176758, 50.788230895996094, 55.075157165527344, 59.362083435058594, 63.649009704589844, 67.9359359741211, 72.22286224365234, 76.5097885131836, 80.79671478271484, 85.0836410522461, 89.37056732177734, 93.6574935913086, 97.94442749023438, 102.23135375976562, 106.51828002929688, 110.80520629882812, 115.09213256835938, 119.37905883789062, 123.66598510742188, 127.95291137695312, 132.23983764648438, 136.52676391601562, 140.81369018554688]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 7.0, 5.0, 10.0, 5.0, 10.0, 10.0, 12.0, 15.0, 17.0, 16.0, 36.0, 25.0, 45.0, 34.0, 29.0, 48.0, 35.0, 47.0, 39.0, 52.0, 64.0, 47.0, 51.0, 33.0, 33.0, 37.0, 31.0, 37.0, 27.0, 25.0, 23.0, 23.0, 15.0, 13.0, 9.0, 6.0, 7.0, 7.0, 5.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.0859375, -11.692138671875, -11.29833984375, -10.904541015625, -10.5107421875, -10.116943359375, -9.72314453125, -9.329345703125, -8.935546875, -8.541748046875, -8.14794921875, -7.754150390625, -7.3603515625, -6.966552734375, -6.57275390625, -6.178955078125, -5.78515625, -5.391357421875, -4.99755859375, -4.603759765625, -4.2099609375, -3.816162109375, -3.42236328125, -3.028564453125, -2.634765625, -2.240966796875, -1.84716796875, -1.453369140625, -1.0595703125, -0.665771484375, -0.27197265625, 0.121826171875, 0.515625, 0.909423828125, 1.30322265625, 1.697021484375, 2.0908203125, 2.484619140625, 2.87841796875, 3.272216796875, 3.666015625, 4.059814453125, 4.45361328125, 4.847412109375, 5.2412109375, 5.635009765625, 6.02880859375, 6.422607421875, 6.81640625, 7.210205078125, 7.60400390625, 7.997802734375, 8.3916015625, 8.785400390625, 9.17919921875, 9.572998046875, 9.966796875, 10.360595703125, 10.75439453125, 11.148193359375, 11.5419921875, 11.935791015625, 12.32958984375, 12.723388671875, 13.1171875]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 7.0, 3.0, 9.0, 13.0, 14.0, 18.0, 20.0, 40.0, 58.0, 63.0, 121.0, 176.0, 245.0, 408.0, 645.0, 1020.0, 1872.0, 3459.0, 7205.0, 18453.0, 302157.0, 3660086.0, 169411.0, 15287.0, 6334.0, 3016.0, 1641.0, 921.0, 552.0, 353.0, 221.0, 143.0, 86.0, 75.0, 35.0, 45.0, 20.0, 15.0, 7.0, 16.0, 6.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.75, -39.41064453125, -38.0712890625, -36.73193359375, -35.392578125, -34.05322265625, -32.7138671875, -31.37451171875, -30.03515625, -28.69580078125, -27.3564453125, -26.01708984375, -24.677734375, -23.33837890625, -21.9990234375, -20.65966796875, -19.3203125, -17.98095703125, -16.6416015625, -15.30224609375, -13.962890625, -12.62353515625, -11.2841796875, -9.94482421875, -8.60546875, -7.26611328125, -5.9267578125, -4.58740234375, -3.248046875, -1.90869140625, -0.5693359375, 0.77001953125, 2.109375, 3.44873046875, 4.7880859375, 6.12744140625, 7.466796875, 8.80615234375, 10.1455078125, 11.48486328125, 12.82421875, 14.16357421875, 15.5029296875, 16.84228515625, 18.181640625, 19.52099609375, 20.8603515625, 22.19970703125, 23.5390625, 24.87841796875, 26.2177734375, 27.55712890625, 28.896484375, 30.23583984375, 31.5751953125, 32.91455078125, 34.25390625, 35.59326171875, 36.9326171875, 38.27197265625, 39.611328125, 40.95068359375, 42.2900390625, 43.62939453125, 44.96875]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 5.0, 3.0, 8.0, 6.0, 6.0, 3.0, 6.0, 5.0, 11.0, 9.0, 17.0, 17.0, 18.0, 38.0, 39.0, 69.0, 136.0, 350.0, 689.0, 1022.0, 805.0, 366.0, 186.0, 91.0, 49.0, 29.0, 25.0, 13.0, 14.0, 4.0, 5.0, 3.0, 8.0, 7.0, 9.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-33.875, -32.7685546875, -31.662109375, -30.5556640625, -29.44921875, -28.3427734375, -27.236328125, -26.1298828125, -25.0234375, -23.9169921875, -22.810546875, -21.7041015625, -20.59765625, -19.4912109375, -18.384765625, -17.2783203125, -16.171875, -15.0654296875, -13.958984375, -12.8525390625, -11.74609375, -10.6396484375, -9.533203125, -8.4267578125, -7.3203125, -6.2138671875, -5.107421875, -4.0009765625, -2.89453125, -1.7880859375, -0.681640625, 0.4248046875, 1.53125, 2.6376953125, 3.744140625, 4.8505859375, 5.95703125, 7.0634765625, 8.169921875, 9.2763671875, 10.3828125, 11.4892578125, 12.595703125, 13.7021484375, 14.80859375, 15.9150390625, 17.021484375, 18.1279296875, 19.234375, 20.3408203125, 21.447265625, 22.5537109375, 23.66015625, 24.7666015625, 25.873046875, 26.9794921875, 28.0859375, 29.1923828125, 30.298828125, 31.4052734375, 32.51171875, 33.6181640625, 34.724609375, 35.8310546875, 36.9375]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 8.0, 3.0, 10.0, 13.0, 17.0, 21.0, 28.0, 42.0, 62.0, 76.0, 121.0, 196.0, 249.0, 370.0, 554.0, 797.0, 1192.0, 1786.0, 2772.0, 4311.0, 7119.0, 12531.0, 24062.0, 59384.0, 374635.0, 3268337.0, 325281.0, 56228.0, 22948.0, 11877.0, 6889.0, 4175.0, 2691.0, 1798.0, 1104.0, 840.0, 519.0, 371.0, 255.0, 184.0, 134.0, 77.0, 63.0, 46.0, 27.0, 24.0, 18.0, 5.0, 14.0, 8.0, 4.0, 3.0, 5.0, 2.0, 0.0, 4.0], "bins": [-40.78125, -39.56298828125, -38.3447265625, -37.12646484375, -35.908203125, -34.68994140625, -33.4716796875, -32.25341796875, -31.03515625, -29.81689453125, -28.5986328125, -27.38037109375, -26.162109375, -24.94384765625, -23.7255859375, -22.50732421875, -21.2890625, -20.07080078125, -18.8525390625, -17.63427734375, -16.416015625, -15.19775390625, -13.9794921875, -12.76123046875, -11.54296875, -10.32470703125, -9.1064453125, -7.88818359375, -6.669921875, -5.45166015625, -4.2333984375, -3.01513671875, -1.796875, -0.57861328125, 0.6396484375, 1.85791015625, 3.076171875, 4.29443359375, 5.5126953125, 6.73095703125, 7.94921875, 9.16748046875, 10.3857421875, 11.60400390625, 12.822265625, 14.04052734375, 15.2587890625, 16.47705078125, 17.6953125, 18.91357421875, 20.1318359375, 21.35009765625, 22.568359375, 23.78662109375, 25.0048828125, 26.22314453125, 27.44140625, 28.65966796875, 29.8779296875, 31.09619140625, 32.314453125, 33.53271484375, 34.7509765625, 35.96923828125, 37.1875]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 3.0, 5.0, 13.0, 13.0, 15.0, 21.0, 26.0, 54.0, 76.0, 108.0, 168.0, 184.0, 109.0, 78.0, 38.0, 32.0, 22.0, 8.0, 9.0, 6.0, 6.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-119.85140228271484, -115.04425048828125, -110.23709869384766, -105.42994689941406, -100.62278747558594, -95.81563568115234, -91.00848388671875, -86.20132446289062, -81.39418029785156, -76.58702850341797, -71.77987670898438, -66.97271728515625, -62.165565490722656, -57.35841369628906, -52.55126190185547, -47.74410629272461, -42.93695068359375, -38.129798889160156, -33.3226432800293, -28.515491485595703, -23.708337783813477, -18.90118408203125, -14.094032287597656, -9.286876678466797, -4.479724884033203, 0.32742834091186523, 5.134581565856934, 9.941734313964844, 14.74888801574707, 19.556041717529297, 24.36319351196289, 29.17034912109375, 33.977508544921875, 38.78466033935547, 43.59181594848633, 48.39896774291992, 53.20612335205078, 58.013275146484375, 62.82042694091797, 67.62757873535156, 72.43473815917969, 77.24188995361328, 82.04904174804688, 86.856201171875, 91.6633529663086, 96.47050476074219, 101.27765655517578, 106.08480834960938, 110.89196014404297, 115.69911193847656, 120.50626373291016, 125.31341552734375, 130.12057495117188, 134.927734375, 139.73487854003906, 144.5420379638672, 149.34918212890625, 154.15634155273438, 158.96348571777344, 163.77064514160156, 168.57778930664062, 173.38494873046875, 178.19210815429688, 182.99925231933594, 187.80641174316406]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 3.0, 6.0, 3.0, 5.0, 8.0, 7.0, 12.0, 15.0, 12.0, 17.0, 23.0, 30.0, 30.0, 26.0, 25.0, 30.0, 32.0, 45.0, 41.0, 44.0, 43.0, 38.0, 41.0, 45.0, 36.0, 48.0, 38.0, 39.0, 37.0, 35.0, 27.0, 26.0, 21.0, 28.0, 11.0, 14.0, 14.0, 12.0, 11.0, 5.0, 7.0, 2.0, 6.0, 7.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-76.74385070800781, -74.01144409179688, -71.2790298461914, -68.54662322998047, -65.814208984375, -63.0817985534668, -60.349388122558594, -57.616981506347656, -54.88456726074219, -52.152156829833984, -49.41974639892578, -46.68733596801758, -43.954925537109375, -41.22251510620117, -38.49010467529297, -35.75769805908203, -33.02528762817383, -30.292877197265625, -27.560466766357422, -24.82805633544922, -22.095645904541016, -19.363235473632812, -16.630826950073242, -13.898416519165039, -11.166006088256836, -8.433595657348633, -5.701185703277588, -2.968775749206543, -0.23636531829833984, 2.4960451126098633, 5.22845458984375, 7.960865020751953, 10.693275451660156, 13.42568588256836, 16.158096313476562, 18.890506744384766, 21.62291717529297, 24.355327606201172, 27.087736129760742, 29.820146560668945, 32.55255889892578, 35.284969329833984, 38.01737976074219, 40.74979019165039, 43.482200622558594, 46.2146110534668, 48.947021484375, 51.67942810058594, 54.41183853149414, 57.144248962402344, 59.87665939331055, 62.60906982421875, 65.34147644042969, 68.07389068603516, 70.8062973022461, 73.53871154785156, 76.2711181640625, 79.00352478027344, 81.7359390258789, 84.46834564208984, 87.20075988769531, 89.93316650390625, 92.66558074951172, 95.39798736572266, 98.13040161132812]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 3.0, 6.0, 3.0, 10.0, 7.0, 11.0, 8.0, 17.0, 16.0, 24.0, 19.0, 24.0, 27.0, 29.0, 35.0, 43.0, 42.0, 38.0, 45.0, 42.0, 51.0, 40.0, 35.0, 40.0, 32.0, 40.0, 40.0, 39.0, 40.0, 40.0, 25.0, 24.0, 13.0, 12.0, 25.0, 8.0, 13.0, 9.0, 7.0, 4.0, 5.0, 6.0, 2.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.28125, -11.888671875, -11.49609375, -11.103515625, -10.7109375, -10.318359375, -9.92578125, -9.533203125, -9.140625, -8.748046875, -8.35546875, -7.962890625, -7.5703125, -7.177734375, -6.78515625, -6.392578125, -6.0, -5.607421875, -5.21484375, -4.822265625, -4.4296875, -4.037109375, -3.64453125, -3.251953125, -2.859375, -2.466796875, -2.07421875, -1.681640625, -1.2890625, -0.896484375, -0.50390625, -0.111328125, 0.28125, 0.673828125, 1.06640625, 1.458984375, 1.8515625, 2.244140625, 2.63671875, 3.029296875, 3.421875, 3.814453125, 4.20703125, 4.599609375, 4.9921875, 5.384765625, 5.77734375, 6.169921875, 6.5625, 6.955078125, 7.34765625, 7.740234375, 8.1328125, 8.525390625, 8.91796875, 9.310546875, 9.703125, 10.095703125, 10.48828125, 10.880859375, 11.2734375, 11.666015625, 12.05859375, 12.451171875, 12.84375]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 7.0, 3.0, 11.0, 12.0, 26.0, 21.0, 35.0, 46.0, 89.0, 117.0, 184.0, 260.0, 417.0, 611.0, 960.0, 1489.0, 2291.0, 3483.0, 5391.0, 8445.0, 13249.0, 21438.0, 35901.0, 62797.0, 120206.0, 238125.0, 244648.0, 125714.0, 65248.0, 36803.0, 22330.0, 13668.0, 8680.0, 5492.0, 3627.0, 2383.0, 1434.0, 986.0, 660.0, 425.0, 263.0, 183.0, 121.0, 102.0, 56.0, 46.0, 35.0, 9.0, 15.0, 6.0, 4.0, 4.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0], "bins": [-1.52734375, -1.4796600341796875, -1.431976318359375, -1.3842926025390625, -1.33660888671875, -1.2889251708984375, -1.241241455078125, -1.1935577392578125, -1.1458740234375, -1.0981903076171875, -1.050506591796875, -1.0028228759765625, -0.95513916015625, -0.9074554443359375, -0.859771728515625, -0.8120880126953125, -0.764404296875, -0.7167205810546875, -0.669036865234375, -0.6213531494140625, -0.57366943359375, -0.5259857177734375, -0.478302001953125, -0.4306182861328125, -0.3829345703125, -0.3352508544921875, -0.287567138671875, -0.2398834228515625, -0.19219970703125, -0.1445159912109375, -0.096832275390625, -0.0491485595703125, -0.00146484375, 0.0462188720703125, 0.093902587890625, 0.1415863037109375, 0.18927001953125, 0.2369537353515625, 0.284637451171875, 0.3323211669921875, 0.3800048828125, 0.4276885986328125, 0.475372314453125, 0.5230560302734375, 0.57073974609375, 0.6184234619140625, 0.666107177734375, 0.7137908935546875, 0.761474609375, 0.8091583251953125, 0.856842041015625, 0.9045257568359375, 0.95220947265625, 0.9998931884765625, 1.047576904296875, 1.0952606201171875, 1.1429443359375, 1.1906280517578125, 1.238311767578125, 1.2859954833984375, 1.33367919921875, 1.3813629150390625, 1.429046630859375, 1.4767303466796875, 1.5244140625]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 2.0, 7.0, 10.0, 6.0, 7.0, 15.0, 11.0, 12.0, 8.0, 18.0, 29.0, 27.0, 27.0, 26.0, 38.0, 31.0, 27.0, 38.0, 40.0, 36.0, 40.0, 45.0, 1063.0, 36.0, 43.0, 40.0, 31.0, 37.0, 21.0, 25.0, 38.0, 32.0, 24.0, 19.0, 17.0, 11.0, 15.0, 19.0, 14.0, 6.0, 9.0, 2.0, 8.0, 7.0, 5.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.8125, -7.5848388671875, -7.357177734375, -7.1295166015625, -6.90185546875, -6.6741943359375, -6.446533203125, -6.2188720703125, -5.9912109375, -5.7635498046875, -5.535888671875, -5.3082275390625, -5.08056640625, -4.8529052734375, -4.625244140625, -4.3975830078125, -4.169921875, -3.9422607421875, -3.714599609375, -3.4869384765625, -3.25927734375, -3.0316162109375, -2.803955078125, -2.5762939453125, -2.3486328125, -2.1209716796875, -1.893310546875, -1.6656494140625, -1.43798828125, -1.2103271484375, -0.982666015625, -0.7550048828125, -0.52734375, -0.2996826171875, -0.072021484375, 0.1556396484375, 0.38330078125, 0.6109619140625, 0.838623046875, 1.0662841796875, 1.2939453125, 1.5216064453125, 1.749267578125, 1.9769287109375, 2.20458984375, 2.4322509765625, 2.659912109375, 2.8875732421875, 3.115234375, 3.3428955078125, 3.570556640625, 3.7982177734375, 4.02587890625, 4.2535400390625, 4.481201171875, 4.7088623046875, 4.9365234375, 5.1641845703125, 5.391845703125, 5.6195068359375, 5.84716796875, 6.0748291015625, 6.302490234375, 6.5301513671875, 6.7578125]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 1.0, 5.0, 12.0, 13.0, 20.0, 24.0, 44.0, 73.0, 115.0, 155.0, 196.0, 358.0, 600.0, 903.0, 1483.0, 2206.0, 3641.0, 5753.0, 9301.0, 14710.0, 24215.0, 40801.0, 71404.0, 130713.0, 1146535.0, 356218.0, 121711.0, 66563.0, 38656.0, 23115.0, 14109.0, 8651.0, 5437.0, 3438.0, 2082.0, 1375.0, 915.0, 568.0, 347.0, 211.0, 163.0, 111.0, 64.0, 54.0, 23.0, 13.0, 10.0, 10.0, 5.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.716796875, -0.6920318603515625, -0.667266845703125, -0.6425018310546875, -0.61773681640625, -0.5929718017578125, -0.568206787109375, -0.5434417724609375, -0.5186767578125, -0.4939117431640625, -0.469146728515625, -0.4443817138671875, -0.41961669921875, -0.3948516845703125, -0.370086669921875, -0.3453216552734375, -0.320556640625, -0.2957916259765625, -0.271026611328125, -0.2462615966796875, -0.22149658203125, -0.1967315673828125, -0.171966552734375, -0.1472015380859375, -0.1224365234375, -0.0976715087890625, -0.072906494140625, -0.0481414794921875, -0.02337646484375, 0.0013885498046875, 0.026153564453125, 0.0509185791015625, 0.07568359375, 0.1004486083984375, 0.125213623046875, 0.1499786376953125, 0.17474365234375, 0.1995086669921875, 0.224273681640625, 0.2490386962890625, 0.2738037109375, 0.2985687255859375, 0.323333740234375, 0.3480987548828125, 0.37286376953125, 0.3976287841796875, 0.422393798828125, 0.4471588134765625, 0.471923828125, 0.4966888427734375, 0.521453857421875, 0.5462188720703125, 0.57098388671875, 0.5957489013671875, 0.620513916015625, 0.6452789306640625, 0.6700439453125, 0.6948089599609375, 0.719573974609375, 0.7443389892578125, 0.76910400390625, 0.7938690185546875, 0.818634033203125, 0.8433990478515625, 0.8681640625]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 6.0, 1.0, 8.0, 4.0, 6.0, 3.0, 5.0, 12.0, 14.0, 20.0, 32.0, 28.0, 90.0, 145.0, 159.0, 158.0, 92.0, 52.0, 32.0, 34.0, 13.0, 17.0, 2.0, 7.0, 10.0, 6.0, 8.0, 5.0, 3.0, 5.0, 4.0, 3.0, 5.0, 5.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.04541015625, -0.0439763069152832, -0.042542457580566406, -0.04110860824584961, -0.03967475891113281, -0.038240909576416016, -0.03680706024169922, -0.03537321090698242, -0.033939361572265625, -0.03250551223754883, -0.03107166290283203, -0.029637813568115234, -0.028203964233398438, -0.02677011489868164, -0.025336265563964844, -0.023902416229248047, -0.02246856689453125, -0.021034717559814453, -0.019600868225097656, -0.01816701889038086, -0.016733169555664062, -0.015299320220947266, -0.013865470886230469, -0.012431621551513672, -0.010997772216796875, -0.009563922882080078, -0.008130073547363281, -0.006696224212646484, -0.0052623748779296875, -0.0038285255432128906, -0.0023946762084960938, -0.0009608268737792969, 0.0004730224609375, 0.0019068717956542969, 0.0033407211303710938, 0.004774570465087891, 0.0062084197998046875, 0.007642269134521484, 0.009076118469238281, 0.010509967803955078, 0.011943817138671875, 0.013377666473388672, 0.014811515808105469, 0.016245365142822266, 0.017679214477539062, 0.01911306381225586, 0.020546913146972656, 0.021980762481689453, 0.02341461181640625, 0.024848461151123047, 0.026282310485839844, 0.02771615982055664, 0.029150009155273438, 0.030583858489990234, 0.03201770782470703, 0.03345155715942383, 0.034885406494140625, 0.03631925582885742, 0.03775310516357422, 0.039186954498291016, 0.04062080383300781, 0.04205465316772461, 0.043488502502441406, 0.0449223518371582, 0.046356201171875]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 2.0, 4.0, 1.0, 3.0, 8.0, 7.0, 9.0, 11.0, 31.0, 30.0, 54.0, 70.0, 106.0, 173.0, 1188.0, 45064.0, 993602.0, 7277.0, 472.0, 146.0, 100.0, 58.0, 34.0, 34.0, 22.0, 15.0, 9.0, 8.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.1376953125, -1.1024627685546875, -1.067230224609375, -1.0319976806640625, -0.99676513671875, -0.9615325927734375, -0.926300048828125, -0.8910675048828125, -0.8558349609375, -0.8206024169921875, -0.785369873046875, -0.7501373291015625, -0.71490478515625, -0.6796722412109375, -0.644439697265625, -0.6092071533203125, -0.573974609375, -0.5387420654296875, -0.503509521484375, -0.4682769775390625, -0.43304443359375, -0.3978118896484375, -0.362579345703125, -0.3273468017578125, -0.2921142578125, -0.2568817138671875, -0.221649169921875, -0.1864166259765625, -0.15118408203125, -0.1159515380859375, -0.080718994140625, -0.0454864501953125, -0.01025390625, 0.0249786376953125, 0.060211181640625, 0.0954437255859375, 0.13067626953125, 0.1659088134765625, 0.201141357421875, 0.2363739013671875, 0.2716064453125, 0.3068389892578125, 0.342071533203125, 0.3773040771484375, 0.41253662109375, 0.4477691650390625, 0.483001708984375, 0.5182342529296875, 0.553466796875, 0.5886993408203125, 0.623931884765625, 0.6591644287109375, 0.69439697265625, 0.7296295166015625, 0.764862060546875, 0.8000946044921875, 0.8353271484375, 0.8705596923828125, 0.905792236328125, 0.9410247802734375, 0.97625732421875, 1.0114898681640625, 1.046722412109375, 1.0819549560546875, 1.1171875]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 7.0, 15.0, 17.0, 34.0, 69.0, 121.0, 264.0, 240.0, 95.0, 64.0, 26.0, 21.0, 11.0, 8.0, 3.0, 0.0, 3.0, 2.0, 0.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11927410215139389, -0.11261456459760666, -0.10595502704381943, -0.09929549694061279, -0.09263595938682556, -0.08597642183303833, -0.0793168842792511, -0.07265734672546387, -0.06599780917167664, -0.059338271617889404, -0.05267873778939247, -0.04601920023560524, -0.03935966640710831, -0.032700128853321075, -0.026040591299533844, -0.01938105747103691, -0.012721523642539978, -0.0060619874857366085, 0.000597548671066761, 0.007257085293531418, 0.0139166209846735, 0.020576156675815582, 0.027235694229602814, 0.03389522805809975, 0.04055476561188698, 0.04721430316567421, 0.05387383699417114, 0.060533374547958374, 0.0671929121017456, 0.07385244965553284, 0.08051198720932007, 0.0871715173125267, 0.09383104741573334, 0.10049058496952057, 0.1071501225233078, 0.11380966007709503, 0.12046919018030167, 0.1271287202835083, 0.13378825783729553, 0.14044779539108276, 0.14710733294487, 0.15376687049865723, 0.16042640805244446, 0.1670859456062317, 0.17374548316001892, 0.18040502071380615, 0.18706455826759338, 0.19372408092021942, 0.20038363337516785, 0.20704317092895508, 0.2137027084827423, 0.22036224603652954, 0.22702178359031677, 0.233681321144104, 0.24034085869789124, 0.24700038135051727, 0.2536599040031433, 0.26031944155693054, 0.2669789791107178, 0.273638516664505, 0.28029805421829224, 0.28695759177207947, 0.2936171293258667, 0.30027666687965393, 0.30693620443344116]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 3.0, 3.0, 3.0, 5.0, 8.0, 10.0, 11.0, 16.0, 13.0, 14.0, 21.0, 19.0, 26.0, 21.0, 19.0, 35.0, 41.0, 21.0, 31.0, 47.0, 31.0, 39.0, 35.0, 36.0, 39.0, 38.0, 38.0, 33.0, 46.0, 42.0, 29.0, 29.0, 21.0, 26.0, 31.0, 21.0, 17.0, 17.0, 15.0, 10.0, 6.0, 12.0, 8.0, 4.0, 3.0, 1.0, 5.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.020572364330291748, -0.019920574501156807, -0.019268784672021866, -0.018616994842886925, -0.017965205013751984, -0.017313415184617043, -0.0166616253554821, -0.01600983552634716, -0.01535804569721222, -0.014706255868077278, -0.014054466038942337, -0.013402676209807396, -0.012750886380672455, -0.012099096551537514, -0.011447306722402573, -0.010795516893267632, -0.01014372706413269, -0.00949193723499775, -0.008840147405862808, -0.008188357576727867, -0.007536567747592926, -0.006884777918457985, -0.006232988089323044, -0.005581198260188103, -0.004929408431053162, -0.0042776186019182205, -0.0036258287727832794, -0.0029740389436483383, -0.002322249114513397, -0.0016704592853784561, -0.001018669456243515, -0.0003668796271085739, 0.0002849102020263672, 0.0009367000311613083, 0.0015884898602962494, 0.0022402796894311905, 0.0028920695185661316, 0.0035438593477010727, 0.004195649176836014, 0.004847439005970955, 0.005499228835105896, 0.006151018664240837, 0.006802808493375778, 0.007454598322510719, 0.00810638815164566, 0.008758177980780602, 0.009409967809915543, 0.010061757639050484, 0.010713547468185425, 0.011365337297320366, 0.012017127126455307, 0.012668916955590248, 0.01332070678472519, 0.01397249661386013, 0.014624286442995071, 0.015276076272130013, 0.015927866101264954, 0.016579655930399895, 0.017231445759534836, 0.017883235588669777, 0.018535025417804718, 0.01918681524693966, 0.0198386050760746, 0.02049039490520954, 0.021142184734344482]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 3.0, 6.0, 3.0, 10.0, 7.0, 11.0, 8.0, 17.0, 16.0, 24.0, 19.0, 24.0, 27.0, 29.0, 36.0, 42.0, 42.0, 38.0, 45.0, 42.0, 51.0, 40.0, 35.0, 40.0, 33.0, 39.0, 39.0, 40.0, 40.0, 40.0, 25.0, 24.0, 13.0, 12.0, 25.0, 8.0, 13.0, 9.0, 7.0, 4.0, 5.0, 6.0, 2.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.28125, -11.888671875, -11.49609375, -11.103515625, -10.7109375, -10.318359375, -9.92578125, -9.533203125, -9.140625, -8.748046875, -8.35546875, -7.962890625, -7.5703125, -7.177734375, -6.78515625, -6.392578125, -6.0, -5.607421875, -5.21484375, -4.822265625, -4.4296875, -4.037109375, -3.64453125, -3.251953125, -2.859375, -2.466796875, -2.07421875, -1.681640625, -1.2890625, -0.896484375, -0.50390625, -0.111328125, 0.28125, 0.673828125, 1.06640625, 1.458984375, 1.8515625, 2.244140625, 2.63671875, 3.029296875, 3.421875, 3.814453125, 4.20703125, 4.599609375, 4.9921875, 5.384765625, 5.77734375, 6.169921875, 6.5625, 6.955078125, 7.34765625, 7.740234375, 8.1328125, 8.525390625, 8.91796875, 9.310546875, 9.703125, 10.095703125, 10.48828125, 10.880859375, 11.2734375, 11.666015625, 12.05859375, 12.451171875, 12.84375]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 0.0, 6.0, 4.0, 9.0, 13.0, 16.0, 20.0, 33.0, 53.0, 61.0, 72.0, 121.0, 158.0, 219.0, 341.0, 473.0, 695.0, 946.0, 1585.0, 2795.0, 5517.0, 18934.0, 177877.0, 761669.0, 56649.0, 10249.0, 3818.0, 2135.0, 1269.0, 877.0, 563.0, 415.0, 275.0, 185.0, 154.0, 108.0, 66.0, 52.0, 43.0, 17.0, 23.0, 12.0, 15.0, 6.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-17.828125, -17.27587890625, -16.7236328125, -16.17138671875, -15.619140625, -15.06689453125, -14.5146484375, -13.96240234375, -13.41015625, -12.85791015625, -12.3056640625, -11.75341796875, -11.201171875, -10.64892578125, -10.0966796875, -9.54443359375, -8.9921875, -8.43994140625, -7.8876953125, -7.33544921875, -6.783203125, -6.23095703125, -5.6787109375, -5.12646484375, -4.57421875, -4.02197265625, -3.4697265625, -2.91748046875, -2.365234375, -1.81298828125, -1.2607421875, -0.70849609375, -0.15625, 0.39599609375, 0.9482421875, 1.50048828125, 2.052734375, 2.60498046875, 3.1572265625, 3.70947265625, 4.26171875, 4.81396484375, 5.3662109375, 5.91845703125, 6.470703125, 7.02294921875, 7.5751953125, 8.12744140625, 8.6796875, 9.23193359375, 9.7841796875, 10.33642578125, 10.888671875, 11.44091796875, 11.9931640625, 12.54541015625, 13.09765625, 13.64990234375, 14.2021484375, 14.75439453125, 15.306640625, 15.85888671875, 16.4111328125, 16.96337890625, 17.515625]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 3.0, 1.0, 6.0, 5.0, 6.0, 6.0, 8.0, 17.0, 15.0, 13.0, 12.0, 23.0, 24.0, 27.0, 31.0, 28.0, 33.0, 33.0, 34.0, 41.0, 35.0, 43.0, 103.0, 1950.0, 101.0, 40.0, 46.0, 33.0, 39.0, 40.0, 33.0, 20.0, 25.0, 25.0, 30.0, 18.0, 17.0, 14.0, 9.0, 15.0, 10.0, 6.0, 4.0, 6.0, 5.0, 5.0, 8.0, 2.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-38.375, -37.19482421875, -36.0146484375, -34.83447265625, -33.654296875, -32.47412109375, -31.2939453125, -30.11376953125, -28.93359375, -27.75341796875, -26.5732421875, -25.39306640625, -24.212890625, -23.03271484375, -21.8525390625, -20.67236328125, -19.4921875, -18.31201171875, -17.1318359375, -15.95166015625, -14.771484375, -13.59130859375, -12.4111328125, -11.23095703125, -10.05078125, -8.87060546875, -7.6904296875, -6.51025390625, -5.330078125, -4.14990234375, -2.9697265625, -1.78955078125, -0.609375, 0.57080078125, 1.7509765625, 2.93115234375, 4.111328125, 5.29150390625, 6.4716796875, 7.65185546875, 8.83203125, 10.01220703125, 11.1923828125, 12.37255859375, 13.552734375, 14.73291015625, 15.9130859375, 17.09326171875, 18.2734375, 19.45361328125, 20.6337890625, 21.81396484375, 22.994140625, 24.17431640625, 25.3544921875, 26.53466796875, 27.71484375, 28.89501953125, 30.0751953125, 31.25537109375, 32.435546875, 33.61572265625, 34.7958984375, 35.97607421875, 37.15625]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 13.0, 8.0, 7.0, 6.0, 7.0, 13.0, 16.0, 16.0, 25.0, 26.0, 48.0, 56.0, 62.0, 109.0, 162.0, 317.0, 711.0, 2232.0, 11178.0, 3103699.0, 22132.0, 2988.0, 851.0, 384.0, 203.0, 124.0, 78.0, 55.0, 39.0, 31.0, 19.0, 18.0, 24.0, 9.0, 6.0, 12.0, 5.0, 3.0, 5.0, 4.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-71.875, -69.3623046875, -66.849609375, -64.3369140625, -61.82421875, -59.3115234375, -56.798828125, -54.2861328125, -51.7734375, -49.2607421875, -46.748046875, -44.2353515625, -41.72265625, -39.2099609375, -36.697265625, -34.1845703125, -31.671875, -29.1591796875, -26.646484375, -24.1337890625, -21.62109375, -19.1083984375, -16.595703125, -14.0830078125, -11.5703125, -9.0576171875, -6.544921875, -4.0322265625, -1.51953125, 0.9931640625, 3.505859375, 6.0185546875, 8.53125, 11.0439453125, 13.556640625, 16.0693359375, 18.58203125, 21.0947265625, 23.607421875, 26.1201171875, 28.6328125, 31.1455078125, 33.658203125, 36.1708984375, 38.68359375, 41.1962890625, 43.708984375, 46.2216796875, 48.734375, 51.2470703125, 53.759765625, 56.2724609375, 58.78515625, 61.2978515625, 63.810546875, 66.3232421875, 68.8359375, 71.3486328125, 73.861328125, 76.3740234375, 78.88671875, 81.3994140625, 83.912109375, 86.4248046875, 88.9375]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 6.0, 11.0, 26.0, 44.0, 92.0, 108.0, 154.0, 206.0, 161.0, 89.0, 64.0, 23.0, 11.0, 8.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.517452239990234, -53.011497497558594, -51.50553894042969, -49.99958419799805, -48.493629455566406, -46.9876708984375, -45.48171615600586, -43.97576141357422, -42.46980285644531, -40.96384811401367, -39.457889556884766, -37.951934814453125, -36.44597625732422, -34.94002151489258, -33.43406677246094, -31.928110122680664, -30.42215347290039, -28.916196823120117, -27.410240173339844, -25.904285430908203, -24.39832878112793, -22.892372131347656, -21.386417388916016, -19.880460739135742, -18.37450408935547, -16.868547439575195, -15.362591743469238, -13.856636047363281, -12.350679397583008, -10.844722747802734, -9.338767051696777, -7.83281135559082, -6.326854705810547, -4.820898532867432, -3.3149423599243164, -1.8089861869812012, -0.30303001403808594, 1.2029261589050293, 2.7088823318481445, 4.214838027954102, 5.720794677734375, 7.22675085067749, 8.732707023620605, 10.238662719726562, 11.744619369506836, 13.25057601928711, 14.756531715393066, 16.262487411499023, 17.768444061279297, 19.27440071105957, 20.780357360839844, 22.286312103271484, 23.792268753051758, 25.29822540283203, 26.804180145263672, 28.310136795043945, 29.81609344482422, 31.322050094604492, 32.828006744384766, 34.333961486816406, 35.83992004394531, 37.34587478637695, 38.851829528808594, 40.3577880859375, 41.86374282836914]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 2.0, 2.0, 4.0, 4.0, 1.0, 4.0, 9.0, 9.0, 14.0, 19.0, 19.0, 10.0, 33.0, 22.0, 32.0, 32.0, 35.0, 38.0, 38.0, 39.0, 41.0, 31.0, 49.0, 62.0, 37.0, 37.0, 41.0, 44.0, 38.0, 31.0, 32.0, 33.0, 29.0, 26.0, 14.0, 28.0, 18.0, 12.0, 11.0, 6.0, 3.0, 5.0, 6.0, 4.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-128.0409698486328, -124.08228302001953, -120.12360382080078, -116.1649169921875, -112.20623779296875, -108.24755096435547, -104.28886413574219, -100.33018493652344, -96.37149810791016, -92.41281127929688, -88.45413208007812, -84.49544525146484, -80.53675842285156, -76.57807922363281, -72.61939239501953, -68.66070556640625, -64.7020263671875, -60.743343353271484, -56.78466033935547, -52.82597351074219, -48.86729049682617, -44.908607482910156, -40.949920654296875, -36.99123764038086, -33.032554626464844, -29.073871612548828, -25.11518669128418, -21.15650177001953, -17.197818756103516, -13.2391357421875, -9.280450820922852, -5.321765899658203, -1.3630828857421875, 2.5956010818481445, 6.554285049438477, 10.512969017028809, 14.47165298461914, 18.430335998535156, 22.389020919799805, 26.347705841064453, 30.30638885498047, 34.265071868896484, 38.2237548828125, 42.18244171142578, 46.1411247253418, 50.09980773925781, 54.058494567871094, 58.01717758178711, 61.975860595703125, 65.9345474243164, 69.89322662353516, 73.85191345214844, 77.81059265136719, 81.76927947998047, 85.72796630859375, 89.6866455078125, 93.64533233642578, 97.60401916503906, 101.56269836425781, 105.5213851928711, 109.48007202148438, 113.43875122070312, 117.3974380493164, 121.35612487792969, 125.31480407714844]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 3.0, 10.0, 12.0, 9.0, 5.0, 17.0, 21.0, 19.0, 13.0, 28.0, 29.0, 28.0, 32.0, 51.0, 44.0, 33.0, 43.0, 50.0, 46.0, 41.0, 42.0, 31.0, 42.0, 37.0, 34.0, 46.0, 40.0, 35.0, 32.0, 15.0, 14.0, 14.0, 19.0, 11.0, 15.0, 8.0, 6.0, 6.0, 4.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-12.609375, -12.2059326171875, -11.802490234375, -11.3990478515625, -10.99560546875, -10.5921630859375, -10.188720703125, -9.7852783203125, -9.3818359375, -8.9783935546875, -8.574951171875, -8.1715087890625, -7.76806640625, -7.3646240234375, -6.961181640625, -6.5577392578125, -6.154296875, -5.7508544921875, -5.347412109375, -4.9439697265625, -4.54052734375, -4.1370849609375, -3.733642578125, -3.3302001953125, -2.9267578125, -2.5233154296875, -2.119873046875, -1.7164306640625, -1.31298828125, -0.9095458984375, -0.506103515625, -0.1026611328125, 0.30078125, 0.7042236328125, 1.107666015625, 1.5111083984375, 1.91455078125, 2.3179931640625, 2.721435546875, 3.1248779296875, 3.5283203125, 3.9317626953125, 4.335205078125, 4.7386474609375, 5.14208984375, 5.5455322265625, 5.948974609375, 6.3524169921875, 6.755859375, 7.1593017578125, 7.562744140625, 7.9661865234375, 8.36962890625, 8.7730712890625, 9.176513671875, 9.5799560546875, 9.9833984375, 10.3868408203125, 10.790283203125, 11.1937255859375, 11.59716796875, 12.0006103515625, 12.404052734375, 12.8074951171875, 13.2109375]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 0.0, 4.0, 10.0, 2.0, 6.0, 7.0, 13.0, 21.0, 26.0, 28.0, 56.0, 74.0, 152.0, 240.0, 413.0, 655.0, 1126.0, 2000.0, 3791.0, 7390.0, 17567.0, 266943.0, 3569451.0, 290294.0, 18004.0, 7270.0, 3684.0, 2085.0, 1209.0, 698.0, 403.0, 237.0, 154.0, 80.0, 68.0, 34.0, 21.0, 20.0, 17.0, 10.0, 8.0, 8.0, 6.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-42.625, -41.31396484375, -40.0029296875, -38.69189453125, -37.380859375, -36.06982421875, -34.7587890625, -33.44775390625, -32.13671875, -30.82568359375, -29.5146484375, -28.20361328125, -26.892578125, -25.58154296875, -24.2705078125, -22.95947265625, -21.6484375, -20.33740234375, -19.0263671875, -17.71533203125, -16.404296875, -15.09326171875, -13.7822265625, -12.47119140625, -11.16015625, -9.84912109375, -8.5380859375, -7.22705078125, -5.916015625, -4.60498046875, -3.2939453125, -1.98291015625, -0.671875, 0.63916015625, 1.9501953125, 3.26123046875, 4.572265625, 5.88330078125, 7.1943359375, 8.50537109375, 9.81640625, 11.12744140625, 12.4384765625, 13.74951171875, 15.060546875, 16.37158203125, 17.6826171875, 18.99365234375, 20.3046875, 21.61572265625, 22.9267578125, 24.23779296875, 25.548828125, 26.85986328125, 28.1708984375, 29.48193359375, 30.79296875, 32.10400390625, 33.4150390625, 34.72607421875, 36.037109375, 37.34814453125, 38.6591796875, 39.97021484375, 41.28125]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 3.0, 3.0, 2.0, 9.0, 5.0, 6.0, 6.0, 10.0, 8.0, 11.0, 18.0, 33.0, 51.0, 87.0, 177.0, 480.0, 931.0, 1041.0, 581.0, 283.0, 121.0, 61.0, 36.0, 28.0, 12.0, 21.0, 15.0, 3.0, 7.0, 6.0, 3.0, 1.0, 3.0, 1.0, 6.0, 0.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-39.0, -37.75048828125, -36.5009765625, -35.25146484375, -34.001953125, -32.75244140625, -31.5029296875, -30.25341796875, -29.00390625, -27.75439453125, -26.5048828125, -25.25537109375, -24.005859375, -22.75634765625, -21.5068359375, -20.25732421875, -19.0078125, -17.75830078125, -16.5087890625, -15.25927734375, -14.009765625, -12.76025390625, -11.5107421875, -10.26123046875, -9.01171875, -7.76220703125, -6.5126953125, -5.26318359375, -4.013671875, -2.76416015625, -1.5146484375, -0.26513671875, 0.984375, 2.23388671875, 3.4833984375, 4.73291015625, 5.982421875, 7.23193359375, 8.4814453125, 9.73095703125, 10.98046875, 12.22998046875, 13.4794921875, 14.72900390625, 15.978515625, 17.22802734375, 18.4775390625, 19.72705078125, 20.9765625, 22.22607421875, 23.4755859375, 24.72509765625, 25.974609375, 27.22412109375, 28.4736328125, 29.72314453125, 30.97265625, 32.22216796875, 33.4716796875, 34.72119140625, 35.970703125, 37.22021484375, 38.4697265625, 39.71923828125, 40.96875]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 7.0, 4.0, 11.0, 12.0, 21.0, 35.0, 40.0, 79.0, 111.0, 129.0, 212.0, 322.0, 509.0, 800.0, 1142.0, 1812.0, 2926.0, 4846.0, 8742.0, 17545.0, 45119.0, 307881.0, 3448619.0, 271582.0, 43565.0, 16886.0, 8460.0, 4815.0, 2853.0, 1811.0, 1183.0, 715.0, 455.0, 350.0, 223.0, 174.0, 113.0, 50.0, 30.0, 23.0, 25.0, 18.0, 13.0, 7.0, 7.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.71875, -41.21875, -39.71875, -38.21875, -36.71875, -35.21875, -33.71875, -32.21875, -30.71875, -29.21875, -27.71875, -26.21875, -24.71875, -23.21875, -21.71875, -20.21875, -18.71875, -17.21875, -15.71875, -14.21875, -12.71875, -11.21875, -9.71875, -8.21875, -6.71875, -5.21875, -3.71875, -2.21875, -0.71875, 0.78125, 2.28125, 3.78125, 5.28125, 6.78125, 8.28125, 9.78125, 11.28125, 12.78125, 14.28125, 15.78125, 17.28125, 18.78125, 20.28125, 21.78125, 23.28125, 24.78125, 26.28125, 27.78125, 29.28125, 30.78125, 32.28125, 33.78125, 35.28125, 36.78125, 38.28125, 39.78125, 41.28125, 42.78125, 44.28125, 45.78125, 47.28125, 48.78125, 50.28125, 51.78125, 53.28125]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0, 8.0, 8.0, 6.0, 7.0, 6.0, 14.0, 17.0, 18.0, 39.0, 44.0, 61.0, 96.0, 119.0, 125.0, 115.0, 85.0, 56.0, 43.0, 30.0, 13.0, 17.0, 18.0, 12.0, 7.0, 8.0, 11.0, 1.0, 5.0, 4.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-121.70426177978516, -117.93956756591797, -114.17488098144531, -110.41018676757812, -106.64549255371094, -102.88079833984375, -99.11610412597656, -95.3514175415039, -91.58672332763672, -87.82202911376953, -84.05734252929688, -80.29264831542969, -76.5279541015625, -72.76325988769531, -68.99856567382812, -65.23387908935547, -61.46918487548828, -57.704490661621094, -53.93980026245117, -50.17510986328125, -46.41041564941406, -42.645721435546875, -38.88103103637695, -35.11634063720703, -31.351646423339844, -27.58695411682129, -23.822261810302734, -20.05756950378418, -16.292877197265625, -12.52818489074707, -8.763492584228516, -4.998800277709961, -1.2341079711914062, 2.5305843353271484, 6.295276641845703, 10.059968948364258, 13.824661254882812, 17.589353561401367, 21.354045867919922, 25.118738174438477, 28.88343048095703, 32.64812469482422, 36.41281509399414, 40.17750549316406, 43.94219970703125, 47.70689392089844, 51.47158432006836, 55.23627471923828, 59.00096893310547, 62.765663146972656, 66.53034973144531, 70.2950439453125, 74.05973815917969, 77.82443237304688, 81.58912658691406, 85.35381317138672, 89.1185073852539, 92.8832015991211, 96.64788818359375, 100.41258239746094, 104.17727661132812, 107.94197082519531, 111.7066650390625, 115.47135162353516, 119.23604583740234]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 1.0, 0.0, 3.0, 4.0, 2.0, 2.0, 10.0, 10.0, 7.0, 11.0, 13.0, 15.0, 22.0, 20.0, 23.0, 21.0, 30.0, 28.0, 31.0, 29.0, 28.0, 41.0, 50.0, 44.0, 52.0, 35.0, 54.0, 50.0, 46.0, 37.0, 34.0, 31.0, 32.0, 26.0, 34.0, 24.0, 16.0, 18.0, 14.0, 10.0, 10.0, 12.0, 8.0, 9.0, 5.0, 2.0, 0.0, 6.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.22354125976562, -81.3347396850586, -78.44593048095703, -75.55712890625, -72.66832733154297, -69.77952575683594, -66.89071655273438, -64.00191497802734, -61.11310958862305, -58.22430419921875, -55.33550262451172, -52.44669723510742, -49.557891845703125, -46.669090270996094, -43.7802848815918, -40.8914794921875, -38.00267791748047, -35.11387252807617, -32.22507095336914, -29.336265563964844, -26.44746208190918, -23.558658599853516, -20.66985321044922, -17.781049728393555, -14.89224624633789, -12.003442764282227, -9.114638328552246, -6.225833892822266, -3.3370304107666016, -0.4482269287109375, 2.4405784606933594, 5.329381942749023, 8.218185424804688, 11.106988906860352, 13.995793342590332, 16.884597778320312, 19.773401260375977, 22.66220474243164, 25.551010131835938, 28.4398136138916, 31.328617095947266, 34.21742248535156, 37.106224060058594, 39.99502944946289, 42.88383483886719, 45.77263641357422, 48.661441802978516, 51.55024719238281, 54.439048767089844, 57.32785415649414, 60.21665573120117, 63.10546112060547, 65.9942626953125, 68.88307189941406, 71.7718734741211, 74.66067504882812, 77.54948425292969, 80.43828582763672, 83.32709503173828, 86.21589660644531, 89.10469818115234, 91.99349975585938, 94.88230895996094, 97.77111053466797, 100.659912109375]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 9.0, 9.0, 9.0, 13.0, 10.0, 16.0, 19.0, 22.0, 24.0, 40.0, 29.0, 35.0, 30.0, 35.0, 36.0, 54.0, 54.0, 44.0, 44.0, 39.0, 42.0, 43.0, 43.0, 36.0, 40.0, 28.0, 30.0, 31.0, 20.0, 14.0, 21.0, 9.0, 12.0, 12.0, 12.0, 12.0, 5.0, 5.0, 1.0, 3.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.5078125, -14.083984375, -13.66015625, -13.236328125, -12.8125, -12.388671875, -11.96484375, -11.541015625, -11.1171875, -10.693359375, -10.26953125, -9.845703125, -9.421875, -8.998046875, -8.57421875, -8.150390625, -7.7265625, -7.302734375, -6.87890625, -6.455078125, -6.03125, -5.607421875, -5.18359375, -4.759765625, -4.3359375, -3.912109375, -3.48828125, -3.064453125, -2.640625, -2.216796875, -1.79296875, -1.369140625, -0.9453125, -0.521484375, -0.09765625, 0.326171875, 0.75, 1.173828125, 1.59765625, 2.021484375, 2.4453125, 2.869140625, 3.29296875, 3.716796875, 4.140625, 4.564453125, 4.98828125, 5.412109375, 5.8359375, 6.259765625, 6.68359375, 7.107421875, 7.53125, 7.955078125, 8.37890625, 8.802734375, 9.2265625, 9.650390625, 10.07421875, 10.498046875, 10.921875, 11.345703125, 11.76953125, 12.193359375, 12.6171875]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 6.0, 16.0, 20.0, 21.0, 40.0, 46.0, 75.0, 109.0, 204.0, 306.0, 501.0, 783.0, 1315.0, 2224.0, 3715.0, 6279.0, 10634.0, 18509.0, 32781.0, 62056.0, 130434.0, 288271.0, 254085.0, 111762.0, 54668.0, 29391.0, 16475.0, 9680.0, 5749.0, 3242.0, 2017.0, 1195.0, 746.0, 419.0, 296.0, 152.0, 126.0, 78.0, 36.0, 33.0, 20.0, 15.0, 12.0, 7.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.7900390625, -1.73211669921875, -1.6741943359375, -1.61627197265625, -1.558349609375, -1.50042724609375, -1.4425048828125, -1.38458251953125, -1.32666015625, -1.26873779296875, -1.2108154296875, -1.15289306640625, -1.094970703125, -1.03704833984375, -0.9791259765625, -0.92120361328125, -0.86328125, -0.80535888671875, -0.7474365234375, -0.68951416015625, -0.631591796875, -0.57366943359375, -0.5157470703125, -0.45782470703125, -0.39990234375, -0.34197998046875, -0.2840576171875, -0.22613525390625, -0.168212890625, -0.11029052734375, -0.0523681640625, 0.00555419921875, 0.0634765625, 0.12139892578125, 0.1793212890625, 0.23724365234375, 0.295166015625, 0.35308837890625, 0.4110107421875, 0.46893310546875, 0.52685546875, 0.58477783203125, 0.6427001953125, 0.70062255859375, 0.758544921875, 0.81646728515625, 0.8743896484375, 0.93231201171875, 0.990234375, 1.04815673828125, 1.1060791015625, 1.16400146484375, 1.221923828125, 1.27984619140625, 1.3377685546875, 1.39569091796875, 1.45361328125, 1.51153564453125, 1.5694580078125, 1.62738037109375, 1.685302734375, 1.74322509765625, 1.8011474609375, 1.85906982421875, 1.9169921875]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 2.0, 1.0, 5.0, 3.0, 5.0, 8.0, 6.0, 8.0, 10.0, 9.0, 11.0, 17.0, 22.0, 26.0, 22.0, 28.0, 26.0, 25.0, 34.0, 30.0, 32.0, 26.0, 44.0, 43.0, 36.0, 1065.0, 35.0, 50.0, 45.0, 34.0, 43.0, 24.0, 30.0, 24.0, 26.0, 40.0, 21.0, 14.0, 19.0, 20.0, 12.0, 7.0, 15.0, 9.0, 7.0, 1.0, 5.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-8.0390625, -7.792236328125, -7.54541015625, -7.298583984375, -7.0517578125, -6.804931640625, -6.55810546875, -6.311279296875, -6.064453125, -5.817626953125, -5.57080078125, -5.323974609375, -5.0771484375, -4.830322265625, -4.58349609375, -4.336669921875, -4.08984375, -3.843017578125, -3.59619140625, -3.349365234375, -3.1025390625, -2.855712890625, -2.60888671875, -2.362060546875, -2.115234375, -1.868408203125, -1.62158203125, -1.374755859375, -1.1279296875, -0.881103515625, -0.63427734375, -0.387451171875, -0.140625, 0.106201171875, 0.35302734375, 0.599853515625, 0.8466796875, 1.093505859375, 1.34033203125, 1.587158203125, 1.833984375, 2.080810546875, 2.32763671875, 2.574462890625, 2.8212890625, 3.068115234375, 3.31494140625, 3.561767578125, 3.80859375, 4.055419921875, 4.30224609375, 4.549072265625, 4.7958984375, 5.042724609375, 5.28955078125, 5.536376953125, 5.783203125, 6.030029296875, 6.27685546875, 6.523681640625, 6.7705078125, 7.017333984375, 7.26416015625, 7.510986328125, 7.7578125]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 5.0, 3.0, 8.0, 18.0, 16.0, 37.0, 66.0, 96.0, 152.0, 210.0, 326.0, 446.0, 727.0, 1000.0, 1507.0, 2221.0, 3435.0, 5141.0, 7787.0, 11880.0, 17991.0, 28046.0, 45058.0, 75261.0, 132252.0, 1183360.0, 276062.0, 119283.0, 68693.0, 41181.0, 25713.0, 16424.0, 10920.0, 7192.0, 4871.0, 3214.0, 2218.0, 1410.0, 996.0, 612.0, 429.0, 320.0, 174.0, 117.0, 89.0, 60.0, 41.0, 23.0, 12.0, 13.0, 9.0, 5.0, 4.0, 3.0, 3.0, 0.0, 1.0], "bins": [-0.76708984375, -0.7437820434570312, -0.7204742431640625, -0.6971664428710938, -0.673858642578125, -0.6505508422851562, -0.6272430419921875, -0.6039352416992188, -0.58062744140625, -0.5573196411132812, -0.5340118408203125, -0.5107040405273438, -0.487396240234375, -0.46408843994140625, -0.4407806396484375, -0.41747283935546875, -0.3941650390625, -0.37085723876953125, -0.3475494384765625, -0.32424163818359375, -0.300933837890625, -0.27762603759765625, -0.2543182373046875, -0.23101043701171875, -0.20770263671875, -0.18439483642578125, -0.1610870361328125, -0.13777923583984375, -0.114471435546875, -0.09116363525390625, -0.0678558349609375, -0.04454803466796875, -0.021240234375, 0.00206756591796875, 0.0253753662109375, 0.04868316650390625, 0.071990966796875, 0.09529876708984375, 0.1186065673828125, 0.14191436767578125, 0.16522216796875, 0.18852996826171875, 0.2118377685546875, 0.23514556884765625, 0.258453369140625, 0.28176116943359375, 0.3050689697265625, 0.32837677001953125, 0.3516845703125, 0.37499237060546875, 0.3983001708984375, 0.42160797119140625, 0.444915771484375, 0.46822357177734375, 0.4915313720703125, 0.5148391723632812, 0.53814697265625, 0.5614547729492188, 0.5847625732421875, 0.6080703735351562, 0.631378173828125, 0.6546859741210938, 0.6779937744140625, 0.7013015747070312, 0.724609375]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 5.0, 5.0, 2.0, 10.0, 11.0, 18.0, 20.0, 25.0, 43.0, 59.0, 72.0, 131.0, 190.0, 122.0, 77.0, 68.0, 41.0, 36.0, 24.0, 12.0, 9.0, 4.0, 1.0, 6.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.032501220703125, -0.031502723693847656, -0.030504226684570312, -0.02950572967529297, -0.028507232666015625, -0.02750873565673828, -0.026510238647460938, -0.025511741638183594, -0.02451324462890625, -0.023514747619628906, -0.022516250610351562, -0.02151775360107422, -0.020519256591796875, -0.01952075958251953, -0.018522262573242188, -0.017523765563964844, -0.0165252685546875, -0.015526771545410156, -0.014528274536132812, -0.013529777526855469, -0.012531280517578125, -0.011532783508300781, -0.010534286499023438, -0.009535789489746094, -0.00853729248046875, -0.007538795471191406, -0.0065402984619140625, -0.005541801452636719, -0.004543304443359375, -0.0035448074340820312, -0.0025463104248046875, -0.0015478134155273438, -0.00054931640625, 0.00044918060302734375, 0.0014476776123046875, 0.0024461746215820312, 0.003444671630859375, 0.004443168640136719, 0.0054416656494140625, 0.006440162658691406, 0.00743865966796875, 0.008437156677246094, 0.009435653686523438, 0.010434150695800781, 0.011432647705078125, 0.012431144714355469, 0.013429641723632812, 0.014428138732910156, 0.0154266357421875, 0.016425132751464844, 0.017423629760742188, 0.01842212677001953, 0.019420623779296875, 0.02041912078857422, 0.021417617797851562, 0.022416114807128906, 0.02341461181640625, 0.024413108825683594, 0.025411605834960938, 0.02641010284423828, 0.027408599853515625, 0.02840709686279297, 0.029405593872070312, 0.030404090881347656, 0.031402587890625]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 4.0, 4.0, 8.0, 9.0, 5.0, 14.0, 18.0, 21.0, 32.0, 33.0, 46.0, 67.0, 106.0, 123.0, 199.0, 347.0, 800.0, 3335.0, 25974.0, 921342.0, 87163.0, 6444.0, 1329.0, 438.0, 206.0, 123.0, 95.0, 62.0, 53.0, 29.0, 23.0, 25.0, 18.0, 13.0, 9.0, 5.0, 11.0, 3.0, 5.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.50927734375, -0.49320220947265625, -0.4771270751953125, -0.46105194091796875, -0.444976806640625, -0.42890167236328125, -0.4128265380859375, -0.39675140380859375, -0.38067626953125, -0.36460113525390625, -0.3485260009765625, -0.33245086669921875, -0.316375732421875, -0.30030059814453125, -0.2842254638671875, -0.26815032958984375, -0.2520751953125, -0.23600006103515625, -0.2199249267578125, -0.20384979248046875, -0.187774658203125, -0.17169952392578125, -0.1556243896484375, -0.13954925537109375, -0.12347412109375, -0.10739898681640625, -0.0913238525390625, -0.07524871826171875, -0.059173583984375, -0.04309844970703125, -0.0270233154296875, -0.01094818115234375, 0.005126953125, 0.02120208740234375, 0.0372772216796875, 0.05335235595703125, 0.069427490234375, 0.08550262451171875, 0.1015777587890625, 0.11765289306640625, 0.13372802734375, 0.14980316162109375, 0.1658782958984375, 0.18195343017578125, 0.198028564453125, 0.21410369873046875, 0.2301788330078125, 0.24625396728515625, 0.2623291015625, 0.27840423583984375, 0.2944793701171875, 0.31055450439453125, 0.326629638671875, 0.34270477294921875, 0.3587799072265625, 0.37485504150390625, 0.39093017578125, 0.40700531005859375, 0.4230804443359375, 0.43915557861328125, 0.455230712890625, 0.47130584716796875, 0.4873809814453125, 0.5034561157226562, 0.51953125]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 6.0, 16.0, 66.0, 250.0, 454.0, 128.0, 52.0, 16.0, 12.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2257242053747177, -0.21600471436977386, -0.20628522336483002, -0.19656573235988617, -0.18684624135494232, -0.17712675034999847, -0.16740724444389343, -0.15768775343894958, -0.14796826243400574, -0.1382487714290619, -0.12852928042411804, -0.1188097894191742, -0.10909029841423035, -0.0993708074092865, -0.08965130895376205, -0.0799318179488182, -0.07021233439445496, -0.06049284338951111, -0.05077335238456726, -0.041053857654333115, -0.03133436664938927, -0.02161487564444542, -0.011895380914211273, -0.0021758899092674255, 0.007543601095676422, 0.01726309210062027, 0.026982584968209267, 0.036702077835798264, 0.04642156884074211, 0.05614105984568596, 0.0658605545759201, 0.07558004558086395, 0.0852995216846466, 0.09501901268959045, 0.1047385036945343, 0.11445799469947815, 0.124177485704422, 0.13389697670936584, 0.1436164677143097, 0.15333595871925354, 0.1630554497241974, 0.17277494072914124, 0.18249443173408508, 0.19221392273902893, 0.20193341374397278, 0.21165290474891663, 0.22137239575386047, 0.23109188675880432, 0.24081139266490936, 0.2505308985710144, 0.26025038957595825, 0.2699698805809021, 0.27968937158584595, 0.2894088625907898, 0.29912835359573364, 0.3088478446006775, 0.31856733560562134, 0.3282868266105652, 0.33800631761550903, 0.3477258086204529, 0.35744529962539673, 0.3671647906303406, 0.3768842816352844, 0.38660377264022827, 0.3963232636451721]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 4.0, 6.0, 6.0, 5.0, 7.0, 7.0, 14.0, 21.0, 13.0, 20.0, 18.0, 16.0, 21.0, 34.0, 33.0, 26.0, 31.0, 31.0, 39.0, 48.0, 46.0, 39.0, 32.0, 43.0, 32.0, 36.0, 37.0, 41.0, 30.0, 26.0, 20.0, 37.0, 29.0, 28.0, 23.0, 21.0, 16.0, 13.0, 11.0, 10.0, 12.0, 7.0, 7.0, 3.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01572597026824951, -0.015226421877741814, -0.014726873487234116, -0.014227325096726418, -0.01372777670621872, -0.013228228315711021, -0.012728679925203323, -0.012229131534695625, -0.011729583144187927, -0.01123003475368023, -0.010730486363172531, -0.010230937972664833, -0.009731389582157135, -0.009231841191649437, -0.008732292801141739, -0.00823274441063404, -0.007733196020126343, -0.007233647629618645, -0.006734099239110947, -0.006234550848603249, -0.0057350024580955505, -0.0052354540675878525, -0.004735905677080154, -0.004236357286572456, -0.0037368088960647583, -0.0032372605055570602, -0.002737712115049362, -0.002238163724541664, -0.001738615334033966, -0.001239066943526268, -0.00073951855301857, -0.0002399701625108719, 0.00025957822799682617, 0.0007591266185045242, 0.0012586750090122223, 0.0017582233995199203, 0.0022577717900276184, 0.0027573201805353165, 0.0032568685710430145, 0.0037564169615507126, 0.004255965352058411, 0.004755513742566109, 0.005255062133073807, 0.005754610523581505, 0.006254158914089203, 0.006753707304596901, 0.007253255695104599, 0.007752804085612297, 0.008252352476119995, 0.008751900866627693, 0.009251449257135391, 0.00975099764764309, 0.010250546038150787, 0.010750094428658485, 0.011249642819166183, 0.011749191209673882, 0.01224873960018158, 0.012748287990689278, 0.013247836381196976, 0.013747384771704674, 0.014246933162212372, 0.01474648155272007, 0.015246029943227768, 0.015745578333735466, 0.016245126724243164]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 9.0, 9.0, 9.0, 13.0, 11.0, 15.0, 20.0, 21.0, 25.0, 40.0, 31.0, 34.0, 28.0, 35.0, 36.0, 54.0, 55.0, 44.0, 44.0, 38.0, 44.0, 42.0, 43.0, 35.0, 40.0, 30.0, 28.0, 32.0, 19.0, 15.0, 20.0, 9.0, 13.0, 12.0, 11.0, 12.0, 5.0, 5.0, 1.0, 3.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.5, -14.076171875, -13.65234375, -13.228515625, -12.8046875, -12.380859375, -11.95703125, -11.533203125, -11.109375, -10.685546875, -10.26171875, -9.837890625, -9.4140625, -8.990234375, -8.56640625, -8.142578125, -7.71875, -7.294921875, -6.87109375, -6.447265625, -6.0234375, -5.599609375, -5.17578125, -4.751953125, -4.328125, -3.904296875, -3.48046875, -3.056640625, -2.6328125, -2.208984375, -1.78515625, -1.361328125, -0.9375, -0.513671875, -0.08984375, 0.333984375, 0.7578125, 1.181640625, 1.60546875, 2.029296875, 2.453125, 2.876953125, 3.30078125, 3.724609375, 4.1484375, 4.572265625, 4.99609375, 5.419921875, 5.84375, 6.267578125, 6.69140625, 7.115234375, 7.5390625, 7.962890625, 8.38671875, 8.810546875, 9.234375, 9.658203125, 10.08203125, 10.505859375, 10.9296875, 11.353515625, 11.77734375, 12.201171875, 12.625]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 1.0, 8.0, 12.0, 11.0, 15.0, 16.0, 28.0, 41.0, 54.0, 70.0, 106.0, 209.0, 316.0, 566.0, 1085.0, 2319.0, 5073.0, 12701.0, 36259.0, 129081.0, 522457.0, 246274.0, 58576.0, 19358.0, 7454.0, 3147.0, 1481.0, 746.0, 416.0, 219.0, 145.0, 78.0, 50.0, 37.0, 37.0, 35.0, 15.0, 17.0, 13.0, 7.0, 8.0, 3.0, 3.0, 1.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.5625, -8.3157958984375, -8.069091796875, -7.8223876953125, -7.57568359375, -7.3289794921875, -7.082275390625, -6.8355712890625, -6.5888671875, -6.3421630859375, -6.095458984375, -5.8487548828125, -5.60205078125, -5.3553466796875, -5.108642578125, -4.8619384765625, -4.615234375, -4.3685302734375, -4.121826171875, -3.8751220703125, -3.62841796875, -3.3817138671875, -3.135009765625, -2.8883056640625, -2.6416015625, -2.3948974609375, -2.148193359375, -1.9014892578125, -1.65478515625, -1.4080810546875, -1.161376953125, -0.9146728515625, -0.66796875, -0.4212646484375, -0.174560546875, 0.0721435546875, 0.31884765625, 0.5655517578125, 0.812255859375, 1.0589599609375, 1.3056640625, 1.5523681640625, 1.799072265625, 2.0457763671875, 2.29248046875, 2.5391845703125, 2.785888671875, 3.0325927734375, 3.279296875, 3.5260009765625, 3.772705078125, 4.0194091796875, 4.26611328125, 4.5128173828125, 4.759521484375, 5.0062255859375, 5.2529296875, 5.4996337890625, 5.746337890625, 5.9930419921875, 6.23974609375, 6.4864501953125, 6.733154296875, 6.9798583984375, 7.2265625]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 7.0, 4.0, 6.0, 8.0, 13.0, 10.0, 10.0, 11.0, 18.0, 25.0, 27.0, 27.0, 33.0, 25.0, 44.0, 37.0, 48.0, 32.0, 37.0, 53.0, 150.0, 1888.0, 108.0, 40.0, 38.0, 31.0, 33.0, 43.0, 31.0, 28.0, 31.0, 29.0, 22.0, 16.0, 16.0, 13.0, 10.0, 9.0, 7.0, 10.0, 9.0, 6.0, 5.0, 2.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.4375, -41.08642578125, -39.7353515625, -38.38427734375, -37.033203125, -35.68212890625, -34.3310546875, -32.97998046875, -31.62890625, -30.27783203125, -28.9267578125, -27.57568359375, -26.224609375, -24.87353515625, -23.5224609375, -22.17138671875, -20.8203125, -19.46923828125, -18.1181640625, -16.76708984375, -15.416015625, -14.06494140625, -12.7138671875, -11.36279296875, -10.01171875, -8.66064453125, -7.3095703125, -5.95849609375, -4.607421875, -3.25634765625, -1.9052734375, -0.55419921875, 0.796875, 2.14794921875, 3.4990234375, 4.85009765625, 6.201171875, 7.55224609375, 8.9033203125, 10.25439453125, 11.60546875, 12.95654296875, 14.3076171875, 15.65869140625, 17.009765625, 18.36083984375, 19.7119140625, 21.06298828125, 22.4140625, 23.76513671875, 25.1162109375, 26.46728515625, 27.818359375, 29.16943359375, 30.5205078125, 31.87158203125, 33.22265625, 34.57373046875, 35.9248046875, 37.27587890625, 38.626953125, 39.97802734375, 41.3291015625, 42.68017578125, 44.03125]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 7.0, 6.0, 10.0, 6.0, 10.0, 16.0, 18.0, 11.0, 25.0, 28.0, 37.0, 56.0, 58.0, 93.0, 111.0, 125.0, 186.0, 355.0, 794.0, 5153.0, 3109949.0, 25971.0, 1271.0, 417.0, 217.0, 199.0, 114.0, 98.0, 72.0, 61.0, 50.0, 37.0, 29.0, 29.0, 11.0, 10.0, 14.0, 10.0, 7.0, 8.0, 6.0, 4.0, 7.0, 4.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0], "bins": [-89.5, -86.841796875, -84.18359375, -81.525390625, -78.8671875, -76.208984375, -73.55078125, -70.892578125, -68.234375, -65.576171875, -62.91796875, -60.259765625, -57.6015625, -54.943359375, -52.28515625, -49.626953125, -46.96875, -44.310546875, -41.65234375, -38.994140625, -36.3359375, -33.677734375, -31.01953125, -28.361328125, -25.703125, -23.044921875, -20.38671875, -17.728515625, -15.0703125, -12.412109375, -9.75390625, -7.095703125, -4.4375, -1.779296875, 0.87890625, 3.537109375, 6.1953125, 8.853515625, 11.51171875, 14.169921875, 16.828125, 19.486328125, 22.14453125, 24.802734375, 27.4609375, 30.119140625, 32.77734375, 35.435546875, 38.09375, 40.751953125, 43.41015625, 46.068359375, 48.7265625, 51.384765625, 54.04296875, 56.701171875, 59.359375, 62.017578125, 64.67578125, 67.333984375, 69.9921875, 72.650390625, 75.30859375, 77.966796875, 80.625]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 535.0, 480.0], "bins": [-804.3517456054688, -791.5792236328125, -778.806640625, -766.0341186523438, -753.2615966796875, -740.489013671875, -727.7164916992188, -714.9439697265625, -702.1714477539062, -689.39892578125, -676.6263427734375, -663.8538208007812, -651.081298828125, -638.3087158203125, -625.5361938476562, -612.763671875, -599.9910888671875, -587.2185668945312, -574.4459838867188, -561.6734619140625, -548.9009399414062, -536.12841796875, -523.3558349609375, -510.58331298828125, -497.810791015625, -485.0382385253906, -472.2657165527344, -459.4931640625, -446.72064208984375, -433.9480895996094, -421.175537109375, -408.40301513671875, -395.6304626464844, -382.85791015625, -370.08538818359375, -357.3128356933594, -344.5403137207031, -331.76776123046875, -318.9952392578125, -306.2226867675781, -293.45013427734375, -280.6775817871094, -267.9050598144531, -255.13250732421875, -242.35997009277344, -229.58743286132812, -216.8148956298828, -204.0423583984375, -191.2698211669922, -178.49728393554688, -165.72474670410156, -152.95220947265625, -140.17965698242188, -127.40711975097656, -114.63458251953125, -101.8620376586914, -89.08950805664062, -76.31697082519531, -63.54442596435547, -50.771888732910156, -37.99934768676758, -25.226806640625, -12.454269409179688, 0.31827545166015625, 13.090814590454102]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 7.0, 3.0, 3.0, 9.0, 7.0, 8.0, 10.0, 8.0, 12.0, 8.0, 19.0, 12.0, 23.0, 13.0, 25.0, 29.0, 31.0, 34.0, 39.0, 38.0, 30.0, 38.0, 37.0, 37.0, 52.0, 49.0, 47.0, 31.0, 45.0, 39.0, 32.0, 27.0, 32.0, 26.0, 23.0, 19.0, 18.0, 12.0, 15.0, 12.0, 11.0, 13.0, 6.0, 5.0, 3.0, 3.0, 0.0, 5.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-108.20925903320312, -104.6911392211914, -101.17302703857422, -97.6549072265625, -94.13679504394531, -90.6186752319336, -87.10055541992188, -83.58244323730469, -80.0643310546875, -76.54621124267578, -73.0280990600586, -69.50997924804688, -65.99186706542969, -62.47374725341797, -58.955631256103516, -55.43751525878906, -51.919395446777344, -48.40127944946289, -44.88316345214844, -41.36504364013672, -37.84693145751953, -34.32881164550781, -30.81069564819336, -27.292579650878906, -23.774463653564453, -20.25634765625, -16.738231658935547, -13.220113754272461, -9.701997756958008, -6.183881759643555, -2.6657638549804688, 0.8523521423339844, 4.370460510253906, 7.888576984405518, 11.406693458557129, 14.924810409545898, 18.44292640686035, 21.961042404174805, 25.47916030883789, 28.997276306152344, 32.5153923034668, 36.03350830078125, 39.5516242980957, 43.069740295410156, 46.587860107421875, 50.10597229003906, 53.62409210205078, 57.142208099365234, 60.66032409667969, 64.1784439086914, 67.6965560913086, 71.21467590332031, 74.7327880859375, 78.25090789794922, 81.76902770996094, 85.28713989257812, 88.80525207519531, 92.32337188720703, 95.84148406982422, 99.35960388183594, 102.87771606445312, 106.39583587646484, 109.91395568847656, 113.43206787109375, 116.95018768310547]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 4.0, 7.0, 10.0, 10.0, 10.0, 15.0, 8.0, 19.0, 22.0, 25.0, 39.0, 27.0, 43.0, 31.0, 30.0, 38.0, 42.0, 54.0, 52.0, 48.0, 36.0, 44.0, 43.0, 37.0, 46.0, 41.0, 28.0, 23.0, 26.0, 25.0, 17.0, 20.0, 9.0, 13.0, 16.0, 8.0, 10.0, 7.0, 4.0, 3.0, 3.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.578125, -14.15380859375, -13.7294921875, -13.30517578125, -12.880859375, -12.45654296875, -12.0322265625, -11.60791015625, -11.18359375, -10.75927734375, -10.3349609375, -9.91064453125, -9.486328125, -9.06201171875, -8.6376953125, -8.21337890625, -7.7890625, -7.36474609375, -6.9404296875, -6.51611328125, -6.091796875, -5.66748046875, -5.2431640625, -4.81884765625, -4.39453125, -3.97021484375, -3.5458984375, -3.12158203125, -2.697265625, -2.27294921875, -1.8486328125, -1.42431640625, -1.0, -0.57568359375, -0.1513671875, 0.27294921875, 0.697265625, 1.12158203125, 1.5458984375, 1.97021484375, 2.39453125, 2.81884765625, 3.2431640625, 3.66748046875, 4.091796875, 4.51611328125, 4.9404296875, 5.36474609375, 5.7890625, 6.21337890625, 6.6376953125, 7.06201171875, 7.486328125, 7.91064453125, 8.3349609375, 8.75927734375, 9.18359375, 9.60791015625, 10.0322265625, 10.45654296875, 10.880859375, 11.30517578125, 11.7294921875, 12.15380859375, 12.578125]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 3.0, 4.0, 4.0, 10.0, 12.0, 15.0, 12.0, 16.0, 19.0, 27.0, 48.0, 65.0, 102.0, 134.0, 239.0, 396.0, 758.0, 1507.0, 3345.0, 8351.0, 38971.0, 3227112.0, 881874.0, 19818.0, 6058.0, 2613.0, 1215.0, 631.0, 332.0, 196.0, 115.0, 77.0, 52.0, 41.0, 27.0, 13.0, 11.0, 13.0, 17.0, 8.0, 6.0, 7.0, 2.0, 4.0, 2.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-60.375, -58.5908203125, -56.806640625, -55.0224609375, -53.23828125, -51.4541015625, -49.669921875, -47.8857421875, -46.1015625, -44.3173828125, -42.533203125, -40.7490234375, -38.96484375, -37.1806640625, -35.396484375, -33.6123046875, -31.828125, -30.0439453125, -28.259765625, -26.4755859375, -24.69140625, -22.9072265625, -21.123046875, -19.3388671875, -17.5546875, -15.7705078125, -13.986328125, -12.2021484375, -10.41796875, -8.6337890625, -6.849609375, -5.0654296875, -3.28125, -1.4970703125, 0.287109375, 2.0712890625, 3.85546875, 5.6396484375, 7.423828125, 9.2080078125, 10.9921875, 12.7763671875, 14.560546875, 16.3447265625, 18.12890625, 19.9130859375, 21.697265625, 23.4814453125, 25.265625, 27.0498046875, 28.833984375, 30.6181640625, 32.40234375, 34.1865234375, 35.970703125, 37.7548828125, 39.5390625, 41.3232421875, 43.107421875, 44.8916015625, 46.67578125, 48.4599609375, 50.244140625, 52.0283203125, 53.8125]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 6.0, 5.0, 4.0, 5.0, 9.0, 7.0, 9.0, 7.0, 12.0, 11.0, 17.0, 17.0, 25.0, 28.0, 49.0, 79.0, 178.0, 327.0, 641.0, 879.0, 764.0, 422.0, 222.0, 129.0, 69.0, 26.0, 21.0, 18.0, 14.0, 14.0, 12.0, 5.0, 5.0, 8.0, 7.0, 6.0, 3.0, 1.0, 4.0, 0.0, 1.0, 3.0, 5.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-35.40625, -34.38671875, -33.3671875, -32.34765625, -31.328125, -30.30859375, -29.2890625, -28.26953125, -27.25, -26.23046875, -25.2109375, -24.19140625, -23.171875, -22.15234375, -21.1328125, -20.11328125, -19.09375, -18.07421875, -17.0546875, -16.03515625, -15.015625, -13.99609375, -12.9765625, -11.95703125, -10.9375, -9.91796875, -8.8984375, -7.87890625, -6.859375, -5.83984375, -4.8203125, -3.80078125, -2.78125, -1.76171875, -0.7421875, 0.27734375, 1.296875, 2.31640625, 3.3359375, 4.35546875, 5.375, 6.39453125, 7.4140625, 8.43359375, 9.453125, 10.47265625, 11.4921875, 12.51171875, 13.53125, 14.55078125, 15.5703125, 16.58984375, 17.609375, 18.62890625, 19.6484375, 20.66796875, 21.6875, 22.70703125, 23.7265625, 24.74609375, 25.765625, 26.78515625, 27.8046875, 28.82421875, 29.84375]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 6.0, 2.0, 2.0, 0.0, 4.0, 1.0, 9.0, 7.0, 7.0, 23.0, 35.0, 75.0, 149.0, 247.0, 449.0, 839.0, 1760.0, 3441.0, 7470.0, 17801.0, 57515.0, 1956658.0, 2057528.0, 57897.0, 17732.0, 7434.0, 3519.0, 1732.0, 886.0, 478.0, 250.0, 129.0, 66.0, 57.0, 22.0, 19.0, 5.0, 9.0, 6.0, 6.0, 2.0, 4.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.65625, -59.45458984375, -57.2529296875, -55.05126953125, -52.849609375, -50.64794921875, -48.4462890625, -46.24462890625, -44.04296875, -41.84130859375, -39.6396484375, -37.43798828125, -35.236328125, -33.03466796875, -30.8330078125, -28.63134765625, -26.4296875, -24.22802734375, -22.0263671875, -19.82470703125, -17.623046875, -15.42138671875, -13.2197265625, -11.01806640625, -8.81640625, -6.61474609375, -4.4130859375, -2.21142578125, -0.009765625, 2.19189453125, 4.3935546875, 6.59521484375, 8.796875, 10.99853515625, 13.2001953125, 15.40185546875, 17.603515625, 19.80517578125, 22.0068359375, 24.20849609375, 26.41015625, 28.61181640625, 30.8134765625, 33.01513671875, 35.216796875, 37.41845703125, 39.6201171875, 41.82177734375, 44.0234375, 46.22509765625, 48.4267578125, 50.62841796875, 52.830078125, 55.03173828125, 57.2333984375, 59.43505859375, 61.63671875, 63.83837890625, 66.0400390625, 68.24169921875, 70.443359375, 72.64501953125, 74.8466796875, 77.04833984375, 79.25]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 4.0, 4.0, 5.0, 8.0, 6.0, 12.0, 17.0, 23.0, 51.0, 63.0, 101.0, 167.0, 157.0, 135.0, 75.0, 51.0, 37.0, 22.0, 14.0, 14.0, 10.0, 11.0, 5.0, 3.0, 5.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-109.67414855957031, -104.3000717163086, -98.92598724365234, -93.55191040039062, -88.17782592773438, -82.80374908447266, -77.42967224121094, -72.05558776855469, -66.68151092529297, -61.307430267333984, -55.933349609375, -50.55927276611328, -45.1851921081543, -39.81111145019531, -34.437034606933594, -29.06295394897461, -23.688873291015625, -18.31479263305664, -12.940713882446289, -7.5666351318359375, -2.192554473876953, 3.1815261840820312, 8.55560302734375, 13.929683685302734, 19.30376434326172, 24.677845001220703, 30.051923751831055, 35.426002502441406, 40.80008316040039, 46.174163818359375, 51.548240661621094, 56.92232131958008, 62.296417236328125, 67.67049407958984, 73.0445785522461, 78.41865539550781, 83.79273986816406, 89.16681671142578, 94.5408935546875, 99.91497802734375, 105.28905487060547, 110.66313171386719, 116.03721618652344, 121.41129302978516, 126.78536987304688, 132.15945434570312, 137.53353881835938, 142.90760803222656, 148.2816925048828, 153.65577697753906, 159.02984619140625, 164.4039306640625, 169.77801513671875, 175.152099609375, 180.5261688232422, 185.90025329589844, 191.27432250976562, 196.64840698242188, 202.02247619628906, 207.3965606689453, 212.77064514160156, 218.14471435546875, 223.518798828125, 228.89288330078125, 234.2669677734375]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 2.0, 7.0, 6.0, 9.0, 7.0, 8.0, 20.0, 21.0, 14.0, 21.0, 17.0, 11.0, 26.0, 28.0, 30.0, 30.0, 30.0, 42.0, 45.0, 39.0, 52.0, 43.0, 41.0, 33.0, 38.0, 35.0, 41.0, 32.0, 33.0, 33.0, 35.0, 24.0, 18.0, 16.0, 17.0, 20.0, 12.0, 13.0, 15.0, 13.0, 4.0, 9.0, 3.0, 2.0, 0.0, 2.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-88.70303344726562, -85.9404525756836, -83.17787170410156, -80.41529846191406, -77.65271759033203, -74.89013671875, -72.12755584716797, -69.36497497558594, -66.60240173339844, -63.839820861816406, -61.07724380493164, -58.31466293334961, -55.552085876464844, -52.78950500488281, -50.02692413330078, -47.26434326171875, -44.50176239013672, -41.73918151855469, -38.97660446166992, -36.21402359008789, -33.451446533203125, -30.688865661621094, -27.926284790039062, -25.163705825805664, -22.401126861572266, -19.638547897338867, -16.87596893310547, -14.113388061523438, -11.350809097290039, -8.58823013305664, -5.825649261474609, -3.063070297241211, -0.30049896240234375, 2.462080478668213, 5.2246599197387695, 7.987239837646484, 10.749818801879883, 13.512397766113281, 16.274978637695312, 19.03755760192871, 21.80013656616211, 24.562715530395508, 27.325294494628906, 30.087875366210938, 32.85045623779297, 35.613033294677734, 38.375614166259766, 41.13819122314453, 43.90077209472656, 46.663352966308594, 49.42593002319336, 52.18851089477539, 54.951087951660156, 57.71366882324219, 60.47624969482422, 63.23883056640625, 66.00140380859375, 68.76398468017578, 71.52656555175781, 74.28913879394531, 77.05171966552734, 79.81430053710938, 82.5768814086914, 85.33946228027344, 88.10204315185547]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 5.0, 6.0, 2.0, 4.0, 14.0, 8.0, 18.0, 18.0, 11.0, 23.0, 21.0, 31.0, 37.0, 44.0, 26.0, 40.0, 31.0, 40.0, 58.0, 47.0, 47.0, 40.0, 44.0, 36.0, 31.0, 39.0, 36.0, 28.0, 27.0, 28.0, 27.0, 25.0, 19.0, 13.0, 15.0, 8.0, 12.0, 6.0, 9.0, 7.0, 8.0, 5.0, 3.0, 2.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-13.9375, -13.5235595703125, -13.109619140625, -12.6956787109375, -12.28173828125, -11.8677978515625, -11.453857421875, -11.0399169921875, -10.6259765625, -10.2120361328125, -9.798095703125, -9.3841552734375, -8.97021484375, -8.5562744140625, -8.142333984375, -7.7283935546875, -7.314453125, -6.9005126953125, -6.486572265625, -6.0726318359375, -5.65869140625, -5.2447509765625, -4.830810546875, -4.4168701171875, -4.0029296875, -3.5889892578125, -3.175048828125, -2.7611083984375, -2.34716796875, -1.9332275390625, -1.519287109375, -1.1053466796875, -0.69140625, -0.2774658203125, 0.136474609375, 0.5504150390625, 0.96435546875, 1.3782958984375, 1.792236328125, 2.2061767578125, 2.6201171875, 3.0340576171875, 3.447998046875, 3.8619384765625, 4.27587890625, 4.6898193359375, 5.103759765625, 5.5177001953125, 5.931640625, 6.3455810546875, 6.759521484375, 7.1734619140625, 7.58740234375, 8.0013427734375, 8.415283203125, 8.8292236328125, 9.2431640625, 9.6571044921875, 10.071044921875, 10.4849853515625, 10.89892578125, 11.3128662109375, 11.726806640625, 12.1407470703125, 12.5546875]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 0.0, 4.0, 5.0, 6.0, 16.0, 18.0, 27.0, 46.0, 68.0, 106.0, 169.0, 265.0, 363.0, 569.0, 782.0, 1159.0, 1752.0, 2398.0, 3775.0, 5636.0, 8416.0, 13411.0, 20949.0, 33847.0, 56956.0, 101411.0, 190447.0, 249411.0, 150500.0, 80700.0, 46652.0, 27766.0, 17628.0, 11219.0, 7398.0, 4822.0, 3235.0, 2176.0, 1470.0, 953.0, 671.0, 410.0, 270.0, 230.0, 150.0, 93.0, 57.0, 46.0, 48.0, 28.0, 12.0, 7.0, 4.0, 4.0, 4.0, 0.0, 0.0, 1.0], "bins": [-1.490234375, -1.44549560546875, -1.4007568359375, -1.35601806640625, -1.311279296875, -1.26654052734375, -1.2218017578125, -1.17706298828125, -1.13232421875, -1.08758544921875, -1.0428466796875, -0.99810791015625, -0.953369140625, -0.90863037109375, -0.8638916015625, -0.81915283203125, -0.7744140625, -0.72967529296875, -0.6849365234375, -0.64019775390625, -0.595458984375, -0.55072021484375, -0.5059814453125, -0.46124267578125, -0.41650390625, -0.37176513671875, -0.3270263671875, -0.28228759765625, -0.237548828125, -0.19281005859375, -0.1480712890625, -0.10333251953125, -0.05859375, -0.01385498046875, 0.0308837890625, 0.07562255859375, 0.120361328125, 0.16510009765625, 0.2098388671875, 0.25457763671875, 0.29931640625, 0.34405517578125, 0.3887939453125, 0.43353271484375, 0.478271484375, 0.52301025390625, 0.5677490234375, 0.61248779296875, 0.6572265625, 0.70196533203125, 0.7467041015625, 0.79144287109375, 0.836181640625, 0.88092041015625, 0.9256591796875, 0.97039794921875, 1.01513671875, 1.05987548828125, 1.1046142578125, 1.14935302734375, 1.194091796875, 1.23883056640625, 1.2835693359375, 1.32830810546875, 1.373046875]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 5.0, 4.0, 6.0, 15.0, 8.0, 6.0, 11.0, 9.0, 19.0, 16.0, 15.0, 18.0, 37.0, 34.0, 42.0, 40.0, 46.0, 39.0, 46.0, 46.0, 1059.0, 32.0, 55.0, 34.0, 38.0, 36.0, 42.0, 37.0, 30.0, 37.0, 30.0, 24.0, 23.0, 15.0, 21.0, 13.0, 10.0, 12.0, 3.0, 4.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.28125, -7.994384765625, -7.70751953125, -7.420654296875, -7.1337890625, -6.846923828125, -6.56005859375, -6.273193359375, -5.986328125, -5.699462890625, -5.41259765625, -5.125732421875, -4.8388671875, -4.552001953125, -4.26513671875, -3.978271484375, -3.69140625, -3.404541015625, -3.11767578125, -2.830810546875, -2.5439453125, -2.257080078125, -1.97021484375, -1.683349609375, -1.396484375, -1.109619140625, -0.82275390625, -0.535888671875, -0.2490234375, 0.037841796875, 0.32470703125, 0.611572265625, 0.8984375, 1.185302734375, 1.47216796875, 1.759033203125, 2.0458984375, 2.332763671875, 2.61962890625, 2.906494140625, 3.193359375, 3.480224609375, 3.76708984375, 4.053955078125, 4.3408203125, 4.627685546875, 4.91455078125, 5.201416015625, 5.48828125, 5.775146484375, 6.06201171875, 6.348876953125, 6.6357421875, 6.922607421875, 7.20947265625, 7.496337890625, 7.783203125, 8.070068359375, 8.35693359375, 8.643798828125, 8.9306640625, 9.217529296875, 9.50439453125, 9.791259765625, 10.078125]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 10.0, 6.0, 11.0, 26.0, 23.0, 34.0, 51.0, 95.0, 141.0, 208.0, 353.0, 531.0, 779.0, 1158.0, 1703.0, 2637.0, 4079.0, 6391.0, 9630.0, 15220.0, 23818.0, 39471.0, 67695.0, 122264.0, 325804.0, 1158663.0, 131262.0, 72534.0, 42149.0, 25421.0, 15888.0, 10039.0, 6544.0, 4345.0, 2797.0, 1869.0, 1224.0, 773.0, 498.0, 325.0, 210.0, 146.0, 101.0, 66.0, 51.0, 34.0, 23.0, 12.0, 16.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.861328125, -0.8352737426757812, -0.8092193603515625, -0.7831649780273438, -0.757110595703125, -0.7310562133789062, -0.7050018310546875, -0.6789474487304688, -0.65289306640625, -0.6268386840820312, -0.6007843017578125, -0.5747299194335938, -0.548675537109375, -0.5226211547851562, -0.4965667724609375, -0.47051239013671875, -0.4444580078125, -0.41840362548828125, -0.3923492431640625, -0.36629486083984375, -0.340240478515625, -0.31418609619140625, -0.2881317138671875, -0.26207733154296875, -0.23602294921875, -0.20996856689453125, -0.1839141845703125, -0.15785980224609375, -0.131805419921875, -0.10575103759765625, -0.0796966552734375, -0.05364227294921875, -0.027587890625, -0.00153350830078125, 0.0245208740234375, 0.05057525634765625, 0.076629638671875, 0.10268402099609375, 0.1287384033203125, 0.15479278564453125, 0.18084716796875, 0.20690155029296875, 0.2329559326171875, 0.25901031494140625, 0.285064697265625, 0.31111907958984375, 0.3371734619140625, 0.36322784423828125, 0.3892822265625, 0.41533660888671875, 0.4413909912109375, 0.46744537353515625, 0.493499755859375, 0.5195541381835938, 0.5456085205078125, 0.5716629028320312, 0.59771728515625, 0.6237716674804688, 0.6498260498046875, 0.6758804321289062, 0.701934814453125, 0.7279891967773438, 0.7540435791015625, 0.7800979614257812, 0.80615234375]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 4.0, 5.0, 6.0, 10.0, 10.0, 9.0, 10.0, 14.0, 15.0, 19.0, 18.0, 21.0, 22.0, 52.0, 74.0, 77.0, 117.0, 121.0, 88.0, 55.0, 52.0, 30.0, 35.0, 22.0, 18.0, 16.0, 7.0, 11.0, 10.0, 2.0, 5.0, 4.0, 8.0, 5.0, 4.0, 4.0, 6.0, 6.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0207366943359375, -0.02004241943359375, -0.01934814453125, -0.01865386962890625, -0.0179595947265625, -0.01726531982421875, -0.016571044921875, -0.01587677001953125, -0.0151824951171875, -0.01448822021484375, -0.0137939453125, -0.01309967041015625, -0.0124053955078125, -0.01171112060546875, -0.011016845703125, -0.01032257080078125, -0.0096282958984375, -0.00893402099609375, -0.00823974609375, -0.00754547119140625, -0.0068511962890625, -0.00615692138671875, -0.005462646484375, -0.00476837158203125, -0.0040740966796875, -0.00337982177734375, -0.002685546875, -0.00199127197265625, -0.0012969970703125, -0.00060272216796875, 9.1552734375e-05, 0.00078582763671875, 0.0014801025390625, 0.00217437744140625, 0.00286865234375, 0.00356292724609375, 0.0042572021484375, 0.00495147705078125, 0.005645751953125, 0.00634002685546875, 0.0070343017578125, 0.00772857666015625, 0.0084228515625, 0.00911712646484375, 0.0098114013671875, 0.01050567626953125, 0.011199951171875, 0.01189422607421875, 0.0125885009765625, 0.01328277587890625, 0.01397705078125, 0.01467132568359375, 0.0153656005859375, 0.01605987548828125, 0.016754150390625, 0.01744842529296875, 0.0181427001953125, 0.01883697509765625, 0.01953125, 0.02022552490234375, 0.0209197998046875, 0.02161407470703125, 0.022308349609375, 0.02300262451171875, 0.0236968994140625]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 1.0, 7.0, 4.0, 7.0, 8.0, 10.0, 11.0, 7.0, 19.0, 22.0, 15.0, 21.0, 24.0, 36.0, 45.0, 50.0, 88.0, 142.0, 218.0, 466.0, 1381.0, 7823.0, 170629.0, 842964.0, 20502.0, 2552.0, 650.0, 236.0, 162.0, 84.0, 67.0, 45.0, 45.0, 37.0, 30.0, 33.0, 26.0, 22.0, 12.0, 12.0, 12.0, 8.0, 4.0, 5.0, 6.0, 3.0, 5.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.416259765625, -0.4040870666503906, -0.39191436767578125, -0.3797416687011719, -0.3675689697265625, -0.3553962707519531, -0.34322357177734375, -0.3310508728027344, -0.318878173828125, -0.3067054748535156, -0.29453277587890625, -0.2823600769042969, -0.2701873779296875, -0.2580146789550781, -0.24584197998046875, -0.23366928100585938, -0.22149658203125, -0.20932388305664062, -0.19715118408203125, -0.18497848510742188, -0.1728057861328125, -0.16063308715820312, -0.14846038818359375, -0.13628768920898438, -0.124114990234375, -0.11194229125976562, -0.09976959228515625, -0.08759689331054688, -0.0754241943359375, -0.06325149536132812, -0.05107879638671875, -0.038906097412109375, -0.0267333984375, -0.014560699462890625, -0.00238800048828125, 0.009784698486328125, 0.0219573974609375, 0.034130096435546875, 0.04630279541015625, 0.058475494384765625, 0.070648193359375, 0.08282089233398438, 0.09499359130859375, 0.10716629028320312, 0.1193389892578125, 0.13151168823242188, 0.14368438720703125, 0.15585708618164062, 0.16802978515625, 0.18020248413085938, 0.19237518310546875, 0.20454788208007812, 0.2167205810546875, 0.22889328002929688, 0.24106597900390625, 0.2532386779785156, 0.265411376953125, 0.2775840759277344, 0.28975677490234375, 0.3019294738769531, 0.3141021728515625, 0.3262748718261719, 0.33844757080078125, 0.3506202697753906, 0.36279296875]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 10.0, 16.0, 56.0, 218.0, 495.0, 120.0, 57.0, 18.0, 12.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10337348282337189, -0.09560608118772507, -0.08783868700265884, -0.08007128536701202, -0.0723038911819458, -0.06453648954629898, -0.05676908791065216, -0.04900169000029564, -0.04123429208993912, -0.033466894179582596, -0.025699494406580925, -0.017932094633579254, -0.010164696723222733, -0.002397298812866211, 0.005370102822780609, 0.01313750073313713, 0.020904898643493652, 0.028672296553850174, 0.036439694464206696, 0.044207096099853516, 0.05197449401021004, 0.05974189192056656, 0.06750929355621338, 0.0752766877412796, 0.08304408937692642, 0.09081149101257324, 0.09857888519763947, 0.10634628683328629, 0.1141136884689331, 0.12188108265399933, 0.12964847683906555, 0.13741588592529297, 0.14518329501152039, 0.1529506891965866, 0.16071809828281403, 0.16848549246788025, 0.17625288665294647, 0.1840202808380127, 0.1917876899242401, 0.19955508410930634, 0.20732247829437256, 0.21508987247943878, 0.2228572815656662, 0.23062467575073242, 0.23839206993579865, 0.24615946412086487, 0.2539268732070923, 0.2616942822933197, 0.2694616913795471, 0.27722910046577454, 0.28499647974967957, 0.292763888835907, 0.3005312979221344, 0.30829867720603943, 0.31606608629226685, 0.32383349537849426, 0.3316008746623993, 0.3393682837486267, 0.34713566303253174, 0.35490307211875916, 0.3626704812049866, 0.3704378604888916, 0.378205269575119, 0.38597267866134644, 0.39374005794525146]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 1.0, 6.0, 4.0, 4.0, 6.0, 16.0, 9.0, 10.0, 12.0, 17.0, 12.0, 22.0, 23.0, 26.0, 20.0, 22.0, 33.0, 35.0, 26.0, 38.0, 30.0, 44.0, 32.0, 30.0, 35.0, 49.0, 26.0, 36.0, 35.0, 43.0, 32.0, 15.0, 31.0, 39.0, 23.0, 20.0, 22.0, 22.0, 16.0, 17.0, 9.0, 10.0, 15.0, 9.0, 3.0, 7.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.02029484510421753, -0.01967526413500309, -0.01905568316578865, -0.01843610219657421, -0.01781652122735977, -0.017196940258145332, -0.016577359288930893, -0.015957778319716454, -0.015338197350502014, -0.014718616381287575, -0.014099035412073135, -0.013479454442858696, -0.012859873473644257, -0.012240292504429817, -0.011620711535215378, -0.011001130566000938, -0.010381549596786499, -0.00976196862757206, -0.00914238765835762, -0.00852280668914318, -0.007903225719928741, -0.007283644750714302, -0.006664063781499863, -0.006044482812285423, -0.005424901843070984, -0.0048053208738565445, -0.004185739904642105, -0.0035661589354276657, -0.0029465779662132263, -0.002326996996998787, -0.0017074160277843475, -0.0010878350585699081, -0.00046825408935546875, 0.00015132687985897064, 0.00077090784907341, 0.0013904888182878494, 0.002010069787502289, 0.002629650756716728, 0.0032492317259311676, 0.003868812695145607, 0.004488393664360046, 0.005107974633574486, 0.005727555602788925, 0.0063471365720033646, 0.006966717541217804, 0.007586298510432243, 0.008205879479646683, 0.008825460448861122, 0.009445041418075562, 0.010064622387290001, 0.01068420335650444, 0.01130378432571888, 0.011923365294933319, 0.012542946264147758, 0.013162527233362198, 0.013782108202576637, 0.014401689171791077, 0.015021270141005516, 0.015640851110219955, 0.016260432079434395, 0.016880013048648834, 0.017499594017863274, 0.018119174987077713, 0.018738755956292152, 0.019358336925506592]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 5.0, 6.0, 2.0, 4.0, 14.0, 9.0, 17.0, 18.0, 12.0, 22.0, 22.0, 30.0, 37.0, 44.0, 27.0, 39.0, 33.0, 38.0, 59.0, 46.0, 47.0, 41.0, 45.0, 34.0, 32.0, 39.0, 35.0, 28.0, 27.0, 28.0, 27.0, 25.0, 19.0, 13.0, 15.0, 8.0, 12.0, 6.0, 9.0, 7.0, 8.0, 5.0, 3.0, 2.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-13.9296875, -13.515869140625, -13.10205078125, -12.688232421875, -12.2744140625, -11.860595703125, -11.44677734375, -11.032958984375, -10.619140625, -10.205322265625, -9.79150390625, -9.377685546875, -8.9638671875, -8.550048828125, -8.13623046875, -7.722412109375, -7.30859375, -6.894775390625, -6.48095703125, -6.067138671875, -5.6533203125, -5.239501953125, -4.82568359375, -4.411865234375, -3.998046875, -3.584228515625, -3.17041015625, -2.756591796875, -2.3427734375, -1.928955078125, -1.51513671875, -1.101318359375, -0.6875, -0.273681640625, 0.14013671875, 0.553955078125, 0.9677734375, 1.381591796875, 1.79541015625, 2.209228515625, 2.623046875, 3.036865234375, 3.45068359375, 3.864501953125, 4.2783203125, 4.692138671875, 5.10595703125, 5.519775390625, 5.93359375, 6.347412109375, 6.76123046875, 7.175048828125, 7.5888671875, 8.002685546875, 8.41650390625, 8.830322265625, 9.244140625, 9.657958984375, 10.07177734375, 10.485595703125, 10.8994140625, 11.313232421875, 11.72705078125, 12.140869140625, 12.5546875]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 4.0, 7.0, 11.0, 11.0, 13.0, 11.0, 25.0, 40.0, 59.0, 77.0, 174.0, 306.0, 432.0, 816.0, 1622.0, 3248.0, 7765.0, 21845.0, 71718.0, 294335.0, 486593.0, 108760.0, 31273.0, 10740.0, 4227.0, 2037.0, 1044.0, 520.0, 346.0, 194.0, 102.0, 67.0, 35.0, 32.0, 20.0, 13.0, 15.0, 7.0, 2.0, 3.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.8828125, -6.66192626953125, -6.4410400390625, -6.22015380859375, -5.999267578125, -5.77838134765625, -5.5574951171875, -5.33660888671875, -5.11572265625, -4.89483642578125, -4.6739501953125, -4.45306396484375, -4.232177734375, -4.01129150390625, -3.7904052734375, -3.56951904296875, -3.3486328125, -3.12774658203125, -2.9068603515625, -2.68597412109375, -2.465087890625, -2.24420166015625, -2.0233154296875, -1.80242919921875, -1.58154296875, -1.36065673828125, -1.1397705078125, -0.91888427734375, -0.697998046875, -0.47711181640625, -0.2562255859375, -0.03533935546875, 0.185546875, 0.40643310546875, 0.6273193359375, 0.84820556640625, 1.069091796875, 1.28997802734375, 1.5108642578125, 1.73175048828125, 1.95263671875, 2.17352294921875, 2.3944091796875, 2.61529541015625, 2.836181640625, 3.05706787109375, 3.2779541015625, 3.49884033203125, 3.7197265625, 3.94061279296875, 4.1614990234375, 4.38238525390625, 4.603271484375, 4.82415771484375, 5.0450439453125, 5.26593017578125, 5.48681640625, 5.70770263671875, 5.9285888671875, 6.14947509765625, 6.370361328125, 6.59124755859375, 6.8121337890625, 7.03302001953125, 7.25390625]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 5.0, 6.0, 13.0, 6.0, 10.0, 12.0, 13.0, 21.0, 20.0, 25.0, 16.0, 25.0, 30.0, 32.0, 36.0, 34.0, 33.0, 41.0, 48.0, 61.0, 1650.0, 431.0, 65.0, 36.0, 33.0, 40.0, 30.0, 35.0, 33.0, 24.0, 34.0, 23.0, 25.0, 12.0, 20.0, 16.0, 14.0, 10.0, 7.0, 8.0, 5.0, 5.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-39.84375, -38.5146484375, -37.185546875, -35.8564453125, -34.52734375, -33.1982421875, -31.869140625, -30.5400390625, -29.2109375, -27.8818359375, -26.552734375, -25.2236328125, -23.89453125, -22.5654296875, -21.236328125, -19.9072265625, -18.578125, -17.2490234375, -15.919921875, -14.5908203125, -13.26171875, -11.9326171875, -10.603515625, -9.2744140625, -7.9453125, -6.6162109375, -5.287109375, -3.9580078125, -2.62890625, -1.2998046875, 0.029296875, 1.3583984375, 2.6875, 4.0166015625, 5.345703125, 6.6748046875, 8.00390625, 9.3330078125, 10.662109375, 11.9912109375, 13.3203125, 14.6494140625, 15.978515625, 17.3076171875, 18.63671875, 19.9658203125, 21.294921875, 22.6240234375, 23.953125, 25.2822265625, 26.611328125, 27.9404296875, 29.26953125, 30.5986328125, 31.927734375, 33.2568359375, 34.5859375, 35.9150390625, 37.244140625, 38.5732421875, 39.90234375, 41.2314453125, 42.560546875, 43.8896484375, 45.21875]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 5.0, 3.0, 8.0, 10.0, 9.0, 16.0, 14.0, 27.0, 17.0, 30.0, 27.0, 61.0, 70.0, 78.0, 108.0, 136.0, 191.0, 270.0, 492.0, 1531.0, 64718.0, 3071773.0, 4114.0, 759.0, 355.0, 187.0, 143.0, 119.0, 104.0, 70.0, 60.0, 37.0, 29.0, 37.0, 20.0, 15.0, 13.0, 16.0, 7.0, 7.0, 10.0, 3.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-80.75, -78.390625, -76.03125, -73.671875, -71.3125, -68.953125, -66.59375, -64.234375, -61.875, -59.515625, -57.15625, -54.796875, -52.4375, -50.078125, -47.71875, -45.359375, -43.0, -40.640625, -38.28125, -35.921875, -33.5625, -31.203125, -28.84375, -26.484375, -24.125, -21.765625, -19.40625, -17.046875, -14.6875, -12.328125, -9.96875, -7.609375, -5.25, -2.890625, -0.53125, 1.828125, 4.1875, 6.546875, 8.90625, 11.265625, 13.625, 15.984375, 18.34375, 20.703125, 23.0625, 25.421875, 27.78125, 30.140625, 32.5, 34.859375, 37.21875, 39.578125, 41.9375, 44.296875, 46.65625, 49.015625, 51.375, 53.734375, 56.09375, 58.453125, 60.8125, 63.171875, 65.53125, 67.890625, 70.25]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 12.0, 24.0, 103.0, 255.0, 284.0, 207.0, 88.0, 30.0, 8.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.617923736572266, -20.640039443969727, -18.662155151367188, -16.684268951416016, -14.706384658813477, -12.728500366210938, -10.750615119934082, -8.772729873657227, -6.7948455810546875, -4.81696081161499, -2.839076042175293, -0.8611912727355957, 1.1166934967041016, 3.0945777893066406, 5.072463035583496, 7.050348281860352, 9.02823257446289, 11.00611686706543, 12.984002113342285, 14.96188735961914, 16.93977165222168, 18.91765594482422, 20.89554214477539, 22.87342643737793, 24.85131072998047, 26.829195022583008, 28.807079315185547, 30.78496551513672, 32.762847900390625, 34.7407341003418, 36.71862030029297, 38.696502685546875, 40.67439270019531, 42.652278900146484, 44.63016128540039, 46.60804748535156, 48.58592987060547, 50.56381607055664, 52.54170227050781, 54.51958465576172, 56.49747085571289, 58.47535705566406, 60.45323944091797, 62.43112564086914, 64.40901184082031, 66.38689422607422, 68.36477661132812, 70.34266662597656, 72.32054901123047, 74.29843139648438, 76.27632141113281, 78.25420379638672, 80.23208618164062, 82.20997619628906, 84.18785858154297, 86.16574096679688, 88.14363098144531, 90.12151336669922, 92.09940338134766, 94.07728576660156, 96.05516815185547, 98.03305053710938, 100.01094055175781, 101.98882293701172, 103.96670532226562]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 7.0, 1.0, 10.0, 5.0, 8.0, 6.0, 13.0, 15.0, 10.0, 22.0, 29.0, 16.0, 29.0, 24.0, 27.0, 34.0, 41.0, 44.0, 33.0, 38.0, 45.0, 49.0, 37.0, 43.0, 39.0, 42.0, 25.0, 36.0, 31.0, 28.0, 33.0, 27.0, 21.0, 32.0, 16.0, 18.0, 17.0, 8.0, 11.0, 12.0, 6.0, 4.0, 3.0, 4.0, 3.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-128.55751037597656, -124.38248443603516, -120.20745086669922, -116.03242492675781, -111.85739135742188, -107.68236541748047, -103.50733947753906, -99.33230590820312, -95.15727996826172, -90.98225402832031, -86.80722045898438, -82.63219451904297, -78.45716857910156, -74.28213500976562, -70.10710906982422, -65.93208312988281, -61.757049560546875, -57.5820198059082, -53.40699005126953, -49.231964111328125, -45.05693435668945, -40.88190460205078, -36.706878662109375, -32.5318489074707, -28.35681915283203, -24.18178939819336, -20.00676155090332, -15.831732749938965, -11.65670394897461, -7.4816741943359375, -3.3066463470458984, 0.8683815002441406, 5.043426513671875, 9.21845531463623, 13.393484115600586, 17.568511962890625, 21.743541717529297, 25.91857147216797, 30.093599319458008, 34.26862716674805, 38.44365692138672, 42.61868667602539, 46.79371643066406, 50.96874237060547, 55.14377212524414, 59.31880187988281, 63.49382781982422, 67.66885375976562, 71.84388732910156, 76.01891326904297, 80.1939468383789, 84.36897277832031, 88.54400634765625, 92.71903228759766, 96.89405822753906, 101.069091796875, 105.2441177368164, 109.41914367675781, 113.59417724609375, 117.76920318603516, 121.94422912597656, 126.1192626953125, 130.29429626464844, 134.4693145751953, 138.64434814453125]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 6.0, 3.0, 5.0, 5.0, 7.0, 9.0, 14.0, 13.0, 20.0, 15.0, 23.0, 28.0, 26.0, 35.0, 47.0, 25.0, 40.0, 33.0, 46.0, 59.0, 51.0, 34.0, 49.0, 35.0, 34.0, 34.0, 39.0, 38.0, 23.0, 32.0, 26.0, 28.0, 23.0, 15.0, 12.0, 11.0, 12.0, 8.0, 10.0, 7.0, 10.0, 3.0, 4.0, 4.0, 2.0, 1.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-14.0546875, -13.6337890625, -13.212890625, -12.7919921875, -12.37109375, -11.9501953125, -11.529296875, -11.1083984375, -10.6875, -10.2666015625, -9.845703125, -9.4248046875, -9.00390625, -8.5830078125, -8.162109375, -7.7412109375, -7.3203125, -6.8994140625, -6.478515625, -6.0576171875, -5.63671875, -5.2158203125, -4.794921875, -4.3740234375, -3.953125, -3.5322265625, -3.111328125, -2.6904296875, -2.26953125, -1.8486328125, -1.427734375, -1.0068359375, -0.5859375, -0.1650390625, 0.255859375, 0.6767578125, 1.09765625, 1.5185546875, 1.939453125, 2.3603515625, 2.78125, 3.2021484375, 3.623046875, 4.0439453125, 4.46484375, 4.8857421875, 5.306640625, 5.7275390625, 6.1484375, 6.5693359375, 6.990234375, 7.4111328125, 7.83203125, 8.2529296875, 8.673828125, 9.0947265625, 9.515625, 9.9365234375, 10.357421875, 10.7783203125, 11.19921875, 11.6201171875, 12.041015625, 12.4619140625, 12.8828125]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 7.0, 7.0, 8.0, 12.0, 15.0, 22.0, 29.0, 34.0, 45.0, 80.0, 118.0, 161.0, 236.0, 417.0, 830.0, 1586.0, 3121.0, 7385.0, 24870.0, 2289261.0, 1828677.0, 23115.0, 7147.0, 3138.0, 1679.0, 930.0, 502.0, 263.0, 156.0, 128.0, 87.0, 66.0, 38.0, 28.0, 19.0, 12.0, 20.0, 12.0, 11.0, 2.0, 8.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.125, -64.234375, -62.34375, -60.453125, -58.5625, -56.671875, -54.78125, -52.890625, -51.0, -49.109375, -47.21875, -45.328125, -43.4375, -41.546875, -39.65625, -37.765625, -35.875, -33.984375, -32.09375, -30.203125, -28.3125, -26.421875, -24.53125, -22.640625, -20.75, -18.859375, -16.96875, -15.078125, -13.1875, -11.296875, -9.40625, -7.515625, -5.625, -3.734375, -1.84375, 0.046875, 1.9375, 3.828125, 5.71875, 7.609375, 9.5, 11.390625, 13.28125, 15.171875, 17.0625, 18.953125, 20.84375, 22.734375, 24.625, 26.515625, 28.40625, 30.296875, 32.1875, 34.078125, 35.96875, 37.859375, 39.75, 41.640625, 43.53125, 45.421875, 47.3125, 49.203125, 51.09375, 52.984375, 54.875]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 3.0, 2.0, 1.0, 3.0, 2.0, 12.0, 7.0, 13.0, 18.0, 12.0, 33.0, 44.0, 64.0, 118.0, 292.0, 626.0, 1064.0, 865.0, 422.0, 202.0, 90.0, 49.0, 36.0, 21.0, 14.0, 12.0, 7.0, 7.0, 9.0, 3.0, 6.0, 5.0, 4.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.125, -36.92578125, -35.7265625, -34.52734375, -33.328125, -32.12890625, -30.9296875, -29.73046875, -28.53125, -27.33203125, -26.1328125, -24.93359375, -23.734375, -22.53515625, -21.3359375, -20.13671875, -18.9375, -17.73828125, -16.5390625, -15.33984375, -14.140625, -12.94140625, -11.7421875, -10.54296875, -9.34375, -8.14453125, -6.9453125, -5.74609375, -4.546875, -3.34765625, -2.1484375, -0.94921875, 0.25, 1.44921875, 2.6484375, 3.84765625, 5.046875, 6.24609375, 7.4453125, 8.64453125, 9.84375, 11.04296875, 12.2421875, 13.44140625, 14.640625, 15.83984375, 17.0390625, 18.23828125, 19.4375, 20.63671875, 21.8359375, 23.03515625, 24.234375, 25.43359375, 26.6328125, 27.83203125, 29.03125, 30.23046875, 31.4296875, 32.62890625, 33.828125, 35.02734375, 36.2265625, 37.42578125, 38.625]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 1.0, 1.0, 3.0, 2.0, 0.0, 10.0, 7.0, 11.0, 13.0, 35.0, 51.0, 66.0, 113.0, 186.0, 282.0, 480.0, 763.0, 1284.0, 2206.0, 4084.0, 8124.0, 18193.0, 56896.0, 931847.0, 3030367.0, 93566.0, 24080.0, 10158.0, 4860.0, 2772.0, 1513.0, 869.0, 542.0, 336.0, 203.0, 139.0, 72.0, 52.0, 33.0, 25.0, 17.0, 12.0, 4.0, 4.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-55.0625, -53.349609375, -51.63671875, -49.923828125, -48.2109375, -46.498046875, -44.78515625, -43.072265625, -41.359375, -39.646484375, -37.93359375, -36.220703125, -34.5078125, -32.794921875, -31.08203125, -29.369140625, -27.65625, -25.943359375, -24.23046875, -22.517578125, -20.8046875, -19.091796875, -17.37890625, -15.666015625, -13.953125, -12.240234375, -10.52734375, -8.814453125, -7.1015625, -5.388671875, -3.67578125, -1.962890625, -0.25, 1.462890625, 3.17578125, 4.888671875, 6.6015625, 8.314453125, 10.02734375, 11.740234375, 13.453125, 15.166015625, 16.87890625, 18.591796875, 20.3046875, 22.017578125, 23.73046875, 25.443359375, 27.15625, 28.869140625, 30.58203125, 32.294921875, 34.0078125, 35.720703125, 37.43359375, 39.146484375, 40.859375, 42.572265625, 44.28515625, 45.998046875, 47.7109375, 49.423828125, 51.13671875, 52.849609375, 54.5625]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 4.0, 4.0, 7.0, 9.0, 13.0, 21.0, 21.0, 36.0, 65.0, 80.0, 130.0, 165.0, 150.0, 97.0, 58.0, 40.0, 24.0, 16.0, 19.0, 8.0, 10.0, 9.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-157.1263427734375, -152.4529266357422, -147.7794952392578, -143.1060791015625, -138.43264770507812, -133.7592315673828, -129.0858154296875, -124.41238403320312, -119.73896789550781, -115.06554412841797, -110.39212036132812, -105.71870422363281, -101.04528045654297, -96.37185668945312, -91.69843292236328, -87.02500915527344, -82.3515853881836, -77.67816162109375, -73.0047378540039, -68.33131408691406, -63.65789794921875, -58.984474182128906, -54.31105041503906, -49.637630462646484, -44.96420669555664, -40.2907829284668, -35.61736297607422, -30.943939208984375, -26.270517349243164, -21.597095489501953, -16.92367172241211, -12.250251770019531, -7.5768280029296875, -2.9034056663513184, 1.7700166702270508, 6.443439483642578, 11.116861343383789, 15.790283203125, 20.463706970214844, 25.137126922607422, 29.810550689697266, 34.48397445678711, 39.15739440917969, 43.83081817626953, 48.504241943359375, 53.17766189575195, 57.8510856628418, 62.524505615234375, 67.19792938232422, 71.87135314941406, 76.5447769165039, 81.21820068359375, 85.89161682128906, 90.5650405883789, 95.23846435546875, 99.91188049316406, 104.58531188964844, 109.25873565673828, 113.93215942382812, 118.60557556152344, 123.27899932861328, 127.95242309570312, 132.6258544921875, 137.2992706298828, 141.97268676757812]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 4.0, 5.0, 6.0, 12.0, 15.0, 13.0, 16.0, 16.0, 21.0, 17.0, 36.0, 39.0, 35.0, 36.0, 36.0, 60.0, 39.0, 44.0, 49.0, 38.0, 41.0, 42.0, 41.0, 40.0, 56.0, 31.0, 30.0, 28.0, 23.0, 17.0, 23.0, 22.0, 9.0, 17.0, 16.0, 9.0, 10.0, 8.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-85.65242004394531, -82.71452331542969, -79.77661895751953, -76.8387222290039, -73.90081787109375, -70.96292114257812, -68.0250244140625, -65.08712005615234, -62.14921951293945, -59.21131896972656, -56.27341842651367, -53.33551788330078, -50.397621154785156, -47.459716796875, -44.521820068359375, -41.583919525146484, -38.646018981933594, -35.7081184387207, -32.77021789550781, -29.832319259643555, -26.894418716430664, -23.956518173217773, -21.018619537353516, -18.080718994140625, -15.142818450927734, -12.204917907714844, -9.26701831817627, -6.329118728637695, -3.3912181854248047, -0.45331764221191406, 2.4845809936523438, 5.422481536865234, 8.360374450683594, 11.298274993896484, 14.236174583435059, 17.174074172973633, 20.111974716186523, 23.049875259399414, 25.987773895263672, 28.925674438476562, 31.863574981689453, 34.801475524902344, 37.739376068115234, 40.677276611328125, 43.61517333984375, 46.553077697753906, 49.49097442626953, 52.42887496948242, 55.36677551269531, 58.3046760559082, 61.242576599121094, 64.18047332763672, 67.11837768554688, 70.0562744140625, 72.99417114257812, 75.93207550048828, 78.86997985839844, 81.80787658691406, 84.74578094482422, 87.68367767333984, 90.62158203125, 93.55947875976562, 96.49737548828125, 99.4352798461914, 102.37317657470703]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 6.0, 7.0, 6.0, 9.0, 7.0, 9.0, 13.0, 24.0, 17.0, 16.0, 20.0, 29.0, 34.0, 30.0, 36.0, 31.0, 44.0, 47.0, 49.0, 44.0, 47.0, 55.0, 32.0, 37.0, 53.0, 50.0, 23.0, 29.0, 29.0, 30.0, 20.0, 20.0, 16.0, 13.0, 15.0, 19.0, 13.0, 7.0, 5.0, 5.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-14.5078125, -14.0758056640625, -13.643798828125, -13.2117919921875, -12.77978515625, -12.3477783203125, -11.915771484375, -11.4837646484375, -11.0517578125, -10.6197509765625, -10.187744140625, -9.7557373046875, -9.32373046875, -8.8917236328125, -8.459716796875, -8.0277099609375, -7.595703125, -7.1636962890625, -6.731689453125, -6.2996826171875, -5.86767578125, -5.4356689453125, -5.003662109375, -4.5716552734375, -4.1396484375, -3.7076416015625, -3.275634765625, -2.8436279296875, -2.41162109375, -1.9796142578125, -1.547607421875, -1.1156005859375, -0.68359375, -0.2515869140625, 0.180419921875, 0.6124267578125, 1.04443359375, 1.4764404296875, 1.908447265625, 2.3404541015625, 2.7724609375, 3.2044677734375, 3.636474609375, 4.0684814453125, 4.50048828125, 4.9324951171875, 5.364501953125, 5.7965087890625, 6.228515625, 6.6605224609375, 7.092529296875, 7.5245361328125, 7.95654296875, 8.3885498046875, 8.820556640625, 9.2525634765625, 9.6845703125, 10.1165771484375, 10.548583984375, 10.9805908203125, 11.41259765625, 11.8446044921875, 12.276611328125, 12.7086181640625, 13.140625]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 6.0, 11.0, 15.0, 19.0, 19.0, 47.0, 62.0, 92.0, 160.0, 226.0, 347.0, 516.0, 808.0, 1274.0, 1894.0, 3005.0, 4650.0, 7343.0, 11551.0, 18735.0, 31086.0, 53804.0, 101014.0, 199439.0, 267719.0, 154495.0, 78863.0, 43218.0, 25488.0, 15359.0, 9957.0, 6070.0, 3967.0, 2606.0, 1674.0, 1044.0, 696.0, 417.0, 314.0, 179.0, 123.0, 81.0, 59.0, 37.0, 27.0, 17.0, 13.0, 7.0, 3.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.5966796875, -1.545684814453125, -1.49468994140625, -1.443695068359375, -1.3927001953125, -1.341705322265625, -1.29071044921875, -1.239715576171875, -1.188720703125, -1.137725830078125, -1.08673095703125, -1.035736083984375, -0.9847412109375, -0.933746337890625, -0.88275146484375, -0.831756591796875, -0.78076171875, -0.729766845703125, -0.67877197265625, -0.627777099609375, -0.5767822265625, -0.525787353515625, -0.47479248046875, -0.423797607421875, -0.372802734375, -0.321807861328125, -0.27081298828125, -0.219818115234375, -0.1688232421875, -0.117828369140625, -0.06683349609375, -0.015838623046875, 0.03515625, 0.086151123046875, 0.13714599609375, 0.188140869140625, 0.2391357421875, 0.290130615234375, 0.34112548828125, 0.392120361328125, 0.443115234375, 0.494110107421875, 0.54510498046875, 0.596099853515625, 0.6470947265625, 0.698089599609375, 0.74908447265625, 0.800079345703125, 0.85107421875, 0.902069091796875, 0.95306396484375, 1.004058837890625, 1.0550537109375, 1.106048583984375, 1.15704345703125, 1.208038330078125, 1.259033203125, 1.310028076171875, 1.36102294921875, 1.412017822265625, 1.4630126953125, 1.514007568359375, 1.56500244140625, 1.615997314453125, 1.6669921875]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 4.0, 7.0, 7.0, 12.0, 1.0, 11.0, 13.0, 9.0, 19.0, 19.0, 14.0, 14.0, 28.0, 25.0, 33.0, 25.0, 35.0, 27.0, 41.0, 28.0, 24.0, 33.0, 41.0, 1070.0, 44.0, 36.0, 37.0, 40.0, 28.0, 35.0, 31.0, 24.0, 32.0, 35.0, 23.0, 21.0, 15.0, 16.0, 9.0, 15.0, 6.0, 6.0, 9.0, 10.0, 4.0, 6.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-7.0703125, -6.8367919921875, -6.603271484375, -6.3697509765625, -6.13623046875, -5.9027099609375, -5.669189453125, -5.4356689453125, -5.2021484375, -4.9686279296875, -4.735107421875, -4.5015869140625, -4.26806640625, -4.0345458984375, -3.801025390625, -3.5675048828125, -3.333984375, -3.1004638671875, -2.866943359375, -2.6334228515625, -2.39990234375, -2.1663818359375, -1.932861328125, -1.6993408203125, -1.4658203125, -1.2322998046875, -0.998779296875, -0.7652587890625, -0.53173828125, -0.2982177734375, -0.064697265625, 0.1688232421875, 0.40234375, 0.6358642578125, 0.869384765625, 1.1029052734375, 1.33642578125, 1.5699462890625, 1.803466796875, 2.0369873046875, 2.2705078125, 2.5040283203125, 2.737548828125, 2.9710693359375, 3.20458984375, 3.4381103515625, 3.671630859375, 3.9051513671875, 4.138671875, 4.3721923828125, 4.605712890625, 4.8392333984375, 5.07275390625, 5.3062744140625, 5.539794921875, 5.7733154296875, 6.0068359375, 6.2403564453125, 6.473876953125, 6.7073974609375, 6.94091796875, 7.1744384765625, 7.407958984375, 7.6414794921875, 7.875]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 12.0, 11.0, 19.0, 22.0, 28.0, 53.0, 87.0, 132.0, 235.0, 316.0, 505.0, 750.0, 1246.0, 1986.0, 2771.0, 4439.0, 6654.0, 10150.0, 15848.0, 24633.0, 40037.0, 68162.0, 119303.0, 260851.0, 1204070.0, 135753.0, 76914.0, 44762.0, 27460.0, 17520.0, 11225.0, 7361.0, 4905.0, 3044.0, 2113.0, 1365.0, 848.0, 526.0, 369.0, 230.0, 167.0, 90.0, 67.0, 36.0, 20.0, 18.0, 8.0, 5.0, 7.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.75927734375, -0.7356338500976562, -0.7119903564453125, -0.6883468627929688, -0.664703369140625, -0.6410598754882812, -0.6174163818359375, -0.5937728881835938, -0.57012939453125, -0.5464859008789062, -0.5228424072265625, -0.49919891357421875, -0.475555419921875, -0.45191192626953125, -0.4282684326171875, -0.40462493896484375, -0.3809814453125, -0.35733795166015625, -0.3336944580078125, -0.31005096435546875, -0.286407470703125, -0.26276397705078125, -0.2391204833984375, -0.21547698974609375, -0.19183349609375, -0.16819000244140625, -0.1445465087890625, -0.12090301513671875, -0.097259521484375, -0.07361602783203125, -0.0499725341796875, -0.02632904052734375, -0.002685546875, 0.02095794677734375, 0.0446014404296875, 0.06824493408203125, 0.091888427734375, 0.11553192138671875, 0.1391754150390625, 0.16281890869140625, 0.18646240234375, 0.21010589599609375, 0.2337493896484375, 0.25739288330078125, 0.281036376953125, 0.30467987060546875, 0.3283233642578125, 0.35196685791015625, 0.3756103515625, 0.39925384521484375, 0.4228973388671875, 0.44654083251953125, 0.470184326171875, 0.49382781982421875, 0.5174713134765625, 0.5411148071289062, 0.56475830078125, 0.5884017944335938, 0.6120452880859375, 0.6356887817382812, 0.659332275390625, 0.6829757690429688, 0.7066192626953125, 0.7302627563476562, 0.75390625]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 5.0, 1.0, 6.0, 6.0, 12.0, 11.0, 14.0, 14.0, 18.0, 48.0, 46.0, 51.0, 59.0, 76.0, 104.0, 76.0, 78.0, 68.0, 66.0, 67.0, 42.0, 33.0, 28.0, 13.0, 12.0, 5.0, 11.0, 8.0, 4.0, 4.0, 5.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.022979736328125, -0.02219676971435547, -0.021413803100585938, -0.020630836486816406, -0.019847869873046875, -0.019064903259277344, -0.018281936645507812, -0.01749897003173828, -0.01671600341796875, -0.01593303680419922, -0.015150070190429688, -0.014367103576660156, -0.013584136962890625, -0.012801170349121094, -0.012018203735351562, -0.011235237121582031, -0.0104522705078125, -0.009669303894042969, -0.008886337280273438, -0.008103370666503906, -0.007320404052734375, -0.006537437438964844, -0.0057544708251953125, -0.004971504211425781, -0.00418853759765625, -0.0034055709838867188, -0.0026226043701171875, -0.0018396377563476562, -0.001056671142578125, -0.00027370452880859375, 0.0005092620849609375, 0.0012922286987304688, 0.0020751953125, 0.0028581619262695312, 0.0036411285400390625, 0.004424095153808594, 0.005207061767578125, 0.005990028381347656, 0.0067729949951171875, 0.007555961608886719, 0.00833892822265625, 0.009121894836425781, 0.009904861450195312, 0.010687828063964844, 0.011470794677734375, 0.012253761291503906, 0.013036727905273438, 0.013819694519042969, 0.0146026611328125, 0.015385627746582031, 0.016168594360351562, 0.016951560974121094, 0.017734527587890625, 0.018517494201660156, 0.019300460815429688, 0.02008342742919922, 0.02086639404296875, 0.02164936065673828, 0.022432327270507812, 0.023215293884277344, 0.023998260498046875, 0.024781227111816406, 0.025564193725585938, 0.02634716033935547, 0.027130126953125]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 4.0, 4.0, 6.0, 2.0, 17.0, 20.0, 23.0, 33.0, 36.0, 33.0, 71.0, 90.0, 123.0, 242.0, 436.0, 1011.0, 3184.0, 23254.0, 909347.0, 101162.0, 6413.0, 1591.0, 591.0, 303.0, 160.0, 132.0, 66.0, 48.0, 32.0, 33.0, 18.0, 16.0, 12.0, 8.0, 10.0, 5.0, 3.0, 2.0, 6.0, 1.0, 3.0, 5.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.466552734375, -0.4522895812988281, -0.43802642822265625, -0.4237632751464844, -0.4095001220703125, -0.3952369689941406, -0.38097381591796875, -0.3667106628417969, -0.352447509765625, -0.3381843566894531, -0.32392120361328125, -0.3096580505371094, -0.2953948974609375, -0.2811317443847656, -0.26686859130859375, -0.2526054382324219, -0.23834228515625, -0.22407913208007812, -0.20981597900390625, -0.19555282592773438, -0.1812896728515625, -0.16702651977539062, -0.15276336669921875, -0.13850021362304688, -0.124237060546875, -0.10997390747070312, -0.09571075439453125, -0.08144760131835938, -0.0671844482421875, -0.052921295166015625, -0.03865814208984375, -0.024394989013671875, -0.0101318359375, 0.004131317138671875, 0.01839447021484375, 0.032657623291015625, 0.0469207763671875, 0.061183929443359375, 0.07544708251953125, 0.08971023559570312, 0.103973388671875, 0.11823654174804688, 0.13249969482421875, 0.14676284790039062, 0.1610260009765625, 0.17528915405273438, 0.18955230712890625, 0.20381546020507812, 0.21807861328125, 0.23234176635742188, 0.24660491943359375, 0.2608680725097656, 0.2751312255859375, 0.2893943786621094, 0.30365753173828125, 0.3179206848144531, 0.332183837890625, 0.3464469909667969, 0.36071014404296875, 0.3749732971191406, 0.3892364501953125, 0.4034996032714844, 0.41776275634765625, 0.4320259094238281, 0.4462890625]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 6.0, 10.0, 28.0, 68.0, 203.0, 412.0, 153.0, 63.0, 33.0, 12.0, 8.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0875474140048027, -0.0810135081410408, -0.0744796097278595, -0.0679457038640976, -0.06141179800033569, -0.05487789586186409, -0.04834399372339249, -0.041810087859630585, -0.03527618572115898, -0.02874228172004223, -0.022208377718925476, -0.015674475580453873, -0.00914057157933712, -0.0026066675782203674, 0.003927234560251236, 0.010461140424013138, 0.01699504256248474, 0.023528946563601494, 0.030062850564718246, 0.03659675270318985, 0.04313065856695175, 0.049664560705423355, 0.05619846284389496, 0.06273236870765686, 0.06926627457141876, 0.07580018043518066, 0.08233407884836197, 0.08886798471212387, 0.09540189057588577, 0.10193578898906708, 0.10846969485282898, 0.11500360071659088, 0.12153749167919159, 0.1280713975429535, 0.1346053034067154, 0.1411392092704773, 0.147673100233078, 0.1542070060968399, 0.1607409119606018, 0.1672748178243637, 0.1738087236881256, 0.1803426295518875, 0.18687653541564941, 0.19341042637825012, 0.19994433224201202, 0.20647823810577393, 0.21301214396953583, 0.21954604983329773, 0.22607994079589844, 0.23261384665966034, 0.23914775252342224, 0.24568164348602295, 0.25221556425094604, 0.25874945521354675, 0.26528334617614746, 0.27181726694107056, 0.27835118770599365, 0.28488507866859436, 0.29141899943351746, 0.29795289039611816, 0.30448681116104126, 0.31102070212364197, 0.3175545930862427, 0.32408851385116577, 0.3306224048137665]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 4.0, 2.0, 7.0, 12.0, 13.0, 15.0, 11.0, 14.0, 20.0, 17.0, 17.0, 16.0, 23.0, 26.0, 37.0, 28.0, 39.0, 44.0, 39.0, 31.0, 43.0, 44.0, 42.0, 37.0, 38.0, 34.0, 34.0, 33.0, 34.0, 33.0, 24.0, 18.0, 32.0, 25.0, 18.0, 17.0, 17.0, 17.0, 11.0, 7.0, 7.0, 7.0, 5.0, 5.0, 1.0, 1.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.027836382389068604, -0.027014771476387978, -0.02619316056370735, -0.025371549651026726, -0.0245499387383461, -0.023728327825665474, -0.022906716912984848, -0.022085106000304222, -0.021263495087623596, -0.02044188417494297, -0.019620273262262344, -0.01879866234958172, -0.017977051436901093, -0.017155440524220467, -0.01633382961153984, -0.015512218698859215, -0.014690607786178589, -0.013868996873497963, -0.013047385960817337, -0.012225775048136711, -0.011404164135456085, -0.01058255322277546, -0.009760942310094833, -0.008939331397414207, -0.008117720484733582, -0.007296109572052956, -0.00647449865937233, -0.005652887746691704, -0.004831276834011078, -0.004009665921330452, -0.003188055008649826, -0.0023664440959692, -0.0015448331832885742, -0.0007232222706079483, 9.838864207267761e-05, 0.0009199995547533035, 0.0017416104674339294, 0.0025632213801145554, 0.0033848322927951813, 0.004206443205475807, 0.005028054118156433, 0.005849665030837059, 0.006671275943517685, 0.007492886856198311, 0.008314497768878937, 0.009136108681559563, 0.009957719594240189, 0.010779330506920815, 0.01160094141960144, 0.012422552332282066, 0.013244163244962692, 0.014065774157643318, 0.014887385070323944, 0.01570899598300457, 0.016530606895685196, 0.017352217808365822, 0.018173828721046448, 0.018995439633727074, 0.0198170505464077, 0.020638661459088326, 0.02146027237176895, 0.022281883284449577, 0.023103494197130203, 0.02392510510981083, 0.024746716022491455]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 6.0, 7.0, 6.0, 9.0, 7.0, 7.0, 15.0, 24.0, 16.0, 17.0, 19.0, 30.0, 34.0, 30.0, 35.0, 32.0, 44.0, 47.0, 49.0, 44.0, 47.0, 55.0, 31.0, 38.0, 53.0, 48.0, 25.0, 28.0, 30.0, 30.0, 20.0, 20.0, 16.0, 13.0, 15.0, 19.0, 13.0, 7.0, 5.0, 5.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-14.515625, -14.08349609375, -13.6513671875, -13.21923828125, -12.787109375, -12.35498046875, -11.9228515625, -11.49072265625, -11.05859375, -10.62646484375, -10.1943359375, -9.76220703125, -9.330078125, -8.89794921875, -8.4658203125, -8.03369140625, -7.6015625, -7.16943359375, -6.7373046875, -6.30517578125, -5.873046875, -5.44091796875, -5.0087890625, -4.57666015625, -4.14453125, -3.71240234375, -3.2802734375, -2.84814453125, -2.416015625, -1.98388671875, -1.5517578125, -1.11962890625, -0.6875, -0.25537109375, 0.1767578125, 0.60888671875, 1.041015625, 1.47314453125, 1.9052734375, 2.33740234375, 2.76953125, 3.20166015625, 3.6337890625, 4.06591796875, 4.498046875, 4.93017578125, 5.3623046875, 5.79443359375, 6.2265625, 6.65869140625, 7.0908203125, 7.52294921875, 7.955078125, 8.38720703125, 8.8193359375, 9.25146484375, 9.68359375, 10.11572265625, 10.5478515625, 10.97998046875, 11.412109375, 11.84423828125, 12.2763671875, 12.70849609375, 13.140625]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 5.0, 10.0, 10.0, 17.0, 20.0, 26.0, 45.0, 46.0, 70.0, 100.0, 157.0, 227.0, 332.0, 639.0, 1069.0, 2064.0, 4333.0, 10008.0, 26216.0, 75178.0, 251741.0, 449274.0, 148791.0, 47257.0, 17170.0, 6853.0, 3075.0, 1561.0, 850.0, 498.0, 311.0, 174.0, 114.0, 93.0, 68.0, 49.0, 27.0, 17.0, 18.0, 14.0, 13.0, 5.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.5390625, -7.298095703125, -7.05712890625, -6.816162109375, -6.5751953125, -6.334228515625, -6.09326171875, -5.852294921875, -5.611328125, -5.370361328125, -5.12939453125, -4.888427734375, -4.6474609375, -4.406494140625, -4.16552734375, -3.924560546875, -3.68359375, -3.442626953125, -3.20166015625, -2.960693359375, -2.7197265625, -2.478759765625, -2.23779296875, -1.996826171875, -1.755859375, -1.514892578125, -1.27392578125, -1.032958984375, -0.7919921875, -0.551025390625, -0.31005859375, -0.069091796875, 0.171875, 0.412841796875, 0.65380859375, 0.894775390625, 1.1357421875, 1.376708984375, 1.61767578125, 1.858642578125, 2.099609375, 2.340576171875, 2.58154296875, 2.822509765625, 3.0634765625, 3.304443359375, 3.54541015625, 3.786376953125, 4.02734375, 4.268310546875, 4.50927734375, 4.750244140625, 4.9912109375, 5.232177734375, 5.47314453125, 5.714111328125, 5.955078125, 6.196044921875, 6.43701171875, 6.677978515625, 6.9189453125, 7.159912109375, 7.40087890625, 7.641845703125, 7.8828125]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 7.0, 7.0, 7.0, 16.0, 16.0, 14.0, 21.0, 18.0, 21.0, 24.0, 24.0, 38.0, 32.0, 40.0, 52.0, 37.0, 49.0, 58.0, 130.0, 1807.0, 148.0, 76.0, 40.0, 35.0, 37.0, 33.0, 34.0, 36.0, 43.0, 27.0, 16.0, 14.0, 20.0, 9.0, 11.0, 14.0, 11.0, 8.0, 5.0, 4.0, 5.0, 2.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-37.875, -36.5947265625, -35.314453125, -34.0341796875, -32.75390625, -31.4736328125, -30.193359375, -28.9130859375, -27.6328125, -26.3525390625, -25.072265625, -23.7919921875, -22.51171875, -21.2314453125, -19.951171875, -18.6708984375, -17.390625, -16.1103515625, -14.830078125, -13.5498046875, -12.26953125, -10.9892578125, -9.708984375, -8.4287109375, -7.1484375, -5.8681640625, -4.587890625, -3.3076171875, -2.02734375, -0.7470703125, 0.533203125, 1.8134765625, 3.09375, 4.3740234375, 5.654296875, 6.9345703125, 8.21484375, 9.4951171875, 10.775390625, 12.0556640625, 13.3359375, 14.6162109375, 15.896484375, 17.1767578125, 18.45703125, 19.7373046875, 21.017578125, 22.2978515625, 23.578125, 24.8583984375, 26.138671875, 27.4189453125, 28.69921875, 29.9794921875, 31.259765625, 32.5400390625, 33.8203125, 35.1005859375, 36.380859375, 37.6611328125, 38.94140625, 40.2216796875, 41.501953125, 42.7822265625, 44.0625]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 8.0, 7.0, 8.0, 9.0, 17.0, 30.0, 30.0, 46.0, 57.0, 123.0, 176.0, 242.0, 599.0, 1898.0, 16542.0, 3109646.0, 13283.0, 1714.0, 535.0, 243.0, 191.0, 105.0, 58.0, 42.0, 32.0, 29.0, 19.0, 10.0, 7.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-129.75, -125.345703125, -120.94140625, -116.537109375, -112.1328125, -107.728515625, -103.32421875, -98.919921875, -94.515625, -90.111328125, -85.70703125, -81.302734375, -76.8984375, -72.494140625, -68.08984375, -63.685546875, -59.28125, -54.876953125, -50.47265625, -46.068359375, -41.6640625, -37.259765625, -32.85546875, -28.451171875, -24.046875, -19.642578125, -15.23828125, -10.833984375, -6.4296875, -2.025390625, 2.37890625, 6.783203125, 11.1875, 15.591796875, 19.99609375, 24.400390625, 28.8046875, 33.208984375, 37.61328125, 42.017578125, 46.421875, 50.826171875, 55.23046875, 59.634765625, 64.0390625, 68.443359375, 72.84765625, 77.251953125, 81.65625, 86.060546875, 90.46484375, 94.869140625, 99.2734375, 103.677734375, 108.08203125, 112.486328125, 116.890625, 121.294921875, 125.69921875, 130.103515625, 134.5078125, 138.912109375, 143.31640625, 147.720703125, 152.125]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 33.0, 943.0, 45.0], "bins": [-1874.1378173828125, -1844.176513671875, -1814.215087890625, -1784.2537841796875, -1754.2923583984375, -1724.3310546875, -1694.36962890625, -1664.4083251953125, -1634.4468994140625, -1604.485595703125, -1574.524169921875, -1544.5628662109375, -1514.6014404296875, -1484.64013671875, -1454.6787109375, -1424.7174072265625, -1394.7559814453125, -1364.794677734375, -1334.833251953125, -1304.8719482421875, -1274.9105224609375, -1244.94921875, -1214.98779296875, -1185.0264892578125, -1155.0650634765625, -1125.103759765625, -1095.142333984375, -1065.1810302734375, -1035.2196044921875, -1005.2582397460938, -975.296875, -945.3355102539062, -915.3742065429688, -885.412841796875, -855.4514770507812, -825.4901123046875, -795.5287475585938, -765.5673828125, -735.6060180664062, -705.6446533203125, -675.683349609375, -645.7219848632812, -615.7606201171875, -585.7992553710938, -555.837890625, -525.8765258789062, -495.9151611328125, -465.95379638671875, -435.992431640625, -406.03106689453125, -376.0697021484375, -346.10833740234375, -316.14697265625, -286.18560791015625, -256.2242431640625, -226.2628936767578, -196.301513671875, -166.34014892578125, -136.3787841796875, -106.41742706298828, -76.45606231689453, -46.49470520019531, -16.533340454101562, 13.428024291992188, 43.38938903808594]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 5.0, 4.0, 9.0, 3.0, 12.0, 14.0, 18.0, 18.0, 16.0, 20.0, 24.0, 30.0, 22.0, 22.0, 32.0, 40.0, 35.0, 45.0, 51.0, 50.0, 43.0, 45.0, 43.0, 49.0, 40.0, 38.0, 33.0, 22.0, 34.0, 32.0, 20.0, 13.0, 27.0, 23.0, 16.0, 14.0, 13.0, 8.0, 7.0, 4.0, 5.0, 2.0, 2.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-125.19329071044922, -121.64056396484375, -118.08784484863281, -114.53511810302734, -110.9823989868164, -107.42967224121094, -103.876953125, -100.32422637939453, -96.77149963378906, -93.2187728881836, -89.66605377197266, -86.11332702636719, -82.56060791015625, -79.00788116455078, -75.45515441894531, -71.90243530273438, -68.34971618652344, -64.79698944091797, -61.24427032470703, -57.69154357910156, -54.138824462890625, -50.586097717285156, -47.03337478637695, -43.48065185546875, -39.92792892456055, -36.375205993652344, -32.82248306274414, -29.269758224487305, -25.7170352935791, -22.1643123626709, -18.611587524414062, -15.05886459350586, -11.506134033203125, -7.953410625457764, -4.400687217712402, -0.8479633331298828, 2.7047595977783203, 6.257482528686523, 9.81020736694336, 13.362930297851562, 16.915653228759766, 20.46837615966797, 24.021099090576172, 27.573823928833008, 31.12654685974121, 34.67926788330078, 38.23199462890625, 41.78471755981445, 45.337440490722656, 48.89016342163086, 52.44288635253906, 55.99561309814453, 59.54833221435547, 63.10105895996094, 66.65377807617188, 70.20650482177734, 73.75923156738281, 77.31195831298828, 80.86467742919922, 84.41740417480469, 87.97012329101562, 91.5228500366211, 95.07557678222656, 98.6282958984375, 102.18101501464844]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 4.0, 0.0, 3.0, 5.0, 15.0, 6.0, 10.0, 13.0, 16.0, 17.0, 13.0, 23.0, 23.0, 32.0, 28.0, 46.0, 36.0, 34.0, 45.0, 40.0, 51.0, 50.0, 51.0, 52.0, 40.0, 49.0, 28.0, 34.0, 26.0, 40.0, 23.0, 23.0, 22.0, 13.0, 23.0, 7.0, 19.0, 12.0, 10.0, 8.0, 5.0, 4.0, 7.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-15.1875, -14.73974609375, -14.2919921875, -13.84423828125, -13.396484375, -12.94873046875, -12.5009765625, -12.05322265625, -11.60546875, -11.15771484375, -10.7099609375, -10.26220703125, -9.814453125, -9.36669921875, -8.9189453125, -8.47119140625, -8.0234375, -7.57568359375, -7.1279296875, -6.68017578125, -6.232421875, -5.78466796875, -5.3369140625, -4.88916015625, -4.44140625, -3.99365234375, -3.5458984375, -3.09814453125, -2.650390625, -2.20263671875, -1.7548828125, -1.30712890625, -0.859375, -0.41162109375, 0.0361328125, 0.48388671875, 0.931640625, 1.37939453125, 1.8271484375, 2.27490234375, 2.72265625, 3.17041015625, 3.6181640625, 4.06591796875, 4.513671875, 4.96142578125, 5.4091796875, 5.85693359375, 6.3046875, 6.75244140625, 7.2001953125, 7.64794921875, 8.095703125, 8.54345703125, 8.9912109375, 9.43896484375, 9.88671875, 10.33447265625, 10.7822265625, 11.22998046875, 11.677734375, 12.12548828125, 12.5732421875, 13.02099609375, 13.46875]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 10.0, 13.0, 10.0, 21.0, 19.0, 26.0, 33.0, 31.0, 69.0, 91.0, 135.0, 199.0, 289.0, 486.0, 883.0, 1596.0, 3138.0, 6799.0, 16900.0, 118393.0, 3600812.0, 402175.0, 24394.0, 8973.0, 4035.0, 2040.0, 1046.0, 567.0, 362.0, 219.0, 162.0, 87.0, 56.0, 57.0, 31.0, 25.0, 32.0, 20.0, 16.0, 7.0, 11.0, 4.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-58.46875, -56.78125, -55.09375, -53.40625, -51.71875, -50.03125, -48.34375, -46.65625, -44.96875, -43.28125, -41.59375, -39.90625, -38.21875, -36.53125, -34.84375, -33.15625, -31.46875, -29.78125, -28.09375, -26.40625, -24.71875, -23.03125, -21.34375, -19.65625, -17.96875, -16.28125, -14.59375, -12.90625, -11.21875, -9.53125, -7.84375, -6.15625, -4.46875, -2.78125, -1.09375, 0.59375, 2.28125, 3.96875, 5.65625, 7.34375, 9.03125, 10.71875, 12.40625, 14.09375, 15.78125, 17.46875, 19.15625, 20.84375, 22.53125, 24.21875, 25.90625, 27.59375, 29.28125, 30.96875, 32.65625, 34.34375, 36.03125, 37.71875, 39.40625, 41.09375, 42.78125, 44.46875, 46.15625, 47.84375, 49.53125]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 4.0, 2.0, 6.0, 7.0, 6.0, 5.0, 10.0, 9.0, 10.0, 18.0, 24.0, 32.0, 36.0, 63.0, 114.0, 225.0, 565.0, 1099.0, 946.0, 452.0, 172.0, 80.0, 47.0, 35.0, 24.0, 18.0, 16.0, 13.0, 19.0, 7.0, 5.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.6875, -32.38623046875, -31.0849609375, -29.78369140625, -28.482421875, -27.18115234375, -25.8798828125, -24.57861328125, -23.27734375, -21.97607421875, -20.6748046875, -19.37353515625, -18.072265625, -16.77099609375, -15.4697265625, -14.16845703125, -12.8671875, -11.56591796875, -10.2646484375, -8.96337890625, -7.662109375, -6.36083984375, -5.0595703125, -3.75830078125, -2.45703125, -1.15576171875, 0.1455078125, 1.44677734375, 2.748046875, 4.04931640625, 5.3505859375, 6.65185546875, 7.953125, 9.25439453125, 10.5556640625, 11.85693359375, 13.158203125, 14.45947265625, 15.7607421875, 17.06201171875, 18.36328125, 19.66455078125, 20.9658203125, 22.26708984375, 23.568359375, 24.86962890625, 26.1708984375, 27.47216796875, 28.7734375, 30.07470703125, 31.3759765625, 32.67724609375, 33.978515625, 35.27978515625, 36.5810546875, 37.88232421875, 39.18359375, 40.48486328125, 41.7861328125, 43.08740234375, 44.388671875, 45.68994140625, 46.9912109375, 48.29248046875, 49.59375]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 5.0, 7.0, 4.0, 6.0, 13.0, 11.0, 29.0, 35.0, 64.0, 94.0, 162.0, 279.0, 460.0, 969.0, 1746.0, 3484.0, 7797.0, 19178.0, 61691.0, 1551409.0, 2439790.0, 70109.0, 20745.0, 8295.0, 3757.0, 1811.0, 939.0, 567.0, 314.0, 191.0, 106.0, 59.0, 45.0, 29.0, 30.0, 18.0, 9.0, 14.0, 4.0, 6.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-79.0, -76.92333984375, -74.8466796875, -72.77001953125, -70.693359375, -68.61669921875, -66.5400390625, -64.46337890625, -62.38671875, -60.31005859375, -58.2333984375, -56.15673828125, -54.080078125, -52.00341796875, -49.9267578125, -47.85009765625, -45.7734375, -43.69677734375, -41.6201171875, -39.54345703125, -37.466796875, -35.39013671875, -33.3134765625, -31.23681640625, -29.16015625, -27.08349609375, -25.0068359375, -22.93017578125, -20.853515625, -18.77685546875, -16.7001953125, -14.62353515625, -12.546875, -10.47021484375, -8.3935546875, -6.31689453125, -4.240234375, -2.16357421875, -0.0869140625, 1.98974609375, 4.06640625, 6.14306640625, 8.2197265625, 10.29638671875, 12.373046875, 14.44970703125, 16.5263671875, 18.60302734375, 20.6796875, 22.75634765625, 24.8330078125, 26.90966796875, 28.986328125, 31.06298828125, 33.1396484375, 35.21630859375, 37.29296875, 39.36962890625, 41.4462890625, 43.52294921875, 45.599609375, 47.67626953125, 49.7529296875, 51.82958984375, 53.90625]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 6.0, 4.0, 6.0, 7.0, 12.0, 14.0, 29.0, 23.0, 40.0, 55.0, 101.0, 131.0, 153.0, 143.0, 97.0, 57.0, 39.0, 21.0, 17.0, 15.0, 6.0, 12.0, 6.0, 8.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-95.68331909179688, -90.7453842163086, -85.80744934082031, -80.86951446533203, -75.93157958984375, -70.99364471435547, -66.05570983886719, -61.117774963378906, -56.179840087890625, -51.241905212402344, -46.30397033691406, -41.36603546142578, -36.4281005859375, -31.49016571044922, -26.552230834960938, -21.614295959472656, -16.676361083984375, -11.738426208496094, -6.8004913330078125, -1.8625564575195312, 3.07537841796875, 8.013313293457031, 12.951248168945312, 17.889183044433594, 22.827117919921875, 27.765052795410156, 32.70298767089844, 37.64092254638672, 42.578857421875, 47.51679229736328, 52.45472717285156, 57.392662048339844, 62.330596923828125, 67.2685317993164, 72.20646667480469, 77.14440155029297, 82.08233642578125, 87.02027130126953, 91.95820617675781, 96.8961410522461, 101.83407592773438, 106.77201080322266, 111.70994567871094, 116.64788055419922, 121.5858154296875, 126.52375030517578, 131.46168518066406, 136.39962768554688, 141.33755493164062, 146.27548217773438, 151.2134246826172, 156.1513671875, 161.08929443359375, 166.0272216796875, 170.9651641845703, 175.90310668945312, 180.84103393554688, 185.77896118164062, 190.71690368652344, 195.65484619140625, 200.5927734375, 205.53070068359375, 210.46864318847656, 215.40658569335938, 220.34451293945312]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 5.0, 4.0, 3.0, 6.0, 4.0, 4.0, 9.0, 6.0, 10.0, 4.0, 13.0, 14.0, 18.0, 15.0, 22.0, 19.0, 25.0, 35.0, 26.0, 29.0, 28.0, 26.0, 27.0, 28.0, 32.0, 30.0, 34.0, 30.0, 26.0, 36.0, 28.0, 37.0, 39.0, 42.0, 29.0, 27.0, 21.0, 27.0, 25.0, 21.0, 23.0, 17.0, 14.0, 11.0, 13.0, 7.0, 18.0, 4.0, 13.0, 8.0, 7.0, 3.0, 1.0, 3.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-71.44918060302734, -69.10608673095703, -66.76298522949219, -64.41989135742188, -62.07678985595703, -59.73369598388672, -57.39059829711914, -55.04750061035156, -52.704402923583984, -50.361305236816406, -48.01820755004883, -45.67510986328125, -43.33201599121094, -40.988914489746094, -38.64582061767578, -36.3027229309082, -33.959625244140625, -31.616527557373047, -29.27342987060547, -26.930334091186523, -24.587236404418945, -22.244138717651367, -19.901042938232422, -17.557945251464844, -15.214847564697266, -12.871749877929688, -10.528653144836426, -8.185556411743164, -5.842458724975586, -3.499361038208008, -1.156264305114746, 1.1868324279785156, 3.5299224853515625, 5.873019695281982, 8.216116905212402, 10.559213638305664, 12.902311325073242, 15.24540901184082, 17.588504791259766, 19.931602478027344, 22.274700164794922, 24.6177978515625, 26.960895538330078, 29.303991317749023, 31.6470890045166, 33.99018859863281, 36.333282470703125, 38.6763801574707, 41.01947784423828, 43.36257553100586, 45.70567321777344, 48.048770904541016, 50.391868591308594, 52.734962463378906, 55.078060150146484, 57.42115783691406, 59.76425552368164, 62.10735321044922, 64.45044708251953, 66.79354858398438, 69.13664245605469, 71.47974395751953, 73.82283782958984, 76.16593933105469, 78.509033203125]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 4.0, 3.0, 3.0, 10.0, 4.0, 11.0, 11.0, 15.0, 20.0, 22.0, 18.0, 14.0, 30.0, 32.0, 37.0, 29.0, 40.0, 40.0, 41.0, 52.0, 44.0, 56.0, 32.0, 50.0, 34.0, 38.0, 49.0, 30.0, 32.0, 26.0, 33.0, 19.0, 18.0, 18.0, 14.0, 14.0, 9.0, 7.0, 14.0, 8.0, 8.0, 3.0, 5.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-15.1015625, -14.6640625, -14.2265625, -13.7890625, -13.3515625, -12.9140625, -12.4765625, -12.0390625, -11.6015625, -11.1640625, -10.7265625, -10.2890625, -9.8515625, -9.4140625, -8.9765625, -8.5390625, -8.1015625, -7.6640625, -7.2265625, -6.7890625, -6.3515625, -5.9140625, -5.4765625, -5.0390625, -4.6015625, -4.1640625, -3.7265625, -3.2890625, -2.8515625, -2.4140625, -1.9765625, -1.5390625, -1.1015625, -0.6640625, -0.2265625, 0.2109375, 0.6484375, 1.0859375, 1.5234375, 1.9609375, 2.3984375, 2.8359375, 3.2734375, 3.7109375, 4.1484375, 4.5859375, 5.0234375, 5.4609375, 5.8984375, 6.3359375, 6.7734375, 7.2109375, 7.6484375, 8.0859375, 8.5234375, 8.9609375, 9.3984375, 9.8359375, 10.2734375, 10.7109375, 11.1484375, 11.5859375, 12.0234375, 12.4609375, 12.8984375]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 2.0, 4.0, 1.0, 6.0, 10.0, 7.0, 11.0, 24.0, 47.0, 64.0, 80.0, 157.0, 187.0, 353.0, 542.0, 802.0, 1300.0, 2014.0, 3027.0, 4632.0, 6996.0, 10469.0, 16438.0, 26657.0, 44942.0, 80533.0, 153109.0, 256905.0, 193934.0, 101840.0, 55475.0, 32057.0, 19737.0, 12626.0, 8317.0, 5343.0, 3391.0, 2303.0, 1480.0, 928.0, 626.0, 429.0, 255.0, 168.0, 115.0, 82.0, 47.0, 31.0, 20.0, 17.0, 8.0, 6.0, 4.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.578125, -1.5283203125, -1.478515625, -1.4287109375, -1.37890625, -1.3291015625, -1.279296875, -1.2294921875, -1.1796875, -1.1298828125, -1.080078125, -1.0302734375, -0.98046875, -0.9306640625, -0.880859375, -0.8310546875, -0.78125, -0.7314453125, -0.681640625, -0.6318359375, -0.58203125, -0.5322265625, -0.482421875, -0.4326171875, -0.3828125, -0.3330078125, -0.283203125, -0.2333984375, -0.18359375, -0.1337890625, -0.083984375, -0.0341796875, 0.015625, 0.0654296875, 0.115234375, 0.1650390625, 0.21484375, 0.2646484375, 0.314453125, 0.3642578125, 0.4140625, 0.4638671875, 0.513671875, 0.5634765625, 0.61328125, 0.6630859375, 0.712890625, 0.7626953125, 0.8125, 0.8623046875, 0.912109375, 0.9619140625, 1.01171875, 1.0615234375, 1.111328125, 1.1611328125, 1.2109375, 1.2607421875, 1.310546875, 1.3603515625, 1.41015625, 1.4599609375, 1.509765625, 1.5595703125, 1.609375]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 6.0, 7.0, 9.0, 7.0, 17.0, 6.0, 16.0, 17.0, 16.0, 27.0, 27.0, 34.0, 22.0, 22.0, 36.0, 32.0, 30.0, 40.0, 36.0, 46.0, 38.0, 1067.0, 52.0, 32.0, 32.0, 36.0, 28.0, 30.0, 39.0, 28.0, 29.0, 23.0, 21.0, 10.0, 28.0, 17.0, 12.0, 13.0, 6.0, 9.0, 10.0, 6.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0], "bins": [-8.6171875, -8.35107421875, -8.0849609375, -7.81884765625, -7.552734375, -7.28662109375, -7.0205078125, -6.75439453125, -6.48828125, -6.22216796875, -5.9560546875, -5.68994140625, -5.423828125, -5.15771484375, -4.8916015625, -4.62548828125, -4.359375, -4.09326171875, -3.8271484375, -3.56103515625, -3.294921875, -3.02880859375, -2.7626953125, -2.49658203125, -2.23046875, -1.96435546875, -1.6982421875, -1.43212890625, -1.166015625, -0.89990234375, -0.6337890625, -0.36767578125, -0.1015625, 0.16455078125, 0.4306640625, 0.69677734375, 0.962890625, 1.22900390625, 1.4951171875, 1.76123046875, 2.02734375, 2.29345703125, 2.5595703125, 2.82568359375, 3.091796875, 3.35791015625, 3.6240234375, 3.89013671875, 4.15625, 4.42236328125, 4.6884765625, 4.95458984375, 5.220703125, 5.48681640625, 5.7529296875, 6.01904296875, 6.28515625, 6.55126953125, 6.8173828125, 7.08349609375, 7.349609375, 7.61572265625, 7.8818359375, 8.14794921875, 8.4140625]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 4.0, 5.0, 1.0, 6.0, 13.0, 9.0, 21.0, 35.0, 61.0, 95.0, 120.0, 207.0, 333.0, 469.0, 725.0, 1115.0, 1558.0, 2436.0, 3623.0, 5558.0, 8203.0, 12869.0, 19744.0, 30939.0, 49893.0, 83158.0, 143531.0, 1257732.0, 191013.0, 109577.0, 64025.0, 38848.0, 24491.0, 16012.0, 10342.0, 6905.0, 4585.0, 3052.0, 1967.0, 1308.0, 844.0, 589.0, 373.0, 259.0, 153.0, 119.0, 70.0, 49.0, 35.0, 29.0, 12.0, 12.0, 6.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.77880859375, -0.7542800903320312, -0.7297515869140625, -0.7052230834960938, -0.680694580078125, -0.6561660766601562, -0.6316375732421875, -0.6071090698242188, -0.58258056640625, -0.5580520629882812, -0.5335235595703125, -0.5089950561523438, -0.484466552734375, -0.45993804931640625, -0.4354095458984375, -0.41088104248046875, -0.3863525390625, -0.36182403564453125, -0.3372955322265625, -0.31276702880859375, -0.288238525390625, -0.26371002197265625, -0.2391815185546875, -0.21465301513671875, -0.19012451171875, -0.16559600830078125, -0.1410675048828125, -0.11653900146484375, -0.092010498046875, -0.06748199462890625, -0.0429534912109375, -0.01842498779296875, 0.006103515625, 0.03063201904296875, 0.0551605224609375, 0.07968902587890625, 0.104217529296875, 0.12874603271484375, 0.1532745361328125, 0.17780303955078125, 0.20233154296875, 0.22686004638671875, 0.2513885498046875, 0.27591705322265625, 0.300445556640625, 0.32497406005859375, 0.3495025634765625, 0.37403106689453125, 0.3985595703125, 0.42308807373046875, 0.4476165771484375, 0.47214508056640625, 0.496673583984375, 0.5212020874023438, 0.5457305908203125, 0.5702590942382812, 0.59478759765625, 0.6193161010742188, 0.6438446044921875, 0.6683731079101562, 0.692901611328125, 0.7174301147460938, 0.7419586181640625, 0.7664871215820312, 0.791015625]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 5.0, 8.0, 6.0, 12.0, 18.0, 27.0, 39.0, 60.0, 83.0, 129.0, 183.0, 145.0, 90.0, 58.0, 28.0, 28.0, 14.0, 13.0, 11.0, 8.0, 6.0, 6.0, 8.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.04205322265625, -0.04076671600341797, -0.03948020935058594, -0.038193702697753906, -0.036907196044921875, -0.035620689392089844, -0.03433418273925781, -0.03304767608642578, -0.03176116943359375, -0.03047466278076172, -0.029188156127929688, -0.027901649475097656, -0.026615142822265625, -0.025328636169433594, -0.024042129516601562, -0.02275562286376953, -0.0214691162109375, -0.02018260955810547, -0.018896102905273438, -0.017609596252441406, -0.016323089599609375, -0.015036582946777344, -0.013750076293945312, -0.012463569641113281, -0.01117706298828125, -0.009890556335449219, -0.008604049682617188, -0.007317543029785156, -0.006031036376953125, -0.004744529724121094, -0.0034580230712890625, -0.0021715164184570312, -0.000885009765625, 0.00040149688720703125, 0.0016880035400390625, 0.0029745101928710938, 0.004261016845703125, 0.005547523498535156, 0.0068340301513671875, 0.008120536804199219, 0.00940704345703125, 0.010693550109863281, 0.011980056762695312, 0.013266563415527344, 0.014553070068359375, 0.015839576721191406, 0.017126083374023438, 0.01841259002685547, 0.0196990966796875, 0.02098560333251953, 0.022272109985351562, 0.023558616638183594, 0.024845123291015625, 0.026131629943847656, 0.027418136596679688, 0.02870464324951172, 0.02999114990234375, 0.03127765655517578, 0.03256416320800781, 0.033850669860839844, 0.035137176513671875, 0.036423683166503906, 0.03771018981933594, 0.03899669647216797, 0.040283203125]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 7.0, 8.0, 13.0, 13.0, 21.0, 43.0, 43.0, 97.0, 138.0, 372.0, 1727.0, 68309.0, 969309.0, 7228.0, 650.0, 259.0, 122.0, 72.0, 39.0, 19.0, 19.0, 13.0, 8.0, 4.0, 0.0, 2.0, 3.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.81298828125, -0.7869720458984375, -0.760955810546875, -0.7349395751953125, -0.70892333984375, -0.6829071044921875, -0.656890869140625, -0.6308746337890625, -0.6048583984375, -0.5788421630859375, -0.552825927734375, -0.5268096923828125, -0.50079345703125, -0.4747772216796875, -0.448760986328125, -0.4227447509765625, -0.396728515625, -0.3707122802734375, -0.344696044921875, -0.3186798095703125, -0.29266357421875, -0.2666473388671875, -0.240631103515625, -0.2146148681640625, -0.1885986328125, -0.1625823974609375, -0.136566162109375, -0.1105499267578125, -0.08453369140625, -0.0585174560546875, -0.032501220703125, -0.0064849853515625, 0.01953125, 0.0455474853515625, 0.071563720703125, 0.0975799560546875, 0.12359619140625, 0.1496124267578125, 0.175628662109375, 0.2016448974609375, 0.2276611328125, 0.2536773681640625, 0.279693603515625, 0.3057098388671875, 0.33172607421875, 0.3577423095703125, 0.383758544921875, 0.4097747802734375, 0.435791015625, 0.4618072509765625, 0.487823486328125, 0.5138397216796875, 0.53985595703125, 0.5658721923828125, 0.591888427734375, 0.6179046630859375, 0.6439208984375, 0.6699371337890625, 0.695953369140625, 0.7219696044921875, 0.74798583984375, 0.7740020751953125, 0.800018310546875, 0.8260345458984375, 0.85205078125]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 8.0, 26.0, 92.0, 425.0, 315.0, 86.0, 30.0, 17.0, 6.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12032121419906616, -0.1093047633767128, -0.09828831255435944, -0.08727185428142548, -0.07625540345907211, -0.06523895263671875, -0.05422249436378479, -0.04320604354143143, -0.032189592719078064, -0.02117314003407955, -0.01015668734908104, 0.0008597671985626221, 0.011876218020915985, 0.022892668843269348, 0.03390912711620331, 0.04492557793855667, 0.055942028760910034, 0.0669584795832634, 0.07797493040561676, 0.08899138867855072, 0.10000783950090408, 0.11102429032325745, 0.1220407485961914, 0.13305720686912537, 0.14407365024089813, 0.1550901085138321, 0.16610655188560486, 0.17712301015853882, 0.18813946843147278, 0.19915591180324554, 0.2101723700761795, 0.22118881344795227, 0.23220527172088623, 0.2432217299938202, 0.25423818826675415, 0.2652546167373657, 0.2762710750102997, 0.28728753328323364, 0.2983039915561676, 0.30932044982910156, 0.32033687829971313, 0.3313533365726471, 0.34236979484558105, 0.3533862233161926, 0.3644026815891266, 0.37541913986206055, 0.3864355981349945, 0.39745205640792847, 0.4084685146808624, 0.4194849729537964, 0.43050143122673035, 0.4415178894996643, 0.4525343179702759, 0.46355077624320984, 0.4745672345161438, 0.48558369278907776, 0.4966001510620117, 0.5076165795326233, 0.5186330676078796, 0.5296494960784912, 0.5406659841537476, 0.5516824126243591, 0.5626988410949707, 0.573715329170227, 0.5847317576408386]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 7.0, 2.0, 9.0, 8.0, 13.0, 15.0, 10.0, 20.0, 27.0, 20.0, 26.0, 28.0, 19.0, 29.0, 27.0, 32.0, 32.0, 37.0, 27.0, 42.0, 33.0, 39.0, 44.0, 27.0, 38.0, 32.0, 56.0, 37.0, 42.0, 29.0, 30.0, 25.0, 19.0, 19.0, 19.0, 20.0, 16.0, 5.0, 9.0, 10.0, 6.0, 4.0, 3.0, 3.0, 3.0, 3.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.048168838024139404, -0.04663674533367157, -0.045104652643203735, -0.0435725562274456, -0.04204046353697777, -0.040508370846509933, -0.0389762744307518, -0.037444181740283966, -0.03591208904981613, -0.0343799963593483, -0.03284790366888046, -0.03131580725312233, -0.029783714562654495, -0.02825162187218666, -0.026719527319073677, -0.025187432765960693, -0.02365534007549286, -0.022123247385025024, -0.02059115283191204, -0.019059058278799057, -0.017526965588331223, -0.015994872897863388, -0.014462778344750404, -0.012930684722959995, -0.011398591101169586, -0.009866497479379177, -0.008334403857588768, -0.006802310235798359, -0.00527021661400795, -0.0037381229922175407, -0.0022060293704271317, -0.0006739357486367226, 0.0008581578731536865, 0.0023902514949440956, 0.003922345116734505, 0.005454438738524914, 0.006986532360315323, 0.008518625982105732, 0.010050719603896141, 0.01158281322568655, 0.01311490684747696, 0.014647000469267368, 0.016179094091057777, 0.01771118864417076, 0.019243281334638596, 0.02077537402510643, 0.022307468578219414, 0.023839563131332397, 0.025371655821800232, 0.026903748512268066, 0.02843584306538105, 0.029967937618494034, 0.03150003030896187, 0.0330321229994297, 0.034564219415187836, 0.03609631210565567, 0.037628404796123505, 0.03916049748659134, 0.040692590177059174, 0.042224686592817307, 0.04375677928328514, 0.045288871973752975, 0.04682096838951111, 0.04835306107997894, 0.04988515377044678]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 4.0, 3.0, 3.0, 10.0, 4.0, 12.0, 10.0, 17.0, 19.0, 22.0, 17.0, 14.0, 30.0, 32.0, 38.0, 28.0, 41.0, 40.0, 40.0, 52.0, 45.0, 55.0, 32.0, 50.0, 34.0, 38.0, 49.0, 30.0, 32.0, 26.0, 33.0, 19.0, 18.0, 18.0, 14.0, 14.0, 9.0, 7.0, 14.0, 8.0, 8.0, 3.0, 5.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-15.09375, -14.6563720703125, -14.218994140625, -13.7816162109375, -13.34423828125, -12.9068603515625, -12.469482421875, -12.0321044921875, -11.5947265625, -11.1573486328125, -10.719970703125, -10.2825927734375, -9.84521484375, -9.4078369140625, -8.970458984375, -8.5330810546875, -8.095703125, -7.6583251953125, -7.220947265625, -6.7835693359375, -6.34619140625, -5.9088134765625, -5.471435546875, -5.0340576171875, -4.5966796875, -4.1593017578125, -3.721923828125, -3.2845458984375, -2.84716796875, -2.4097900390625, -1.972412109375, -1.5350341796875, -1.09765625, -0.6602783203125, -0.222900390625, 0.2144775390625, 0.65185546875, 1.0892333984375, 1.526611328125, 1.9639892578125, 2.4013671875, 2.8387451171875, 3.276123046875, 3.7135009765625, 4.15087890625, 4.5882568359375, 5.025634765625, 5.4630126953125, 5.900390625, 6.3377685546875, 6.775146484375, 7.2125244140625, 7.64990234375, 8.0872802734375, 8.524658203125, 8.9620361328125, 9.3994140625, 9.8367919921875, 10.274169921875, 10.7115478515625, 11.14892578125, 11.5863037109375, 12.023681640625, 12.4610595703125, 12.8984375]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 5.0, 3.0, 7.0, 5.0, 13.0, 14.0, 11.0, 11.0, 20.0, 20.0, 26.0, 36.0, 52.0, 71.0, 146.0, 260.0, 708.0, 1959.0, 7229.0, 29680.0, 142554.0, 573571.0, 230662.0, 46188.0, 10642.0, 2934.0, 878.0, 332.0, 180.0, 85.0, 71.0, 26.0, 37.0, 32.0, 20.0, 15.0, 17.0, 10.0, 4.0, 7.0, 4.0, 5.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.7734375, -8.4671630859375, -8.160888671875, -7.8546142578125, -7.54833984375, -7.2420654296875, -6.935791015625, -6.6295166015625, -6.3232421875, -6.0169677734375, -5.710693359375, -5.4044189453125, -5.09814453125, -4.7918701171875, -4.485595703125, -4.1793212890625, -3.873046875, -3.5667724609375, -3.260498046875, -2.9542236328125, -2.64794921875, -2.3416748046875, -2.035400390625, -1.7291259765625, -1.4228515625, -1.1165771484375, -0.810302734375, -0.5040283203125, -0.19775390625, 0.1085205078125, 0.414794921875, 0.7210693359375, 1.02734375, 1.3336181640625, 1.639892578125, 1.9461669921875, 2.25244140625, 2.5587158203125, 2.864990234375, 3.1712646484375, 3.4775390625, 3.7838134765625, 4.090087890625, 4.3963623046875, 4.70263671875, 5.0089111328125, 5.315185546875, 5.6214599609375, 5.927734375, 6.2340087890625, 6.540283203125, 6.8465576171875, 7.15283203125, 7.4591064453125, 7.765380859375, 8.0716552734375, 8.3779296875, 8.6842041015625, 8.990478515625, 9.2967529296875, 9.60302734375, 9.9093017578125, 10.215576171875, 10.5218505859375, 10.828125]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 4.0, 3.0, 9.0, 10.0, 7.0, 9.0, 14.0, 13.0, 19.0, 19.0, 21.0, 25.0, 32.0, 33.0, 40.0, 55.0, 50.0, 62.0, 78.0, 350.0, 1687.0, 85.0, 55.0, 52.0, 43.0, 39.0, 36.0, 18.0, 31.0, 27.0, 26.0, 23.0, 18.0, 12.0, 9.0, 12.0, 6.0, 7.0, 6.0, 6.0, 7.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.71875, -46.318359375, -44.91796875, -43.517578125, -42.1171875, -40.716796875, -39.31640625, -37.916015625, -36.515625, -35.115234375, -33.71484375, -32.314453125, -30.9140625, -29.513671875, -28.11328125, -26.712890625, -25.3125, -23.912109375, -22.51171875, -21.111328125, -19.7109375, -18.310546875, -16.91015625, -15.509765625, -14.109375, -12.708984375, -11.30859375, -9.908203125, -8.5078125, -7.107421875, -5.70703125, -4.306640625, -2.90625, -1.505859375, -0.10546875, 1.294921875, 2.6953125, 4.095703125, 5.49609375, 6.896484375, 8.296875, 9.697265625, 11.09765625, 12.498046875, 13.8984375, 15.298828125, 16.69921875, 18.099609375, 19.5, 20.900390625, 22.30078125, 23.701171875, 25.1015625, 26.501953125, 27.90234375, 29.302734375, 30.703125, 32.103515625, 33.50390625, 34.904296875, 36.3046875, 37.705078125, 39.10546875, 40.505859375, 41.90625]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 8.0, 5.0, 6.0, 7.0, 11.0, 7.0, 13.0, 14.0, 21.0, 31.0, 34.0, 54.0, 60.0, 75.0, 107.0, 132.0, 191.0, 300.0, 653.0, 3671.0, 3066963.0, 70334.0, 1642.0, 480.0, 236.0, 180.0, 112.0, 84.0, 67.0, 47.0, 37.0, 29.0, 24.0, 17.0, 14.0, 11.0, 6.0, 13.0, 5.0, 7.0, 5.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-90.6875, -87.64453125, -84.6015625, -81.55859375, -78.515625, -75.47265625, -72.4296875, -69.38671875, -66.34375, -63.30078125, -60.2578125, -57.21484375, -54.171875, -51.12890625, -48.0859375, -45.04296875, -42.0, -38.95703125, -35.9140625, -32.87109375, -29.828125, -26.78515625, -23.7421875, -20.69921875, -17.65625, -14.61328125, -11.5703125, -8.52734375, -5.484375, -2.44140625, 0.6015625, 3.64453125, 6.6875, 9.73046875, 12.7734375, 15.81640625, 18.859375, 21.90234375, 24.9453125, 27.98828125, 31.03125, 34.07421875, 37.1171875, 40.16015625, 43.203125, 46.24609375, 49.2890625, 52.33203125, 55.375, 58.41796875, 61.4609375, 64.50390625, 67.546875, 70.58984375, 73.6328125, 76.67578125, 79.71875, 82.76171875, 85.8046875, 88.84765625, 91.890625, 94.93359375, 97.9765625, 101.01953125, 104.0625]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 28.0, 930.0, 60.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-753.763671875, -740.4360961914062, -727.1084594726562, -713.7808837890625, -700.4532470703125, -687.1256713867188, -673.7980346679688, -660.470458984375, -647.142822265625, -633.8152465820312, -620.4876098632812, -607.1600341796875, -593.8323974609375, -580.5048217773438, -567.1771850585938, -553.849609375, -540.5220336914062, -527.1944580078125, -513.8668212890625, -500.5392150878906, -487.21160888671875, -473.884033203125, -460.556396484375, -447.22882080078125, -433.90118408203125, -420.5735778808594, -407.2459716796875, -393.9183654785156, -380.59075927734375, -367.26318359375, -353.935546875, -340.60797119140625, -327.28033447265625, -313.9527282714844, -300.6251220703125, -287.2975158691406, -273.96990966796875, -260.642333984375, -247.31471252441406, -233.98712158203125, -220.65951538085938, -207.3319091796875, -194.00430297851562, -180.67669677734375, -167.34910583496094, -154.02149963378906, -140.6938934326172, -127.36629486083984, -114.03868865966797, -100.7110824584961, -87.38348388671875, -74.05587768554688, -60.728275299072266, -47.400672912597656, -34.07306671142578, -20.745468139648438, -7.4178619384765625, 5.909741401672363, 19.23734474182129, 32.56494903564453, 45.89255142211914, 59.22015380859375, 72.54776000976562, 85.87535858154297, 99.20296478271484]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 3.0, 5.0, 2.0, 11.0, 7.0, 10.0, 6.0, 14.0, 9.0, 15.0, 19.0, 18.0, 22.0, 20.0, 19.0, 27.0, 21.0, 22.0, 19.0, 17.0, 42.0, 29.0, 38.0, 45.0, 42.0, 41.0, 38.0, 43.0, 27.0, 35.0, 42.0, 34.0, 32.0, 24.0, 29.0, 31.0, 20.0, 21.0, 14.0, 25.0, 8.0, 8.0, 8.0, 8.0, 7.0, 8.0, 4.0, 4.0, 3.0, 2.0, 4.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0], "bins": [-97.35313415527344, -93.98736572265625, -90.62159729003906, -87.25582885742188, -83.89006042480469, -80.5242919921875, -77.15852355957031, -73.79275512695312, -70.42698669433594, -67.06121826171875, -63.69544982910156, -60.329681396484375, -56.96391296386719, -53.59814453125, -50.23237228393555, -46.86660385131836, -43.500831604003906, -40.13506317138672, -36.76929473876953, -33.403526306152344, -30.037755966186523, -26.671987533569336, -23.306217193603516, -19.940448760986328, -16.57468032836914, -13.208911895751953, -9.84314250946045, -6.477373123168945, -3.111604690551758, 0.2541637420654297, 3.61993408203125, 6.9857025146484375, 10.351463317871094, 13.717231750488281, 17.08300018310547, 20.44877052307129, 23.814538955688477, 27.180307388305664, 30.546077728271484, 33.91184616088867, 37.27761459350586, 40.64338302612305, 44.009151458740234, 47.37492370605469, 50.740692138671875, 54.10646057128906, 57.47222900390625, 60.83799743652344, 64.20376586914062, 67.56953430175781, 70.935302734375, 74.30107116699219, 77.66683959960938, 81.03260803222656, 84.39837646484375, 87.76414489746094, 91.12991333007812, 94.49568176269531, 97.8614501953125, 101.22721862792969, 104.59298706054688, 107.95875549316406, 111.32452392578125, 114.69029235839844, 118.05606842041016]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 3.0, 4.0, 7.0, 5.0, 12.0, 10.0, 14.0, 17.0, 16.0, 21.0, 19.0, 18.0, 34.0, 32.0, 29.0, 44.0, 37.0, 40.0, 45.0, 45.0, 52.0, 36.0, 46.0, 41.0, 43.0, 42.0, 43.0, 31.0, 35.0, 22.0, 19.0, 21.0, 17.0, 16.0, 17.0, 11.0, 7.0, 8.0, 15.0, 9.0, 5.0, 5.0, 3.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-15.1171875, -14.673828125, -14.23046875, -13.787109375, -13.34375, -12.900390625, -12.45703125, -12.013671875, -11.5703125, -11.126953125, -10.68359375, -10.240234375, -9.796875, -9.353515625, -8.91015625, -8.466796875, -8.0234375, -7.580078125, -7.13671875, -6.693359375, -6.25, -5.806640625, -5.36328125, -4.919921875, -4.4765625, -4.033203125, -3.58984375, -3.146484375, -2.703125, -2.259765625, -1.81640625, -1.373046875, -0.9296875, -0.486328125, -0.04296875, 0.400390625, 0.84375, 1.287109375, 1.73046875, 2.173828125, 2.6171875, 3.060546875, 3.50390625, 3.947265625, 4.390625, 4.833984375, 5.27734375, 5.720703125, 6.1640625, 6.607421875, 7.05078125, 7.494140625, 7.9375, 8.380859375, 8.82421875, 9.267578125, 9.7109375, 10.154296875, 10.59765625, 11.041015625, 11.484375, 11.927734375, 12.37109375, 12.814453125, 13.2578125]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 2.0, 6.0, 4.0, 12.0, 11.0, 10.0, 19.0, 21.0, 30.0, 38.0, 37.0, 64.0, 79.0, 110.0, 214.0, 527.0, 1316.0, 3713.0, 11272.0, 132950.0, 3935442.0, 91584.0, 10679.0, 3646.0, 1341.0, 533.0, 213.0, 96.0, 63.0, 52.0, 42.0, 32.0, 33.0, 20.0, 17.0, 15.0, 12.0, 11.0, 7.0, 7.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-83.625, -81.33203125, -79.0390625, -76.74609375, -74.453125, -72.16015625, -69.8671875, -67.57421875, -65.28125, -62.98828125, -60.6953125, -58.40234375, -56.109375, -53.81640625, -51.5234375, -49.23046875, -46.9375, -44.64453125, -42.3515625, -40.05859375, -37.765625, -35.47265625, -33.1796875, -30.88671875, -28.59375, -26.30078125, -24.0078125, -21.71484375, -19.421875, -17.12890625, -14.8359375, -12.54296875, -10.25, -7.95703125, -5.6640625, -3.37109375, -1.078125, 1.21484375, 3.5078125, 5.80078125, 8.09375, 10.38671875, 12.6796875, 14.97265625, 17.265625, 19.55859375, 21.8515625, 24.14453125, 26.4375, 28.73046875, 31.0234375, 33.31640625, 35.609375, 37.90234375, 40.1953125, 42.48828125, 44.78125, 47.07421875, 49.3671875, 51.66015625, 53.953125, 56.24609375, 58.5390625, 60.83203125, 63.125]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 6.0, 9.0, 7.0, 16.0, 25.0, 34.0, 44.0, 50.0, 91.0, 234.0, 558.0, 1073.0, 1000.0, 458.0, 202.0, 73.0, 61.0, 33.0, 22.0, 10.0, 17.0, 13.0, 9.0, 7.0, 2.0, 3.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.25, -38.94677734375, -37.6435546875, -36.34033203125, -35.037109375, -33.73388671875, -32.4306640625, -31.12744140625, -29.82421875, -28.52099609375, -27.2177734375, -25.91455078125, -24.611328125, -23.30810546875, -22.0048828125, -20.70166015625, -19.3984375, -18.09521484375, -16.7919921875, -15.48876953125, -14.185546875, -12.88232421875, -11.5791015625, -10.27587890625, -8.97265625, -7.66943359375, -6.3662109375, -5.06298828125, -3.759765625, -2.45654296875, -1.1533203125, 0.14990234375, 1.453125, 2.75634765625, 4.0595703125, 5.36279296875, 6.666015625, 7.96923828125, 9.2724609375, 10.57568359375, 11.87890625, 13.18212890625, 14.4853515625, 15.78857421875, 17.091796875, 18.39501953125, 19.6982421875, 21.00146484375, 22.3046875, 23.60791015625, 24.9111328125, 26.21435546875, 27.517578125, 28.82080078125, 30.1240234375, 31.42724609375, 32.73046875, 34.03369140625, 35.3369140625, 36.64013671875, 37.943359375, 39.24658203125, 40.5498046875, 41.85302734375, 43.15625]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 3.0, 3.0, 4.0, 4.0, 5.0, 12.0, 16.0, 29.0, 40.0, 87.0, 195.0, 450.0, 986.0, 2660.0, 8852.0, 45940.0, 3670186.0, 431922.0, 24201.0, 5456.0, 1834.0, 712.0, 324.0, 170.0, 91.0, 42.0, 16.0, 13.0, 12.0, 8.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-111.125, -107.83984375, -104.5546875, -101.26953125, -97.984375, -94.69921875, -91.4140625, -88.12890625, -84.84375, -81.55859375, -78.2734375, -74.98828125, -71.703125, -68.41796875, -65.1328125, -61.84765625, -58.5625, -55.27734375, -51.9921875, -48.70703125, -45.421875, -42.13671875, -38.8515625, -35.56640625, -32.28125, -28.99609375, -25.7109375, -22.42578125, -19.140625, -15.85546875, -12.5703125, -9.28515625, -6.0, -2.71484375, 0.5703125, 3.85546875, 7.140625, 10.42578125, 13.7109375, 16.99609375, 20.28125, 23.56640625, 26.8515625, 30.13671875, 33.421875, 36.70703125, 39.9921875, 43.27734375, 46.5625, 49.84765625, 53.1328125, 56.41796875, 59.703125, 62.98828125, 66.2734375, 69.55859375, 72.84375, 76.12890625, 79.4140625, 82.69921875, 85.984375, 89.26953125, 92.5546875, 95.83984375, 99.125]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 5.0, 7.0, 6.0, 13.0, 11.0, 16.0, 27.0, 20.0, 45.0, 59.0, 89.0, 102.0, 148.0, 131.0, 94.0, 73.0, 43.0, 27.0, 29.0, 13.0, 9.0, 13.0, 7.0, 2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-146.2808074951172, -142.3976287841797, -138.51443481445312, -134.63125610351562, -130.74807739257812, -126.86489868164062, -122.9817123413086, -119.09852600097656, -115.21534729003906, -111.33216857910156, -107.44898223876953, -103.5657958984375, -99.6826171875, -95.7994384765625, -91.91625213623047, -88.03306579589844, -84.14988708496094, -80.26670837402344, -76.3835220336914, -72.50033569335938, -68.61715698242188, -64.73397827148438, -60.850791931152344, -56.96760940551758, -53.08442687988281, -49.20124435424805, -45.31806182861328, -41.434879302978516, -37.55169677734375, -33.668514251708984, -29.78533172607422, -25.902149200439453, -22.018959045410156, -18.13577651977539, -14.252593994140625, -10.36941146850586, -6.486228942871094, -2.603046417236328, 1.2801361083984375, 5.163318634033203, 9.046501159667969, 12.929683685302734, 16.8128662109375, 20.696048736572266, 24.57923126220703, 28.462413787841797, 32.34559631347656, 36.22877883911133, 40.111961364746094, 43.99514389038086, 47.878326416015625, 51.76150894165039, 55.644691467285156, 59.52787399291992, 63.41105651855469, 67.29423522949219, 71.17742156982422, 75.06060791015625, 78.94378662109375, 82.82696533203125, 86.71015167236328, 90.59333801269531, 94.47651672363281, 98.35969543457031, 102.24288177490234]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 10.0, 10.0, 7.0, 8.0, 18.0, 26.0, 17.0, 21.0, 22.0, 26.0, 36.0, 23.0, 38.0, 48.0, 40.0, 38.0, 32.0, 34.0, 41.0, 41.0, 44.0, 43.0, 37.0, 40.0, 39.0, 28.0, 30.0, 31.0, 19.0, 21.0, 12.0, 25.0, 19.0, 11.0, 14.0, 10.0, 9.0, 7.0, 4.0, 6.0, 3.0, 7.0, 4.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-74.97794342041016, -72.29045104980469, -69.60296630859375, -66.91548156738281, -64.22798919677734, -61.54050064086914, -58.85301208496094, -56.165523529052734, -53.47803497314453, -50.79054641723633, -48.103057861328125, -45.41556930541992, -42.72808074951172, -40.040592193603516, -37.35310363769531, -34.66561508178711, -31.978126525878906, -29.290637969970703, -26.6031494140625, -23.915660858154297, -21.228172302246094, -18.54068374633789, -15.853195190429688, -13.165706634521484, -10.478218078613281, -7.790729522705078, -5.103240966796875, -2.415752410888672, 0.27173614501953125, 2.9592247009277344, 5.6467132568359375, 8.33420181274414, 11.021697998046875, 13.709186553955078, 16.39667510986328, 19.084163665771484, 21.771652221679688, 24.45914077758789, 27.146629333496094, 29.834117889404297, 32.5216064453125, 35.2090950012207, 37.896583557128906, 40.58407211303711, 43.27156066894531, 45.959049224853516, 48.64653778076172, 51.33402633666992, 54.021514892578125, 56.70900344848633, 59.39649200439453, 62.083980560302734, 64.77146911621094, 67.45895385742188, 70.14644622802734, 72.83393859863281, 75.52142333984375, 78.20890808105469, 80.89640045166016, 83.58389282226562, 86.27137756347656, 88.9588623046875, 91.64635467529297, 94.33384704589844, 97.02133178710938]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 8.0, 10.0, 4.0, 12.0, 10.0, 12.0, 21.0, 19.0, 28.0, 31.0, 39.0, 41.0, 37.0, 44.0, 45.0, 46.0, 38.0, 44.0, 53.0, 59.0, 41.0, 45.0, 41.0, 36.0, 31.0, 30.0, 33.0, 32.0, 15.0, 16.0, 13.0, 18.0, 10.0, 11.0, 9.0, 5.0, 6.0, 1.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.71875, -16.22802734375, -15.7373046875, -15.24658203125, -14.755859375, -14.26513671875, -13.7744140625, -13.28369140625, -12.79296875, -12.30224609375, -11.8115234375, -11.32080078125, -10.830078125, -10.33935546875, -9.8486328125, -9.35791015625, -8.8671875, -8.37646484375, -7.8857421875, -7.39501953125, -6.904296875, -6.41357421875, -5.9228515625, -5.43212890625, -4.94140625, -4.45068359375, -3.9599609375, -3.46923828125, -2.978515625, -2.48779296875, -1.9970703125, -1.50634765625, -1.015625, -0.52490234375, -0.0341796875, 0.45654296875, 0.947265625, 1.43798828125, 1.9287109375, 2.41943359375, 2.91015625, 3.40087890625, 3.8916015625, 4.38232421875, 4.873046875, 5.36376953125, 5.8544921875, 6.34521484375, 6.8359375, 7.32666015625, 7.8173828125, 8.30810546875, 8.798828125, 9.28955078125, 9.7802734375, 10.27099609375, 10.76171875, 11.25244140625, 11.7431640625, 12.23388671875, 12.724609375, 13.21533203125, 13.7060546875, 14.19677734375, 14.6875]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 10.0, 20.0, 21.0, 20.0, 36.0, 49.0, 55.0, 72.0, 146.0, 209.0, 292.0, 468.0, 763.0, 1097.0, 1780.0, 2777.0, 4194.0, 6669.0, 10935.0, 17791.0, 29223.0, 48866.0, 84949.0, 155109.0, 248800.0, 185444.0, 102381.0, 58099.0, 33934.0, 20425.0, 12413.0, 7886.0, 5008.0, 3044.0, 2005.0, 1199.0, 814.0, 565.0, 344.0, 243.0, 141.0, 96.0, 40.0, 40.0, 14.0, 22.0, 11.0, 13.0, 7.0, 4.0, 1.0, 5.0, 5.0, 2.0, 7.0, 0.0, 1.0, 2.0], "bins": [-1.57421875, -1.522857666015625, -1.47149658203125, -1.420135498046875, -1.3687744140625, -1.317413330078125, -1.26605224609375, -1.214691162109375, -1.163330078125, -1.111968994140625, -1.06060791015625, -1.009246826171875, -0.9578857421875, -0.906524658203125, -0.85516357421875, -0.803802490234375, -0.75244140625, -0.701080322265625, -0.64971923828125, -0.598358154296875, -0.5469970703125, -0.495635986328125, -0.44427490234375, -0.392913818359375, -0.341552734375, -0.290191650390625, -0.23883056640625, -0.187469482421875, -0.1361083984375, -0.084747314453125, -0.03338623046875, 0.017974853515625, 0.0693359375, 0.120697021484375, 0.17205810546875, 0.223419189453125, 0.2747802734375, 0.326141357421875, 0.37750244140625, 0.428863525390625, 0.480224609375, 0.531585693359375, 0.58294677734375, 0.634307861328125, 0.6856689453125, 0.737030029296875, 0.78839111328125, 0.839752197265625, 0.89111328125, 0.942474365234375, 0.99383544921875, 1.045196533203125, 1.0965576171875, 1.147918701171875, 1.19927978515625, 1.250640869140625, 1.302001953125, 1.353363037109375, 1.40472412109375, 1.456085205078125, 1.5074462890625, 1.558807373046875, 1.61016845703125, 1.661529541015625, 1.712890625]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 6.0, 5.0, 5.0, 5.0, 4.0, 8.0, 10.0, 12.0, 7.0, 14.0, 17.0, 17.0, 24.0, 22.0, 28.0, 38.0, 20.0, 29.0, 38.0, 44.0, 36.0, 39.0, 34.0, 43.0, 1071.0, 45.0, 39.0, 44.0, 29.0, 32.0, 35.0, 38.0, 32.0, 20.0, 24.0, 20.0, 16.0, 10.0, 17.0, 15.0, 10.0, 10.0, 7.0, 4.0, 6.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.0625, -7.78564453125, -7.5087890625, -7.23193359375, -6.955078125, -6.67822265625, -6.4013671875, -6.12451171875, -5.84765625, -5.57080078125, -5.2939453125, -5.01708984375, -4.740234375, -4.46337890625, -4.1865234375, -3.90966796875, -3.6328125, -3.35595703125, -3.0791015625, -2.80224609375, -2.525390625, -2.24853515625, -1.9716796875, -1.69482421875, -1.41796875, -1.14111328125, -0.8642578125, -0.58740234375, -0.310546875, -0.03369140625, 0.2431640625, 0.52001953125, 0.796875, 1.07373046875, 1.3505859375, 1.62744140625, 1.904296875, 2.18115234375, 2.4580078125, 2.73486328125, 3.01171875, 3.28857421875, 3.5654296875, 3.84228515625, 4.119140625, 4.39599609375, 4.6728515625, 4.94970703125, 5.2265625, 5.50341796875, 5.7802734375, 6.05712890625, 6.333984375, 6.61083984375, 6.8876953125, 7.16455078125, 7.44140625, 7.71826171875, 7.9951171875, 8.27197265625, 8.548828125, 8.82568359375, 9.1025390625, 9.37939453125, 9.65625]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 9.0, 12.0, 14.0, 26.0, 41.0, 51.0, 85.0, 171.0, 246.0, 389.0, 612.0, 932.0, 1436.0, 2379.0, 3807.0, 6178.0, 9881.0, 16273.0, 26850.0, 47361.0, 88540.0, 170944.0, 1310818.0, 187683.0, 96220.0, 51404.0, 29115.0, 17288.0, 10674.0, 6416.0, 4214.0, 2703.0, 1580.0, 1011.0, 645.0, 429.0, 241.0, 156.0, 91.0, 79.0, 35.0, 37.0, 22.0, 14.0, 13.0, 7.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.98193359375, -0.9517822265625, -0.921630859375, -0.8914794921875, -0.861328125, -0.8311767578125, -0.801025390625, -0.7708740234375, -0.74072265625, -0.7105712890625, -0.680419921875, -0.6502685546875, -0.6201171875, -0.5899658203125, -0.559814453125, -0.5296630859375, -0.49951171875, -0.4693603515625, -0.439208984375, -0.4090576171875, -0.37890625, -0.3487548828125, -0.318603515625, -0.2884521484375, -0.25830078125, -0.2281494140625, -0.197998046875, -0.1678466796875, -0.1376953125, -0.1075439453125, -0.077392578125, -0.0472412109375, -0.01708984375, 0.0130615234375, 0.043212890625, 0.0733642578125, 0.103515625, 0.1336669921875, 0.163818359375, 0.1939697265625, 0.22412109375, 0.2542724609375, 0.284423828125, 0.3145751953125, 0.3447265625, 0.3748779296875, 0.405029296875, 0.4351806640625, 0.46533203125, 0.4954833984375, 0.525634765625, 0.5557861328125, 0.5859375, 0.6160888671875, 0.646240234375, 0.6763916015625, 0.70654296875, 0.7366943359375, 0.766845703125, 0.7969970703125, 0.8271484375, 0.8572998046875, 0.887451171875, 0.9176025390625, 0.94775390625]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 7.0, 5.0, 7.0, 12.0, 6.0, 17.0, 16.0, 14.0, 19.0, 30.0, 43.0, 57.0, 80.0, 139.0, 160.0, 131.0, 66.0, 49.0, 29.0, 24.0, 16.0, 14.0, 11.0, 16.0, 4.0, 5.0, 7.0, 4.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05169677734375, -0.05014657974243164, -0.04859638214111328, -0.04704618453979492, -0.04549598693847656, -0.0439457893371582, -0.042395591735839844, -0.040845394134521484, -0.039295196533203125, -0.037744998931884766, -0.036194801330566406, -0.03464460372924805, -0.03309440612792969, -0.03154420852661133, -0.02999401092529297, -0.02844381332397461, -0.02689361572265625, -0.02534341812133789, -0.02379322052001953, -0.022243022918701172, -0.020692825317382812, -0.019142627716064453, -0.017592430114746094, -0.016042232513427734, -0.014492034912109375, -0.012941837310791016, -0.011391639709472656, -0.009841442108154297, -0.008291244506835938, -0.006741046905517578, -0.005190849304199219, -0.0036406517028808594, -0.0020904541015625, -0.0005402565002441406, 0.0010099411010742188, 0.002560138702392578, 0.0041103363037109375, 0.005660533905029297, 0.007210731506347656, 0.008760929107666016, 0.010311126708984375, 0.011861324310302734, 0.013411521911621094, 0.014961719512939453, 0.016511917114257812, 0.018062114715576172, 0.01961231231689453, 0.02116250991821289, 0.02271270751953125, 0.02426290512084961, 0.02581310272216797, 0.027363300323486328, 0.028913497924804688, 0.030463695526123047, 0.032013893127441406, 0.033564090728759766, 0.035114288330078125, 0.036664485931396484, 0.038214683532714844, 0.0397648811340332, 0.04131507873535156, 0.04286527633666992, 0.04441547393798828, 0.04596567153930664, 0.047515869140625]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 2.0, 6.0, 11.0, 18.0, 15.0, 33.0, 48.0, 61.0, 123.0, 227.0, 835.0, 11543.0, 984434.0, 48648.0, 1809.0, 313.0, 150.0, 84.0, 55.0, 30.0, 26.0, 21.0, 12.0, 8.0, 9.0, 7.0, 8.0, 2.0, 6.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.044921875, -1.0108642578125, -0.976806640625, -0.9427490234375, -0.90869140625, -0.8746337890625, -0.840576171875, -0.8065185546875, -0.7724609375, -0.7384033203125, -0.704345703125, -0.6702880859375, -0.63623046875, -0.6021728515625, -0.568115234375, -0.5340576171875, -0.5, -0.4659423828125, -0.431884765625, -0.3978271484375, -0.36376953125, -0.3297119140625, -0.295654296875, -0.2615966796875, -0.2275390625, -0.1934814453125, -0.159423828125, -0.1253662109375, -0.09130859375, -0.0572509765625, -0.023193359375, 0.0108642578125, 0.044921875, 0.0789794921875, 0.113037109375, 0.1470947265625, 0.18115234375, 0.2152099609375, 0.249267578125, 0.2833251953125, 0.3173828125, 0.3514404296875, 0.385498046875, 0.4195556640625, 0.45361328125, 0.4876708984375, 0.521728515625, 0.5557861328125, 0.58984375, 0.6239013671875, 0.657958984375, 0.6920166015625, 0.72607421875, 0.7601318359375, 0.794189453125, 0.8282470703125, 0.8623046875, 0.8963623046875, 0.930419921875, 0.9644775390625, 0.99853515625, 1.0325927734375, 1.066650390625, 1.1007080078125, 1.134765625]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 10.0, 13.0, 42.0, 96.0, 476.0, 221.0, 89.0, 39.0, 16.0, 5.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.42249006032943726, -0.4096030294895172, -0.39671602845191956, -0.3838289976119995, -0.37094199657440186, -0.3580549657344818, -0.34516793489456177, -0.3322809338569641, -0.31939390301704407, -0.306506872177124, -0.29361987113952637, -0.2807328402996063, -0.26784583926200867, -0.2549588084220886, -0.24207179248332977, -0.22918477654457092, -0.21629776060581207, -0.20341074466705322, -0.19052372872829437, -0.17763671278953552, -0.16474968194961548, -0.15186266601085663, -0.13897565007209778, -0.12608861923217773, -0.11320161074399948, -0.10031459480524063, -0.08742757141590118, -0.07454055547714233, -0.061653535813093185, -0.04876651614904404, -0.03587950021028519, -0.02299247682094574, -0.01010546088218689, 0.0027815578505396843, 0.015668576583266258, 0.028555594384670258, 0.041442614048719406, 0.054329633712768555, 0.0672166496515274, 0.08010367304086685, 0.0929906889796257, 0.10587770491838455, 0.118764728307724, 0.13165174424648285, 0.1445387601852417, 0.15742579102516174, 0.1703127920627594, 0.18319982290267944, 0.1960868388414383, 0.20897385478019714, 0.221860870718956, 0.23474788665771484, 0.2476349174976349, 0.26052194833755493, 0.2734089493751526, 0.28629598021507263, 0.2991829812526703, 0.31207001209259033, 0.324957013130188, 0.33784404397010803, 0.3507310450077057, 0.36361807584762573, 0.3765050768852234, 0.38939210772514343, 0.4022791385650635]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 2.0, 9.0, 5.0, 5.0, 6.0, 16.0, 7.0, 19.0, 15.0, 16.0, 24.0, 12.0, 27.0, 24.0, 30.0, 28.0, 31.0, 34.0, 44.0, 28.0, 38.0, 39.0, 37.0, 36.0, 45.0, 33.0, 36.0, 43.0, 34.0, 34.0, 43.0, 23.0, 20.0, 24.0, 21.0, 24.0, 11.0, 15.0, 8.0, 11.0, 12.0, 3.0, 9.0, 3.0, 7.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.05724400281906128, -0.05544813722372055, -0.05365227162837982, -0.051856402307748795, -0.050060536712408066, -0.04826467111706734, -0.04646880179643631, -0.04467293620109558, -0.04287707060575485, -0.041081205010414124, -0.039285339415073395, -0.03748947009444237, -0.03569360449910164, -0.03389773890376091, -0.03210186958312988, -0.030306003987789154, -0.028510138392448425, -0.026714272797107697, -0.02491840533912182, -0.02312253788113594, -0.021326672285795212, -0.019530806690454483, -0.017734939232468605, -0.015939071774482727, -0.014143206179141998, -0.012347339652478695, -0.010551473125815392, -0.008755606599152088, -0.006959740072488785, -0.005163873545825481, -0.003368007019162178, -0.0015721404924988747, 0.0002237260341644287, 0.002019592560827732, 0.0038154590874910355, 0.005611325614154339, 0.007407192140817642, 0.009203058667480946, 0.010998925194144249, 0.012794791720807552, 0.014590658247470856, 0.016386523842811584, 0.018182391300797462, 0.01997825875878334, 0.02177412435412407, 0.023569989949464798, 0.025365857407450676, 0.027161724865436554, 0.028957590460777283, 0.03075345605611801, 0.03254932165145874, 0.03434519097208977, 0.036141056567430496, 0.037936922162771225, 0.03973279148340225, 0.04152865707874298, 0.04332452267408371, 0.04512038826942444, 0.04691625386476517, 0.048712123185396194, 0.05050798878073692, 0.05230385437607765, 0.05409972369670868, 0.05589558929204941, 0.05769145488739014]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 8.0, 10.0, 4.0, 12.0, 10.0, 12.0, 21.0, 19.0, 28.0, 33.0, 37.0, 41.0, 38.0, 43.0, 45.0, 46.0, 38.0, 44.0, 54.0, 58.0, 41.0, 45.0, 41.0, 36.0, 30.0, 31.0, 33.0, 32.0, 15.0, 16.0, 13.0, 18.0, 10.0, 11.0, 9.0, 5.0, 6.0, 1.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.71875, -16.22802734375, -15.7373046875, -15.24658203125, -14.755859375, -14.26513671875, -13.7744140625, -13.28369140625, -12.79296875, -12.30224609375, -11.8115234375, -11.32080078125, -10.830078125, -10.33935546875, -9.8486328125, -9.35791015625, -8.8671875, -8.37646484375, -7.8857421875, -7.39501953125, -6.904296875, -6.41357421875, -5.9228515625, -5.43212890625, -4.94140625, -4.45068359375, -3.9599609375, -3.46923828125, -2.978515625, -2.48779296875, -1.9970703125, -1.50634765625, -1.015625, -0.52490234375, -0.0341796875, 0.45654296875, 0.947265625, 1.43798828125, 1.9287109375, 2.41943359375, 2.91015625, 3.40087890625, 3.8916015625, 4.38232421875, 4.873046875, 5.36376953125, 5.8544921875, 6.34521484375, 6.8359375, 7.32666015625, 7.8173828125, 8.30810546875, 8.798828125, 9.28955078125, 9.7802734375, 10.27099609375, 10.76171875, 11.25244140625, 11.7431640625, 12.23388671875, 12.724609375, 13.21533203125, 13.7060546875, 14.19677734375, 14.6875]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 5.0, 8.0, 12.0, 18.0, 20.0, 27.0, 41.0, 57.0, 77.0, 138.0, 199.0, 312.0, 524.0, 797.0, 1228.0, 1913.0, 3359.0, 7987.0, 29222.0, 172196.0, 646635.0, 142970.0, 25304.0, 7222.0, 3160.0, 1811.0, 1157.0, 749.0, 484.0, 314.0, 188.0, 147.0, 84.0, 62.0, 32.0, 35.0, 22.0, 16.0, 8.0, 7.0, 1.0, 3.0, 6.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.484375, -11.1304931640625, -10.776611328125, -10.4227294921875, -10.06884765625, -9.7149658203125, -9.361083984375, -9.0072021484375, -8.6533203125, -8.2994384765625, -7.945556640625, -7.5916748046875, -7.23779296875, -6.8839111328125, -6.530029296875, -6.1761474609375, -5.822265625, -5.4683837890625, -5.114501953125, -4.7606201171875, -4.40673828125, -4.0528564453125, -3.698974609375, -3.3450927734375, -2.9912109375, -2.6373291015625, -2.283447265625, -1.9295654296875, -1.57568359375, -1.2218017578125, -0.867919921875, -0.5140380859375, -0.16015625, 0.1937255859375, 0.547607421875, 0.9014892578125, 1.25537109375, 1.6092529296875, 1.963134765625, 2.3170166015625, 2.6708984375, 3.0247802734375, 3.378662109375, 3.7325439453125, 4.08642578125, 4.4403076171875, 4.794189453125, 5.1480712890625, 5.501953125, 5.8558349609375, 6.209716796875, 6.5635986328125, 6.91748046875, 7.2713623046875, 7.625244140625, 7.9791259765625, 8.3330078125, 8.6868896484375, 9.040771484375, 9.3946533203125, 9.74853515625, 10.1024169921875, 10.456298828125, 10.8101806640625, 11.1640625]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 5.0, 2.0, 2.0, 4.0, 3.0, 4.0, 8.0, 4.0, 9.0, 7.0, 13.0, 9.0, 12.0, 21.0, 18.0, 28.0, 22.0, 40.0, 30.0, 38.0, 37.0, 33.0, 45.0, 59.0, 83.0, 1756.0, 268.0, 75.0, 43.0, 39.0, 40.0, 49.0, 38.0, 29.0, 27.0, 25.0, 20.0, 20.0, 19.0, 12.0, 16.0, 11.0, 13.0, 8.0, 7.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-34.375, -33.1806640625, -31.986328125, -30.7919921875, -29.59765625, -28.4033203125, -27.208984375, -26.0146484375, -24.8203125, -23.6259765625, -22.431640625, -21.2373046875, -20.04296875, -18.8486328125, -17.654296875, -16.4599609375, -15.265625, -14.0712890625, -12.876953125, -11.6826171875, -10.48828125, -9.2939453125, -8.099609375, -6.9052734375, -5.7109375, -4.5166015625, -3.322265625, -2.1279296875, -0.93359375, 0.2607421875, 1.455078125, 2.6494140625, 3.84375, 5.0380859375, 6.232421875, 7.4267578125, 8.62109375, 9.8154296875, 11.009765625, 12.2041015625, 13.3984375, 14.5927734375, 15.787109375, 16.9814453125, 18.17578125, 19.3701171875, 20.564453125, 21.7587890625, 22.953125, 24.1474609375, 25.341796875, 26.5361328125, 27.73046875, 28.9248046875, 30.119140625, 31.3134765625, 32.5078125, 33.7021484375, 34.896484375, 36.0908203125, 37.28515625, 38.4794921875, 39.673828125, 40.8681640625, 42.0625]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 4.0, 4.0, 2.0, 6.0, 6.0, 12.0, 19.0, 22.0, 27.0, 34.0, 42.0, 60.0, 79.0, 87.0, 124.0, 157.0, 223.0, 327.0, 864.0, 9252.0, 3121293.0, 10928.0, 885.0, 320.0, 218.0, 149.0, 140.0, 87.0, 82.0, 57.0, 48.0, 36.0, 22.0, 21.0, 14.0, 10.0, 15.0, 9.0, 11.0, 4.0, 6.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-98.3125, -95.3798828125, -92.447265625, -89.5146484375, -86.58203125, -83.6494140625, -80.716796875, -77.7841796875, -74.8515625, -71.9189453125, -68.986328125, -66.0537109375, -63.12109375, -60.1884765625, -57.255859375, -54.3232421875, -51.390625, -48.4580078125, -45.525390625, -42.5927734375, -39.66015625, -36.7275390625, -33.794921875, -30.8623046875, -27.9296875, -24.9970703125, -22.064453125, -19.1318359375, -16.19921875, -13.2666015625, -10.333984375, -7.4013671875, -4.46875, -1.5361328125, 1.396484375, 4.3291015625, 7.26171875, 10.1943359375, 13.126953125, 16.0595703125, 18.9921875, 21.9248046875, 24.857421875, 27.7900390625, 30.72265625, 33.6552734375, 36.587890625, 39.5205078125, 42.453125, 45.3857421875, 48.318359375, 51.2509765625, 54.18359375, 57.1162109375, 60.048828125, 62.9814453125, 65.9140625, 68.8466796875, 71.779296875, 74.7119140625, 77.64453125, 80.5771484375, 83.509765625, 86.4423828125, 89.375]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 23.0, 134.0, 426.0, 329.0, 89.0, 12.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.34568214416504, -17.37533950805664, -14.404998779296875, -11.434657096862793, -8.464315414428711, -5.493973731994629, -2.523632049560547, 0.44671058654785156, 3.417051315307617, 6.387392997741699, 9.357734680175781, 12.328076362609863, 15.298418045043945, 18.268760681152344, 21.23910140991211, 24.209444046020508, 27.179784774780273, 30.150127410888672, 33.12046813964844, 36.0908088684082, 39.06114959716797, 42.031494140625, 45.001834869384766, 47.97217559814453, 50.94252014160156, 53.91286087036133, 56.883201599121094, 59.853546142578125, 62.82388687133789, 65.79422760009766, 68.76457214355469, 71.73490905761719, 74.70524597167969, 77.67559051513672, 80.64592742919922, 83.61627197265625, 86.58660888671875, 89.55695343017578, 92.52729797363281, 95.49763488769531, 98.46797943115234, 101.43832397460938, 104.40866088867188, 107.3790054321289, 110.34934997558594, 113.31968688964844, 116.29003143310547, 119.2603759765625, 122.230712890625, 125.20105743408203, 128.17140197753906, 131.14173889160156, 134.11207580566406, 137.08242797851562, 140.05276489257812, 143.02310180664062, 145.99343872070312, 148.96377563476562, 151.9341278076172, 154.9044647216797, 157.8748016357422, 160.84515380859375, 163.81549072265625, 166.78582763671875, 169.7561798095703]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 7.0, 5.0, 5.0, 11.0, 7.0, 6.0, 14.0, 15.0, 16.0, 17.0, 35.0, 20.0, 38.0, 22.0, 38.0, 32.0, 42.0, 41.0, 34.0, 50.0, 49.0, 37.0, 56.0, 33.0, 36.0, 44.0, 29.0, 28.0, 35.0, 30.0, 31.0, 26.0, 22.0, 21.0, 12.0, 11.0, 8.0, 7.0, 7.0, 9.0, 8.0, 5.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-108.66925811767578, -105.16291809082031, -101.65657043457031, -98.15023040771484, -94.64389038085938, -91.13754272460938, -87.6312026977539, -84.12486267089844, -80.61851501464844, -77.11217498779297, -73.60582733154297, -70.0994873046875, -66.59314727783203, -63.0868034362793, -59.58045959472656, -56.074119567871094, -52.567779541015625, -49.06143569946289, -45.55509567260742, -42.04875183105469, -38.54241180419922, -35.036067962646484, -31.52972412109375, -28.02338218688965, -24.517040252685547, -21.010698318481445, -17.504356384277344, -13.99801254272461, -10.491670608520508, -6.985328674316406, -3.478984832763672, 0.027357101440429688, 3.53369140625, 7.04003381729126, 10.54637622833252, 14.052719116210938, 17.55906105041504, 21.06540298461914, 24.571746826171875, 28.078088760375977, 31.584430694580078, 35.09077453613281, 38.59711456298828, 42.103458404541016, 45.60980224609375, 49.11614227294922, 52.62248611450195, 56.12882995605469, 59.635169982910156, 63.14151382446289, 66.64785766601562, 70.1541976928711, 73.66053771972656, 77.16688537597656, 80.67322540283203, 84.1795654296875, 87.6859130859375, 91.19225311279297, 94.69860076904297, 98.20494079589844, 101.7112808227539, 105.21762084960938, 108.72396850585938, 112.23030853271484, 115.73664855957031]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 6.0, 7.0, 8.0, 4.0, 11.0, 11.0, 12.0, 19.0, 18.0, 30.0, 21.0, 40.0, 36.0, 33.0, 49.0, 45.0, 44.0, 45.0, 45.0, 49.0, 58.0, 39.0, 41.0, 44.0, 41.0, 33.0, 39.0, 28.0, 28.0, 20.0, 17.0, 14.0, 10.0, 18.0, 7.0, 14.0, 6.0, 5.0, 5.0, 3.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-17.03125, -16.536376953125, -16.04150390625, -15.546630859375, -15.0517578125, -14.556884765625, -14.06201171875, -13.567138671875, -13.072265625, -12.577392578125, -12.08251953125, -11.587646484375, -11.0927734375, -10.597900390625, -10.10302734375, -9.608154296875, -9.11328125, -8.618408203125, -8.12353515625, -7.628662109375, -7.1337890625, -6.638916015625, -6.14404296875, -5.649169921875, -5.154296875, -4.659423828125, -4.16455078125, -3.669677734375, -3.1748046875, -2.679931640625, -2.18505859375, -1.690185546875, -1.1953125, -0.700439453125, -0.20556640625, 0.289306640625, 0.7841796875, 1.279052734375, 1.77392578125, 2.268798828125, 2.763671875, 3.258544921875, 3.75341796875, 4.248291015625, 4.7431640625, 5.238037109375, 5.73291015625, 6.227783203125, 6.72265625, 7.217529296875, 7.71240234375, 8.207275390625, 8.7021484375, 9.197021484375, 9.69189453125, 10.186767578125, 10.681640625, 11.176513671875, 11.67138671875, 12.166259765625, 12.6611328125, 13.156005859375, 13.65087890625, 14.145751953125, 14.640625]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 0.0, 11.0, 20.0, 23.0, 26.0, 32.0, 55.0, 74.0, 92.0, 134.0, 243.0, 332.0, 554.0, 1051.0, 2062.0, 4452.0, 10937.0, 111921.0, 3753620.0, 282946.0, 14641.0, 5390.0, 2503.0, 1255.0, 683.0, 411.0, 256.0, 166.0, 123.0, 69.0, 52.0, 45.0, 32.0, 24.0, 16.0, 8.0, 13.0, 2.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-64.375, -62.56689453125, -60.7587890625, -58.95068359375, -57.142578125, -55.33447265625, -53.5263671875, -51.71826171875, -49.91015625, -48.10205078125, -46.2939453125, -44.48583984375, -42.677734375, -40.86962890625, -39.0615234375, -37.25341796875, -35.4453125, -33.63720703125, -31.8291015625, -30.02099609375, -28.212890625, -26.40478515625, -24.5966796875, -22.78857421875, -20.98046875, -19.17236328125, -17.3642578125, -15.55615234375, -13.748046875, -11.93994140625, -10.1318359375, -8.32373046875, -6.515625, -4.70751953125, -2.8994140625, -1.09130859375, 0.716796875, 2.52490234375, 4.3330078125, 6.14111328125, 7.94921875, 9.75732421875, 11.5654296875, 13.37353515625, 15.181640625, 16.98974609375, 18.7978515625, 20.60595703125, 22.4140625, 24.22216796875, 26.0302734375, 27.83837890625, 29.646484375, 31.45458984375, 33.2626953125, 35.07080078125, 36.87890625, 38.68701171875, 40.4951171875, 42.30322265625, 44.111328125, 45.91943359375, 47.7275390625, 49.53564453125, 51.34375]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 4.0, 6.0, 3.0, 3.0, 4.0, 7.0, 7.0, 2.0, 15.0, 14.0, 15.0, 15.0, 21.0, 27.0, 51.0, 92.0, 157.0, 367.0, 581.0, 893.0, 733.0, 465.0, 243.0, 102.0, 70.0, 39.0, 42.0, 20.0, 12.0, 14.0, 6.0, 9.0, 3.0, 7.0, 6.0, 5.0, 5.0, 2.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.21875, -28.267333984375, -27.31591796875, -26.364501953125, -25.4130859375, -24.461669921875, -23.51025390625, -22.558837890625, -21.607421875, -20.656005859375, -19.70458984375, -18.753173828125, -17.8017578125, -16.850341796875, -15.89892578125, -14.947509765625, -13.99609375, -13.044677734375, -12.09326171875, -11.141845703125, -10.1904296875, -9.239013671875, -8.28759765625, -7.336181640625, -6.384765625, -5.433349609375, -4.48193359375, -3.530517578125, -2.5791015625, -1.627685546875, -0.67626953125, 0.275146484375, 1.2265625, 2.177978515625, 3.12939453125, 4.080810546875, 5.0322265625, 5.983642578125, 6.93505859375, 7.886474609375, 8.837890625, 9.789306640625, 10.74072265625, 11.692138671875, 12.6435546875, 13.594970703125, 14.54638671875, 15.497802734375, 16.44921875, 17.400634765625, 18.35205078125, 19.303466796875, 20.2548828125, 21.206298828125, 22.15771484375, 23.109130859375, 24.060546875, 25.011962890625, 25.96337890625, 26.914794921875, 27.8662109375, 28.817626953125, 29.76904296875, 30.720458984375, 31.671875]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 4.0, 6.0, 6.0, 6.0, 1.0, 9.0, 9.0, 14.0, 8.0, 21.0, 27.0, 44.0, 86.0, 143.0, 251.0, 543.0, 1259.0, 2961.0, 8229.0, 26313.0, 285671.0, 3774374.0, 70076.0, 15186.0, 5221.0, 2041.0, 837.0, 415.0, 198.0, 102.0, 62.0, 44.0, 28.0, 22.0, 15.0, 14.0, 10.0, 2.0, 4.0, 8.0, 8.0, 7.0, 1.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.625, -79.1728515625, -76.720703125, -74.2685546875, -71.81640625, -69.3642578125, -66.912109375, -64.4599609375, -62.0078125, -59.5556640625, -57.103515625, -54.6513671875, -52.19921875, -49.7470703125, -47.294921875, -44.8427734375, -42.390625, -39.9384765625, -37.486328125, -35.0341796875, -32.58203125, -30.1298828125, -27.677734375, -25.2255859375, -22.7734375, -20.3212890625, -17.869140625, -15.4169921875, -12.96484375, -10.5126953125, -8.060546875, -5.6083984375, -3.15625, -0.7041015625, 1.748046875, 4.2001953125, 6.65234375, 9.1044921875, 11.556640625, 14.0087890625, 16.4609375, 18.9130859375, 21.365234375, 23.8173828125, 26.26953125, 28.7216796875, 31.173828125, 33.6259765625, 36.078125, 38.5302734375, 40.982421875, 43.4345703125, 45.88671875, 48.3388671875, 50.791015625, 53.2431640625, 55.6953125, 58.1474609375, 60.599609375, 63.0517578125, 65.50390625, 67.9560546875, 70.408203125, 72.8603515625, 75.3125]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 8.0, 7.0, 21.0, 36.0, 60.0, 147.0, 274.0, 238.0, 100.0, 46.0, 30.0, 19.0, 11.0, 9.0, 3.0, 1.0, 2.0], "bins": [-413.81341552734375, -406.13128662109375, -398.44915771484375, -390.76702880859375, -383.08489990234375, -375.40277099609375, -367.72064208984375, -360.03851318359375, -352.35638427734375, -344.67425537109375, -336.99212646484375, -329.30999755859375, -321.62786865234375, -313.94573974609375, -306.26361083984375, -298.58148193359375, -290.8993835449219, -283.2172546386719, -275.5351257324219, -267.8529968261719, -260.1708679199219, -252.48873901367188, -244.80661010742188, -237.12449645996094, -229.44235229492188, -221.76022338867188, -214.07809448242188, -206.39596557617188, -198.71383666992188, -191.03170776367188, -183.34957885742188, -175.66746520996094, -167.98533630371094, -160.30320739746094, -152.62107849121094, -144.93894958496094, -137.25682067871094, -129.57470703125, -121.89257049560547, -114.21044921875, -106.5283203125, -98.84619140625, -91.1640625, -83.48193359375, -75.79981231689453, -68.11768341064453, -60.43555450439453, -52.7534294128418, -45.07129669189453, -37.38916778564453, -29.707042694091797, -22.024913787841797, -14.34278678894043, -6.6606597900390625, 1.0214691162109375, 8.703594207763672, 16.385723114013672, 24.06785011291504, 31.749977111816406, 39.432106018066406, 47.114234924316406, 54.79636001586914, 62.47848892211914, 70.16061401367188, 77.84274291992188]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 7.0, 5.0, 13.0, 7.0, 7.0, 11.0, 6.0, 6.0, 19.0, 19.0, 21.0, 28.0, 23.0, 30.0, 33.0, 37.0, 39.0, 41.0, 40.0, 47.0, 34.0, 43.0, 36.0, 38.0, 30.0, 34.0, 31.0, 34.0, 29.0, 39.0, 26.0, 21.0, 20.0, 19.0, 25.0, 17.0, 22.0, 10.0, 10.0, 7.0, 5.0, 11.0, 7.0, 4.0, 2.0, 6.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-72.63909912109375, -70.26516723632812, -67.8912353515625, -65.51730346679688, -63.143367767333984, -60.76943588256836, -58.39550018310547, -56.021568298339844, -53.64763641357422, -51.273704528808594, -48.89977264404297, -46.52583694458008, -44.15190505981445, -41.77797317504883, -39.40403747558594, -37.03010559082031, -34.65617370605469, -32.28224182128906, -29.908308029174805, -27.534374237060547, -25.160442352294922, -22.786510467529297, -20.41257667541504, -18.03864288330078, -15.664710998535156, -13.290778160095215, -10.916845321655273, -8.542912483215332, -6.168979644775391, -3.795046806335449, -1.4211139678955078, 0.95281982421875, 3.326751708984375, 5.700684547424316, 8.074617385864258, 10.4485502243042, 12.82248306274414, 15.196415901184082, 17.570348739624023, 19.94428253173828, 22.318214416503906, 24.69214630126953, 27.06608009338379, 29.440013885498047, 31.813945770263672, 34.1878776550293, 36.56181335449219, 38.93574523925781, 41.30967712402344, 43.68360900878906, 46.05754089355469, 48.43147659301758, 50.8054084777832, 53.17934036254883, 55.55327606201172, 57.927207946777344, 60.30113983154297, 62.675071716308594, 65.04900360107422, 67.42293548583984, 69.796875, 72.17080688476562, 74.54473876953125, 76.91867065429688, 79.2926025390625]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 7.0, 6.0, 5.0, 8.0, 12.0, 7.0, 15.0, 21.0, 28.0, 32.0, 33.0, 33.0, 32.0, 36.0, 48.0, 38.0, 48.0, 46.0, 41.0, 41.0, 47.0, 39.0, 52.0, 45.0, 46.0, 29.0, 28.0, 35.0, 22.0, 19.0, 22.0, 16.0, 22.0, 15.0, 7.0, 7.0, 7.0, 5.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-17.265625, -16.776123046875, -16.28662109375, -15.797119140625, -15.3076171875, -14.818115234375, -14.32861328125, -13.839111328125, -13.349609375, -12.860107421875, -12.37060546875, -11.881103515625, -11.3916015625, -10.902099609375, -10.41259765625, -9.923095703125, -9.43359375, -8.944091796875, -8.45458984375, -7.965087890625, -7.4755859375, -6.986083984375, -6.49658203125, -6.007080078125, -5.517578125, -5.028076171875, -4.53857421875, -4.049072265625, -3.5595703125, -3.070068359375, -2.58056640625, -2.091064453125, -1.6015625, -1.112060546875, -0.62255859375, -0.133056640625, 0.3564453125, 0.845947265625, 1.33544921875, 1.824951171875, 2.314453125, 2.803955078125, 3.29345703125, 3.782958984375, 4.2724609375, 4.761962890625, 5.25146484375, 5.740966796875, 6.23046875, 6.719970703125, 7.20947265625, 7.698974609375, 8.1884765625, 8.677978515625, 9.16748046875, 9.656982421875, 10.146484375, 10.635986328125, 11.12548828125, 11.614990234375, 12.1044921875, 12.593994140625, 13.08349609375, 13.572998046875, 14.0625]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 3.0, 8.0, 5.0, 11.0, 15.0, 29.0, 20.0, 34.0, 55.0, 84.0, 115.0, 212.0, 363.0, 599.0, 1031.0, 1705.0, 2989.0, 5123.0, 8803.0, 15294.0, 26289.0, 46211.0, 85184.0, 165906.0, 268557.0, 194419.0, 99739.0, 53834.0, 30074.0, 17503.0, 10105.0, 5849.0, 3417.0, 2015.0, 1198.0, 673.0, 424.0, 255.0, 162.0, 90.0, 57.0, 39.0, 19.0, 16.0, 11.0, 7.0, 3.0, 5.0, 3.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.5732421875, -1.518280029296875, -1.46331787109375, -1.408355712890625, -1.3533935546875, -1.298431396484375, -1.24346923828125, -1.188507080078125, -1.133544921875, -1.078582763671875, -1.02362060546875, -0.968658447265625, -0.9136962890625, -0.858734130859375, -0.80377197265625, -0.748809814453125, -0.69384765625, -0.638885498046875, -0.58392333984375, -0.528961181640625, -0.4739990234375, -0.419036865234375, -0.36407470703125, -0.309112548828125, -0.254150390625, -0.199188232421875, -0.14422607421875, -0.089263916015625, -0.0343017578125, 0.020660400390625, 0.07562255859375, 0.130584716796875, 0.185546875, 0.240509033203125, 0.29547119140625, 0.350433349609375, 0.4053955078125, 0.460357666015625, 0.51531982421875, 0.570281982421875, 0.625244140625, 0.680206298828125, 0.73516845703125, 0.790130615234375, 0.8450927734375, 0.900054931640625, 0.95501708984375, 1.009979248046875, 1.06494140625, 1.119903564453125, 1.17486572265625, 1.229827880859375, 1.2847900390625, 1.339752197265625, 1.39471435546875, 1.449676513671875, 1.504638671875, 1.559600830078125, 1.61456298828125, 1.669525146484375, 1.7244873046875, 1.779449462890625, 1.83441162109375, 1.889373779296875, 1.9443359375]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 5.0, 5.0, 8.0, 3.0, 7.0, 11.0, 4.0, 8.0, 9.0, 11.0, 13.0, 23.0, 17.0, 20.0, 23.0, 34.0, 43.0, 30.0, 26.0, 30.0, 32.0, 28.0, 42.0, 41.0, 1056.0, 36.0, 32.0, 30.0, 36.0, 35.0, 26.0, 40.0, 22.0, 32.0, 23.0, 23.0, 29.0, 23.0, 12.0, 22.0, 18.0, 13.0, 7.0, 10.0, 6.0, 10.0, 4.0, 3.0, 6.0, 3.0, 1.0, 2.0, 3.0], "bins": [-8.75, -8.50531005859375, -8.2606201171875, -8.01593017578125, -7.771240234375, -7.52655029296875, -7.2818603515625, -7.03717041015625, -6.79248046875, -6.54779052734375, -6.3031005859375, -6.05841064453125, -5.813720703125, -5.56903076171875, -5.3243408203125, -5.07965087890625, -4.8349609375, -4.59027099609375, -4.3455810546875, -4.10089111328125, -3.856201171875, -3.61151123046875, -3.3668212890625, -3.12213134765625, -2.87744140625, -2.63275146484375, -2.3880615234375, -2.14337158203125, -1.898681640625, -1.65399169921875, -1.4093017578125, -1.16461181640625, -0.919921875, -0.67523193359375, -0.4305419921875, -0.18585205078125, 0.058837890625, 0.30352783203125, 0.5482177734375, 0.79290771484375, 1.03759765625, 1.28228759765625, 1.5269775390625, 1.77166748046875, 2.016357421875, 2.26104736328125, 2.5057373046875, 2.75042724609375, 2.9951171875, 3.23980712890625, 3.4844970703125, 3.72918701171875, 3.973876953125, 4.21856689453125, 4.4632568359375, 4.70794677734375, 4.95263671875, 5.19732666015625, 5.4420166015625, 5.68670654296875, 5.931396484375, 6.17608642578125, 6.4207763671875, 6.66546630859375, 6.91015625]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 7.0, 8.0, 13.0, 17.0, 29.0, 32.0, 67.0, 100.0, 148.0, 239.0, 378.0, 567.0, 851.0, 1315.0, 1965.0, 3017.0, 4505.0, 6672.0, 10281.0, 15328.0, 24063.0, 38290.0, 63832.0, 108523.0, 182786.0, 1256414.0, 148022.0, 87460.0, 51897.0, 31899.0, 20022.0, 12958.0, 8563.0, 5598.0, 3839.0, 2485.0, 1710.0, 1146.0, 721.0, 464.0, 322.0, 221.0, 118.0, 81.0, 64.0, 39.0, 20.0, 15.0, 8.0, 9.0, 7.0, 2.0, 2.0, 3.0, 1.0, 1.0], "bins": [-0.83154296875, -0.8065719604492188, -0.7816009521484375, -0.7566299438476562, -0.731658935546875, -0.7066879272460938, -0.6817169189453125, -0.6567459106445312, -0.63177490234375, -0.6068038940429688, -0.5818328857421875, -0.5568618774414062, -0.531890869140625, -0.5069198608398438, -0.4819488525390625, -0.45697784423828125, -0.4320068359375, -0.40703582763671875, -0.3820648193359375, -0.35709381103515625, -0.332122802734375, -0.30715179443359375, -0.2821807861328125, -0.25720977783203125, -0.23223876953125, -0.20726776123046875, -0.1822967529296875, -0.15732574462890625, -0.132354736328125, -0.10738372802734375, -0.0824127197265625, -0.05744171142578125, -0.032470703125, -0.00749969482421875, 0.0174713134765625, 0.04244232177734375, 0.067413330078125, 0.09238433837890625, 0.1173553466796875, 0.14232635498046875, 0.16729736328125, 0.19226837158203125, 0.2172393798828125, 0.24221038818359375, 0.267181396484375, 0.29215240478515625, 0.3171234130859375, 0.34209442138671875, 0.3670654296875, 0.39203643798828125, 0.4170074462890625, 0.44197845458984375, 0.466949462890625, 0.49192047119140625, 0.5168914794921875, 0.5418624877929688, 0.56683349609375, 0.5918045043945312, 0.6167755126953125, 0.6417465209960938, 0.666717529296875, 0.6916885375976562, 0.7166595458984375, 0.7416305541992188, 0.7666015625]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 3.0, 0.0, 5.0, 3.0, 1.0, 6.0, 10.0, 14.0, 9.0, 22.0, 14.0, 29.0, 31.0, 46.0, 53.0, 86.0, 135.0, 152.0, 117.0, 67.0, 41.0, 38.0, 32.0, 19.0, 14.0, 10.0, 9.0, 11.0, 10.0, 7.0, 5.0, 4.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0419921875, -0.04059648513793945, -0.039200782775878906, -0.03780508041381836, -0.03640937805175781, -0.035013675689697266, -0.03361797332763672, -0.03222227096557617, -0.030826568603515625, -0.029430866241455078, -0.02803516387939453, -0.026639461517333984, -0.025243759155273438, -0.02384805679321289, -0.022452354431152344, -0.021056652069091797, -0.01966094970703125, -0.018265247344970703, -0.016869544982910156, -0.01547384262084961, -0.014078140258789062, -0.012682437896728516, -0.011286735534667969, -0.009891033172607422, -0.008495330810546875, -0.007099628448486328, -0.005703926086425781, -0.004308223724365234, -0.0029125213623046875, -0.0015168190002441406, -0.00012111663818359375, 0.0012745857238769531, 0.0026702880859375, 0.004065990447998047, 0.005461692810058594, 0.006857395172119141, 0.008253097534179688, 0.009648799896240234, 0.011044502258300781, 0.012440204620361328, 0.013835906982421875, 0.015231609344482422, 0.01662731170654297, 0.018023014068603516, 0.019418716430664062, 0.02081441879272461, 0.022210121154785156, 0.023605823516845703, 0.02500152587890625, 0.026397228240966797, 0.027792930603027344, 0.02918863296508789, 0.030584335327148438, 0.031980037689208984, 0.03337574005126953, 0.03477144241333008, 0.036167144775390625, 0.03756284713745117, 0.03895854949951172, 0.040354251861572266, 0.04174995422363281, 0.04314565658569336, 0.044541358947753906, 0.04593706130981445, 0.047332763671875]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 10.0, 8.0, 7.0, 7.0, 17.0, 18.0, 20.0, 19.0, 47.0, 67.0, 117.0, 284.0, 1967.0, 785502.0, 258488.0, 1393.0, 280.0, 103.0, 59.0, 39.0, 26.0, 24.0, 13.0, 15.0, 11.0, 7.0, 2.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1171875, -1.0842742919921875, -1.051361083984375, -1.0184478759765625, -0.98553466796875, -0.9526214599609375, -0.919708251953125, -0.8867950439453125, -0.8538818359375, -0.8209686279296875, -0.788055419921875, -0.7551422119140625, -0.72222900390625, -0.6893157958984375, -0.656402587890625, -0.6234893798828125, -0.590576171875, -0.5576629638671875, -0.524749755859375, -0.4918365478515625, -0.45892333984375, -0.4260101318359375, -0.393096923828125, -0.3601837158203125, -0.3272705078125, -0.2943572998046875, -0.261444091796875, -0.2285308837890625, -0.19561767578125, -0.1627044677734375, -0.129791259765625, -0.0968780517578125, -0.06396484375, -0.0310516357421875, 0.001861572265625, 0.0347747802734375, 0.06768798828125, 0.1006011962890625, 0.133514404296875, 0.1664276123046875, 0.1993408203125, 0.2322540283203125, 0.265167236328125, 0.2980804443359375, 0.33099365234375, 0.3639068603515625, 0.396820068359375, 0.4297332763671875, 0.462646484375, 0.4955596923828125, 0.528472900390625, 0.5613861083984375, 0.59429931640625, 0.6272125244140625, 0.660125732421875, 0.6930389404296875, 0.7259521484375, 0.7588653564453125, 0.791778564453125, 0.8246917724609375, 0.85760498046875, 0.8905181884765625, 0.923431396484375, 0.9563446044921875, 0.9892578125]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 8.0, 13.0, 41.0, 70.0, 196.0, 383.0, 168.0, 63.0, 25.0, 23.0, 8.0, 2.0, 9.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07136602699756622, -0.0644640251994133, -0.05756201595067978, -0.050660014152526855, -0.04375800862908363, -0.03685600310564041, -0.029954001307487488, -0.023051995784044266, -0.016149990260601044, -0.009247985668480396, -0.002345981076359749, 0.004556022584438324, 0.011458028107881546, 0.018360033631324768, 0.02526203542947769, 0.032164040952920914, 0.039066046476364136, 0.04596805199980736, 0.05287005752325058, 0.0597720593214035, 0.06667406857013702, 0.07357607036828995, 0.08047807216644287, 0.08738008141517639, 0.09428208321332932, 0.10118408501148224, 0.10808609426021576, 0.11498809605836868, 0.1218900978565216, 0.12879210710525513, 0.13569411635398865, 0.14259611070156097, 0.1494981050491333, 0.15640011429786682, 0.16330210864543915, 0.17020411789417267, 0.1771061271429062, 0.18400812149047852, 0.19091013073921204, 0.19781213998794556, 0.20471414923667908, 0.2116161584854126, 0.21851815283298492, 0.22542016208171844, 0.23232217133045197, 0.2392241656780243, 0.2461261749267578, 0.25302818417549133, 0.25993019342422485, 0.2668322026729584, 0.2737342119216919, 0.280636191368103, 0.28753820061683655, 0.29444020986557007, 0.3013422191143036, 0.3082442283630371, 0.31514620780944824, 0.32204821705818176, 0.3289502263069153, 0.3358522057533264, 0.34275421500205994, 0.34965622425079346, 0.356558233499527, 0.3634602427482605, 0.370362251996994]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 4.0, 6.0, 6.0, 10.0, 13.0, 25.0, 16.0, 23.0, 33.0, 19.0, 27.0, 23.0, 26.0, 50.0, 36.0, 29.0, 52.0, 37.0, 52.0, 32.0, 48.0, 49.0, 34.0, 46.0, 47.0, 31.0, 39.0, 35.0, 23.0, 26.0, 29.0, 26.0, 11.0, 7.0, 10.0, 8.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06251299381256104, -0.060667648911476135, -0.05882230028510094, -0.05697695165872574, -0.05513160675764084, -0.05328626185655594, -0.05144091323018074, -0.04959556460380554, -0.04775021970272064, -0.04590487480163574, -0.044059526175260544, -0.042214177548885345, -0.040368832647800446, -0.038523487746715546, -0.03667813912034035, -0.03483279049396515, -0.03298744559288025, -0.0311420988291502, -0.02929675206542015, -0.0274514053016901, -0.025606058537960052, -0.023760711774230003, -0.021915365010499954, -0.020070018246769905, -0.018224671483039856, -0.016379324719309807, -0.014533977955579758, -0.012688631191849709, -0.01084328442811966, -0.00899793766438961, -0.007152590900659561, -0.005307244136929512, -0.003461897373199463, -0.0016165506094694138, 0.00022879615426063538, 0.0020741429179906845, 0.003919489681720734, 0.005764836445450783, 0.007610183209180832, 0.009455529972910881, 0.01130087673664093, 0.01314622350037098, 0.014991570264101028, 0.016836917027831078, 0.018682263791561127, 0.020527610555291176, 0.022372957319021225, 0.024218304082751274, 0.026063650846481323, 0.027908997610211372, 0.02975434437394142, 0.03159969300031662, 0.03344503790140152, 0.03529038280248642, 0.03713573142886162, 0.038981080055236816, 0.040826424956321716, 0.042671769857406616, 0.044517118483781815, 0.04636246711015701, 0.04820781201124191, 0.05005315691232681, 0.05189850553870201, 0.05374385416507721, 0.05558919906616211]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 7.0, 6.0, 5.0, 8.0, 12.0, 7.0, 16.0, 19.0, 29.0, 32.0, 33.0, 33.0, 32.0, 36.0, 48.0, 38.0, 48.0, 46.0, 40.0, 42.0, 47.0, 39.0, 53.0, 44.0, 46.0, 29.0, 28.0, 34.0, 23.0, 20.0, 21.0, 16.0, 22.0, 15.0, 7.0, 7.0, 7.0, 5.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-17.265625, -16.776123046875, -16.28662109375, -15.797119140625, -15.3076171875, -14.818115234375, -14.32861328125, -13.839111328125, -13.349609375, -12.860107421875, -12.37060546875, -11.881103515625, -11.3916015625, -10.902099609375, -10.41259765625, -9.923095703125, -9.43359375, -8.944091796875, -8.45458984375, -7.965087890625, -7.4755859375, -6.986083984375, -6.49658203125, -6.007080078125, -5.517578125, -5.028076171875, -4.53857421875, -4.049072265625, -3.5595703125, -3.070068359375, -2.58056640625, -2.091064453125, -1.6015625, -1.112060546875, -0.62255859375, -0.133056640625, 0.3564453125, 0.845947265625, 1.33544921875, 1.824951171875, 2.314453125, 2.803955078125, 3.29345703125, 3.782958984375, 4.2724609375, 4.761962890625, 5.25146484375, 5.740966796875, 6.23046875, 6.719970703125, 7.20947265625, 7.698974609375, 8.1884765625, 8.677978515625, 9.16748046875, 9.656982421875, 10.146484375, 10.635986328125, 11.12548828125, 11.614990234375, 12.1044921875, 12.593994140625, 13.08349609375, 13.572998046875, 14.0625]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 7.0, 8.0, 6.0, 10.0, 14.0, 11.0, 18.0, 32.0, 47.0, 65.0, 78.0, 124.0, 159.0, 309.0, 567.0, 1421.0, 4979.0, 24291.0, 222755.0, 709317.0, 68524.0, 11145.0, 2647.0, 915.0, 422.0, 212.0, 145.0, 100.0, 52.0, 40.0, 33.0, 25.0, 27.0, 18.0, 9.0, 7.0, 7.0, 5.0, 4.0, 3.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-16.078125, -15.6221923828125, -15.166259765625, -14.7103271484375, -14.25439453125, -13.7984619140625, -13.342529296875, -12.8865966796875, -12.4306640625, -11.9747314453125, -11.518798828125, -11.0628662109375, -10.60693359375, -10.1510009765625, -9.695068359375, -9.2391357421875, -8.783203125, -8.3272705078125, -7.871337890625, -7.4154052734375, -6.95947265625, -6.5035400390625, -6.047607421875, -5.5916748046875, -5.1357421875, -4.6798095703125, -4.223876953125, -3.7679443359375, -3.31201171875, -2.8560791015625, -2.400146484375, -1.9442138671875, -1.48828125, -1.0323486328125, -0.576416015625, -0.1204833984375, 0.33544921875, 0.7913818359375, 1.247314453125, 1.7032470703125, 2.1591796875, 2.6151123046875, 3.071044921875, 3.5269775390625, 3.98291015625, 4.4388427734375, 4.894775390625, 5.3507080078125, 5.806640625, 6.2625732421875, 6.718505859375, 7.1744384765625, 7.63037109375, 8.0863037109375, 8.542236328125, 8.9981689453125, 9.4541015625, 9.9100341796875, 10.365966796875, 10.8218994140625, 11.27783203125, 11.7337646484375, 12.189697265625, 12.6456298828125, 13.1015625]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 3.0, 3.0, 8.0, 3.0, 12.0, 12.0, 16.0, 12.0, 10.0, 18.0, 30.0, 23.0, 29.0, 26.0, 31.0, 27.0, 36.0, 41.0, 33.0, 41.0, 50.0, 192.0, 1886.0, 81.0, 34.0, 43.0, 46.0, 28.0, 32.0, 40.0, 28.0, 19.0, 18.0, 20.0, 13.0, 19.0, 16.0, 13.0, 13.0, 12.0, 6.0, 4.0, 5.0, 9.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-35.59375, -34.45654296875, -33.3193359375, -32.18212890625, -31.044921875, -29.90771484375, -28.7705078125, -27.63330078125, -26.49609375, -25.35888671875, -24.2216796875, -23.08447265625, -21.947265625, -20.81005859375, -19.6728515625, -18.53564453125, -17.3984375, -16.26123046875, -15.1240234375, -13.98681640625, -12.849609375, -11.71240234375, -10.5751953125, -9.43798828125, -8.30078125, -7.16357421875, -6.0263671875, -4.88916015625, -3.751953125, -2.61474609375, -1.4775390625, -0.34033203125, 0.796875, 1.93408203125, 3.0712890625, 4.20849609375, 5.345703125, 6.48291015625, 7.6201171875, 8.75732421875, 9.89453125, 11.03173828125, 12.1689453125, 13.30615234375, 14.443359375, 15.58056640625, 16.7177734375, 17.85498046875, 18.9921875, 20.12939453125, 21.2666015625, 22.40380859375, 23.541015625, 24.67822265625, 25.8154296875, 26.95263671875, 28.08984375, 29.22705078125, 30.3642578125, 31.50146484375, 32.638671875, 33.77587890625, 34.9130859375, 36.05029296875, 37.1875]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 10.0, 7.0, 5.0, 4.0, 14.0, 16.0, 14.0, 18.0, 23.0, 19.0, 30.0, 42.0, 55.0, 79.0, 102.0, 110.0, 140.0, 214.0, 316.0, 693.0, 3998.0, 3116559.0, 20711.0, 1087.0, 398.0, 243.0, 173.0, 125.0, 104.0, 89.0, 55.0, 53.0, 36.0, 37.0, 24.0, 20.0, 21.0, 12.0, 18.0, 10.0, 5.0, 6.0, 5.0, 1.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-78.25, -75.85546875, -73.4609375, -71.06640625, -68.671875, -66.27734375, -63.8828125, -61.48828125, -59.09375, -56.69921875, -54.3046875, -51.91015625, -49.515625, -47.12109375, -44.7265625, -42.33203125, -39.9375, -37.54296875, -35.1484375, -32.75390625, -30.359375, -27.96484375, -25.5703125, -23.17578125, -20.78125, -18.38671875, -15.9921875, -13.59765625, -11.203125, -8.80859375, -6.4140625, -4.01953125, -1.625, 0.76953125, 3.1640625, 5.55859375, 7.953125, 10.34765625, 12.7421875, 15.13671875, 17.53125, 19.92578125, 22.3203125, 24.71484375, 27.109375, 29.50390625, 31.8984375, 34.29296875, 36.6875, 39.08203125, 41.4765625, 43.87109375, 46.265625, 48.66015625, 51.0546875, 53.44921875, 55.84375, 58.23828125, 60.6328125, 63.02734375, 65.421875, 67.81640625, 70.2109375, 72.60546875, 75.0]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [7.0, 51.0, 376.0, 502.0, 83.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.273372650146484, -6.994553565979004, -3.7157340049743652, -0.43691444396972656, 2.841904640197754, 6.120723724365234, 9.399543762207031, 12.678361892700195, 15.957181930541992, 19.23600196838379, 22.514820098876953, 25.79364013671875, 29.072460174560547, 32.351280212402344, 35.630096435546875, 38.90891647338867, 42.18773651123047, 45.466556549072266, 48.74537658691406, 52.024192810058594, 55.30301284790039, 58.58183288574219, 61.860652923583984, 65.13947296142578, 68.41828918457031, 71.69710540771484, 74.9759292602539, 78.25474548339844, 81.5335693359375, 84.81238555908203, 88.09120178222656, 91.37002563476562, 94.64884185791016, 97.92765808105469, 101.20648193359375, 104.48529815673828, 107.76412200927734, 111.04293823242188, 114.32176208496094, 117.60057830810547, 120.87939453125, 124.15821075439453, 127.4370346069336, 130.71585083007812, 133.9946746826172, 137.27349853515625, 140.55230712890625, 143.8311309814453, 147.10995483398438, 150.38877868652344, 153.66758728027344, 156.9464111328125, 160.22523498535156, 163.50405883789062, 166.78286743164062, 170.0616912841797, 173.3404998779297, 176.61932373046875, 179.89813232421875, 183.1769561767578, 186.45578002929688, 189.73458862304688, 193.01341247558594, 196.292236328125, 199.57106018066406]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 7.0, 10.0, 6.0, 4.0, 11.0, 17.0, 15.0, 21.0, 15.0, 28.0, 23.0, 28.0, 33.0, 34.0, 43.0, 37.0, 31.0, 46.0, 42.0, 59.0, 45.0, 35.0, 39.0, 38.0, 40.0, 39.0, 48.0, 35.0, 27.0, 22.0, 19.0, 21.0, 16.0, 13.0, 11.0, 9.0, 7.0, 10.0, 6.0, 3.0, 3.0, 5.0, 2.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-119.44609832763672, -115.95172119140625, -112.45734405517578, -108.96296691894531, -105.46858978271484, -101.97421264648438, -98.47984313964844, -94.98545837402344, -91.4910888671875, -87.99671173095703, -84.50233459472656, -81.0079574584961, -77.51358032226562, -74.01920318603516, -70.52482604980469, -67.03045654296875, -63.53607177734375, -60.04169464111328, -56.54731750488281, -53.052940368652344, -49.558563232421875, -46.064186096191406, -42.5698127746582, -39.075435638427734, -35.581058502197266, -32.0866813659668, -28.592304229736328, -25.097929000854492, -21.603551864624023, -18.109174728393555, -14.614799499511719, -11.12042236328125, -7.6260528564453125, -4.131676197052002, -0.6372995376586914, 2.857076644897461, 6.35145378112793, 9.845830917358398, 13.340206146240234, 16.834583282470703, 20.328960418701172, 23.82333755493164, 27.31771469116211, 30.812089920043945, 34.30646514892578, 37.80084228515625, 41.29521942138672, 44.78959655761719, 48.283973693847656, 51.778350830078125, 55.272727966308594, 58.76710510253906, 62.26148223876953, 65.755859375, 69.25022888183594, 72.74461364746094, 76.23898315429688, 79.73336029052734, 83.22773742675781, 86.72211456298828, 90.21649169921875, 93.71086883544922, 97.20524597167969, 100.69961547851562, 104.19400024414062]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 7.0, 5.0, 4.0, 12.0, 13.0, 7.0, 17.0, 24.0, 24.0, 33.0, 36.0, 35.0, 31.0, 35.0, 46.0, 43.0, 40.0, 47.0, 35.0, 53.0, 40.0, 48.0, 45.0, 48.0, 39.0, 28.0, 29.0, 31.0, 26.0, 21.0, 18.0, 19.0, 18.0, 13.0, 10.0, 8.0, 5.0, 5.0, 6.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-17.078125, -16.59130859375, -16.1044921875, -15.61767578125, -15.130859375, -14.64404296875, -14.1572265625, -13.67041015625, -13.18359375, -12.69677734375, -12.2099609375, -11.72314453125, -11.236328125, -10.74951171875, -10.2626953125, -9.77587890625, -9.2890625, -8.80224609375, -8.3154296875, -7.82861328125, -7.341796875, -6.85498046875, -6.3681640625, -5.88134765625, -5.39453125, -4.90771484375, -4.4208984375, -3.93408203125, -3.447265625, -2.96044921875, -2.4736328125, -1.98681640625, -1.5, -1.01318359375, -0.5263671875, -0.03955078125, 0.447265625, 0.93408203125, 1.4208984375, 1.90771484375, 2.39453125, 2.88134765625, 3.3681640625, 3.85498046875, 4.341796875, 4.82861328125, 5.3154296875, 5.80224609375, 6.2890625, 6.77587890625, 7.2626953125, 7.74951171875, 8.236328125, 8.72314453125, 9.2099609375, 9.69677734375, 10.18359375, 10.67041015625, 11.1572265625, 11.64404296875, 12.130859375, 12.61767578125, 13.1044921875, 13.59130859375, 14.078125]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 5.0, 10.0, 16.0, 29.0, 33.0, 37.0, 74.0, 101.0, 123.0, 165.0, 253.0, 356.0, 524.0, 781.0, 1157.0, 1786.0, 3200.0, 5471.0, 10970.0, 61006.0, 1049730.0, 2836047.0, 187401.0, 17036.0, 7198.0, 3879.0, 2288.0, 1437.0, 964.0, 620.0, 429.0, 330.0, 208.0, 159.0, 117.0, 93.0, 73.0, 46.0, 41.0, 28.0, 19.0, 11.0, 10.0, 5.0, 5.0, 6.0, 4.0, 1.0, 2.0], "bins": [-38.78125, -37.710205078125, -36.63916015625, -35.568115234375, -34.4970703125, -33.426025390625, -32.35498046875, -31.283935546875, -30.212890625, -29.141845703125, -28.07080078125, -26.999755859375, -25.9287109375, -24.857666015625, -23.78662109375, -22.715576171875, -21.64453125, -20.573486328125, -19.50244140625, -18.431396484375, -17.3603515625, -16.289306640625, -15.21826171875, -14.147216796875, -13.076171875, -12.005126953125, -10.93408203125, -9.863037109375, -8.7919921875, -7.720947265625, -6.64990234375, -5.578857421875, -4.5078125, -3.436767578125, -2.36572265625, -1.294677734375, -0.2236328125, 0.847412109375, 1.91845703125, 2.989501953125, 4.060546875, 5.131591796875, 6.20263671875, 7.273681640625, 8.3447265625, 9.415771484375, 10.48681640625, 11.557861328125, 12.62890625, 13.699951171875, 14.77099609375, 15.842041015625, 16.9130859375, 17.984130859375, 19.05517578125, 20.126220703125, 21.197265625, 22.268310546875, 23.33935546875, 24.410400390625, 25.4814453125, 26.552490234375, 27.62353515625, 28.694580078125, 29.765625]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 6.0, 7.0, 7.0, 8.0, 11.0, 7.0, 15.0, 15.0, 17.0, 25.0, 37.0, 62.0, 104.0, 183.0, 369.0, 599.0, 949.0, 660.0, 412.0, 234.0, 115.0, 62.0, 42.0, 26.0, 27.0, 16.0, 13.0, 11.0, 8.0, 7.0, 4.0, 3.0, 4.0, 7.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-29.40625, -28.503662109375, -27.60107421875, -26.698486328125, -25.7958984375, -24.893310546875, -23.99072265625, -23.088134765625, -22.185546875, -21.282958984375, -20.38037109375, -19.477783203125, -18.5751953125, -17.672607421875, -16.77001953125, -15.867431640625, -14.96484375, -14.062255859375, -13.15966796875, -12.257080078125, -11.3544921875, -10.451904296875, -9.54931640625, -8.646728515625, -7.744140625, -6.841552734375, -5.93896484375, -5.036376953125, -4.1337890625, -3.231201171875, -2.32861328125, -1.426025390625, -0.5234375, 0.379150390625, 1.28173828125, 2.184326171875, 3.0869140625, 3.989501953125, 4.89208984375, 5.794677734375, 6.697265625, 7.599853515625, 8.50244140625, 9.405029296875, 10.3076171875, 11.210205078125, 12.11279296875, 13.015380859375, 13.91796875, 14.820556640625, 15.72314453125, 16.625732421875, 17.5283203125, 18.430908203125, 19.33349609375, 20.236083984375, 21.138671875, 22.041259765625, 22.94384765625, 23.846435546875, 24.7490234375, 25.651611328125, 26.55419921875, 27.456787109375, 28.359375]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 0.0, 3.0, 1.0, 3.0, 5.0, 1.0, 1.0, 6.0, 6.0, 13.0, 18.0, 22.0, 28.0, 40.0, 48.0, 98.0, 198.0, 511.0, 1429.0, 5719.0, 35389.0, 3839211.0, 291125.0, 15584.0, 3169.0, 890.0, 361.0, 175.0, 71.0, 44.0, 33.0, 14.0, 21.0, 13.0, 11.0, 8.0, 4.0, 4.0, 6.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-105.5, -102.07421875, -98.6484375, -95.22265625, -91.796875, -88.37109375, -84.9453125, -81.51953125, -78.09375, -74.66796875, -71.2421875, -67.81640625, -64.390625, -60.96484375, -57.5390625, -54.11328125, -50.6875, -47.26171875, -43.8359375, -40.41015625, -36.984375, -33.55859375, -30.1328125, -26.70703125, -23.28125, -19.85546875, -16.4296875, -13.00390625, -9.578125, -6.15234375, -2.7265625, 0.69921875, 4.125, 7.55078125, 10.9765625, 14.40234375, 17.828125, 21.25390625, 24.6796875, 28.10546875, 31.53125, 34.95703125, 38.3828125, 41.80859375, 45.234375, 48.66015625, 52.0859375, 55.51171875, 58.9375, 62.36328125, 65.7890625, 69.21484375, 72.640625, 76.06640625, 79.4921875, 82.91796875, 86.34375, 89.76953125, 93.1953125, 96.62109375, 100.046875, 103.47265625, 106.8984375, 110.32421875, 113.75]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 3.0, 11.0, 27.0, 50.0, 103.0, 242.0, 304.0, 159.0, 50.0, 25.0, 20.0, 6.0, 5.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-186.51565551757812, -179.0924835205078, -171.6693115234375, -164.2461395263672, -156.82296752929688, -149.3997802734375, -141.9766082763672, -134.55343627929688, -127.13026428222656, -119.70709228515625, -112.28392028808594, -104.8607406616211, -97.43756866455078, -90.01439666748047, -82.59121704101562, -75.16804504394531, -67.744873046875, -60.32170104980469, -52.89852523803711, -45.47534942626953, -38.05217742919922, -30.629005432128906, -23.205829620361328, -15.78265380859375, -8.359481811523438, -0.9363079071044922, 6.486865997314453, 13.910039901733398, 21.333213806152344, 28.756385803222656, 36.179561614990234, 43.60273742675781, 51.025909423828125, 58.44908142089844, 65.87225341796875, 73.2954330444336, 80.7186050415039, 88.14177703857422, 95.56495666503906, 102.98812866210938, 110.41130065917969, 117.83447265625, 125.25764465332031, 132.68081665039062, 140.10400390625, 147.52716064453125, 154.95034790039062, 162.37351989746094, 169.79669189453125, 177.21986389160156, 184.64303588867188, 192.0662078857422, 199.4893798828125, 206.91256713867188, 214.3357391357422, 221.7589111328125, 229.1820831298828, 236.60525512695312, 244.02842712402344, 251.45159912109375, 258.8747863769531, 266.2979431152344, 273.72113037109375, 281.144287109375, 288.5674743652344]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 4.0, 2.0, 2.0, 3.0, 12.0, 8.0, 4.0, 13.0, 12.0, 17.0, 21.0, 18.0, 19.0, 27.0, 24.0, 22.0, 28.0, 36.0, 39.0, 41.0, 34.0, 43.0, 39.0, 31.0, 45.0, 50.0, 37.0, 29.0, 38.0, 32.0, 31.0, 32.0, 23.0, 27.0, 26.0, 16.0, 26.0, 21.0, 15.0, 9.0, 5.0, 12.0, 7.0, 8.0, 3.0, 8.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.77050018310547, -64.57345581054688, -62.37641906738281, -60.179378509521484, -57.982337951660156, -55.78529739379883, -53.5882568359375, -51.39121627807617, -49.194175720214844, -46.997135162353516, -44.80009460449219, -42.60305404663086, -40.40601348876953, -38.2089729309082, -36.011932373046875, -33.81489181518555, -31.61785125732422, -29.42081069946289, -27.223770141601562, -25.026729583740234, -22.829689025878906, -20.632648468017578, -18.43560791015625, -16.238567352294922, -14.041526794433594, -11.844486236572266, -9.647445678710938, -7.450405120849609, -5.253364562988281, -3.056324005126953, -0.859283447265625, 1.3377571105957031, 3.5348052978515625, 5.731845855712891, 7.928886413574219, 10.125926971435547, 12.322967529296875, 14.520008087158203, 16.71704864501953, 18.91408920288086, 21.111129760742188, 23.308170318603516, 25.505210876464844, 27.702251434326172, 29.8992919921875, 32.09633255004883, 34.293373107910156, 36.490413665771484, 38.68745422363281, 40.88449478149414, 43.08153533935547, 45.2785758972168, 47.475616455078125, 49.67265701293945, 51.86969757080078, 54.06673812866211, 56.26377868652344, 58.460819244384766, 60.657859802246094, 62.85490036010742, 65.05194091796875, 67.24897766113281, 69.4460220336914, 71.64306640625, 73.84010314941406]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 6.0, 10.0, 2.0, 13.0, 17.0, 16.0, 21.0, 21.0, 14.0, 30.0, 30.0, 36.0, 25.0, 42.0, 40.0, 39.0, 46.0, 41.0, 44.0, 33.0, 41.0, 47.0, 37.0, 35.0, 44.0, 37.0, 28.0, 29.0, 23.0, 26.0, 21.0, 14.0, 23.0, 16.0, 6.0, 12.0, 5.0, 10.0, 8.0, 2.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 4.0], "bins": [-15.5078125, -15.05712890625, -14.6064453125, -14.15576171875, -13.705078125, -13.25439453125, -12.8037109375, -12.35302734375, -11.90234375, -11.45166015625, -11.0009765625, -10.55029296875, -10.099609375, -9.64892578125, -9.1982421875, -8.74755859375, -8.296875, -7.84619140625, -7.3955078125, -6.94482421875, -6.494140625, -6.04345703125, -5.5927734375, -5.14208984375, -4.69140625, -4.24072265625, -3.7900390625, -3.33935546875, -2.888671875, -2.43798828125, -1.9873046875, -1.53662109375, -1.0859375, -0.63525390625, -0.1845703125, 0.26611328125, 0.716796875, 1.16748046875, 1.6181640625, 2.06884765625, 2.51953125, 2.97021484375, 3.4208984375, 3.87158203125, 4.322265625, 4.77294921875, 5.2236328125, 5.67431640625, 6.125, 6.57568359375, 7.0263671875, 7.47705078125, 7.927734375, 8.37841796875, 8.8291015625, 9.27978515625, 9.73046875, 10.18115234375, 10.6318359375, 11.08251953125, 11.533203125, 11.98388671875, 12.4345703125, 12.88525390625, 13.3359375]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 2.0, 3.0, 6.0, 7.0, 9.0, 16.0, 21.0, 60.0, 67.0, 112.0, 179.0, 267.0, 424.0, 672.0, 1006.0, 1576.0, 2409.0, 4022.0, 6631.0, 10590.0, 17131.0, 28886.0, 48958.0, 87852.0, 160691.0, 245979.0, 187165.0, 102853.0, 56345.0, 32985.0, 19904.0, 12085.0, 7445.0, 4542.0, 2870.0, 1717.0, 1092.0, 694.0, 443.0, 259.0, 201.0, 126.0, 101.0, 52.0, 45.0, 16.0, 16.0, 10.0, 10.0, 4.0, 5.0, 2.0, 2.0, 2.0, 1.0], "bins": [-1.6201171875, -1.573333740234375, -1.52655029296875, -1.479766845703125, -1.4329833984375, -1.386199951171875, -1.33941650390625, -1.292633056640625, -1.245849609375, -1.199066162109375, -1.15228271484375, -1.105499267578125, -1.0587158203125, -1.011932373046875, -0.96514892578125, -0.918365478515625, -0.87158203125, -0.824798583984375, -0.77801513671875, -0.731231689453125, -0.6844482421875, -0.637664794921875, -0.59088134765625, -0.544097900390625, -0.497314453125, -0.450531005859375, -0.40374755859375, -0.356964111328125, -0.3101806640625, -0.263397216796875, -0.21661376953125, -0.169830322265625, -0.123046875, -0.076263427734375, -0.02947998046875, 0.017303466796875, 0.0640869140625, 0.110870361328125, 0.15765380859375, 0.204437255859375, 0.251220703125, 0.298004150390625, 0.34478759765625, 0.391571044921875, 0.4383544921875, 0.485137939453125, 0.53192138671875, 0.578704833984375, 0.62548828125, 0.672271728515625, 0.71905517578125, 0.765838623046875, 0.8126220703125, 0.859405517578125, 0.90618896484375, 0.952972412109375, 0.999755859375, 1.046539306640625, 1.09332275390625, 1.140106201171875, 1.1868896484375, 1.233673095703125, 1.28045654296875, 1.327239990234375, 1.3740234375]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 7.0, 6.0, 6.0, 10.0, 5.0, 8.0, 13.0, 17.0, 20.0, 18.0, 27.0, 19.0, 24.0, 26.0, 26.0, 35.0, 33.0, 27.0, 30.0, 54.0, 41.0, 45.0, 1061.0, 38.0, 35.0, 44.0, 44.0, 42.0, 37.0, 34.0, 25.0, 19.0, 21.0, 23.0, 18.0, 18.0, 14.0, 16.0, 9.0, 14.0, 7.0, 4.0, 2.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-9.4609375, -9.17529296875, -8.8896484375, -8.60400390625, -8.318359375, -8.03271484375, -7.7470703125, -7.46142578125, -7.17578125, -6.89013671875, -6.6044921875, -6.31884765625, -6.033203125, -5.74755859375, -5.4619140625, -5.17626953125, -4.890625, -4.60498046875, -4.3193359375, -4.03369140625, -3.748046875, -3.46240234375, -3.1767578125, -2.89111328125, -2.60546875, -2.31982421875, -2.0341796875, -1.74853515625, -1.462890625, -1.17724609375, -0.8916015625, -0.60595703125, -0.3203125, -0.03466796875, 0.2509765625, 0.53662109375, 0.822265625, 1.10791015625, 1.3935546875, 1.67919921875, 1.96484375, 2.25048828125, 2.5361328125, 2.82177734375, 3.107421875, 3.39306640625, 3.6787109375, 3.96435546875, 4.25, 4.53564453125, 4.8212890625, 5.10693359375, 5.392578125, 5.67822265625, 5.9638671875, 6.24951171875, 6.53515625, 6.82080078125, 7.1064453125, 7.39208984375, 7.677734375, 7.96337890625, 8.2490234375, 8.53466796875, 8.8203125]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 11.0, 10.0, 16.0, 35.0, 64.0, 71.0, 101.0, 141.0, 248.0, 395.0, 579.0, 884.0, 1398.0, 2110.0, 3416.0, 5117.0, 8038.0, 12141.0, 19383.0, 31642.0, 53554.0, 94284.0, 170547.0, 1291756.0, 169470.0, 93207.0, 53342.0, 31380.0, 19408.0, 11856.0, 7876.0, 5095.0, 3377.0, 2169.0, 1393.0, 942.0, 619.0, 378.0, 227.0, 141.0, 100.0, 79.0, 46.0, 30.0, 29.0, 12.0, 9.0, 3.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.88232421875, -0.85430908203125, -0.8262939453125, -0.79827880859375, -0.770263671875, -0.74224853515625, -0.7142333984375, -0.68621826171875, -0.658203125, -0.63018798828125, -0.6021728515625, -0.57415771484375, -0.546142578125, -0.51812744140625, -0.4901123046875, -0.46209716796875, -0.43408203125, -0.40606689453125, -0.3780517578125, -0.35003662109375, -0.322021484375, -0.29400634765625, -0.2659912109375, -0.23797607421875, -0.2099609375, -0.18194580078125, -0.1539306640625, -0.12591552734375, -0.097900390625, -0.06988525390625, -0.0418701171875, -0.01385498046875, 0.01416015625, 0.04217529296875, 0.0701904296875, 0.09820556640625, 0.126220703125, 0.15423583984375, 0.1822509765625, 0.21026611328125, 0.23828125, 0.26629638671875, 0.2943115234375, 0.32232666015625, 0.350341796875, 0.37835693359375, 0.4063720703125, 0.43438720703125, 0.46240234375, 0.49041748046875, 0.5184326171875, 0.54644775390625, 0.574462890625, 0.60247802734375, 0.6304931640625, 0.65850830078125, 0.6865234375, 0.71453857421875, 0.7425537109375, 0.77056884765625, 0.798583984375, 0.82659912109375, 0.8546142578125, 0.88262939453125, 0.91064453125]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 12.0, 37.0, 36.0, 64.0, 99.0, 126.0, 148.0, 149.0, 112.0, 75.0, 58.0, 29.0, 21.0, 5.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0391845703125, -0.03802061080932617, -0.036856651306152344, -0.035692691802978516, -0.03452873229980469, -0.03336477279663086, -0.03220081329345703, -0.031036853790283203, -0.029872894287109375, -0.028708934783935547, -0.02754497528076172, -0.02638101577758789, -0.025217056274414062, -0.024053096771240234, -0.022889137268066406, -0.021725177764892578, -0.02056121826171875, -0.019397258758544922, -0.018233299255371094, -0.017069339752197266, -0.015905380249023438, -0.01474142074584961, -0.013577461242675781, -0.012413501739501953, -0.011249542236328125, -0.010085582733154297, -0.008921623229980469, -0.007757663726806641, -0.0065937042236328125, -0.005429744720458984, -0.004265785217285156, -0.003101825714111328, -0.0019378662109375, -0.0007739067077636719, 0.00039005279541015625, 0.0015540122985839844, 0.0027179718017578125, 0.0038819313049316406, 0.005045890808105469, 0.006209850311279297, 0.007373809814453125, 0.008537769317626953, 0.009701728820800781, 0.01086568832397461, 0.012029647827148438, 0.013193607330322266, 0.014357566833496094, 0.015521526336669922, 0.01668548583984375, 0.017849445343017578, 0.019013404846191406, 0.020177364349365234, 0.021341323852539062, 0.02250528335571289, 0.02366924285888672, 0.024833202362060547, 0.025997161865234375, 0.027161121368408203, 0.02832508087158203, 0.02948904037475586, 0.030652999877929688, 0.031816959381103516, 0.032980918884277344, 0.03414487838745117, 0.035308837890625]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 5.0, 3.0, 3.0, 8.0, 11.0, 16.0, 38.0, 80.0, 160.0, 359.0, 4417.0, 1037842.0, 4938.0, 356.0, 151.0, 70.0, 46.0, 10.0, 16.0, 5.0, 2.0, 3.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.765625, -0.7405319213867188, -0.7154388427734375, -0.6903457641601562, -0.665252685546875, -0.6401596069335938, -0.6150665283203125, -0.5899734497070312, -0.56488037109375, -0.5397872924804688, -0.5146942138671875, -0.48960113525390625, -0.464508056640625, -0.43941497802734375, -0.4143218994140625, -0.38922882080078125, -0.3641357421875, -0.33904266357421875, -0.3139495849609375, -0.28885650634765625, -0.263763427734375, -0.23867034912109375, -0.2135772705078125, -0.18848419189453125, -0.16339111328125, -0.13829803466796875, -0.1132049560546875, -0.08811187744140625, -0.063018798828125, -0.03792572021484375, -0.0128326416015625, 0.01226043701171875, 0.037353515625, 0.06244659423828125, 0.0875396728515625, 0.11263275146484375, 0.137725830078125, 0.16281890869140625, 0.1879119873046875, 0.21300506591796875, 0.23809814453125, 0.26319122314453125, 0.2882843017578125, 0.31337738037109375, 0.338470458984375, 0.36356353759765625, 0.3886566162109375, 0.41374969482421875, 0.4388427734375, 0.46393585205078125, 0.4890289306640625, 0.5141220092773438, 0.539215087890625, 0.5643081665039062, 0.5894012451171875, 0.6144943237304688, 0.63958740234375, 0.6646804809570312, 0.6897735595703125, 0.7148666381835938, 0.739959716796875, 0.7650527954101562, 0.7901458740234375, 0.8152389526367188, 0.84033203125]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [4.0, 3.0, 35.0, 146.0, 600.0, 165.0, 39.0, 17.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.025875117629766464, -0.02000894397497177, -0.014142771251499653, -0.008276598528027534, -0.0024104248732328415, 0.0034557487815618515, 0.009321920573711395, 0.015188094228506088, 0.02105426788330078, 0.026920441538095474, 0.03278661519289017, 0.03865278512239456, 0.04451896250247955, 0.05038513243198395, 0.05625130608677864, 0.062117479741573334, 0.06798365712165833, 0.07384982705116272, 0.07971600443124771, 0.0855821743607521, 0.0914483517408371, 0.09731452167034149, 0.10318069159984589, 0.10904686897993088, 0.11491303890943527, 0.12077920883893967, 0.12664538621902466, 0.13251155614852905, 0.13837772607803345, 0.14424391090869904, 0.15011008083820343, 0.15597625076770782, 0.16184242069721222, 0.1677085906267166, 0.173574760556221, 0.1794409453868866, 0.185307115316391, 0.19117328524589539, 0.19703945517539978, 0.20290562510490417, 0.20877180993556976, 0.21463797986507416, 0.22050414979457855, 0.22637033462524414, 0.23223650455474854, 0.23810267448425293, 0.24396884441375732, 0.24983501434326172, 0.2557011842727661, 0.2615673542022705, 0.2674335241317749, 0.2732996940612793, 0.2791658639907837, 0.2850320637226105, 0.29089823365211487, 0.29676440358161926, 0.30263057351112366, 0.30849674344062805, 0.31436291337013245, 0.32022908329963684, 0.32609525322914124, 0.331961452960968, 0.3378276228904724, 0.3436937928199768, 0.3495599627494812]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 1.0, 8.0, 9.0, 8.0, 11.0, 14.0, 11.0, 13.0, 13.0, 14.0, 21.0, 15.0, 23.0, 24.0, 26.0, 28.0, 26.0, 32.0, 30.0, 31.0, 36.0, 29.0, 34.0, 31.0, 41.0, 48.0, 31.0, 42.0, 43.0, 26.0, 31.0, 34.0, 32.0, 29.0, 22.0, 21.0, 19.0, 15.0, 18.0, 16.0, 14.0, 6.0, 5.0, 6.0, 3.0, 7.0, 1.0, 2.0, 2.0, 5.0, 1.0, 0.0, 1.0], "bins": [-0.030151307582855225, -0.02926386147737503, -0.028376417234539986, -0.02748897299170494, -0.026601526886224747, -0.025714080780744553, -0.024826636537909508, -0.023939192295074463, -0.02305174618959427, -0.022164300084114075, -0.02127685584127903, -0.020389411598443985, -0.01950196549296379, -0.018614519387483597, -0.017727075144648552, -0.016839630901813507, -0.015952184796333313, -0.015064739622175694, -0.014177294448018074, -0.013289849273860455, -0.012402404099702835, -0.011514958925545216, -0.010627513751387596, -0.009740068577229977, -0.008852623403072357, -0.007965178228914738, -0.007077733054757118, -0.006190287880599499, -0.005302842706441879, -0.00441539753228426, -0.0035279523581266403, -0.002640507183969021, -0.0017530620098114014, -0.0008656168356537819, 2.1828338503837585e-05, 0.0009092735126614571, 0.0017967186868190765, 0.002684163860976696, 0.0035716090351343155, 0.004459054209291935, 0.0053464993834495544, 0.006233944557607174, 0.007121389731764793, 0.008008834905922413, 0.008896280080080032, 0.009783725254237652, 0.010671170428395271, 0.01155861560255289, 0.01244606077671051, 0.01333350595086813, 0.01422095112502575, 0.015108396299183369, 0.015995841473340988, 0.016883287578821182, 0.017770731821656227, 0.018658176064491272, 0.019545622169971466, 0.02043306827545166, 0.021320512518286705, 0.02220795676112175, 0.023095402866601944, 0.023982848972082138, 0.024870293214917183, 0.025757737457752228, 0.026645183563232422]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 6.0, 10.0, 2.0, 13.0, 17.0, 16.0, 21.0, 21.0, 14.0, 30.0, 30.0, 36.0, 25.0, 42.0, 40.0, 39.0, 46.0, 41.0, 44.0, 33.0, 41.0, 47.0, 37.0, 35.0, 44.0, 37.0, 28.0, 29.0, 24.0, 25.0, 21.0, 14.0, 23.0, 16.0, 6.0, 12.0, 5.0, 10.0, 8.0, 2.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 4.0], "bins": [-15.5078125, -15.05712890625, -14.6064453125, -14.15576171875, -13.705078125, -13.25439453125, -12.8037109375, -12.35302734375, -11.90234375, -11.45166015625, -11.0009765625, -10.55029296875, -10.099609375, -9.64892578125, -9.1982421875, -8.74755859375, -8.296875, -7.84619140625, -7.3955078125, -6.94482421875, -6.494140625, -6.04345703125, -5.5927734375, -5.14208984375, -4.69140625, -4.24072265625, -3.7900390625, -3.33935546875, -2.888671875, -2.43798828125, -1.9873046875, -1.53662109375, -1.0859375, -0.63525390625, -0.1845703125, 0.26611328125, 0.716796875, 1.16748046875, 1.6181640625, 2.06884765625, 2.51953125, 2.97021484375, 3.4208984375, 3.87158203125, 4.322265625, 4.77294921875, 5.2236328125, 5.67431640625, 6.125, 6.57568359375, 7.0263671875, 7.47705078125, 7.927734375, 8.37841796875, 8.8291015625, 9.27978515625, 9.73046875, 10.18115234375, 10.6318359375, 11.08251953125, 11.533203125, 11.98388671875, 12.4345703125, 12.88525390625, 13.3359375]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 6.0, 9.0, 10.0, 15.0, 21.0, 30.0, 38.0, 52.0, 107.0, 120.0, 186.0, 253.0, 380.0, 657.0, 1056.0, 1894.0, 3259.0, 6343.0, 13059.0, 29137.0, 70294.0, 188489.0, 418975.0, 187956.0, 69596.0, 29076.0, 13193.0, 6322.0, 3240.0, 1843.0, 1067.0, 617.0, 395.0, 275.0, 164.0, 118.0, 92.0, 57.0, 40.0, 35.0, 23.0, 16.0, 13.0, 8.0, 7.0, 4.0, 4.0, 6.0, 4.0, 4.0, 1.0], "bins": [-6.91796875, -6.72308349609375, -6.5281982421875, -6.33331298828125, -6.138427734375, -5.94354248046875, -5.7486572265625, -5.55377197265625, -5.35888671875, -5.16400146484375, -4.9691162109375, -4.77423095703125, -4.579345703125, -4.38446044921875, -4.1895751953125, -3.99468994140625, -3.7998046875, -3.60491943359375, -3.4100341796875, -3.21514892578125, -3.020263671875, -2.82537841796875, -2.6304931640625, -2.43560791015625, -2.24072265625, -2.04583740234375, -1.8509521484375, -1.65606689453125, -1.461181640625, -1.26629638671875, -1.0714111328125, -0.87652587890625, -0.681640625, -0.48675537109375, -0.2918701171875, -0.09698486328125, 0.097900390625, 0.29278564453125, 0.4876708984375, 0.68255615234375, 0.87744140625, 1.07232666015625, 1.2672119140625, 1.46209716796875, 1.656982421875, 1.85186767578125, 2.0467529296875, 2.24163818359375, 2.4365234375, 2.63140869140625, 2.8262939453125, 3.02117919921875, 3.216064453125, 3.41094970703125, 3.6058349609375, 3.80072021484375, 3.99560546875, 4.19049072265625, 4.3853759765625, 4.58026123046875, 4.775146484375, 4.97003173828125, 5.1649169921875, 5.35980224609375, 5.5546875]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 3.0, 4.0, 7.0, 9.0, 11.0, 12.0, 19.0, 15.0, 27.0, 32.0, 30.0, 34.0, 45.0, 39.0, 38.0, 42.0, 60.0, 105.0, 1847.0, 188.0, 73.0, 58.0, 38.0, 43.0, 42.0, 39.0, 24.0, 29.0, 19.0, 23.0, 19.0, 11.0, 14.0, 8.0, 13.0, 3.0, 7.0, 7.0, 6.0, 2.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0], "bins": [-49.625, -48.2705078125, -46.916015625, -45.5615234375, -44.20703125, -42.8525390625, -41.498046875, -40.1435546875, -38.7890625, -37.4345703125, -36.080078125, -34.7255859375, -33.37109375, -32.0166015625, -30.662109375, -29.3076171875, -27.953125, -26.5986328125, -25.244140625, -23.8896484375, -22.53515625, -21.1806640625, -19.826171875, -18.4716796875, -17.1171875, -15.7626953125, -14.408203125, -13.0537109375, -11.69921875, -10.3447265625, -8.990234375, -7.6357421875, -6.28125, -4.9267578125, -3.572265625, -2.2177734375, -0.86328125, 0.4912109375, 1.845703125, 3.2001953125, 4.5546875, 5.9091796875, 7.263671875, 8.6181640625, 9.97265625, 11.3271484375, 12.681640625, 14.0361328125, 15.390625, 16.7451171875, 18.099609375, 19.4541015625, 20.80859375, 22.1630859375, 23.517578125, 24.8720703125, 26.2265625, 27.5810546875, 28.935546875, 30.2900390625, 31.64453125, 32.9990234375, 34.353515625, 35.7080078125, 37.0625]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 5.0, 10.0, 4.0, 8.0, 13.0, 13.0, 21.0, 27.0, 30.0, 40.0, 57.0, 68.0, 89.0, 121.0, 158.0, 252.0, 421.0, 1104.0, 18260.0, 3117897.0, 5152.0, 782.0, 354.0, 218.0, 152.0, 114.0, 85.0, 57.0, 43.0, 44.0, 19.0, 21.0, 16.0, 12.0, 8.0, 6.0, 4.0, 6.0, 5.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-87.9375, -84.7236328125, -81.509765625, -78.2958984375, -75.08203125, -71.8681640625, -68.654296875, -65.4404296875, -62.2265625, -59.0126953125, -55.798828125, -52.5849609375, -49.37109375, -46.1572265625, -42.943359375, -39.7294921875, -36.515625, -33.3017578125, -30.087890625, -26.8740234375, -23.66015625, -20.4462890625, -17.232421875, -14.0185546875, -10.8046875, -7.5908203125, -4.376953125, -1.1630859375, 2.05078125, 5.2646484375, 8.478515625, 11.6923828125, 14.90625, 18.1201171875, 21.333984375, 24.5478515625, 27.76171875, 30.9755859375, 34.189453125, 37.4033203125, 40.6171875, 43.8310546875, 47.044921875, 50.2587890625, 53.47265625, 56.6865234375, 59.900390625, 63.1142578125, 66.328125, 69.5419921875, 72.755859375, 75.9697265625, 79.18359375, 82.3974609375, 85.611328125, 88.8251953125, 92.0390625, 95.2529296875, 98.466796875, 101.6806640625, 104.89453125, 108.1083984375, 111.322265625, 114.5361328125, 117.75]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 7.0, 132.0, 604.0, 255.0, 15.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.84003829956055, -27.916202545166016, -22.99236488342285, -18.068527221679688, -13.144691467285156, -8.220855712890625, -3.297018051147461, 1.6268196105957031, 6.550655364990234, 11.474492073059082, 16.39832878112793, 21.322166442871094, 26.246002197265625, 31.169837951660156, 36.09367370605469, 41.017513275146484, 45.941349029541016, 50.86518478393555, 55.789024353027344, 60.712860107421875, 65.6366958618164, 70.56053161621094, 75.48436737060547, 80.408203125, 85.33204650878906, 90.2558822631836, 95.17971801757812, 100.10355377197266, 105.02738952636719, 109.95123291015625, 114.87506866455078, 119.79890441894531, 124.72274780273438, 129.64659118652344, 134.57041931152344, 139.4942626953125, 144.4180908203125, 149.34193420410156, 154.26576232910156, 159.18960571289062, 164.11343383789062, 169.0372772216797, 173.9611053466797, 178.88494873046875, 183.80877685546875, 188.7326202392578, 193.6564483642578, 198.58029174804688, 203.50413513183594, 208.427978515625, 213.351806640625, 218.27565002441406, 223.19947814941406, 228.12332153320312, 233.04714965820312, 237.9709930419922, 242.89483642578125, 247.8186798095703, 252.7425079345703, 257.6663513183594, 262.5901794433594, 267.5140075683594, 272.4378662109375, 277.3616943359375, 282.2855224609375]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 3.0, 8.0, 2.0, 6.0, 12.0, 5.0, 12.0, 14.0, 25.0, 21.0, 21.0, 26.0, 30.0, 21.0, 37.0, 32.0, 30.0, 28.0, 42.0, 36.0, 42.0, 42.0, 42.0, 56.0, 40.0, 32.0, 47.0, 28.0, 32.0, 32.0, 33.0, 24.0, 20.0, 22.0, 17.0, 13.0, 10.0, 18.0, 10.0, 9.0, 6.0, 5.0, 4.0, 6.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-114.08296203613281, -110.76636505126953, -107.44976043701172, -104.13316345214844, -100.81655883789062, -97.49996185302734, -94.18336486816406, -90.86676025390625, -87.55016326904297, -84.23356628417969, -80.91696166992188, -77.6003646850586, -74.28376770019531, -70.9671630859375, -67.65056610107422, -64.33396911621094, -61.017364501953125, -57.70076370239258, -54.38416290283203, -51.06756591796875, -47.7509651184082, -44.434364318847656, -41.117767333984375, -37.80116653442383, -34.48456573486328, -31.167964935302734, -27.85136604309082, -24.534767150878906, -21.21816635131836, -17.901565551757812, -14.584966659545898, -11.268367767333984, -7.9517669677734375, -4.635167121887207, -1.3185672760009766, 1.998032569885254, 5.314632415771484, 8.631233215332031, 11.947832107543945, 15.26443099975586, 18.581031799316406, 21.897632598876953, 25.214231491088867, 28.53083038330078, 31.847431182861328, 35.164031982421875, 38.480628967285156, 41.7972297668457, 45.11383056640625, 48.4304313659668, 51.747032165527344, 55.063629150390625, 58.38022994995117, 61.69683074951172, 65.013427734375, 68.33003234863281, 71.6466293334961, 74.96322631835938, 78.27983093261719, 81.59642791748047, 84.91302490234375, 88.22962951660156, 91.54622650146484, 94.86282348632812, 98.17942810058594]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 6.0, 6.0, 8.0, 12.0, 13.0, 12.0, 25.0, 17.0, 15.0, 34.0, 25.0, 34.0, 25.0, 39.0, 45.0, 45.0, 37.0, 46.0, 43.0, 35.0, 43.0, 33.0, 36.0, 41.0, 41.0, 39.0, 33.0, 30.0, 30.0, 17.0, 26.0, 12.0, 19.0, 18.0, 6.0, 15.0, 12.0, 6.0, 5.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 4.0, 2.0], "bins": [-15.6796875, -15.227783203125, -14.77587890625, -14.323974609375, -13.8720703125, -13.420166015625, -12.96826171875, -12.516357421875, -12.064453125, -11.612548828125, -11.16064453125, -10.708740234375, -10.2568359375, -9.804931640625, -9.35302734375, -8.901123046875, -8.44921875, -7.997314453125, -7.54541015625, -7.093505859375, -6.6416015625, -6.189697265625, -5.73779296875, -5.285888671875, -4.833984375, -4.382080078125, -3.93017578125, -3.478271484375, -3.0263671875, -2.574462890625, -2.12255859375, -1.670654296875, -1.21875, -0.766845703125, -0.31494140625, 0.136962890625, 0.5888671875, 1.040771484375, 1.49267578125, 1.944580078125, 2.396484375, 2.848388671875, 3.30029296875, 3.752197265625, 4.2041015625, 4.656005859375, 5.10791015625, 5.559814453125, 6.01171875, 6.463623046875, 6.91552734375, 7.367431640625, 7.8193359375, 8.271240234375, 8.72314453125, 9.175048828125, 9.626953125, 10.078857421875, 10.53076171875, 10.982666015625, 11.4345703125, 11.886474609375, 12.33837890625, 12.790283203125, 13.2421875]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 3.0, 9.0, 6.0, 11.0, 15.0, 23.0, 37.0, 47.0, 75.0, 84.0, 122.0, 193.0, 268.0, 400.0, 595.0, 911.0, 1514.0, 3256.0, 8152.0, 54044.0, 2263617.0, 1811089.0, 34622.0, 7438.0, 3292.0, 1586.0, 925.0, 570.0, 379.0, 270.0, 185.0, 142.0, 101.0, 81.0, 63.0, 24.0, 39.0, 30.0, 21.0, 14.0, 9.0, 7.0, 4.0, 4.0, 0.0, 2.0, 4.0, 4.0, 2.0, 1.0], "bins": [-50.65625, -49.20751953125, -47.7587890625, -46.31005859375, -44.861328125, -43.41259765625, -41.9638671875, -40.51513671875, -39.06640625, -37.61767578125, -36.1689453125, -34.72021484375, -33.271484375, -31.82275390625, -30.3740234375, -28.92529296875, -27.4765625, -26.02783203125, -24.5791015625, -23.13037109375, -21.681640625, -20.23291015625, -18.7841796875, -17.33544921875, -15.88671875, -14.43798828125, -12.9892578125, -11.54052734375, -10.091796875, -8.64306640625, -7.1943359375, -5.74560546875, -4.296875, -2.84814453125, -1.3994140625, 0.04931640625, 1.498046875, 2.94677734375, 4.3955078125, 5.84423828125, 7.29296875, 8.74169921875, 10.1904296875, 11.63916015625, 13.087890625, 14.53662109375, 15.9853515625, 17.43408203125, 18.8828125, 20.33154296875, 21.7802734375, 23.22900390625, 24.677734375, 26.12646484375, 27.5751953125, 29.02392578125, 30.47265625, 31.92138671875, 33.3701171875, 34.81884765625, 36.267578125, 37.71630859375, 39.1650390625, 40.61376953125, 42.0625]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 3.0, 6.0, 8.0, 4.0, 10.0, 6.0, 15.0, 17.0, 18.0, 19.0, 43.0, 61.0, 117.0, 242.0, 481.0, 880.0, 983.0, 579.0, 239.0, 133.0, 63.0, 38.0, 26.0, 15.0, 19.0, 14.0, 12.0, 7.0, 8.0, 4.0, 3.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-38.8125, -37.79296875, -36.7734375, -35.75390625, -34.734375, -33.71484375, -32.6953125, -31.67578125, -30.65625, -29.63671875, -28.6171875, -27.59765625, -26.578125, -25.55859375, -24.5390625, -23.51953125, -22.5, -21.48046875, -20.4609375, -19.44140625, -18.421875, -17.40234375, -16.3828125, -15.36328125, -14.34375, -13.32421875, -12.3046875, -11.28515625, -10.265625, -9.24609375, -8.2265625, -7.20703125, -6.1875, -5.16796875, -4.1484375, -3.12890625, -2.109375, -1.08984375, -0.0703125, 0.94921875, 1.96875, 2.98828125, 4.0078125, 5.02734375, 6.046875, 7.06640625, 8.0859375, 9.10546875, 10.125, 11.14453125, 12.1640625, 13.18359375, 14.203125, 15.22265625, 16.2421875, 17.26171875, 18.28125, 19.30078125, 20.3203125, 21.33984375, 22.359375, 23.37890625, 24.3984375, 25.41796875, 26.4375]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 8.0, 8.0, 12.0, 25.0, 21.0, 33.0, 64.0, 86.0, 198.0, 514.0, 1657.0, 8029.0, 83561.0, 4046108.0, 46147.0, 5669.0, 1288.0, 417.0, 179.0, 78.0, 52.0, 38.0, 26.0, 10.0, 10.0, 9.0, 8.0, 11.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-103.6875, -99.7607421875, -95.833984375, -91.9072265625, -87.98046875, -84.0537109375, -80.126953125, -76.2001953125, -72.2734375, -68.3466796875, -64.419921875, -60.4931640625, -56.56640625, -52.6396484375, -48.712890625, -44.7861328125, -40.859375, -36.9326171875, -33.005859375, -29.0791015625, -25.15234375, -21.2255859375, -17.298828125, -13.3720703125, -9.4453125, -5.5185546875, -1.591796875, 2.3349609375, 6.26171875, 10.1884765625, 14.115234375, 18.0419921875, 21.96875, 25.8955078125, 29.822265625, 33.7490234375, 37.67578125, 41.6025390625, 45.529296875, 49.4560546875, 53.3828125, 57.3095703125, 61.236328125, 65.1630859375, 69.08984375, 73.0166015625, 76.943359375, 80.8701171875, 84.796875, 88.7236328125, 92.650390625, 96.5771484375, 100.50390625, 104.4306640625, 108.357421875, 112.2841796875, 116.2109375, 120.1376953125, 124.064453125, 127.9912109375, 131.91796875, 135.8447265625, 139.771484375, 143.6982421875, 147.625]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 5.0, 8.0, 5.0, 16.0, 27.0, 46.0, 84.0, 190.0, 259.0, 182.0, 91.0, 43.0, 25.0, 7.0, 10.0, 6.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-161.24630737304688, -155.5892333984375, -149.93214416503906, -144.2750701904297, -138.6179962158203, -132.96090698242188, -127.3038330078125, -121.64675903320312, -115.98967742919922, -110.33259582519531, -104.67552185058594, -99.01844024658203, -93.36135864257812, -87.70428466796875, -82.04720306396484, -76.39012145996094, -70.73304748535156, -65.07596588134766, -59.41889190673828, -53.761810302734375, -48.104732513427734, -42.447654724121094, -36.79057312011719, -31.133495330810547, -25.476417541503906, -19.819339752197266, -14.162260055541992, -8.505180358886719, -2.848102569580078, 2.8089752197265625, 8.466056823730469, 14.12313461303711, 19.780227661132812, 25.437305450439453, 31.094385147094727, 36.75146484375, 42.40854263305664, 48.06562042236328, 53.72270202636719, 59.37977981567383, 65.03685760498047, 70.69393920898438, 76.35101318359375, 82.00809478759766, 87.66517639160156, 93.32225036621094, 98.97933197021484, 104.63641357421875, 110.29348754882812, 115.95056915283203, 121.6076431274414, 127.26472473144531, 132.9217987060547, 138.57888793945312, 144.2359619140625, 149.89303588867188, 155.55010986328125, 161.20718383789062, 166.86427307128906, 172.52134704589844, 178.1784210205078, 183.83551025390625, 189.49258422851562, 195.149658203125, 200.80674743652344]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 8.0, 0.0, 4.0, 8.0, 13.0, 8.0, 21.0, 10.0, 13.0, 10.0, 16.0, 22.0, 19.0, 35.0, 25.0, 25.0, 39.0, 30.0, 28.0, 41.0, 39.0, 40.0, 31.0, 40.0, 40.0, 24.0, 47.0, 40.0, 32.0, 36.0, 25.0, 29.0, 27.0, 15.0, 25.0, 22.0, 18.0, 9.0, 16.0, 10.0, 9.0, 10.0, 7.0, 9.0, 10.0, 4.0, 3.0, 4.0, 3.0, 1.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-61.555450439453125, -59.51859664916992, -57.481746673583984, -55.44489288330078, -53.408042907714844, -51.37118911743164, -49.33433532714844, -47.2974853515625, -45.2606315612793, -43.223777770996094, -41.186927795410156, -39.15007400512695, -37.11322021484375, -35.07637023925781, -33.03951644897461, -31.00266456604004, -28.96581268310547, -26.9289608001709, -24.892108917236328, -22.855255126953125, -20.818403244018555, -18.781551361083984, -16.74469757080078, -14.707845687866211, -12.67099380493164, -10.63414192199707, -8.597289085388184, -6.560436725616455, -4.523584365844727, -2.4867324829101562, -0.44987964630126953, 1.5869731903076172, 3.6238250732421875, 5.660677433013916, 7.6975297927856445, 9.734382629394531, 11.771234512329102, 13.808086395263672, 15.844939231872559, 17.881792068481445, 19.918643951416016, 21.955495834350586, 23.992347717285156, 26.02920150756836, 28.06605339050293, 30.1029052734375, 32.1397590637207, 34.176612854003906, 36.213462829589844, 38.25031661987305, 40.287166595458984, 42.32402038574219, 44.360870361328125, 46.39772415161133, 48.43457794189453, 50.47142791748047, 52.50828170776367, 54.545135498046875, 56.58198547363281, 58.618839263916016, 60.65569305419922, 62.692543029785156, 64.7293930053711, 66.76625061035156, 68.8031005859375]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 4.0, 1.0, 4.0, 9.0, 10.0, 12.0, 13.0, 12.0, 21.0, 30.0, 16.0, 27.0, 28.0, 37.0, 24.0, 16.0, 45.0, 46.0, 34.0, 51.0, 35.0, 48.0, 38.0, 33.0, 40.0, 34.0, 27.0, 34.0, 27.0, 40.0, 28.0, 28.0, 18.0, 24.0, 19.0, 13.0, 16.0, 14.0, 8.0, 11.0, 7.0, 9.0, 5.0, 4.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-13.7734375, -13.3431396484375, -12.912841796875, -12.4825439453125, -12.05224609375, -11.6219482421875, -11.191650390625, -10.7613525390625, -10.3310546875, -9.9007568359375, -9.470458984375, -9.0401611328125, -8.60986328125, -8.1795654296875, -7.749267578125, -7.3189697265625, -6.888671875, -6.4583740234375, -6.028076171875, -5.5977783203125, -5.16748046875, -4.7371826171875, -4.306884765625, -3.8765869140625, -3.4462890625, -3.0159912109375, -2.585693359375, -2.1553955078125, -1.72509765625, -1.2947998046875, -0.864501953125, -0.4342041015625, -0.00390625, 0.4263916015625, 0.856689453125, 1.2869873046875, 1.71728515625, 2.1475830078125, 2.577880859375, 3.0081787109375, 3.4384765625, 3.8687744140625, 4.299072265625, 4.7293701171875, 5.15966796875, 5.5899658203125, 6.020263671875, 6.4505615234375, 6.880859375, 7.3111572265625, 7.741455078125, 8.1717529296875, 8.60205078125, 9.0323486328125, 9.462646484375, 9.8929443359375, 10.3232421875, 10.7535400390625, 11.183837890625, 11.6141357421875, 12.04443359375, 12.4747314453125, 12.905029296875, 13.3353271484375, 13.765625]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 8.0, 8.0, 11.0, 17.0, 42.0, 49.0, 78.0, 117.0, 138.0, 246.0, 358.0, 631.0, 940.0, 1439.0, 2209.0, 3396.0, 5431.0, 8680.0, 13729.0, 21931.0, 35402.0, 58075.0, 100568.0, 177974.0, 237592.0, 155526.0, 87870.0, 51425.0, 31761.0, 19473.0, 12170.0, 7757.0, 5011.0, 3120.0, 1905.0, 1218.0, 762.0, 507.0, 340.0, 219.0, 147.0, 95.0, 66.0, 44.0, 22.0, 20.0, 6.0, 6.0, 9.0, 6.0, 8.0, 1.0, 0.0, 2.0], "bins": [-1.53125, -1.4867095947265625, -1.442169189453125, -1.3976287841796875, -1.35308837890625, -1.3085479736328125, -1.264007568359375, -1.2194671630859375, -1.1749267578125, -1.1303863525390625, -1.085845947265625, -1.0413055419921875, -0.99676513671875, -0.9522247314453125, -0.907684326171875, -0.8631439208984375, -0.818603515625, -0.7740631103515625, -0.729522705078125, -0.6849822998046875, -0.64044189453125, -0.5959014892578125, -0.551361083984375, -0.5068206787109375, -0.4622802734375, -0.4177398681640625, -0.373199462890625, -0.3286590576171875, -0.28411865234375, -0.2395782470703125, -0.195037841796875, -0.1504974365234375, -0.10595703125, -0.0614166259765625, -0.016876220703125, 0.0276641845703125, 0.07220458984375, 0.1167449951171875, 0.161285400390625, 0.2058258056640625, 0.2503662109375, 0.2949066162109375, 0.339447021484375, 0.3839874267578125, 0.42852783203125, 0.4730682373046875, 0.517608642578125, 0.5621490478515625, 0.606689453125, 0.6512298583984375, 0.695770263671875, 0.7403106689453125, 0.78485107421875, 0.8293914794921875, 0.873931884765625, 0.9184722900390625, 0.9630126953125, 1.0075531005859375, 1.052093505859375, 1.0966339111328125, 1.14117431640625, 1.1857147216796875, 1.230255126953125, 1.2747955322265625, 1.3193359375]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 3.0, 3.0, 6.0, 4.0, 6.0, 7.0, 24.0, 18.0, 11.0, 14.0, 19.0, 29.0, 20.0, 31.0, 29.0, 29.0, 29.0, 39.0, 39.0, 45.0, 38.0, 38.0, 1062.0, 37.0, 50.0, 43.0, 32.0, 36.0, 38.0, 30.0, 36.0, 25.0, 27.0, 14.0, 14.0, 25.0, 9.0, 17.0, 13.0, 8.0, 10.0, 8.0, 3.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.375, -8.0994873046875, -7.823974609375, -7.5484619140625, -7.27294921875, -6.9974365234375, -6.721923828125, -6.4464111328125, -6.1708984375, -5.8953857421875, -5.619873046875, -5.3443603515625, -5.06884765625, -4.7933349609375, -4.517822265625, -4.2423095703125, -3.966796875, -3.6912841796875, -3.415771484375, -3.1402587890625, -2.86474609375, -2.5892333984375, -2.313720703125, -2.0382080078125, -1.7626953125, -1.4871826171875, -1.211669921875, -0.9361572265625, -0.66064453125, -0.3851318359375, -0.109619140625, 0.1658935546875, 0.44140625, 0.7169189453125, 0.992431640625, 1.2679443359375, 1.54345703125, 1.8189697265625, 2.094482421875, 2.3699951171875, 2.6455078125, 2.9210205078125, 3.196533203125, 3.4720458984375, 3.74755859375, 4.0230712890625, 4.298583984375, 4.5740966796875, 4.849609375, 5.1251220703125, 5.400634765625, 5.6761474609375, 5.95166015625, 6.2271728515625, 6.502685546875, 6.7781982421875, 7.0537109375, 7.3292236328125, 7.604736328125, 7.8802490234375, 8.15576171875, 8.4312744140625, 8.706787109375, 8.9822998046875, 9.2578125]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 8.0, 7.0, 13.0, 20.0, 28.0, 32.0, 93.0, 116.0, 167.0, 261.0, 401.0, 562.0, 888.0, 1375.0, 2069.0, 3192.0, 4884.0, 7660.0, 12195.0, 19286.0, 31544.0, 54478.0, 95248.0, 172042.0, 1285713.0, 170968.0, 95191.0, 53792.0, 31456.0, 19506.0, 11935.0, 7802.0, 4970.0, 3230.0, 2021.0, 1421.0, 867.0, 560.0, 355.0, 258.0, 202.0, 107.0, 75.0, 54.0, 21.0, 8.0, 16.0, 20.0, 13.0, 5.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.90087890625, -0.8739852905273438, -0.8470916748046875, -0.8201980590820312, -0.793304443359375, -0.7664108276367188, -0.7395172119140625, -0.7126235961914062, -0.68572998046875, -0.6588363647460938, -0.6319427490234375, -0.6050491333007812, -0.578155517578125, -0.5512619018554688, -0.5243682861328125, -0.49747467041015625, -0.4705810546875, -0.44368743896484375, -0.4167938232421875, -0.38990020751953125, -0.363006591796875, -0.33611297607421875, -0.3092193603515625, -0.28232574462890625, -0.25543212890625, -0.22853851318359375, -0.2016448974609375, -0.17475128173828125, -0.147857666015625, -0.12096405029296875, -0.0940704345703125, -0.06717681884765625, -0.040283203125, -0.01338958740234375, 0.0135040283203125, 0.04039764404296875, 0.067291259765625, 0.09418487548828125, 0.1210784912109375, 0.14797210693359375, 0.17486572265625, 0.20175933837890625, 0.2286529541015625, 0.25554656982421875, 0.282440185546875, 0.30933380126953125, 0.3362274169921875, 0.36312103271484375, 0.3900146484375, 0.41690826416015625, 0.4438018798828125, 0.47069549560546875, 0.497589111328125, 0.5244827270507812, 0.5513763427734375, 0.5782699584960938, 0.60516357421875, 0.6320571899414062, 0.6589508056640625, 0.6858444213867188, 0.712738037109375, 0.7396316528320312, 0.7665252685546875, 0.7934188842773438, 0.8203125]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 2.0, 2.0, 2.0, 2.0, 7.0, 6.0, 7.0, 6.0, 4.0, 13.0, 4.0, 14.0, 15.0, 24.0, 20.0, 24.0, 24.0, 30.0, 30.0, 30.0, 52.0, 68.0, 77.0, 92.0, 78.0, 60.0, 45.0, 36.0, 32.0, 39.0, 25.0, 25.0, 17.0, 18.0, 13.0, 10.0, 9.0, 10.0, 6.0, 5.0, 2.0, 5.0, 7.0, 5.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0145721435546875, -0.01407313346862793, -0.01357412338256836, -0.013075113296508789, -0.012576103210449219, -0.012077093124389648, -0.011578083038330078, -0.011079072952270508, -0.010580062866210938, -0.010081052780151367, -0.009582042694091797, -0.009083032608032227, -0.008584022521972656, -0.008085012435913086, -0.007586002349853516, -0.007086992263793945, -0.006587982177734375, -0.006088972091674805, -0.005589962005615234, -0.005090951919555664, -0.004591941833496094, -0.0040929317474365234, -0.003593921661376953, -0.003094911575317383, -0.0025959014892578125, -0.002096891403198242, -0.0015978813171386719, -0.0010988712310791016, -0.0005998611450195312, -0.00010085105895996094, 0.0003981590270996094, 0.0008971691131591797, 0.00139617919921875, 0.0018951892852783203, 0.0023941993713378906, 0.002893209457397461, 0.0033922195434570312, 0.0038912296295166016, 0.004390239715576172, 0.004889249801635742, 0.0053882598876953125, 0.005887269973754883, 0.006386280059814453, 0.0068852901458740234, 0.007384300231933594, 0.007883310317993164, 0.008382320404052734, 0.008881330490112305, 0.009380340576171875, 0.009879350662231445, 0.010378360748291016, 0.010877370834350586, 0.011376380920410156, 0.011875391006469727, 0.012374401092529297, 0.012873411178588867, 0.013372421264648438, 0.013871431350708008, 0.014370441436767578, 0.014869451522827148, 0.015368461608886719, 0.01586747169494629, 0.01636648178100586, 0.01686549186706543, 0.017364501953125]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 3.0, 3.0, 9.0, 7.0, 9.0, 7.0, 13.0, 14.0, 14.0, 22.0, 15.0, 15.0, 30.0, 44.0, 64.0, 72.0, 95.0, 186.0, 283.0, 1037.0, 19707.0, 991344.0, 33322.0, 1336.0, 304.0, 155.0, 109.0, 75.0, 50.0, 39.0, 36.0, 30.0, 18.0, 24.0, 10.0, 5.0, 12.0, 7.0, 5.0, 11.0, 6.0, 2.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.34716796875, -0.336822509765625, -0.32647705078125, -0.316131591796875, -0.3057861328125, -0.295440673828125, -0.28509521484375, -0.274749755859375, -0.264404296875, -0.254058837890625, -0.24371337890625, -0.233367919921875, -0.2230224609375, -0.212677001953125, -0.20233154296875, -0.191986083984375, -0.181640625, -0.171295166015625, -0.16094970703125, -0.150604248046875, -0.1402587890625, -0.129913330078125, -0.11956787109375, -0.109222412109375, -0.098876953125, -0.088531494140625, -0.07818603515625, -0.067840576171875, -0.0574951171875, -0.047149658203125, -0.03680419921875, -0.026458740234375, -0.01611328125, -0.005767822265625, 0.00457763671875, 0.014923095703125, 0.0252685546875, 0.035614013671875, 0.04595947265625, 0.056304931640625, 0.066650390625, 0.076995849609375, 0.08734130859375, 0.097686767578125, 0.1080322265625, 0.118377685546875, 0.12872314453125, 0.139068603515625, 0.1494140625, 0.159759521484375, 0.17010498046875, 0.180450439453125, 0.1907958984375, 0.201141357421875, 0.21148681640625, 0.221832275390625, 0.232177734375, 0.242523193359375, 0.25286865234375, 0.263214111328125, 0.2735595703125, 0.283905029296875, 0.29425048828125, 0.304595947265625, 0.31494140625]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 20.0, 130.0, 664.0, 146.0, 44.0, 9.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.04348637908697128, -0.037645310163497925, -0.031804244965314865, -0.025963177904486656, -0.020122110843658447, -0.014281043782830238, -0.00843997672200203, -0.0025989115238189697, 0.0032421573996543884, 0.009083224460482597, 0.014924291521310806, 0.020765358582139015, 0.026606425642967224, 0.03244749456644058, 0.03828855976462364, 0.0441296249628067, 0.04997069388628006, 0.05581176280975342, 0.06165282800793648, 0.06749389320611954, 0.0733349621295929, 0.07917603105306625, 0.08501709997653961, 0.09085816144943237, 0.09669923037290573, 0.10254029929637909, 0.10838136076927185, 0.11422242969274521, 0.12006349861621857, 0.12590456008911133, 0.13174563646316528, 0.13758669793605804, 0.1434277594089508, 0.14926882088184357, 0.15510989725589752, 0.16095095872879028, 0.16679203510284424, 0.172633096575737, 0.17847415804862976, 0.18431523442268372, 0.19015629589557648, 0.19599735736846924, 0.2018384337425232, 0.20767949521541595, 0.21352055668830872, 0.21936163306236267, 0.22520269453525543, 0.2310437560081482, 0.23688483238220215, 0.2427258938550949, 0.24856697022914886, 0.2544080317020416, 0.2602491080760956, 0.26609015464782715, 0.2719312310218811, 0.27777230739593506, 0.283613383769989, 0.28945446014404297, 0.29529550671577454, 0.3011365830898285, 0.30697765946388245, 0.312818706035614, 0.31865978240966797, 0.3245008587837219, 0.3303419053554535]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 2.0, 3.0, 1.0, 3.0, 4.0, 9.0, 7.0, 9.0, 10.0, 10.0, 13.0, 18.0, 18.0, 26.0, 31.0, 24.0, 24.0, 32.0, 33.0, 28.0, 33.0, 43.0, 44.0, 49.0, 39.0, 46.0, 43.0, 51.0, 43.0, 36.0, 33.0, 38.0, 27.0, 25.0, 22.0, 29.0, 21.0, 20.0, 16.0, 8.0, 11.0, 8.0, 3.0, 8.0, 3.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02180624008178711, -0.021124038845300674, -0.02044183947145939, -0.019759640097618103, -0.019077438861131668, -0.018395237624645233, -0.017713038250803947, -0.017030838876962662, -0.016348637640476227, -0.015666436403989792, -0.014984237030148506, -0.014302036724984646, -0.013619836419820786, -0.012937636114656925, -0.012255435809493065, -0.011573235504329205, -0.010891035199165344, -0.010208834894001484, -0.009526634588837624, -0.008844434283673763, -0.008162233978509903, -0.007480033673346043, -0.006797833368182182, -0.006115633063018322, -0.005433432757854462, -0.004751232452690601, -0.004069032147526741, -0.0033868318423628807, -0.0027046315371990204, -0.00202243123203516, -0.0013402309268712997, -0.0006580306217074394, 2.41696834564209e-05, 0.0007063699886202812, 0.0013885702937841415, 0.002070770598948002, 0.002752970904111862, 0.0034351712092757225, 0.004117371514439583, 0.004799571819603443, 0.0054817721247673035, 0.006163972429931164, 0.006846172735095024, 0.007528373040258884, 0.008210573345422745, 0.008892773650586605, 0.009574973955750465, 0.010257174260914326, 0.010939374566078186, 0.011621574871242046, 0.012303775176405907, 0.012985975481569767, 0.013668175786733627, 0.014350376091897488, 0.015032576397061348, 0.015714775770902634, 0.01639697700738907, 0.017079178243875504, 0.01776137761771679, 0.018443576991558075, 0.01912577822804451, 0.019807979464530945, 0.02049017883837223, 0.021172378212213516, 0.02185457944869995]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 4.0, 1.0, 4.0, 9.0, 10.0, 12.0, 13.0, 12.0, 21.0, 30.0, 16.0, 27.0, 28.0, 37.0, 24.0, 16.0, 44.0, 47.0, 34.0, 51.0, 35.0, 48.0, 38.0, 33.0, 40.0, 34.0, 27.0, 35.0, 25.0, 41.0, 28.0, 28.0, 18.0, 24.0, 19.0, 13.0, 16.0, 14.0, 8.0, 11.0, 7.0, 9.0, 5.0, 4.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-13.7734375, -13.3431396484375, -12.912841796875, -12.4825439453125, -12.05224609375, -11.6219482421875, -11.191650390625, -10.7613525390625, -10.3310546875, -9.9007568359375, -9.470458984375, -9.0401611328125, -8.60986328125, -8.1795654296875, -7.749267578125, -7.3189697265625, -6.888671875, -6.4583740234375, -6.028076171875, -5.5977783203125, -5.16748046875, -4.7371826171875, -4.306884765625, -3.8765869140625, -3.4462890625, -3.0159912109375, -2.585693359375, -2.1553955078125, -1.72509765625, -1.2947998046875, -0.864501953125, -0.4342041015625, -0.00390625, 0.4263916015625, 0.856689453125, 1.2869873046875, 1.71728515625, 2.1475830078125, 2.577880859375, 3.0081787109375, 3.4384765625, 3.8687744140625, 4.299072265625, 4.7293701171875, 5.15966796875, 5.5899658203125, 6.020263671875, 6.4505615234375, 6.880859375, 7.3111572265625, 7.741455078125, 8.1717529296875, 8.60205078125, 9.0323486328125, 9.462646484375, 9.8929443359375, 10.3232421875, 10.7535400390625, 11.183837890625, 11.6141357421875, 12.04443359375, 12.4747314453125, 12.905029296875, 13.3353271484375, 13.765625]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 0.0, 4.0, 3.0, 15.0, 14.0, 20.0, 21.0, 48.0, 41.0, 71.0, 91.0, 106.0, 186.0, 263.0, 355.0, 528.0, 777.0, 1205.0, 2070.0, 3838.0, 9849.0, 44511.0, 345375.0, 549715.0, 65372.0, 12964.0, 4767.0, 2388.0, 1328.0, 897.0, 503.0, 342.0, 229.0, 163.0, 120.0, 92.0, 67.0, 53.0, 45.0, 24.0, 25.0, 20.0, 11.0, 9.0, 8.0, 9.0, 7.0, 6.0, 6.0, 3.0, 1.0, 0.0, 2.0], "bins": [-16.96875, -16.47119140625, -15.9736328125, -15.47607421875, -14.978515625, -14.48095703125, -13.9833984375, -13.48583984375, -12.98828125, -12.49072265625, -11.9931640625, -11.49560546875, -10.998046875, -10.50048828125, -10.0029296875, -9.50537109375, -9.0078125, -8.51025390625, -8.0126953125, -7.51513671875, -7.017578125, -6.52001953125, -6.0224609375, -5.52490234375, -5.02734375, -4.52978515625, -4.0322265625, -3.53466796875, -3.037109375, -2.53955078125, -2.0419921875, -1.54443359375, -1.046875, -0.54931640625, -0.0517578125, 0.44580078125, 0.943359375, 1.44091796875, 1.9384765625, 2.43603515625, 2.93359375, 3.43115234375, 3.9287109375, 4.42626953125, 4.923828125, 5.42138671875, 5.9189453125, 6.41650390625, 6.9140625, 7.41162109375, 7.9091796875, 8.40673828125, 8.904296875, 9.40185546875, 9.8994140625, 10.39697265625, 10.89453125, 11.39208984375, 11.8896484375, 12.38720703125, 12.884765625, 13.38232421875, 13.8798828125, 14.37744140625, 14.875]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 2.0, 4.0, 2.0, 8.0, 8.0, 9.0, 12.0, 17.0, 18.0, 18.0, 17.0, 23.0, 11.0, 22.0, 42.0, 34.0, 41.0, 52.0, 42.0, 78.0, 108.0, 1855.0, 146.0, 52.0, 72.0, 36.0, 42.0, 33.0, 36.0, 29.0, 30.0, 21.0, 29.0, 23.0, 14.0, 17.0, 8.0, 10.0, 4.0, 5.0, 9.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-36.6875, -35.52685546875, -34.3662109375, -33.20556640625, -32.044921875, -30.88427734375, -29.7236328125, -28.56298828125, -27.40234375, -26.24169921875, -25.0810546875, -23.92041015625, -22.759765625, -21.59912109375, -20.4384765625, -19.27783203125, -18.1171875, -16.95654296875, -15.7958984375, -14.63525390625, -13.474609375, -12.31396484375, -11.1533203125, -9.99267578125, -8.83203125, -7.67138671875, -6.5107421875, -5.35009765625, -4.189453125, -3.02880859375, -1.8681640625, -0.70751953125, 0.453125, 1.61376953125, 2.7744140625, 3.93505859375, 5.095703125, 6.25634765625, 7.4169921875, 8.57763671875, 9.73828125, 10.89892578125, 12.0595703125, 13.22021484375, 14.380859375, 15.54150390625, 16.7021484375, 17.86279296875, 19.0234375, 20.18408203125, 21.3447265625, 22.50537109375, 23.666015625, 24.82666015625, 25.9873046875, 27.14794921875, 28.30859375, 29.46923828125, 30.6298828125, 31.79052734375, 32.951171875, 34.11181640625, 35.2724609375, 36.43310546875, 37.59375]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 9.0, 5.0, 17.0, 19.0, 36.0, 78.0, 137.0, 335.0, 728.0, 9750.0, 3129398.0, 4076.0, 593.0, 256.0, 110.0, 64.0, 44.0, 22.0, 13.0, 9.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-170.25, -164.25390625, -158.2578125, -152.26171875, -146.265625, -140.26953125, -134.2734375, -128.27734375, -122.28125, -116.28515625, -110.2890625, -104.29296875, -98.296875, -92.30078125, -86.3046875, -80.30859375, -74.3125, -68.31640625, -62.3203125, -56.32421875, -50.328125, -44.33203125, -38.3359375, -32.33984375, -26.34375, -20.34765625, -14.3515625, -8.35546875, -2.359375, 3.63671875, 9.6328125, 15.62890625, 21.625, 27.62109375, 33.6171875, 39.61328125, 45.609375, 51.60546875, 57.6015625, 63.59765625, 69.59375, 75.58984375, 81.5859375, 87.58203125, 93.578125, 99.57421875, 105.5703125, 111.56640625, 117.5625, 123.55859375, 129.5546875, 135.55078125, 141.546875, 147.54296875, 153.5390625, 159.53515625, 165.53125, 171.52734375, 177.5234375, 183.51953125, 189.515625, 195.51171875, 201.5078125, 207.50390625, 213.5]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 30.0, 265.0, 542.0, 146.0, 20.0, 7.0], "bins": [-374.1932678222656, -367.989501953125, -361.7857666015625, -355.5820007324219, -349.3782653808594, -343.17449951171875, -336.9707336425781, -330.7669982910156, -324.563232421875, -318.3594665527344, -312.1557312011719, -305.95196533203125, -299.74822998046875, -293.5444641113281, -287.3406982421875, -281.136962890625, -274.9331970214844, -268.72943115234375, -262.52569580078125, -256.3219299316406, -250.11817932128906, -243.9144287109375, -237.71067810058594, -231.50692749023438, -225.3031768798828, -219.09942626953125, -212.8956756591797, -206.69190979003906, -200.4881591796875, -194.28440856933594, -188.08065795898438, -181.87689208984375, -175.6731414794922, -169.46939086914062, -163.26564025878906, -157.06187438964844, -150.85812377929688, -144.6543731689453, -138.45062255859375, -132.24685668945312, -126.0431137084961, -119.83936309814453, -113.63560485839844, -107.43185424804688, -101.22809600830078, -95.02434539794922, -88.82058715820312, -82.61683654785156, -76.41307830810547, -70.2093276977539, -64.00556945800781, -57.80181884765625, -51.598060607910156, -45.394309997558594, -39.190555572509766, -32.98680114746094, -26.783048629760742, -20.579294204711914, -14.375540733337402, -8.17178726196289, -1.9680328369140625, 4.235721588134766, 10.439474105834961, 16.64322853088379, 22.846982955932617]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 3.0, 9.0, 4.0, 14.0, 20.0, 11.0, 18.0, 18.0, 16.0, 18.0, 28.0, 26.0, 37.0, 29.0, 37.0, 55.0, 38.0, 33.0, 40.0, 65.0, 44.0, 36.0, 30.0, 37.0, 30.0, 33.0, 35.0, 33.0, 34.0, 21.0, 24.0, 20.0, 21.0, 14.0, 14.0, 15.0, 9.0, 7.0, 8.0, 7.0, 2.0, 5.0, 6.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-106.68331146240234, -103.46924591064453, -100.25518035888672, -97.0411148071289, -93.8270492553711, -90.61298370361328, -87.39892578125, -84.18486022949219, -80.97079467773438, -77.75672912597656, -74.54266357421875, -71.32859802246094, -68.11453247070312, -64.90046691894531, -61.686405181884766, -58.47233963012695, -55.258270263671875, -52.04420471191406, -48.83013916015625, -45.61607360839844, -42.402008056640625, -39.18794250488281, -35.973880767822266, -32.75981521606445, -29.54574966430664, -26.331684112548828, -23.117618560791016, -19.903554916381836, -16.689489364624023, -13.475423812866211, -10.261360168457031, -7.047294616699219, -3.8332366943359375, -0.6191716194152832, 2.594893455505371, 5.808958053588867, 9.02302360534668, 12.237089157104492, 15.451152801513672, 18.665218353271484, 21.879283905029297, 25.09334945678711, 28.307415008544922, 31.5214786529541, 34.73554229736328, 37.949607849121094, 41.163673400878906, 44.37773895263672, 47.59180450439453, 50.805870056152344, 54.019935607910156, 57.23400115966797, 60.44806671142578, 63.662132263183594, 66.87619018554688, 70.09025573730469, 73.3043212890625, 76.51838684082031, 79.73245239257812, 82.94651794433594, 86.16058349609375, 89.37464904785156, 92.58871459960938, 95.80278015136719, 99.016845703125]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 4.0, 8.0, 9.0, 8.0, 19.0, 19.0, 21.0, 25.0, 31.0, 14.0, 34.0, 37.0, 30.0, 33.0, 37.0, 41.0, 55.0, 37.0, 26.0, 45.0, 35.0, 54.0, 35.0, 40.0, 35.0, 25.0, 30.0, 23.0, 27.0, 26.0, 26.0, 16.0, 19.0, 15.0, 9.0, 11.0, 14.0, 4.0, 5.0, 6.0, 2.0, 2.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-14.7265625, -14.269287109375, -13.81201171875, -13.354736328125, -12.8974609375, -12.440185546875, -11.98291015625, -11.525634765625, -11.068359375, -10.611083984375, -10.15380859375, -9.696533203125, -9.2392578125, -8.781982421875, -8.32470703125, -7.867431640625, -7.41015625, -6.952880859375, -6.49560546875, -6.038330078125, -5.5810546875, -5.123779296875, -4.66650390625, -4.209228515625, -3.751953125, -3.294677734375, -2.83740234375, -2.380126953125, -1.9228515625, -1.465576171875, -1.00830078125, -0.551025390625, -0.09375, 0.363525390625, 0.82080078125, 1.278076171875, 1.7353515625, 2.192626953125, 2.64990234375, 3.107177734375, 3.564453125, 4.021728515625, 4.47900390625, 4.936279296875, 5.3935546875, 5.850830078125, 6.30810546875, 6.765380859375, 7.22265625, 7.679931640625, 8.13720703125, 8.594482421875, 9.0517578125, 9.509033203125, 9.96630859375, 10.423583984375, 10.880859375, 11.338134765625, 11.79541015625, 12.252685546875, 12.7099609375, 13.167236328125, 13.62451171875, 14.081787109375, 14.5390625]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 6.0, 7.0, 7.0, 8.0, 11.0, 20.0, 25.0, 27.0, 39.0, 48.0, 79.0, 140.0, 253.0, 481.0, 882.0, 1786.0, 3367.0, 7261.0, 39342.0, 2579382.0, 1524498.0, 23037.0, 6514.0, 3038.0, 1714.0, 948.0, 520.0, 311.0, 184.0, 115.0, 77.0, 36.0, 33.0, 18.0, 17.0, 17.0, 8.0, 8.0, 4.0, 7.0, 4.0, 3.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-54.5, -52.84521484375, -51.1904296875, -49.53564453125, -47.880859375, -46.22607421875, -44.5712890625, -42.91650390625, -41.26171875, -39.60693359375, -37.9521484375, -36.29736328125, -34.642578125, -32.98779296875, -31.3330078125, -29.67822265625, -28.0234375, -26.36865234375, -24.7138671875, -23.05908203125, -21.404296875, -19.74951171875, -18.0947265625, -16.43994140625, -14.78515625, -13.13037109375, -11.4755859375, -9.82080078125, -8.166015625, -6.51123046875, -4.8564453125, -3.20166015625, -1.546875, 0.10791015625, 1.7626953125, 3.41748046875, 5.072265625, 6.72705078125, 8.3818359375, 10.03662109375, 11.69140625, 13.34619140625, 15.0009765625, 16.65576171875, 18.310546875, 19.96533203125, 21.6201171875, 23.27490234375, 24.9296875, 26.58447265625, 28.2392578125, 29.89404296875, 31.548828125, 33.20361328125, 34.8583984375, 36.51318359375, 38.16796875, 39.82275390625, 41.4775390625, 43.13232421875, 44.787109375, 46.44189453125, 48.0966796875, 49.75146484375, 51.40625]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 4.0, 6.0, 11.0, 8.0, 8.0, 9.0, 9.0, 16.0, 18.0, 24.0, 39.0, 65.0, 124.0, 218.0, 484.0, 783.0, 947.0, 626.0, 305.0, 145.0, 79.0, 35.0, 27.0, 17.0, 20.0, 10.0, 6.0, 4.0, 5.0, 6.0, 4.0, 3.0, 2.0, 6.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-32.59375, -31.6396484375, -30.685546875, -29.7314453125, -28.77734375, -27.8232421875, -26.869140625, -25.9150390625, -24.9609375, -24.0068359375, -23.052734375, -22.0986328125, -21.14453125, -20.1904296875, -19.236328125, -18.2822265625, -17.328125, -16.3740234375, -15.419921875, -14.4658203125, -13.51171875, -12.5576171875, -11.603515625, -10.6494140625, -9.6953125, -8.7412109375, -7.787109375, -6.8330078125, -5.87890625, -4.9248046875, -3.970703125, -3.0166015625, -2.0625, -1.1083984375, -0.154296875, 0.7998046875, 1.75390625, 2.7080078125, 3.662109375, 4.6162109375, 5.5703125, 6.5244140625, 7.478515625, 8.4326171875, 9.38671875, 10.3408203125, 11.294921875, 12.2490234375, 13.203125, 14.1572265625, 15.111328125, 16.0654296875, 17.01953125, 17.9736328125, 18.927734375, 19.8818359375, 20.8359375, 21.7900390625, 22.744140625, 23.6982421875, 24.65234375, 25.6064453125, 26.560546875, 27.5146484375, 28.46875]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 3.0, 3.0, 2.0, 8.0, 3.0, 7.0, 11.0, 14.0, 16.0, 35.0, 58.0, 84.0, 190.0, 422.0, 1450.0, 6925.0, 64026.0, 4069577.0, 43877.0, 5578.0, 1191.0, 379.0, 162.0, 77.0, 57.0, 38.0, 21.0, 14.0, 9.0, 7.0, 12.0, 7.0, 9.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-125.4375, -121.1767578125, -116.916015625, -112.6552734375, -108.39453125, -104.1337890625, -99.873046875, -95.6123046875, -91.3515625, -87.0908203125, -82.830078125, -78.5693359375, -74.30859375, -70.0478515625, -65.787109375, -61.5263671875, -57.265625, -53.0048828125, -48.744140625, -44.4833984375, -40.22265625, -35.9619140625, -31.701171875, -27.4404296875, -23.1796875, -18.9189453125, -14.658203125, -10.3974609375, -6.13671875, -1.8759765625, 2.384765625, 6.6455078125, 10.90625, 15.1669921875, 19.427734375, 23.6884765625, 27.94921875, 32.2099609375, 36.470703125, 40.7314453125, 44.9921875, 49.2529296875, 53.513671875, 57.7744140625, 62.03515625, 66.2958984375, 70.556640625, 74.8173828125, 79.078125, 83.3388671875, 87.599609375, 91.8603515625, 96.12109375, 100.3818359375, 104.642578125, 108.9033203125, 113.1640625, 117.4248046875, 121.685546875, 125.9462890625, 130.20703125, 134.4677734375, 138.728515625, 142.9892578125, 147.25]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 8.0, 4.0, 7.0, 3.0, 11.0, 9.0, 14.0, 16.0, 31.0, 36.0, 44.0, 75.0, 121.0, 120.0, 141.0, 98.0, 74.0, 55.0, 33.0, 26.0, 23.0, 14.0, 14.0, 10.0, 3.0, 5.0, 2.0, 3.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-116.70932006835938, -113.93148803710938, -111.15364837646484, -108.37581634521484, -105.59797668457031, -102.82014465332031, -100.04231262207031, -97.26447296142578, -94.48663330078125, -91.70880126953125, -88.93096160888672, -86.15312957763672, -83.37528991699219, -80.59745788574219, -77.81962585449219, -75.04178619384766, -72.26395416259766, -69.48612213134766, -66.70828247070312, -63.930450439453125, -61.152610778808594, -58.374778747558594, -55.59694290161133, -52.81910705566406, -50.0412712097168, -47.26343536376953, -44.485599517822266, -41.707763671875, -38.929931640625, -36.15209197998047, -33.37425994873047, -30.596424102783203, -27.818580627441406, -25.04074478149414, -22.262908935546875, -19.485074996948242, -16.707239151000977, -13.929403305053711, -11.151569366455078, -8.373733520507812, -5.595897674560547, -2.8180623054504395, -0.04022693634033203, 2.737607955932617, 5.515443801879883, 8.293279647827148, 11.071113586425781, 13.848949432373047, 16.626785278320312, 19.404621124267578, 22.182456970214844, 24.960290908813477, 27.738126754760742, 30.515962600708008, 33.29379653930664, 36.071632385253906, 38.84946823120117, 41.62730407714844, 44.4051399230957, 47.18297576904297, 49.96080780029297, 52.7386474609375, 55.5164794921875, 58.294315338134766, 61.07215118408203]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 5.0, 3.0, 6.0, 7.0, 7.0, 10.0, 11.0, 13.0, 13.0, 11.0, 14.0, 21.0, 15.0, 25.0, 27.0, 29.0, 28.0, 29.0, 28.0, 19.0, 37.0, 31.0, 34.0, 36.0, 47.0, 53.0, 43.0, 44.0, 39.0, 30.0, 19.0, 29.0, 24.0, 39.0, 20.0, 27.0, 26.0, 17.0, 20.0, 10.0, 14.0, 13.0, 8.0, 5.0, 5.0, 2.0, 3.0, 3.0, 3.0, 1.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-63.53112030029297, -61.490440368652344, -59.44975662231445, -57.40907669067383, -55.36839294433594, -53.32771301269531, -51.28703308105469, -49.24635314941406, -47.20566940307617, -45.16498947143555, -43.124305725097656, -41.08362579345703, -39.042945861816406, -37.002262115478516, -34.96158218383789, -32.9208984375, -30.880218505859375, -28.839536666870117, -26.79885482788086, -24.758174896240234, -22.717493057250977, -20.67681121826172, -18.636131286621094, -16.595449447631836, -14.554767608642578, -12.51408576965332, -10.473404884338379, -8.432723999023438, -6.39204216003418, -4.351360321044922, -2.3106794357299805, -0.26999855041503906, 1.7706756591796875, 3.811357021331787, 5.852038383483887, 7.892719745635986, 9.933401107788086, 11.974082946777344, 14.014763832092285, 16.055444717407227, 18.096126556396484, 20.136808395385742, 22.177490234375, 24.218170166015625, 26.258852005004883, 28.29953384399414, 30.340213775634766, 32.380897521972656, 34.42157745361328, 36.462257385253906, 38.5029411315918, 40.54362106323242, 42.58430480957031, 44.62498474121094, 46.66566467285156, 48.70634460449219, 50.74702835083008, 52.7877082824707, 54.828392028808594, 56.86907196044922, 58.909751892089844, 60.950435638427734, 62.99111557006836, 65.03179931640625, 67.07247924804688]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 8.0, 4.0, 6.0, 9.0, 10.0, 7.0, 17.0, 13.0, 15.0, 30.0, 21.0, 20.0, 23.0, 42.0, 30.0, 30.0, 36.0, 40.0, 31.0, 46.0, 44.0, 54.0, 26.0, 38.0, 41.0, 44.0, 22.0, 28.0, 33.0, 22.0, 25.0, 34.0, 25.0, 16.0, 23.0, 15.0, 10.0, 19.0, 11.0, 5.0, 5.0, 5.0, 7.0, 5.0, 4.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0], "bins": [-14.0078125, -13.567138671875, -13.12646484375, -12.685791015625, -12.2451171875, -11.804443359375, -11.36376953125, -10.923095703125, -10.482421875, -10.041748046875, -9.60107421875, -9.160400390625, -8.7197265625, -8.279052734375, -7.83837890625, -7.397705078125, -6.95703125, -6.516357421875, -6.07568359375, -5.635009765625, -5.1943359375, -4.753662109375, -4.31298828125, -3.872314453125, -3.431640625, -2.990966796875, -2.55029296875, -2.109619140625, -1.6689453125, -1.228271484375, -0.78759765625, -0.346923828125, 0.09375, 0.534423828125, 0.97509765625, 1.415771484375, 1.8564453125, 2.297119140625, 2.73779296875, 3.178466796875, 3.619140625, 4.059814453125, 4.50048828125, 4.941162109375, 5.3818359375, 5.822509765625, 6.26318359375, 6.703857421875, 7.14453125, 7.585205078125, 8.02587890625, 8.466552734375, 8.9072265625, 9.347900390625, 9.78857421875, 10.229248046875, 10.669921875, 11.110595703125, 11.55126953125, 11.991943359375, 12.4326171875, 12.873291015625, 13.31396484375, 13.754638671875, 14.1953125]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 5.0, 9.0, 5.0, 14.0, 25.0, 39.0, 79.0, 69.0, 142.0, 186.0, 292.0, 491.0, 786.0, 1312.0, 2064.0, 3266.0, 5161.0, 8408.0, 13775.0, 22336.0, 38546.0, 68898.0, 127093.0, 230479.0, 231079.0, 127808.0, 68982.0, 38884.0, 22626.0, 13638.0, 8588.0, 5125.0, 3149.0, 1926.0, 1240.0, 729.0, 452.0, 279.0, 198.0, 135.0, 72.0, 61.0, 32.0, 37.0, 15.0, 11.0, 6.0, 4.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6943359375, -1.639678955078125, -1.58502197265625, -1.530364990234375, -1.4757080078125, -1.421051025390625, -1.36639404296875, -1.311737060546875, -1.257080078125, -1.202423095703125, -1.14776611328125, -1.093109130859375, -1.0384521484375, -0.983795166015625, -0.92913818359375, -0.874481201171875, -0.81982421875, -0.765167236328125, -0.71051025390625, -0.655853271484375, -0.6011962890625, -0.546539306640625, -0.49188232421875, -0.437225341796875, -0.382568359375, -0.327911376953125, -0.27325439453125, -0.218597412109375, -0.1639404296875, -0.109283447265625, -0.05462646484375, 3.0517578125e-05, 0.0546875, 0.109344482421875, 0.16400146484375, 0.218658447265625, 0.2733154296875, 0.327972412109375, 0.38262939453125, 0.437286376953125, 0.491943359375, 0.546600341796875, 0.60125732421875, 0.655914306640625, 0.7105712890625, 0.765228271484375, 0.81988525390625, 0.874542236328125, 0.92919921875, 0.983856201171875, 1.03851318359375, 1.093170166015625, 1.1478271484375, 1.202484130859375, 1.25714111328125, 1.311798095703125, 1.366455078125, 1.421112060546875, 1.47576904296875, 1.530426025390625, 1.5850830078125, 1.639739990234375, 1.69439697265625, 1.749053955078125, 1.8037109375]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 4.0, 3.0, 9.0, 7.0, 10.0, 24.0, 20.0, 18.0, 29.0, 34.0, 32.0, 36.0, 28.0, 47.0, 50.0, 41.0, 42.0, 55.0, 1077.0, 46.0, 57.0, 38.0, 40.0, 38.0, 43.0, 40.0, 22.0, 20.0, 23.0, 21.0, 14.0, 11.0, 10.0, 12.0, 8.0, 10.0, 1.0, 2.0, 0.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-12.7578125, -12.40869140625, -12.0595703125, -11.71044921875, -11.361328125, -11.01220703125, -10.6630859375, -10.31396484375, -9.96484375, -9.61572265625, -9.2666015625, -8.91748046875, -8.568359375, -8.21923828125, -7.8701171875, -7.52099609375, -7.171875, -6.82275390625, -6.4736328125, -6.12451171875, -5.775390625, -5.42626953125, -5.0771484375, -4.72802734375, -4.37890625, -4.02978515625, -3.6806640625, -3.33154296875, -2.982421875, -2.63330078125, -2.2841796875, -1.93505859375, -1.5859375, -1.23681640625, -0.8876953125, -0.53857421875, -0.189453125, 0.15966796875, 0.5087890625, 0.85791015625, 1.20703125, 1.55615234375, 1.9052734375, 2.25439453125, 2.603515625, 2.95263671875, 3.3017578125, 3.65087890625, 4.0, 4.34912109375, 4.6982421875, 5.04736328125, 5.396484375, 5.74560546875, 6.0947265625, 6.44384765625, 6.79296875, 7.14208984375, 7.4912109375, 7.84033203125, 8.189453125, 8.53857421875, 8.8876953125, 9.23681640625, 9.5859375]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 4.0, 4.0, 3.0, 6.0, 4.0, 10.0, 16.0, 21.0, 28.0, 42.0, 65.0, 95.0, 192.0, 326.0, 551.0, 973.0, 1722.0, 3121.0, 5675.0, 10432.0, 19693.0, 39379.0, 81452.0, 179045.0, 1363997.0, 204800.0, 92700.0, 44281.0, 22203.0, 11837.0, 6463.0, 3571.0, 1865.0, 1069.0, 596.0, 351.0, 210.0, 94.0, 72.0, 45.0, 43.0, 29.0, 21.0, 11.0, 6.0, 6.0, 5.0, 3.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.193359375, -1.151611328125, -1.10986328125, -1.068115234375, -1.0263671875, -0.984619140625, -0.94287109375, -0.901123046875, -0.859375, -0.817626953125, -0.77587890625, -0.734130859375, -0.6923828125, -0.650634765625, -0.60888671875, -0.567138671875, -0.525390625, -0.483642578125, -0.44189453125, -0.400146484375, -0.3583984375, -0.316650390625, -0.27490234375, -0.233154296875, -0.19140625, -0.149658203125, -0.10791015625, -0.066162109375, -0.0244140625, 0.017333984375, 0.05908203125, 0.100830078125, 0.142578125, 0.184326171875, 0.22607421875, 0.267822265625, 0.3095703125, 0.351318359375, 0.39306640625, 0.434814453125, 0.4765625, 0.518310546875, 0.56005859375, 0.601806640625, 0.6435546875, 0.685302734375, 0.72705078125, 0.768798828125, 0.810546875, 0.852294921875, 0.89404296875, 0.935791015625, 0.9775390625, 1.019287109375, 1.06103515625, 1.102783203125, 1.14453125, 1.186279296875, 1.22802734375, 1.269775390625, 1.3115234375, 1.353271484375, 1.39501953125, 1.436767578125, 1.478515625]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 5.0, 1.0, 4.0, 3.0, 6.0, 1.0, 6.0, 4.0, 5.0, 11.0, 6.0, 12.0, 23.0, 27.0, 41.0, 38.0, 34.0, 58.0, 72.0, 55.0, 114.0, 98.0, 81.0, 44.0, 40.0, 40.0, 36.0, 31.0, 25.0, 17.0, 12.0, 13.0, 9.0, 7.0, 10.0, 3.0, 6.0, 2.0, 2.0, 1.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.07080078125, -0.06871604919433594, -0.06663131713867188, -0.06454658508300781, -0.06246185302734375, -0.06037712097167969, -0.058292388916015625, -0.05620765686035156, -0.0541229248046875, -0.05203819274902344, -0.049953460693359375, -0.04786872863769531, -0.04578399658203125, -0.04369926452636719, -0.041614532470703125, -0.03952980041503906, -0.037445068359375, -0.03536033630371094, -0.033275604248046875, -0.031190872192382812, -0.02910614013671875, -0.027021408081054688, -0.024936676025390625, -0.022851943969726562, -0.0207672119140625, -0.018682479858398438, -0.016597747802734375, -0.014513015747070312, -0.01242828369140625, -0.010343551635742188, -0.008258819580078125, -0.0061740875244140625, -0.00408935546875, -0.0020046234130859375, 8.0108642578125e-05, 0.0021648406982421875, 0.00424957275390625, 0.0063343048095703125, 0.008419036865234375, 0.010503768920898438, 0.0125885009765625, 0.014673233032226562, 0.016757965087890625, 0.018842697143554688, 0.02092742919921875, 0.023012161254882812, 0.025096893310546875, 0.027181625366210938, 0.029266357421875, 0.03135108947753906, 0.033435821533203125, 0.03552055358886719, 0.03760528564453125, 0.03969001770019531, 0.041774749755859375, 0.04385948181152344, 0.0459442138671875, 0.04802894592285156, 0.050113677978515625, 0.05219841003417969, 0.05428314208984375, 0.05636787414550781, 0.058452606201171875, 0.06053733825683594, 0.0626220703125]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 4.0, 2.0, 5.0, 7.0, 8.0, 14.0, 10.0, 17.0, 24.0, 22.0, 38.0, 56.0, 72.0, 98.0, 136.0, 256.0, 950.0, 21276.0, 1004926.0, 18970.0, 836.0, 280.0, 154.0, 99.0, 72.0, 60.0, 30.0, 35.0, 20.0, 12.0, 15.0, 7.0, 8.0, 8.0, 6.0, 4.0, 4.0, 6.0, 2.0, 3.0, 2.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.353515625, -1.3105316162109375, -1.267547607421875, -1.2245635986328125, -1.18157958984375, -1.1385955810546875, -1.095611572265625, -1.0526275634765625, -1.0096435546875, -0.9666595458984375, -0.923675537109375, -0.8806915283203125, -0.83770751953125, -0.7947235107421875, -0.751739501953125, -0.7087554931640625, -0.665771484375, -0.6227874755859375, -0.579803466796875, -0.5368194580078125, -0.49383544921875, -0.4508514404296875, -0.407867431640625, -0.3648834228515625, -0.3218994140625, -0.2789154052734375, -0.235931396484375, -0.1929473876953125, -0.14996337890625, -0.1069793701171875, -0.063995361328125, -0.0210113525390625, 0.02197265625, 0.0649566650390625, 0.107940673828125, 0.1509246826171875, 0.19390869140625, 0.2368927001953125, 0.279876708984375, 0.3228607177734375, 0.3658447265625, 0.4088287353515625, 0.451812744140625, 0.4947967529296875, 0.53778076171875, 0.5807647705078125, 0.623748779296875, 0.6667327880859375, 0.709716796875, 0.7527008056640625, 0.795684814453125, 0.8386688232421875, 0.88165283203125, 0.9246368408203125, 0.967620849609375, 1.0106048583984375, 1.0535888671875, 1.0965728759765625, 1.139556884765625, 1.1825408935546875, 1.22552490234375, 1.2685089111328125, 1.311492919921875, 1.3544769287109375, 1.3974609375]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 17.0, 89.0, 729.0, 153.0, 25.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4743356704711914, -1.4370964765548706, -1.3998572826385498, -1.362618088722229, -1.3253788948059082, -1.288139820098877, -1.2509005069732666, -1.2136614322662354, -1.1764222383499146, -1.1391830444335938, -1.101943850517273, -1.0647046566009521, -1.0274654626846313, -0.9902263283729553, -0.9529871344566345, -0.9157480001449585, -0.8785087466239929, -0.8412695527076721, -0.8040303587913513, -0.7667912244796753, -0.7295520305633545, -0.6923128366470337, -0.6550736427307129, -0.6178344488143921, -0.5805952548980713, -0.5433560609817505, -0.5061168670654297, -0.4688777029514313, -0.43163853883743286, -0.39439934492111206, -0.35716015100479126, -0.31992098689079285, -0.2826818823814392, -0.2454427033662796, -0.20820352435112, -0.1709643304347992, -0.1337251514196396, -0.09648597240447998, -0.05924677848815918, -0.022007614374160767, 0.015231579542160034, 0.05247076228260994, 0.08970994502305984, 0.12694913148880005, 0.16418831050395966, 0.20142748951911926, 0.23866668343544006, 0.2759058475494385, 0.3131450414657593, 0.3503842353820801, 0.3876233994960785, 0.4248625934123993, 0.4621017575263977, 0.4993409514427185, 0.5365801453590393, 0.5738192796707153, 0.6110584735870361, 0.6482976675033569, 0.6855368614196777, 0.7227760553359985, 0.7600151896476746, 0.7972543835639954, 0.8344935774803162, 0.8717327117919922, 0.9089719653129578]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 5.0, 1.0, 8.0, 6.0, 7.0, 5.0, 7.0, 15.0, 12.0, 25.0, 17.0, 18.0, 19.0, 40.0, 32.0, 33.0, 45.0, 44.0, 39.0, 49.0, 33.0, 48.0, 45.0, 49.0, 40.0, 43.0, 38.0, 40.0, 33.0, 26.0, 29.0, 34.0, 23.0, 24.0, 19.0, 16.0, 9.0, 11.0, 8.0, 4.0, 2.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.1353248953819275, -0.1309289038181305, -0.1265329122543335, -0.1221369281411171, -0.1177409365773201, -0.1133449450135231, -0.1089489609003067, -0.1045529693365097, -0.10015697777271271, -0.09576098620891571, -0.09136499464511871, -0.08696901053190231, -0.08257301896810532, -0.07817702740430832, -0.07378104329109192, -0.06938505172729492, -0.06498906016349792, -0.06059306859970093, -0.05619708076119423, -0.05180109292268753, -0.04740510135889053, -0.043009109795093536, -0.03861312195658684, -0.03421713411808014, -0.029821142554283142, -0.025425152853131294, -0.021029163151979446, -0.0166331734508276, -0.01223718374967575, -0.007841194048523903, -0.003445204347372055, 0.0009507853537797928, 0.005346775054931641, 0.009742764756083488, 0.014138754457235336, 0.018534744158387184, 0.022930733859539032, 0.02732672356069088, 0.03172271326184273, 0.036118701100349426, 0.04051469266414642, 0.04491068422794342, 0.04930667206645012, 0.05370265990495682, 0.058098651468753815, 0.06249464303255081, 0.06689062714576721, 0.07128661870956421, 0.0756826102733612, 0.0800786018371582, 0.0844745934009552, 0.0888705775141716, 0.0932665690779686, 0.0976625606417656, 0.102058544754982, 0.10645453631877899, 0.11085052788257599, 0.11524651944637299, 0.11964251101016998, 0.12403849512338638, 0.12843447923660278, 0.13283047080039978, 0.13722646236419678, 0.14162245392799377, 0.14601844549179077]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 8.0, 4.0, 7.0, 8.0, 10.0, 7.0, 17.0, 13.0, 15.0, 30.0, 21.0, 20.0, 23.0, 40.0, 32.0, 31.0, 35.0, 40.0, 31.0, 45.0, 44.0, 56.0, 25.0, 36.0, 40.0, 47.0, 21.0, 29.0, 33.0, 22.0, 25.0, 34.0, 25.0, 16.0, 23.0, 15.0, 10.0, 19.0, 11.0, 5.0, 5.0, 5.0, 7.0, 5.0, 4.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0], "bins": [-14.0078125, -13.5672607421875, -13.126708984375, -12.6861572265625, -12.24560546875, -11.8050537109375, -11.364501953125, -10.9239501953125, -10.4833984375, -10.0428466796875, -9.602294921875, -9.1617431640625, -8.72119140625, -8.2806396484375, -7.840087890625, -7.3995361328125, -6.958984375, -6.5184326171875, -6.077880859375, -5.6373291015625, -5.19677734375, -4.7562255859375, -4.315673828125, -3.8751220703125, -3.4345703125, -2.9940185546875, -2.553466796875, -2.1129150390625, -1.67236328125, -1.2318115234375, -0.791259765625, -0.3507080078125, 0.08984375, 0.5303955078125, 0.970947265625, 1.4114990234375, 1.85205078125, 2.2926025390625, 2.733154296875, 3.1737060546875, 3.6142578125, 4.0548095703125, 4.495361328125, 4.9359130859375, 5.37646484375, 5.8170166015625, 6.257568359375, 6.6981201171875, 7.138671875, 7.5792236328125, 8.019775390625, 8.4603271484375, 8.90087890625, 9.3414306640625, 9.781982421875, 10.2225341796875, 10.6630859375, 11.1036376953125, 11.544189453125, 11.9847412109375, 12.42529296875, 12.8658447265625, 13.306396484375, 13.7469482421875, 14.1875]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 8.0, 6.0, 10.0, 10.0, 14.0, 15.0, 27.0, 29.0, 37.0, 62.0, 55.0, 94.0, 112.0, 181.0, 249.0, 434.0, 707.0, 1264.0, 2504.0, 6432.0, 35287.0, 762145.0, 214454.0, 15709.0, 4246.0, 1875.0, 943.0, 514.0, 362.0, 211.0, 133.0, 112.0, 78.0, 47.0, 42.0, 29.0, 24.0, 27.0, 18.0, 7.0, 8.0, 9.0, 6.0, 10.0, 4.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0], "bins": [-23.96875, -23.215087890625, -22.46142578125, -21.707763671875, -20.9541015625, -20.200439453125, -19.44677734375, -18.693115234375, -17.939453125, -17.185791015625, -16.43212890625, -15.678466796875, -14.9248046875, -14.171142578125, -13.41748046875, -12.663818359375, -11.91015625, -11.156494140625, -10.40283203125, -9.649169921875, -8.8955078125, -8.141845703125, -7.38818359375, -6.634521484375, -5.880859375, -5.127197265625, -4.37353515625, -3.619873046875, -2.8662109375, -2.112548828125, -1.35888671875, -0.605224609375, 0.1484375, 0.902099609375, 1.65576171875, 2.409423828125, 3.1630859375, 3.916748046875, 4.67041015625, 5.424072265625, 6.177734375, 6.931396484375, 7.68505859375, 8.438720703125, 9.1923828125, 9.946044921875, 10.69970703125, 11.453369140625, 12.20703125, 12.960693359375, 13.71435546875, 14.468017578125, 15.2216796875, 15.975341796875, 16.72900390625, 17.482666015625, 18.236328125, 18.989990234375, 19.74365234375, 20.497314453125, 21.2509765625, 22.004638671875, 22.75830078125, 23.511962890625, 24.265625]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 5.0, 7.0, 11.0, 6.0, 9.0, 14.0, 17.0, 14.0, 23.0, 22.0, 22.0, 26.0, 28.0, 44.0, 41.0, 42.0, 54.0, 50.0, 80.0, 182.0, 1830.0, 93.0, 50.0, 50.0, 45.0, 40.0, 29.0, 30.0, 27.0, 21.0, 22.0, 19.0, 13.0, 15.0, 18.0, 8.0, 8.0, 8.0, 7.0, 5.0, 4.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.03125, -31.81640625, -30.6015625, -29.38671875, -28.171875, -26.95703125, -25.7421875, -24.52734375, -23.3125, -22.09765625, -20.8828125, -19.66796875, -18.453125, -17.23828125, -16.0234375, -14.80859375, -13.59375, -12.37890625, -11.1640625, -9.94921875, -8.734375, -7.51953125, -6.3046875, -5.08984375, -3.875, -2.66015625, -1.4453125, -0.23046875, 0.984375, 2.19921875, 3.4140625, 4.62890625, 5.84375, 7.05859375, 8.2734375, 9.48828125, 10.703125, 11.91796875, 13.1328125, 14.34765625, 15.5625, 16.77734375, 17.9921875, 19.20703125, 20.421875, 21.63671875, 22.8515625, 24.06640625, 25.28125, 26.49609375, 27.7109375, 28.92578125, 30.140625, 31.35546875, 32.5703125, 33.78515625, 35.0, 36.21484375, 37.4296875, 38.64453125, 39.859375, 41.07421875, 42.2890625, 43.50390625, 44.71875]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 5.0, 5.0, 5.0, 10.0, 8.0, 6.0, 16.0, 16.0, 14.0, 21.0, 19.0, 26.0, 26.0, 49.0, 50.0, 94.0, 132.0, 203.0, 451.0, 2084.0, 2880214.0, 259496.0, 1598.0, 421.0, 222.0, 117.0, 87.0, 68.0, 41.0, 33.0, 21.0, 27.0, 22.0, 18.0, 16.0, 17.0, 9.0, 4.0, 9.0, 8.0, 5.0, 7.0, 2.0, 3.0, 0.0, 2.0, 1.0, 4.0], "bins": [-130.625, -127.0888671875, -123.552734375, -120.0166015625, -116.48046875, -112.9443359375, -109.408203125, -105.8720703125, -102.3359375, -98.7998046875, -95.263671875, -91.7275390625, -88.19140625, -84.6552734375, -81.119140625, -77.5830078125, -74.046875, -70.5107421875, -66.974609375, -63.4384765625, -59.90234375, -56.3662109375, -52.830078125, -49.2939453125, -45.7578125, -42.2216796875, -38.685546875, -35.1494140625, -31.61328125, -28.0771484375, -24.541015625, -21.0048828125, -17.46875, -13.9326171875, -10.396484375, -6.8603515625, -3.32421875, 0.2119140625, 3.748046875, 7.2841796875, 10.8203125, 14.3564453125, 17.892578125, 21.4287109375, 24.96484375, 28.5009765625, 32.037109375, 35.5732421875, 39.109375, 42.6455078125, 46.181640625, 49.7177734375, 53.25390625, 56.7900390625, 60.326171875, 63.8623046875, 67.3984375, 70.9345703125, 74.470703125, 78.0068359375, 81.54296875, 85.0791015625, 88.615234375, 92.1513671875, 95.6875]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 6.0, 81.0, 542.0, 359.0, 31.0], "bins": [-239.0032501220703, -235.13783264160156, -231.2724151611328, -227.40699768066406, -223.54159545898438, -219.67617797851562, -215.81076049804688, -211.94534301757812, -208.07992553710938, -204.21450805664062, -200.34909057617188, -196.48367309570312, -192.61825561523438, -188.7528533935547, -184.88743591308594, -181.0220184326172, -177.15660095214844, -173.2911834716797, -169.42576599121094, -165.5603485107422, -161.6949462890625, -157.82952880859375, -153.964111328125, -150.09869384765625, -146.2332763671875, -142.36785888671875, -138.50244140625, -134.63702392578125, -130.7716064453125, -126.90619659423828, -123.04078674316406, -119.17536926269531, -115.30994415283203, -111.44452667236328, -107.57911682128906, -103.71369934082031, -99.84828186035156, -95.98286437988281, -92.11744689941406, -88.25203704833984, -84.3866195678711, -80.52120208740234, -76.65579223632812, -72.79037475585938, -68.92495727539062, -65.05953979492188, -61.19412612915039, -57.328712463378906, -53.463294982910156, -49.597877502441406, -45.73246383666992, -41.86705017089844, -38.00163269042969, -34.13621520996094, -30.270801544189453, -26.405385971069336, -22.53997039794922, -18.6745548248291, -14.809139251708984, -10.943723678588867, -7.07830810546875, -3.212892532348633, 0.6525230407714844, 4.517938613891602, 8.383353233337402]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 6.0, 5.0, 11.0, 10.0, 9.0, 18.0, 17.0, 20.0, 17.0, 20.0, 28.0, 39.0, 22.0, 33.0, 37.0, 45.0, 41.0, 44.0, 44.0, 40.0, 45.0, 42.0, 47.0, 37.0, 45.0, 32.0, 32.0, 38.0, 37.0, 15.0, 19.0, 14.0, 14.0, 17.0, 14.0, 10.0, 8.0, 12.0, 3.0, 6.0, 5.0, 3.0, 2.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-117.60169219970703, -114.11853790283203, -110.63538360595703, -107.15222930908203, -103.66907501220703, -100.18592071533203, -96.7027587890625, -93.2196044921875, -89.7364501953125, -86.2532958984375, -82.7701416015625, -79.2869873046875, -75.8038330078125, -72.3206787109375, -68.8375244140625, -65.3543701171875, -61.8712158203125, -58.3880615234375, -54.9049072265625, -51.4217529296875, -47.9385986328125, -44.4554443359375, -40.972286224365234, -37.489131927490234, -34.005977630615234, -30.522823333740234, -27.039669036865234, -23.5565128326416, -20.0733585357666, -16.5902042388916, -13.107048034667969, -9.623893737792969, -6.1407318115234375, -2.6575770378112793, 0.8255777359008789, 4.308732986450195, 7.791887283325195, 11.275041580200195, 14.758197784423828, 18.241352081298828, 21.724506378173828, 25.207660675048828, 28.690814971923828, 32.173973083496094, 35.657127380371094, 39.140281677246094, 42.623435974121094, 46.106590270996094, 49.589744567871094, 53.072898864746094, 56.556053161621094, 60.039207458496094, 63.522361755371094, 67.0055160522461, 70.48867797851562, 73.97183227539062, 77.45498657226562, 80.93814086914062, 84.42129516601562, 87.90444946289062, 91.38760375976562, 94.87075805664062, 98.35391235351562, 101.83706665039062, 105.32022094726562]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 7.0, 3.0, 9.0, 7.0, 9.0, 8.0, 12.0, 15.0, 16.0, 19.0, 28.0, 14.0, 25.0, 25.0, 36.0, 26.0, 37.0, 40.0, 32.0, 37.0, 42.0, 42.0, 36.0, 42.0, 37.0, 38.0, 42.0, 25.0, 31.0, 23.0, 24.0, 28.0, 25.0, 22.0, 27.0, 16.0, 13.0, 18.0, 14.0, 9.0, 15.0, 5.0, 2.0, 5.0, 4.0, 6.0, 6.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0], "bins": [-13.7265625, -13.29345703125, -12.8603515625, -12.42724609375, -11.994140625, -11.56103515625, -11.1279296875, -10.69482421875, -10.26171875, -9.82861328125, -9.3955078125, -8.96240234375, -8.529296875, -8.09619140625, -7.6630859375, -7.22998046875, -6.796875, -6.36376953125, -5.9306640625, -5.49755859375, -5.064453125, -4.63134765625, -4.1982421875, -3.76513671875, -3.33203125, -2.89892578125, -2.4658203125, -2.03271484375, -1.599609375, -1.16650390625, -0.7333984375, -0.30029296875, 0.1328125, 0.56591796875, 0.9990234375, 1.43212890625, 1.865234375, 2.29833984375, 2.7314453125, 3.16455078125, 3.59765625, 4.03076171875, 4.4638671875, 4.89697265625, 5.330078125, 5.76318359375, 6.1962890625, 6.62939453125, 7.0625, 7.49560546875, 7.9287109375, 8.36181640625, 8.794921875, 9.22802734375, 9.6611328125, 10.09423828125, 10.52734375, 10.96044921875, 11.3935546875, 11.82666015625, 12.259765625, 12.69287109375, 13.1259765625, 13.55908203125, 13.9921875]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 9.0, 8.0, 5.0, 18.0, 28.0, 21.0, 40.0, 55.0, 72.0, 121.0, 129.0, 207.0, 330.0, 495.0, 758.0, 1164.0, 1899.0, 3121.0, 5497.0, 9304.0, 26234.0, 234277.0, 2488211.0, 1296852.0, 90545.0, 14695.0, 7375.0, 4566.0, 2765.0, 1720.0, 1186.0, 805.0, 498.0, 339.0, 245.0, 175.0, 148.0, 96.0, 71.0, 51.0, 34.0, 38.0, 16.0, 19.0, 7.0, 15.0, 4.0, 6.0, 4.0, 2.0, 4.0, 9.0], "bins": [-34.15625, -33.17578125, -32.1953125, -31.21484375, -30.234375, -29.25390625, -28.2734375, -27.29296875, -26.3125, -25.33203125, -24.3515625, -23.37109375, -22.390625, -21.41015625, -20.4296875, -19.44921875, -18.46875, -17.48828125, -16.5078125, -15.52734375, -14.546875, -13.56640625, -12.5859375, -11.60546875, -10.625, -9.64453125, -8.6640625, -7.68359375, -6.703125, -5.72265625, -4.7421875, -3.76171875, -2.78125, -1.80078125, -0.8203125, 0.16015625, 1.140625, 2.12109375, 3.1015625, 4.08203125, 5.0625, 6.04296875, 7.0234375, 8.00390625, 8.984375, 9.96484375, 10.9453125, 11.92578125, 12.90625, 13.88671875, 14.8671875, 15.84765625, 16.828125, 17.80859375, 18.7890625, 19.76953125, 20.75, 21.73046875, 22.7109375, 23.69140625, 24.671875, 25.65234375, 26.6328125, 27.61328125, 28.59375]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 4.0, 10.0, 9.0, 13.0, 21.0, 18.0, 37.0, 56.0, 101.0, 203.0, 516.0, 1003.0, 1045.0, 544.0, 242.0, 102.0, 58.0, 20.0, 20.0, 19.0, 11.0, 7.0, 5.0, 3.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.28125, -38.94091796875, -37.6005859375, -36.26025390625, -34.919921875, -33.57958984375, -32.2392578125, -30.89892578125, -29.55859375, -28.21826171875, -26.8779296875, -25.53759765625, -24.197265625, -22.85693359375, -21.5166015625, -20.17626953125, -18.8359375, -17.49560546875, -16.1552734375, -14.81494140625, -13.474609375, -12.13427734375, -10.7939453125, -9.45361328125, -8.11328125, -6.77294921875, -5.4326171875, -4.09228515625, -2.751953125, -1.41162109375, -0.0712890625, 1.26904296875, 2.609375, 3.94970703125, 5.2900390625, 6.63037109375, 7.970703125, 9.31103515625, 10.6513671875, 11.99169921875, 13.33203125, 14.67236328125, 16.0126953125, 17.35302734375, 18.693359375, 20.03369140625, 21.3740234375, 22.71435546875, 24.0546875, 25.39501953125, 26.7353515625, 28.07568359375, 29.416015625, 30.75634765625, 32.0966796875, 33.43701171875, 34.77734375, 36.11767578125, 37.4580078125, 38.79833984375, 40.138671875, 41.47900390625, 42.8193359375, 44.15966796875, 45.5]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 10.0, 8.0, 15.0, 17.0, 39.0, 91.0, 161.0, 355.0, 881.0, 2906.0, 18016.0, 3249942.0, 904265.0, 13719.0, 2437.0, 773.0, 309.0, 149.0, 71.0, 47.0, 32.0, 10.0, 13.0, 8.0, 2.0, 0.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-140.25, -135.9921875, -131.734375, -127.4765625, -123.21875, -118.9609375, -114.703125, -110.4453125, -106.1875, -101.9296875, -97.671875, -93.4140625, -89.15625, -84.8984375, -80.640625, -76.3828125, -72.125, -67.8671875, -63.609375, -59.3515625, -55.09375, -50.8359375, -46.578125, -42.3203125, -38.0625, -33.8046875, -29.546875, -25.2890625, -21.03125, -16.7734375, -12.515625, -8.2578125, -4.0, 0.2578125, 4.515625, 8.7734375, 13.03125, 17.2890625, 21.546875, 25.8046875, 30.0625, 34.3203125, 38.578125, 42.8359375, 47.09375, 51.3515625, 55.609375, 59.8671875, 64.125, 68.3828125, 72.640625, 76.8984375, 81.15625, 85.4140625, 89.671875, 93.9296875, 98.1875, 102.4453125, 106.703125, 110.9609375, 115.21875, 119.4765625, 123.734375, 127.9921875, 132.25]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 7.0, 17.0, 134.0, 651.0, 177.0, 31.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1150.5255126953125, -1130.531982421875, -1110.5384521484375, -1090.544921875, -1070.551513671875, -1050.5579833984375, -1030.564453125, -1010.5709228515625, -990.577392578125, -970.5838623046875, -950.59033203125, -930.5968627929688, -910.6033325195312, -890.6098022460938, -870.6163330078125, -850.622802734375, -830.6292724609375, -810.6357421875, -790.6422119140625, -770.6487426757812, -750.6552124023438, -730.6616821289062, -710.668212890625, -690.6746826171875, -670.68115234375, -650.6876220703125, -630.694091796875, -610.7006225585938, -590.7070922851562, -570.7135620117188, -550.7200927734375, -530.7265625, -510.7330322265625, -490.739501953125, -470.7460021972656, -450.75250244140625, -430.75897216796875, -410.76544189453125, -390.7719421386719, -370.7784423828125, -350.784912109375, -330.7913818359375, -310.7978820800781, -290.80438232421875, -270.81085205078125, -250.8173370361328, -230.82382202148438, -210.83030700683594, -190.83680725097656, -170.84329223632812, -150.8497772216797, -130.85626220703125, -110.86274719238281, -90.86923217773438, -70.87571716308594, -50.8822021484375, -30.888687133789062, -10.895172119140625, 9.098342895507812, 29.09185791015625, 49.08537292480469, 69.07888793945312, 89.07240295410156, 109.06591796875, 129.05943298339844]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 8.0, 9.0, 10.0, 6.0, 2.0, 12.0, 12.0, 17.0, 15.0, 15.0, 19.0, 35.0, 21.0, 32.0, 28.0, 28.0, 40.0, 27.0, 42.0, 35.0, 56.0, 39.0, 41.0, 37.0, 52.0, 33.0, 36.0, 40.0, 23.0, 30.0, 24.0, 36.0, 26.0, 19.0, 10.0, 27.0, 17.0, 12.0, 9.0, 5.0, 7.0, 10.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.24681091308594, -72.58232116699219, -69.91783142089844, -67.25334930419922, -64.58885955810547, -61.92436981201172, -59.25988006591797, -56.595394134521484, -53.930908203125, -51.26641845703125, -48.601932525634766, -45.937442779541016, -43.27295684814453, -40.60846710205078, -37.94397735595703, -35.27949142456055, -32.6150016784668, -29.95051383972168, -27.286026000976562, -24.621536254882812, -21.957050323486328, -19.292560577392578, -16.62807273864746, -13.963584899902344, -11.299097061157227, -8.63460922241211, -5.970120906829834, -3.3056325912475586, -0.6411447525024414, 2.023343086242676, 4.687831878662109, 7.352319717407227, 10.016807556152344, 12.681295394897461, 15.345783233642578, 18.010272979736328, 20.674758911132812, 23.339248657226562, 26.00373649597168, 28.668224334716797, 31.332712173461914, 33.99720001220703, 36.66168975830078, 39.326175689697266, 41.990665435791016, 44.6551513671875, 47.31964111328125, 49.984130859375, 52.648616790771484, 55.313106536865234, 57.97759246826172, 60.64208221435547, 63.30656814575195, 65.97105407714844, 68.63554382324219, 71.30003356933594, 73.96452331542969, 76.62901306152344, 79.29350280761719, 81.9579849243164, 84.62247467041016, 87.2869644165039, 89.95145416259766, 92.61593627929688, 95.28042602539062]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 2.0, 5.0, 11.0, 12.0, 14.0, 11.0, 15.0, 14.0, 17.0, 20.0, 22.0, 34.0, 36.0, 36.0, 32.0, 33.0, 37.0, 35.0, 34.0, 40.0, 43.0, 34.0, 40.0, 46.0, 31.0, 34.0, 39.0, 30.0, 27.0, 29.0, 22.0, 21.0, 17.0, 15.0, 22.0, 13.0, 8.0, 11.0, 10.0, 11.0, 8.0, 3.0, 7.0, 4.0, 3.0, 2.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-13.53125, -13.0953369140625, -12.659423828125, -12.2235107421875, -11.78759765625, -11.3516845703125, -10.915771484375, -10.4798583984375, -10.0439453125, -9.6080322265625, -9.172119140625, -8.7362060546875, -8.30029296875, -7.8643798828125, -7.428466796875, -6.9925537109375, -6.556640625, -6.1207275390625, -5.684814453125, -5.2489013671875, -4.81298828125, -4.3770751953125, -3.941162109375, -3.5052490234375, -3.0693359375, -2.6334228515625, -2.197509765625, -1.7615966796875, -1.32568359375, -0.8897705078125, -0.453857421875, -0.0179443359375, 0.41796875, 0.8538818359375, 1.289794921875, 1.7257080078125, 2.16162109375, 2.5975341796875, 3.033447265625, 3.4693603515625, 3.9052734375, 4.3411865234375, 4.777099609375, 5.2130126953125, 5.64892578125, 6.0848388671875, 6.520751953125, 6.9566650390625, 7.392578125, 7.8284912109375, 8.264404296875, 8.7003173828125, 9.13623046875, 9.5721435546875, 10.008056640625, 10.4439697265625, 10.8798828125, 11.3157958984375, 11.751708984375, 12.1876220703125, 12.62353515625, 13.0594482421875, 13.495361328125, 13.9312744140625, 14.3671875]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 8.0, 6.0, 17.0, 23.0, 31.0, 49.0, 52.0, 80.0, 106.0, 158.0, 225.0, 329.0, 523.0, 804.0, 1201.0, 1852.0, 2654.0, 4044.0, 6028.0, 9039.0, 14282.0, 22323.0, 35359.0, 57702.0, 99588.0, 172832.0, 225357.0, 158613.0, 90612.0, 52813.0, 32557.0, 20423.0, 13487.0, 8526.0, 5690.0, 3761.0, 2375.0, 1632.0, 1067.0, 707.0, 518.0, 338.0, 218.0, 200.0, 118.0, 85.0, 52.0, 28.0, 16.0, 20.0, 7.0, 7.0, 6.0, 4.0, 5.0, 5.0, 2.0, 3.0], "bins": [-1.412109375, -1.3685455322265625, -1.324981689453125, -1.2814178466796875, -1.23785400390625, -1.1942901611328125, -1.150726318359375, -1.1071624755859375, -1.0635986328125, -1.0200347900390625, -0.976470947265625, -0.9329071044921875, -0.88934326171875, -0.8457794189453125, -0.802215576171875, -0.7586517333984375, -0.715087890625, -0.6715240478515625, -0.627960205078125, -0.5843963623046875, -0.54083251953125, -0.4972686767578125, -0.453704833984375, -0.4101409912109375, -0.3665771484375, -0.3230133056640625, -0.279449462890625, -0.2358856201171875, -0.19232177734375, -0.1487579345703125, -0.105194091796875, -0.0616302490234375, -0.01806640625, 0.0254974365234375, 0.069061279296875, 0.1126251220703125, 0.15618896484375, 0.1997528076171875, 0.243316650390625, 0.2868804931640625, 0.3304443359375, 0.3740081787109375, 0.417572021484375, 0.4611358642578125, 0.50469970703125, 0.5482635498046875, 0.591827392578125, 0.6353912353515625, 0.678955078125, 0.7225189208984375, 0.766082763671875, 0.8096466064453125, 0.85321044921875, 0.8967742919921875, 0.940338134765625, 0.9839019775390625, 1.0274658203125, 1.0710296630859375, 1.114593505859375, 1.1581573486328125, 1.20172119140625, 1.2452850341796875, 1.288848876953125, 1.3324127197265625, 1.3759765625]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 9.0, 7.0, 6.0, 8.0, 7.0, 6.0, 13.0, 18.0, 19.0, 12.0, 18.0, 28.0, 27.0, 23.0, 32.0, 35.0, 40.0, 35.0, 31.0, 44.0, 37.0, 37.0, 1064.0, 51.0, 35.0, 24.0, 28.0, 29.0, 34.0, 34.0, 32.0, 32.0, 24.0, 27.0, 16.0, 17.0, 22.0, 14.0, 10.0, 5.0, 3.0, 8.0, 10.0, 5.0, 2.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-9.8046875, -9.519775390625, -9.23486328125, -8.949951171875, -8.6650390625, -8.380126953125, -8.09521484375, -7.810302734375, -7.525390625, -7.240478515625, -6.95556640625, -6.670654296875, -6.3857421875, -6.100830078125, -5.81591796875, -5.531005859375, -5.24609375, -4.961181640625, -4.67626953125, -4.391357421875, -4.1064453125, -3.821533203125, -3.53662109375, -3.251708984375, -2.966796875, -2.681884765625, -2.39697265625, -2.112060546875, -1.8271484375, -1.542236328125, -1.25732421875, -0.972412109375, -0.6875, -0.402587890625, -0.11767578125, 0.167236328125, 0.4521484375, 0.737060546875, 1.02197265625, 1.306884765625, 1.591796875, 1.876708984375, 2.16162109375, 2.446533203125, 2.7314453125, 3.016357421875, 3.30126953125, 3.586181640625, 3.87109375, 4.156005859375, 4.44091796875, 4.725830078125, 5.0107421875, 5.295654296875, 5.58056640625, 5.865478515625, 6.150390625, 6.435302734375, 6.72021484375, 7.005126953125, 7.2900390625, 7.574951171875, 7.85986328125, 8.144775390625, 8.4296875]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 9.0, 10.0, 20.0, 20.0, 31.0, 48.0, 73.0, 104.0, 190.0, 335.0, 476.0, 671.0, 984.0, 1596.0, 2376.0, 3612.0, 5473.0, 8504.0, 13286.0, 20977.0, 33131.0, 53987.0, 90250.0, 154340.0, 1264957.0, 174459.0, 103169.0, 61633.0, 37325.0, 23043.0, 14643.0, 9583.0, 6059.0, 4064.0, 2684.0, 1694.0, 1077.0, 804.0, 517.0, 307.0, 231.0, 137.0, 91.0, 44.0, 36.0, 29.0, 17.0, 8.0, 11.0, 9.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.8525390625, -0.8246994018554688, -0.7968597412109375, -0.7690200805664062, -0.741180419921875, -0.7133407592773438, -0.6855010986328125, -0.6576614379882812, -0.62982177734375, -0.6019821166992188, -0.5741424560546875, -0.5463027954101562, -0.518463134765625, -0.49062347412109375, -0.4627838134765625, -0.43494415283203125, -0.4071044921875, -0.37926483154296875, -0.3514251708984375, -0.32358551025390625, -0.295745849609375, -0.26790618896484375, -0.2400665283203125, -0.21222686767578125, -0.18438720703125, -0.15654754638671875, -0.1287078857421875, -0.10086822509765625, -0.073028564453125, -0.04518890380859375, -0.0173492431640625, 0.01049041748046875, 0.038330078125, 0.06616973876953125, 0.0940093994140625, 0.12184906005859375, 0.149688720703125, 0.17752838134765625, 0.2053680419921875, 0.23320770263671875, 0.26104736328125, 0.28888702392578125, 0.3167266845703125, 0.34456634521484375, 0.372406005859375, 0.40024566650390625, 0.4280853271484375, 0.45592498779296875, 0.4837646484375, 0.5116043090820312, 0.5394439697265625, 0.5672836303710938, 0.595123291015625, 0.6229629516601562, 0.6508026123046875, 0.6786422729492188, 0.70648193359375, 0.7343215942382812, 0.7621612548828125, 0.7900009155273438, 0.817840576171875, 0.8456802368164062, 0.8735198974609375, 0.9013595581054688, 0.92919921875]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 4.0, 1.0, 3.0, 6.0, 7.0, 11.0, 5.0, 7.0, 14.0, 15.0, 11.0, 13.0, 20.0, 19.0, 40.0, 42.0, 65.0, 95.0, 126.0, 134.0, 95.0, 80.0, 41.0, 34.0, 22.0, 12.0, 18.0, 13.0, 15.0, 11.0, 5.0, 6.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.03857421875, -0.03747081756591797, -0.03636741638183594, -0.035264015197753906, -0.034160614013671875, -0.033057212829589844, -0.03195381164550781, -0.03085041046142578, -0.02974700927734375, -0.02864360809326172, -0.027540206909179688, -0.026436805725097656, -0.025333404541015625, -0.024230003356933594, -0.023126602172851562, -0.02202320098876953, -0.0209197998046875, -0.01981639862060547, -0.018712997436523438, -0.017609596252441406, -0.016506195068359375, -0.015402793884277344, -0.014299392700195312, -0.013195991516113281, -0.01209259033203125, -0.010989189147949219, -0.009885787963867188, -0.008782386779785156, -0.007678985595703125, -0.006575584411621094, -0.0054721832275390625, -0.004368782043457031, -0.003265380859375, -0.0021619796752929688, -0.0010585784912109375, 4.482269287109375e-05, 0.001148223876953125, 0.0022516250610351562, 0.0033550262451171875, 0.004458427429199219, 0.00556182861328125, 0.006665229797363281, 0.0077686309814453125, 0.008872032165527344, 0.009975433349609375, 0.011078834533691406, 0.012182235717773438, 0.013285636901855469, 0.0143890380859375, 0.015492439270019531, 0.016595840454101562, 0.017699241638183594, 0.018802642822265625, 0.019906044006347656, 0.021009445190429688, 0.02211284637451172, 0.02321624755859375, 0.02431964874267578, 0.025423049926757812, 0.026526451110839844, 0.027629852294921875, 0.028733253479003906, 0.029836654663085938, 0.03094005584716797, 0.03204345703125]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 6.0, 4.0, 9.0, 14.0, 15.0, 22.0, 25.0, 32.0, 32.0, 71.0, 84.0, 197.0, 541.0, 7681.0, 974562.0, 63152.0, 1405.0, 242.0, 118.0, 87.0, 53.0, 42.0, 31.0, 27.0, 12.0, 19.0, 9.0, 12.0, 9.0, 10.0, 6.0, 5.0, 5.0, 4.0, 2.0, 0.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.70263671875, -0.6790084838867188, -0.6553802490234375, -0.6317520141601562, -0.608123779296875, -0.5844955444335938, -0.5608673095703125, -0.5372390747070312, -0.51361083984375, -0.48998260498046875, -0.4663543701171875, -0.44272613525390625, -0.419097900390625, -0.39546966552734375, -0.3718414306640625, -0.34821319580078125, -0.3245849609375, -0.30095672607421875, -0.2773284912109375, -0.25370025634765625, -0.230072021484375, -0.20644378662109375, -0.1828155517578125, -0.15918731689453125, -0.13555908203125, -0.11193084716796875, -0.0883026123046875, -0.06467437744140625, -0.041046142578125, -0.01741790771484375, 0.0062103271484375, 0.02983856201171875, 0.053466796875, 0.07709503173828125, 0.1007232666015625, 0.12435150146484375, 0.147979736328125, 0.17160797119140625, 0.1952362060546875, 0.21886444091796875, 0.24249267578125, 0.26612091064453125, 0.2897491455078125, 0.31337738037109375, 0.337005615234375, 0.36063385009765625, 0.3842620849609375, 0.40789031982421875, 0.4315185546875, 0.45514678955078125, 0.4787750244140625, 0.5024032592773438, 0.526031494140625, 0.5496597290039062, 0.5732879638671875, 0.5969161987304688, 0.62054443359375, 0.6441726684570312, 0.6678009033203125, 0.6914291381835938, 0.715057373046875, 0.7386856079101562, 0.7623138427734375, 0.7859420776367188, 0.8095703125]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 7.0, 30.0, 104.0, 576.0, 227.0, 51.0, 10.0, 7.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3132428526878357, -0.3014827072620392, -0.2897225618362427, -0.27796244621276855, -0.26620230078697205, -0.25444215536117554, -0.24268202483654022, -0.2309218943119049, -0.2191617488861084, -0.2074016034603119, -0.19564147293567657, -0.18388134241104126, -0.17212119698524475, -0.16036105155944824, -0.14860092103481293, -0.1368407905101776, -0.1250806450843811, -0.11332050710916519, -0.10156036913394928, -0.08980023115873337, -0.07804009318351746, -0.06627995520830154, -0.05451981723308563, -0.04275967925786972, -0.03099954128265381, -0.019239403307437897, -0.007479265332221985, 0.004280872642993927, 0.01604101061820984, 0.02780114859342575, 0.03956128656864166, 0.051321424543857574, 0.06308159232139587, 0.07484173029661179, 0.0866018682718277, 0.09836200624704361, 0.11012214422225952, 0.12188228219747543, 0.13364242017269135, 0.14540255069732666, 0.15716269612312317, 0.16892284154891968, 0.180682972073555, 0.1924431025981903, 0.20420324802398682, 0.21596339344978333, 0.22772352397441864, 0.23948365449905396, 0.25124379992485046, 0.263003945350647, 0.2747640609741211, 0.2865242063999176, 0.2982843518257141, 0.3100444972515106, 0.32180464267730713, 0.33356475830078125, 0.34532490372657776, 0.35708504915237427, 0.3688451647758484, 0.3806053102016449, 0.3923654556274414, 0.4041256010532379, 0.4158857464790344, 0.42764586210250854, 0.43940600752830505]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 5.0, 3.0, 6.0, 8.0, 10.0, 6.0, 12.0, 21.0, 22.0, 18.0, 24.0, 38.0, 34.0, 28.0, 43.0, 43.0, 36.0, 39.0, 33.0, 47.0, 47.0, 36.0, 44.0, 45.0, 40.0, 47.0, 40.0, 31.0, 31.0, 26.0, 22.0, 24.0, 19.0, 18.0, 16.0, 3.0, 10.0, 10.0, 4.0, 7.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04542136192321777, -0.04374955594539642, -0.042077746242284775, -0.040405936539173126, -0.038734130561351776, -0.037062324583530426, -0.03539051488041878, -0.03371870517730713, -0.03204689919948578, -0.03037509135901928, -0.02870328351855278, -0.02703147567808628, -0.02535966783761978, -0.023687859997153282, -0.022016052156686783, -0.020344244316220284, -0.018672436475753784, -0.017000628635287285, -0.015328820794820786, -0.013657012954354286, -0.011985205113887787, -0.010313397273421288, -0.008641589432954788, -0.006969781592488289, -0.0052979737520217896, -0.0036261659115552902, -0.001954358071088791, -0.00028255023062229156, 0.0013892576098442078, 0.003061065450310707, 0.004732873290777206, 0.006404681131243706, 0.008076488971710205, 0.009748296812176704, 0.011420104652643204, 0.013091912493109703, 0.014763720333576202, 0.0164355281740427, 0.0181073360145092, 0.0197791438549757, 0.0214509516954422, 0.0231227595359087, 0.0247945673763752, 0.026466375216841698, 0.028138183057308197, 0.029809990897774696, 0.031481798738241196, 0.033153608441352844, 0.034825414419174194, 0.036497220396995544, 0.03816903010010719, 0.03984083980321884, 0.04151264578104019, 0.04318445175886154, 0.04485626146197319, 0.04652807116508484, 0.04819987714290619, 0.04987168312072754, 0.05154349282383919, 0.053215302526950836, 0.054887108504772186, 0.056558914482593536, 0.058230724185705185, 0.059902533888816833, 0.061574339866638184]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 2.0, 5.0, 12.0, 11.0, 14.0, 11.0, 15.0, 14.0, 17.0, 20.0, 22.0, 34.0, 36.0, 36.0, 32.0, 33.0, 37.0, 35.0, 34.0, 41.0, 42.0, 35.0, 39.0, 46.0, 32.0, 33.0, 39.0, 30.0, 27.0, 29.0, 22.0, 22.0, 16.0, 15.0, 22.0, 13.0, 8.0, 11.0, 10.0, 11.0, 8.0, 3.0, 7.0, 4.0, 3.0, 2.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-13.53125, -13.09521484375, -12.6591796875, -12.22314453125, -11.787109375, -11.35107421875, -10.9150390625, -10.47900390625, -10.04296875, -9.60693359375, -9.1708984375, -8.73486328125, -8.298828125, -7.86279296875, -7.4267578125, -6.99072265625, -6.5546875, -6.11865234375, -5.6826171875, -5.24658203125, -4.810546875, -4.37451171875, -3.9384765625, -3.50244140625, -3.06640625, -2.63037109375, -2.1943359375, -1.75830078125, -1.322265625, -0.88623046875, -0.4501953125, -0.01416015625, 0.421875, 0.85791015625, 1.2939453125, 1.72998046875, 2.166015625, 2.60205078125, 3.0380859375, 3.47412109375, 3.91015625, 4.34619140625, 4.7822265625, 5.21826171875, 5.654296875, 6.09033203125, 6.5263671875, 6.96240234375, 7.3984375, 7.83447265625, 8.2705078125, 8.70654296875, 9.142578125, 9.57861328125, 10.0146484375, 10.45068359375, 10.88671875, 11.32275390625, 11.7587890625, 12.19482421875, 12.630859375, 13.06689453125, 13.5029296875, 13.93896484375, 14.375]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 5.0, 7.0, 7.0, 15.0, 10.0, 25.0, 18.0, 35.0, 43.0, 38.0, 80.0, 94.0, 183.0, 266.0, 444.0, 778.0, 1567.0, 3197.0, 8605.0, 28732.0, 115311.0, 511916.0, 285972.0, 63427.0, 17201.0, 5452.0, 2356.0, 1080.0, 620.0, 386.0, 199.0, 134.0, 94.0, 62.0, 45.0, 34.0, 22.0, 16.0, 21.0, 12.0, 12.0, 6.0, 4.0, 6.0, 6.0, 4.0, 1.0, 5.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-12.7421875, -12.328369140625, -11.91455078125, -11.500732421875, -11.0869140625, -10.673095703125, -10.25927734375, -9.845458984375, -9.431640625, -9.017822265625, -8.60400390625, -8.190185546875, -7.7763671875, -7.362548828125, -6.94873046875, -6.534912109375, -6.12109375, -5.707275390625, -5.29345703125, -4.879638671875, -4.4658203125, -4.052001953125, -3.63818359375, -3.224365234375, -2.810546875, -2.396728515625, -1.98291015625, -1.569091796875, -1.1552734375, -0.741455078125, -0.32763671875, 0.086181640625, 0.5, 0.913818359375, 1.32763671875, 1.741455078125, 2.1552734375, 2.569091796875, 2.98291015625, 3.396728515625, 3.810546875, 4.224365234375, 4.63818359375, 5.052001953125, 5.4658203125, 5.879638671875, 6.29345703125, 6.707275390625, 7.12109375, 7.534912109375, 7.94873046875, 8.362548828125, 8.7763671875, 9.190185546875, 9.60400390625, 10.017822265625, 10.431640625, 10.845458984375, 11.25927734375, 11.673095703125, 12.0869140625, 12.500732421875, 12.91455078125, 13.328369140625, 13.7421875]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 7.0, 1.0, 9.0, 13.0, 10.0, 14.0, 11.0, 10.0, 15.0, 21.0, 29.0, 20.0, 31.0, 36.0, 34.0, 38.0, 44.0, 55.0, 84.0, 309.0, 1680.0, 98.0, 79.0, 49.0, 44.0, 40.0, 36.0, 25.0, 31.0, 35.0, 18.0, 19.0, 20.0, 13.0, 10.0, 9.0, 18.0, 9.0, 11.0, 9.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.5, -34.24072265625, -32.9814453125, -31.72216796875, -30.462890625, -29.20361328125, -27.9443359375, -26.68505859375, -25.42578125, -24.16650390625, -22.9072265625, -21.64794921875, -20.388671875, -19.12939453125, -17.8701171875, -16.61083984375, -15.3515625, -14.09228515625, -12.8330078125, -11.57373046875, -10.314453125, -9.05517578125, -7.7958984375, -6.53662109375, -5.27734375, -4.01806640625, -2.7587890625, -1.49951171875, -0.240234375, 1.01904296875, 2.2783203125, 3.53759765625, 4.796875, 6.05615234375, 7.3154296875, 8.57470703125, 9.833984375, 11.09326171875, 12.3525390625, 13.61181640625, 14.87109375, 16.13037109375, 17.3896484375, 18.64892578125, 19.908203125, 21.16748046875, 22.4267578125, 23.68603515625, 24.9453125, 26.20458984375, 27.4638671875, 28.72314453125, 29.982421875, 31.24169921875, 32.5009765625, 33.76025390625, 35.01953125, 36.27880859375, 37.5380859375, 38.79736328125, 40.056640625, 41.31591796875, 42.5751953125, 43.83447265625, 45.09375]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 11.0, 10.0, 10.0, 12.0, 15.0, 16.0, 15.0, 23.0, 37.0, 38.0, 82.0, 84.0, 73.0, 128.0, 127.0, 236.0, 342.0, 782.0, 5367.0, 2787641.0, 345786.0, 3152.0, 661.0, 282.0, 194.0, 139.0, 101.0, 90.0, 52.0, 52.0, 35.0, 24.0, 18.0, 12.0, 17.0, 8.0, 12.0, 9.0, 4.0, 4.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-76.25, -74.1259765625, -72.001953125, -69.8779296875, -67.75390625, -65.6298828125, -63.505859375, -61.3818359375, -59.2578125, -57.1337890625, -55.009765625, -52.8857421875, -50.76171875, -48.6376953125, -46.513671875, -44.3896484375, -42.265625, -40.1416015625, -38.017578125, -35.8935546875, -33.76953125, -31.6455078125, -29.521484375, -27.3974609375, -25.2734375, -23.1494140625, -21.025390625, -18.9013671875, -16.77734375, -14.6533203125, -12.529296875, -10.4052734375, -8.28125, -6.1572265625, -4.033203125, -1.9091796875, 0.21484375, 2.3388671875, 4.462890625, 6.5869140625, 8.7109375, 10.8349609375, 12.958984375, 15.0830078125, 17.20703125, 19.3310546875, 21.455078125, 23.5791015625, 25.703125, 27.8271484375, 29.951171875, 32.0751953125, 34.19921875, 36.3232421875, 38.447265625, 40.5712890625, 42.6953125, 44.8193359375, 46.943359375, 49.0673828125, 51.19140625, 53.3154296875, 55.439453125, 57.5634765625, 59.6875]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [203.0, 807.0, 7.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.93674373626709, -2.113966941833496, 7.708809852600098, 17.531585693359375, 27.35436248779297, 37.17713928222656, 46.999916076660156, 56.82269287109375, 66.64546966552734, 76.46824645996094, 86.29102325439453, 96.11380004882812, 105.93657684326172, 115.75935363769531, 125.5821304321289, 135.4049072265625, 145.22769165039062, 155.05047607421875, 164.8732452392578, 174.69601440429688, 184.518798828125, 194.34158325195312, 204.1643524169922, 213.98712158203125, 223.80990600585938, 233.6326904296875, 243.45545959472656, 253.27822875976562, 263.10101318359375, 272.9237976074219, 282.74658203125, 292.5693359375, 302.39208984375, 312.2148742675781, 322.03765869140625, 331.86041259765625, 341.6831970214844, 351.5059814453125, 361.3287353515625, 371.1515197753906, 380.97430419921875, 390.7970886230469, 400.619873046875, 410.442626953125, 420.2654113769531, 430.08819580078125, 439.91094970703125, 449.7337341308594, 459.5565185546875, 469.3793029785156, 479.20208740234375, 489.02484130859375, 498.8476257324219, 508.67041015625, 518.4931640625, 528.3159790039062, 538.1387329101562, 547.9614868164062, 557.7843017578125, 567.6070556640625, 577.4298095703125, 587.2526245117188, 597.0753784179688, 606.898193359375, 616.720947265625]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 5.0, 6.0, 2.0, 6.0, 9.0, 16.0, 14.0, 23.0, 20.0, 27.0, 35.0, 32.0, 31.0, 39.0, 42.0, 36.0, 38.0, 53.0, 59.0, 33.0, 44.0, 35.0, 49.0, 37.0, 39.0, 36.0, 27.0, 21.0, 29.0, 22.0, 26.0, 16.0, 25.0, 15.0, 13.0, 8.0, 8.0, 8.0, 7.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-99.80734252929688, -96.58840942382812, -93.3694839477539, -90.15055084228516, -86.9316177368164, -83.71269226074219, -80.49375915527344, -77.27482604980469, -74.05590057373047, -70.83696746826172, -67.6180419921875, -64.39910888671875, -61.180179595947266, -57.96125030517578, -54.74231719970703, -51.52338790893555, -48.3044548034668, -45.08552551269531, -41.86659240722656, -38.64766311645508, -35.428733825683594, -32.209800720214844, -28.99087142944336, -25.771942138671875, -22.553010940551758, -19.33407974243164, -16.115150451660156, -12.896219253540039, -9.677289009094238, -6.4583587646484375, -3.2394275665283203, -0.020498275756835938, 3.1984329223632812, 6.417363166809082, 9.636293411254883, 12.855224609375, 16.074153900146484, 19.2930850982666, 22.51201629638672, 25.730945587158203, 28.94987678527832, 32.16880798339844, 35.38773727416992, 38.606666564941406, 41.825599670410156, 45.04452896118164, 48.263458251953125, 51.482391357421875, 54.70132064819336, 57.920249938964844, 61.139183044433594, 64.35810852050781, 67.57704162597656, 70.79597473144531, 74.01490783691406, 77.23383331298828, 80.45276641845703, 83.67169952392578, 86.890625, 90.10955810546875, 93.3284912109375, 96.54741668701172, 99.76634979248047, 102.98527526855469, 106.20420837402344]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 3.0, 2.0, 4.0, 4.0, 14.0, 7.0, 15.0, 8.0, 13.0, 14.0, 20.0, 21.0, 29.0, 29.0, 33.0, 39.0, 27.0, 33.0, 43.0, 41.0, 33.0, 42.0, 40.0, 29.0, 33.0, 47.0, 52.0, 30.0, 35.0, 29.0, 32.0, 20.0, 27.0, 18.0, 14.0, 17.0, 24.0, 11.0, 15.0, 12.0, 8.0, 7.0, 7.0, 6.0, 2.0, 7.0, 3.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-13.6953125, -13.2537841796875, -12.812255859375, -12.3707275390625, -11.92919921875, -11.4876708984375, -11.046142578125, -10.6046142578125, -10.1630859375, -9.7215576171875, -9.280029296875, -8.8385009765625, -8.39697265625, -7.9554443359375, -7.513916015625, -7.0723876953125, -6.630859375, -6.1893310546875, -5.747802734375, -5.3062744140625, -4.86474609375, -4.4232177734375, -3.981689453125, -3.5401611328125, -3.0986328125, -2.6571044921875, -2.215576171875, -1.7740478515625, -1.33251953125, -0.8909912109375, -0.449462890625, -0.0079345703125, 0.43359375, 0.8751220703125, 1.316650390625, 1.7581787109375, 2.19970703125, 2.6412353515625, 3.082763671875, 3.5242919921875, 3.9658203125, 4.4073486328125, 4.848876953125, 5.2904052734375, 5.73193359375, 6.1734619140625, 6.614990234375, 7.0565185546875, 7.498046875, 7.9395751953125, 8.381103515625, 8.8226318359375, 9.26416015625, 9.7056884765625, 10.147216796875, 10.5887451171875, 11.0302734375, 11.4718017578125, 11.913330078125, 12.3548583984375, 12.79638671875, 13.2379150390625, 13.679443359375, 14.1209716796875, 14.5625]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 6.0, 6.0, 9.0, 17.0, 15.0, 22.0, 47.0, 51.0, 57.0, 109.0, 155.0, 172.0, 240.0, 379.0, 567.0, 868.0, 1394.0, 2152.0, 3603.0, 6416.0, 11777.0, 35894.0, 644258.0, 3312807.0, 134022.0, 17523.0, 8507.0, 4757.0, 2791.0, 1800.0, 1181.0, 768.0, 533.0, 379.0, 259.0, 178.0, 144.0, 112.0, 66.0, 63.0, 41.0, 42.0, 20.0, 22.0, 10.0, 19.0, 14.0, 4.0, 4.0, 3.0, 1.0, 0.0, 5.0, 2.0, 0.0, 2.0], "bins": [-43.09375, -41.7158203125, -40.337890625, -38.9599609375, -37.58203125, -36.2041015625, -34.826171875, -33.4482421875, -32.0703125, -30.6923828125, -29.314453125, -27.9365234375, -26.55859375, -25.1806640625, -23.802734375, -22.4248046875, -21.046875, -19.6689453125, -18.291015625, -16.9130859375, -15.53515625, -14.1572265625, -12.779296875, -11.4013671875, -10.0234375, -8.6455078125, -7.267578125, -5.8896484375, -4.51171875, -3.1337890625, -1.755859375, -0.3779296875, 1.0, 2.3779296875, 3.755859375, 5.1337890625, 6.51171875, 7.8896484375, 9.267578125, 10.6455078125, 12.0234375, 13.4013671875, 14.779296875, 16.1572265625, 17.53515625, 18.9130859375, 20.291015625, 21.6689453125, 23.046875, 24.4248046875, 25.802734375, 27.1806640625, 28.55859375, 29.9365234375, 31.314453125, 32.6923828125, 34.0703125, 35.4482421875, 36.826171875, 38.2041015625, 39.58203125, 40.9599609375, 42.337890625, 43.7158203125, 45.09375]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 0.0, 2.0, 1.0, 11.0, 9.0, 6.0, 7.0, 14.0, 13.0, 18.0, 16.0, 28.0, 46.0, 89.0, 200.0, 402.0, 907.0, 1146.0, 556.0, 278.0, 137.0, 46.0, 42.0, 32.0, 19.0, 13.0, 7.0, 10.0, 8.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.625, -29.40869140625, -28.1923828125, -26.97607421875, -25.759765625, -24.54345703125, -23.3271484375, -22.11083984375, -20.89453125, -19.67822265625, -18.4619140625, -17.24560546875, -16.029296875, -14.81298828125, -13.5966796875, -12.38037109375, -11.1640625, -9.94775390625, -8.7314453125, -7.51513671875, -6.298828125, -5.08251953125, -3.8662109375, -2.64990234375, -1.43359375, -0.21728515625, 0.9990234375, 2.21533203125, 3.431640625, 4.64794921875, 5.8642578125, 7.08056640625, 8.296875, 9.51318359375, 10.7294921875, 11.94580078125, 13.162109375, 14.37841796875, 15.5947265625, 16.81103515625, 18.02734375, 19.24365234375, 20.4599609375, 21.67626953125, 22.892578125, 24.10888671875, 25.3251953125, 26.54150390625, 27.7578125, 28.97412109375, 30.1904296875, 31.40673828125, 32.623046875, 33.83935546875, 35.0556640625, 36.27197265625, 37.48828125, 38.70458984375, 39.9208984375, 41.13720703125, 42.353515625, 43.56982421875, 44.7861328125, 46.00244140625, 47.21875]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 4.0, 4.0, 3.0, 6.0, 11.0, 19.0, 25.0, 45.0, 77.0, 139.0, 255.0, 477.0, 1139.0, 3008.0, 9798.0, 44884.0, 3789779.0, 313598.0, 21512.0, 5883.0, 2066.0, 735.0, 347.0, 185.0, 95.0, 54.0, 41.0, 25.0, 24.0, 11.0, 10.0, 9.0, 6.0, 1.0, 6.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-133.125, -129.693359375, -126.26171875, -122.830078125, -119.3984375, -115.966796875, -112.53515625, -109.103515625, -105.671875, -102.240234375, -98.80859375, -95.376953125, -91.9453125, -88.513671875, -85.08203125, -81.650390625, -78.21875, -74.787109375, -71.35546875, -67.923828125, -64.4921875, -61.060546875, -57.62890625, -54.197265625, -50.765625, -47.333984375, -43.90234375, -40.470703125, -37.0390625, -33.607421875, -30.17578125, -26.744140625, -23.3125, -19.880859375, -16.44921875, -13.017578125, -9.5859375, -6.154296875, -2.72265625, 0.708984375, 4.140625, 7.572265625, 11.00390625, 14.435546875, 17.8671875, 21.298828125, 24.73046875, 28.162109375, 31.59375, 35.025390625, 38.45703125, 41.888671875, 45.3203125, 48.751953125, 52.18359375, 55.615234375, 59.046875, 62.478515625, 65.91015625, 69.341796875, 72.7734375, 76.205078125, 79.63671875, 83.068359375, 86.5]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 1.0, 3.0, 4.0, 7.0, 3.0, 11.0, 12.0, 9.0, 8.0, 13.0, 21.0, 43.0, 58.0, 70.0, 119.0, 122.0, 136.0, 115.0, 65.0, 50.0, 40.0, 27.0, 19.0, 13.0, 5.0, 4.0, 14.0, 6.0, 2.0, 1.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-82.74673461914062, -79.55815887451172, -76.36959075927734, -73.18101501464844, -69.99243927001953, -66.80386352539062, -63.61529541015625, -60.426719665527344, -57.2381477355957, -54.04957580566406, -50.861000061035156, -47.672428131103516, -44.483856201171875, -41.29528045654297, -38.10670852661133, -34.91813659667969, -31.72956085205078, -28.540987014770508, -25.352413177490234, -22.163841247558594, -18.97526741027832, -15.786693572998047, -12.598121643066406, -9.409547805786133, -6.220973968505859, -3.032400608062744, 0.1561727523803711, 3.344745635986328, 6.533319473266602, 9.721893310546875, 12.910465240478516, 16.09903907775879, 19.28760528564453, 22.476179122924805, 25.664752960205078, 28.85332489013672, 32.041900634765625, 35.230472564697266, 38.419044494628906, 41.60762023925781, 44.79619216918945, 47.984764099121094, 51.17333984375, 54.36191177368164, 57.55048370361328, 60.73905944824219, 63.92763137817383, 67.11620330810547, 70.30477905273438, 73.49335479736328, 76.68192291259766, 79.87049865722656, 83.05907440185547, 86.24765014648438, 89.43621826171875, 92.62479400634766, 95.81336975097656, 99.00194549560547, 102.19051361083984, 105.37908935546875, 108.56766510009766, 111.75624084472656, 114.94480895996094, 118.13338470458984, 121.32195281982422]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 4.0, 5.0, 4.0, 8.0, 8.0, 3.0, 20.0, 18.0, 11.0, 14.0, 18.0, 15.0, 23.0, 23.0, 20.0, 24.0, 38.0, 29.0, 21.0, 33.0, 38.0, 45.0, 33.0, 47.0, 44.0, 49.0, 34.0, 36.0, 46.0, 38.0, 28.0, 24.0, 28.0, 29.0, 20.0, 22.0, 18.0, 14.0, 13.0, 9.0, 7.0, 7.0, 7.0, 6.0, 9.0, 3.0, 7.0, 4.0, 1.0, 3.0, 3.0, 0.0, 2.0], "bins": [-87.6893310546875, -85.1355209350586, -82.58171081542969, -80.02790069580078, -77.47409057617188, -74.92028045654297, -72.36647033691406, -69.81266021728516, -67.25885009765625, -64.70503997802734, -62.15122985839844, -59.59741973876953, -57.043609619140625, -54.48979949951172, -51.93598937988281, -49.382179260253906, -46.828369140625, -44.274559020996094, -41.72074890136719, -39.16693878173828, -36.613128662109375, -34.05931854248047, -31.505508422851562, -28.951698303222656, -26.39788818359375, -23.844078063964844, -21.290267944335938, -18.73645782470703, -16.182647705078125, -13.628837585449219, -11.075027465820312, -8.521217346191406, -5.9674072265625, -3.4135971069335938, -0.8597869873046875, 1.6940231323242188, 4.247833251953125, 6.801643371582031, 9.355453491210938, 11.909263610839844, 14.46307373046875, 17.016883850097656, 19.570693969726562, 22.12450408935547, 24.678314208984375, 27.23212432861328, 29.785934448242188, 32.339744567871094, 34.8935546875, 37.447364807128906, 40.00117492675781, 42.55498504638672, 45.108795166015625, 47.66260528564453, 50.21641540527344, 52.770225524902344, 55.32403564453125, 57.877845764160156, 60.43165588378906, 62.98546600341797, 65.53927612304688, 68.09308624267578, 70.64689636230469, 73.2007064819336, 75.7545166015625]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 6.0, 5.0, 2.0, 5.0, 9.0, 7.0, 11.0, 19.0, 18.0, 16.0, 20.0, 15.0, 44.0, 27.0, 41.0, 44.0, 29.0, 41.0, 37.0, 35.0, 47.0, 50.0, 28.0, 41.0, 42.0, 35.0, 26.0, 36.0, 37.0, 34.0, 24.0, 24.0, 20.0, 27.0, 16.0, 12.0, 10.0, 13.0, 9.0, 10.0, 10.0, 6.0, 4.0, 3.0, 2.0, 2.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.671875, -13.199462890625, -12.72705078125, -12.254638671875, -11.7822265625, -11.309814453125, -10.83740234375, -10.364990234375, -9.892578125, -9.420166015625, -8.94775390625, -8.475341796875, -8.0029296875, -7.530517578125, -7.05810546875, -6.585693359375, -6.11328125, -5.640869140625, -5.16845703125, -4.696044921875, -4.2236328125, -3.751220703125, -3.27880859375, -2.806396484375, -2.333984375, -1.861572265625, -1.38916015625, -0.916748046875, -0.4443359375, 0.028076171875, 0.50048828125, 0.972900390625, 1.4453125, 1.917724609375, 2.39013671875, 2.862548828125, 3.3349609375, 3.807373046875, 4.27978515625, 4.752197265625, 5.224609375, 5.697021484375, 6.16943359375, 6.641845703125, 7.1142578125, 7.586669921875, 8.05908203125, 8.531494140625, 9.00390625, 9.476318359375, 9.94873046875, 10.421142578125, 10.8935546875, 11.365966796875, 11.83837890625, 12.310791015625, 12.783203125, 13.255615234375, 13.72802734375, 14.200439453125, 14.6728515625, 15.145263671875, 15.61767578125, 16.090087890625, 16.5625]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 1.0, 3.0, 17.0, 12.0, 20.0, 21.0, 55.0, 66.0, 101.0, 126.0, 208.0, 300.0, 428.0, 614.0, 851.0, 1348.0, 1912.0, 2938.0, 4329.0, 6731.0, 10152.0, 15813.0, 25121.0, 40856.0, 67392.0, 115292.0, 192308.0, 213042.0, 137765.0, 80315.0, 47702.0, 29584.0, 18251.0, 11729.0, 7733.0, 5089.0, 3230.0, 2245.0, 1569.0, 1039.0, 699.0, 511.0, 350.0, 210.0, 159.0, 111.0, 86.0, 47.0, 31.0, 17.0, 17.0, 6.0, 6.0, 4.0, 4.0, 1.0, 0.0, 1.0], "bins": [-1.41796875, -1.375213623046875, -1.33245849609375, -1.289703369140625, -1.2469482421875, -1.204193115234375, -1.16143798828125, -1.118682861328125, -1.075927734375, -1.033172607421875, -0.99041748046875, -0.947662353515625, -0.9049072265625, -0.862152099609375, -0.81939697265625, -0.776641845703125, -0.73388671875, -0.691131591796875, -0.64837646484375, -0.605621337890625, -0.5628662109375, -0.520111083984375, -0.47735595703125, -0.434600830078125, -0.391845703125, -0.349090576171875, -0.30633544921875, -0.263580322265625, -0.2208251953125, -0.178070068359375, -0.13531494140625, -0.092559814453125, -0.0498046875, -0.007049560546875, 0.03570556640625, 0.078460693359375, 0.1212158203125, 0.163970947265625, 0.20672607421875, 0.249481201171875, 0.292236328125, 0.334991455078125, 0.37774658203125, 0.420501708984375, 0.4632568359375, 0.506011962890625, 0.54876708984375, 0.591522216796875, 0.63427734375, 0.677032470703125, 0.71978759765625, 0.762542724609375, 0.8052978515625, 0.848052978515625, 0.89080810546875, 0.933563232421875, 0.976318359375, 1.019073486328125, 1.06182861328125, 1.104583740234375, 1.1473388671875, 1.190093994140625, 1.23284912109375, 1.275604248046875, 1.318359375]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 5.0, 4.0, 7.0, 6.0, 4.0, 7.0, 8.0, 11.0, 15.0, 21.0, 18.0, 25.0, 23.0, 24.0, 27.0, 25.0, 34.0, 53.0, 37.0, 39.0, 37.0, 37.0, 1070.0, 33.0, 31.0, 39.0, 40.0, 41.0, 45.0, 21.0, 33.0, 24.0, 23.0, 17.0, 21.0, 16.0, 13.0, 18.0, 17.0, 15.0, 9.0, 6.0, 11.0, 5.0, 1.0, 6.0, 3.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.6640625, -8.3651123046875, -8.066162109375, -7.7672119140625, -7.46826171875, -7.1693115234375, -6.870361328125, -6.5714111328125, -6.2724609375, -5.9735107421875, -5.674560546875, -5.3756103515625, -5.07666015625, -4.7777099609375, -4.478759765625, -4.1798095703125, -3.880859375, -3.5819091796875, -3.282958984375, -2.9840087890625, -2.68505859375, -2.3861083984375, -2.087158203125, -1.7882080078125, -1.4892578125, -1.1903076171875, -0.891357421875, -0.5924072265625, -0.29345703125, 0.0054931640625, 0.304443359375, 0.6033935546875, 0.90234375, 1.2012939453125, 1.500244140625, 1.7991943359375, 2.09814453125, 2.3970947265625, 2.696044921875, 2.9949951171875, 3.2939453125, 3.5928955078125, 3.891845703125, 4.1907958984375, 4.48974609375, 4.7886962890625, 5.087646484375, 5.3865966796875, 5.685546875, 5.9844970703125, 6.283447265625, 6.5823974609375, 6.88134765625, 7.1802978515625, 7.479248046875, 7.7781982421875, 8.0771484375, 8.3760986328125, 8.675048828125, 8.9739990234375, 9.27294921875, 9.5718994140625, 9.870849609375, 10.1697998046875, 10.46875]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 5.0, 3.0, 10.0, 11.0, 15.0, 24.0, 51.0, 64.0, 113.0, 145.0, 217.0, 374.0, 531.0, 802.0, 1195.0, 1794.0, 2867.0, 4254.0, 6304.0, 9799.0, 14847.0, 23022.0, 35995.0, 59865.0, 102566.0, 172255.0, 1267219.0, 154451.0, 91146.0, 53887.0, 32700.0, 20929.0, 13567.0, 9096.0, 5772.0, 3866.0, 2546.0, 1668.0, 1145.0, 646.0, 481.0, 311.0, 201.0, 149.0, 93.0, 51.0, 40.0, 17.0, 12.0, 7.0, 3.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.92724609375, -0.89862060546875, -0.8699951171875, -0.84136962890625, -0.812744140625, -0.78411865234375, -0.7554931640625, -0.72686767578125, -0.6982421875, -0.66961669921875, -0.6409912109375, -0.61236572265625, -0.583740234375, -0.55511474609375, -0.5264892578125, -0.49786376953125, -0.46923828125, -0.44061279296875, -0.4119873046875, -0.38336181640625, -0.354736328125, -0.32611083984375, -0.2974853515625, -0.26885986328125, -0.240234375, -0.21160888671875, -0.1829833984375, -0.15435791015625, -0.125732421875, -0.09710693359375, -0.0684814453125, -0.03985595703125, -0.01123046875, 0.01739501953125, 0.0460205078125, 0.07464599609375, 0.103271484375, 0.13189697265625, 0.1605224609375, 0.18914794921875, 0.2177734375, 0.24639892578125, 0.2750244140625, 0.30364990234375, 0.332275390625, 0.36090087890625, 0.3895263671875, 0.41815185546875, 0.44677734375, 0.47540283203125, 0.5040283203125, 0.53265380859375, 0.561279296875, 0.58990478515625, 0.6185302734375, 0.64715576171875, 0.67578125, 0.70440673828125, 0.7330322265625, 0.76165771484375, 0.790283203125, 0.81890869140625, 0.8475341796875, 0.87615966796875, 0.90478515625]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 6.0, 4.0, 6.0, 5.0, 6.0, 5.0, 18.0, 14.0, 19.0, 21.0, 29.0, 37.0, 33.0, 43.0, 75.0, 75.0, 106.0, 124.0, 85.0, 58.0, 42.0, 37.0, 25.0, 27.0, 23.0, 16.0, 13.0, 16.0, 5.0, 5.0, 10.0, 10.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.027130126953125, -0.02639603614807129, -0.025661945343017578, -0.024927854537963867, -0.024193763732910156, -0.023459672927856445, -0.022725582122802734, -0.021991491317749023, -0.021257400512695312, -0.0205233097076416, -0.01978921890258789, -0.01905512809753418, -0.01832103729248047, -0.017586946487426758, -0.016852855682373047, -0.016118764877319336, -0.015384674072265625, -0.014650583267211914, -0.013916492462158203, -0.013182401657104492, -0.012448310852050781, -0.01171422004699707, -0.01098012924194336, -0.010246038436889648, -0.009511947631835938, -0.008777856826782227, -0.008043766021728516, -0.007309675216674805, -0.006575584411621094, -0.005841493606567383, -0.005107402801513672, -0.004373311996459961, -0.00363922119140625, -0.002905130386352539, -0.002171039581298828, -0.0014369487762451172, -0.0007028579711914062, 3.123283386230469e-05, 0.0007653236389160156, 0.0014994144439697266, 0.0022335052490234375, 0.0029675960540771484, 0.0037016868591308594, 0.00443577766418457, 0.005169868469238281, 0.005903959274291992, 0.006638050079345703, 0.007372140884399414, 0.008106231689453125, 0.008840322494506836, 0.009574413299560547, 0.010308504104614258, 0.011042594909667969, 0.01177668571472168, 0.01251077651977539, 0.013244867324829102, 0.013978958129882812, 0.014713048934936523, 0.015447139739990234, 0.016181230545043945, 0.016915321350097656, 0.017649412155151367, 0.018383502960205078, 0.01911759376525879, 0.0198516845703125]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 2.0, 3.0, 5.0, 8.0, 8.0, 10.0, 9.0, 10.0, 20.0, 20.0, 25.0, 38.0, 41.0, 58.0, 109.0, 185.0, 459.0, 1652.0, 10564.0, 820204.0, 207076.0, 5964.0, 1213.0, 349.0, 158.0, 93.0, 65.0, 43.0, 40.0, 24.0, 25.0, 14.0, 12.0, 11.0, 9.0, 8.0, 6.0, 1.0, 2.0, 4.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.374755859375, -0.3608131408691406, -0.34687042236328125, -0.3329277038574219, -0.3189849853515625, -0.3050422668457031, -0.29109954833984375, -0.2771568298339844, -0.263214111328125, -0.24927139282226562, -0.23532867431640625, -0.22138595581054688, -0.2074432373046875, -0.19350051879882812, -0.17955780029296875, -0.16561508178710938, -0.15167236328125, -0.13772964477539062, -0.12378692626953125, -0.10984420776367188, -0.0959014892578125, -0.08195877075195312, -0.06801605224609375, -0.054073333740234375, -0.040130615234375, -0.026187896728515625, -0.01224517822265625, 0.001697540283203125, 0.0156402587890625, 0.029582977294921875, 0.04352569580078125, 0.057468414306640625, 0.0714111328125, 0.08535385131835938, 0.09929656982421875, 0.11323928833007812, 0.1271820068359375, 0.14112472534179688, 0.15506744384765625, 0.16901016235351562, 0.182952880859375, 0.19689559936523438, 0.21083831787109375, 0.22478103637695312, 0.2387237548828125, 0.2526664733886719, 0.26660919189453125, 0.2805519104003906, 0.29449462890625, 0.3084373474121094, 0.32238006591796875, 0.3363227844238281, 0.3502655029296875, 0.3642082214355469, 0.37815093994140625, 0.3920936584472656, 0.406036376953125, 0.4199790954589844, 0.43392181396484375, 0.4478645324707031, 0.4618072509765625, 0.4757499694824219, 0.48969268798828125, 0.5036354064941406, 0.517578125]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [4.0, 5.0, 5.0, 7.0, 26.0, 51.0, 146.0, 386.0, 225.0, 85.0, 43.0, 13.0, 12.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.034176044166088104, -0.029731385409832, -0.025286724790930748, -0.020842064172029495, -0.01639740541577339, -0.011952746659517288, -0.0075080860406160355, -0.0030634254217147827, 0.0013812333345413208, 0.005825893022119999, 0.010270552709698677, 0.014715212397277355, 0.019159872084856033, 0.023604530841112137, 0.02804919146001339, 0.03249385207891464, 0.036938510835170746, 0.04138316959142685, 0.04582782834768295, 0.050272490829229355, 0.05471714958548546, 0.05916180834174156, 0.06360647082328796, 0.06805112957954407, 0.07249578833580017, 0.07694044709205627, 0.08138510584831238, 0.08582976460456848, 0.09027442336082458, 0.09471908211708069, 0.09916374832391739, 0.10360840708017349, 0.108053058385849, 0.1124977171421051, 0.1169423758983612, 0.12138703465461731, 0.1258316934108734, 0.13027635216712952, 0.13472101092338562, 0.13916566967964172, 0.14361032843589783, 0.14805498719215393, 0.15249964594841003, 0.15694430470466614, 0.16138896346092224, 0.16583362221717834, 0.17027828097343445, 0.17472293972969055, 0.17916761338710785, 0.18361227214336395, 0.18805693089962006, 0.19250158965587616, 0.19694624841213226, 0.20139090716838837, 0.20583556592464447, 0.21028023958206177, 0.21472489833831787, 0.21916955709457397, 0.22361421585083008, 0.22805887460708618, 0.23250353336334229, 0.2369481921195984, 0.2413928508758545, 0.2458375096321106, 0.2502821683883667]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 6.0, 3.0, 5.0, 7.0, 10.0, 10.0, 10.0, 12.0, 27.0, 16.0, 19.0, 21.0, 26.0, 27.0, 22.0, 43.0, 29.0, 26.0, 38.0, 49.0, 47.0, 43.0, 45.0, 39.0, 42.0, 42.0, 41.0, 40.0, 41.0, 24.0, 18.0, 24.0, 30.0, 25.0, 16.0, 19.0, 15.0, 12.0, 12.0, 9.0, 6.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.024921059608459473, -0.02416166290640831, -0.023402266204357147, -0.022642869502305984, -0.021883472800254822, -0.02112407609820366, -0.020364679396152496, -0.019605282694101334, -0.01884588599205017, -0.018086489289999008, -0.017327092587947845, -0.016567695885896683, -0.01580829918384552, -0.015048902481794357, -0.014289505779743195, -0.013530109077692032, -0.01277071237564087, -0.012011315673589706, -0.011251918971538544, -0.010492522269487381, -0.009733125567436218, -0.008973728865385056, -0.008214332163333893, -0.00745493546128273, -0.006695538759231567, -0.005936142057180405, -0.005176745355129242, -0.004417348653078079, -0.0036579519510269165, -0.002898555248975754, -0.002139158546924591, -0.0013797618448734283, -0.0006203651428222656, 0.0001390315592288971, 0.0008984282612800598, 0.0016578249633312225, 0.0024172216653823853, 0.003176618367433548, 0.003936015069484711, 0.004695411771535873, 0.005454808473587036, 0.006214205175638199, 0.006973601877689362, 0.007732998579740524, 0.008492395281791687, 0.00925179198384285, 0.010011188685894012, 0.010770585387945175, 0.011529982089996338, 0.0122893787920475, 0.013048775494098663, 0.013808172196149826, 0.014567568898200989, 0.015326965600252151, 0.016086362302303314, 0.016845759004354477, 0.01760515570640564, 0.018364552408456802, 0.019123949110507965, 0.019883345812559128, 0.02064274251461029, 0.021402139216661453, 0.022161535918712616, 0.02292093262076378, 0.02368032932281494]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 6.0, 5.0, 2.0, 5.0, 9.0, 7.0, 11.0, 18.0, 19.0, 16.0, 20.0, 15.0, 44.0, 27.0, 41.0, 44.0, 28.0, 42.0, 37.0, 35.0, 47.0, 49.0, 29.0, 40.0, 43.0, 34.0, 26.0, 37.0, 36.0, 35.0, 24.0, 24.0, 20.0, 26.0, 17.0, 11.0, 11.0, 13.0, 9.0, 10.0, 10.0, 6.0, 4.0, 3.0, 2.0, 2.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.6796875, -13.2071533203125, -12.734619140625, -12.2620849609375, -11.78955078125, -11.3170166015625, -10.844482421875, -10.3719482421875, -9.8994140625, -9.4268798828125, -8.954345703125, -8.4818115234375, -8.00927734375, -7.5367431640625, -7.064208984375, -6.5916748046875, -6.119140625, -5.6466064453125, -5.174072265625, -4.7015380859375, -4.22900390625, -3.7564697265625, -3.283935546875, -2.8114013671875, -2.3388671875, -1.8663330078125, -1.393798828125, -0.9212646484375, -0.44873046875, 0.0238037109375, 0.496337890625, 0.9688720703125, 1.44140625, 1.9139404296875, 2.386474609375, 2.8590087890625, 3.33154296875, 3.8040771484375, 4.276611328125, 4.7491455078125, 5.2216796875, 5.6942138671875, 6.166748046875, 6.6392822265625, 7.11181640625, 7.5843505859375, 8.056884765625, 8.5294189453125, 9.001953125, 9.4744873046875, 9.947021484375, 10.4195556640625, 10.89208984375, 11.3646240234375, 11.837158203125, 12.3096923828125, 12.7822265625, 13.2547607421875, 13.727294921875, 14.1998291015625, 14.67236328125, 15.1448974609375, 15.617431640625, 16.0899658203125, 16.5625]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 6.0, 7.0, 4.0, 8.0, 9.0, 13.0, 14.0, 19.0, 31.0, 28.0, 40.0, 41.0, 79.0, 77.0, 123.0, 193.0, 276.0, 589.0, 1366.0, 4357.0, 24323.0, 459637.0, 523852.0, 25985.0, 4483.0, 1400.0, 562.0, 335.0, 198.0, 117.0, 85.0, 67.0, 50.0, 40.0, 27.0, 19.0, 19.0, 18.0, 11.0, 14.0, 8.0, 8.0, 5.0, 3.0, 2.0, 2.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-27.109375, -26.175048828125, -25.24072265625, -24.306396484375, -23.3720703125, -22.437744140625, -21.50341796875, -20.569091796875, -19.634765625, -18.700439453125, -17.76611328125, -16.831787109375, -15.8974609375, -14.963134765625, -14.02880859375, -13.094482421875, -12.16015625, -11.225830078125, -10.29150390625, -9.357177734375, -8.4228515625, -7.488525390625, -6.55419921875, -5.619873046875, -4.685546875, -3.751220703125, -2.81689453125, -1.882568359375, -0.9482421875, -0.013916015625, 0.92041015625, 1.854736328125, 2.7890625, 3.723388671875, 4.65771484375, 5.592041015625, 6.5263671875, 7.460693359375, 8.39501953125, 9.329345703125, 10.263671875, 11.197998046875, 12.13232421875, 13.066650390625, 14.0009765625, 14.935302734375, 15.86962890625, 16.803955078125, 17.73828125, 18.672607421875, 19.60693359375, 20.541259765625, 21.4755859375, 22.409912109375, 23.34423828125, 24.278564453125, 25.212890625, 26.147216796875, 27.08154296875, 28.015869140625, 28.9501953125, 29.884521484375, 30.81884765625, 31.753173828125, 32.6875]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 6.0, 6.0, 3.0, 7.0, 17.0, 17.0, 13.0, 19.0, 23.0, 29.0, 28.0, 35.0, 34.0, 45.0, 46.0, 46.0, 56.0, 80.0, 1538.0, 483.0, 82.0, 63.0, 39.0, 53.0, 35.0, 35.0, 40.0, 35.0, 31.0, 19.0, 18.0, 17.0, 13.0, 8.0, 9.0, 12.0, 3.0, 5.0, 6.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.03125, -44.63525390625, -43.2392578125, -41.84326171875, -40.447265625, -39.05126953125, -37.6552734375, -36.25927734375, -34.86328125, -33.46728515625, -32.0712890625, -30.67529296875, -29.279296875, -27.88330078125, -26.4873046875, -25.09130859375, -23.6953125, -22.29931640625, -20.9033203125, -19.50732421875, -18.111328125, -16.71533203125, -15.3193359375, -13.92333984375, -12.52734375, -11.13134765625, -9.7353515625, -8.33935546875, -6.943359375, -5.54736328125, -4.1513671875, -2.75537109375, -1.359375, 0.03662109375, 1.4326171875, 2.82861328125, 4.224609375, 5.62060546875, 7.0166015625, 8.41259765625, 9.80859375, 11.20458984375, 12.6005859375, 13.99658203125, 15.392578125, 16.78857421875, 18.1845703125, 19.58056640625, 20.9765625, 22.37255859375, 23.7685546875, 25.16455078125, 26.560546875, 27.95654296875, 29.3525390625, 30.74853515625, 32.14453125, 33.54052734375, 34.9365234375, 36.33251953125, 37.728515625, 39.12451171875, 40.5205078125, 41.91650390625, 43.3125]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 7.0, 5.0, 9.0, 9.0, 10.0, 14.0, 20.0, 12.0, 30.0, 34.0, 36.0, 46.0, 74.0, 94.0, 143.0, 250.0, 719.0, 2670.0, 163846.0, 2970994.0, 4839.0, 957.0, 305.0, 165.0, 100.0, 69.0, 49.0, 50.0, 38.0, 22.0, 21.0, 14.0, 21.0, 13.0, 6.0, 3.0, 8.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-99.375, -96.1826171875, -92.990234375, -89.7978515625, -86.60546875, -83.4130859375, -80.220703125, -77.0283203125, -73.8359375, -70.6435546875, -67.451171875, -64.2587890625, -61.06640625, -57.8740234375, -54.681640625, -51.4892578125, -48.296875, -45.1044921875, -41.912109375, -38.7197265625, -35.52734375, -32.3349609375, -29.142578125, -25.9501953125, -22.7578125, -19.5654296875, -16.373046875, -13.1806640625, -9.98828125, -6.7958984375, -3.603515625, -0.4111328125, 2.78125, 5.9736328125, 9.166015625, 12.3583984375, 15.55078125, 18.7431640625, 21.935546875, 25.1279296875, 28.3203125, 31.5126953125, 34.705078125, 37.8974609375, 41.08984375, 44.2822265625, 47.474609375, 50.6669921875, 53.859375, 57.0517578125, 60.244140625, 63.4365234375, 66.62890625, 69.8212890625, 73.013671875, 76.2060546875, 79.3984375, 82.5908203125, 85.783203125, 88.9755859375, 92.16796875, 95.3603515625, 98.552734375, 101.7451171875, 104.9375]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 48.0, 670.0, 282.0, 15.0], "bins": [-483.9574279785156, -476.1205749511719, -468.28375244140625, -460.4468994140625, -452.61004638671875, -444.7732238769531, -436.9363708496094, -429.0995178222656, -421.2626953125, -413.42584228515625, -405.5890197753906, -397.7521667480469, -389.9153137207031, -382.0784912109375, -374.24163818359375, -366.40478515625, -358.56793212890625, -350.7310791015625, -342.8942565917969, -335.0574035644531, -327.2205505371094, -319.38372802734375, -311.546875, -303.71002197265625, -295.8731994628906, -288.0363464355469, -280.19952392578125, -272.3626708984375, -264.52581787109375, -256.6889953613281, -248.85214233398438, -241.0153045654297, -233.178466796875, -225.3416290283203, -217.50477600097656, -209.66793823242188, -201.8311004638672, -193.9942626953125, -186.15740966796875, -178.32057189941406, -170.4837188720703, -162.64688110351562, -154.81002807617188, -146.9731903076172, -139.1363525390625, -131.29949951171875, -123.46266174316406, -115.62582397460938, -107.78898620605469, -99.95214080810547, -92.11530303955078, -84.27845764160156, -76.44161987304688, -68.60477447509766, -60.76792907714844, -52.931087493896484, -45.09424591064453, -37.25740432739258, -29.420560836791992, -21.583717346191406, -13.746875762939453, -5.9100341796875, 1.9268112182617188, 9.763652801513672, 17.600496292114258]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 3.0, 8.0, 5.0, 8.0, 5.0, 6.0, 6.0, 8.0, 13.0, 12.0, 12.0, 18.0, 20.0, 25.0, 18.0, 20.0, 27.0, 37.0, 26.0, 25.0, 36.0, 44.0, 32.0, 37.0, 41.0, 39.0, 50.0, 45.0, 33.0, 40.0, 34.0, 42.0, 25.0, 34.0, 25.0, 19.0, 23.0, 21.0, 14.0, 9.0, 9.0, 11.0, 9.0, 13.0, 6.0, 8.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-89.78470611572266, -86.94556427001953, -84.10641479492188, -81.26727294921875, -78.42813110351562, -75.58898162841797, -72.74983978271484, -69.91069030761719, -67.07154846191406, -64.23240661621094, -61.39325714111328, -58.554115295410156, -55.714969635009766, -52.875823974609375, -50.03668212890625, -47.19753646850586, -44.35839080810547, -41.51924514770508, -38.68009948730469, -35.84095764160156, -33.00181198120117, -30.16266632080078, -27.323522567749023, -24.484378814697266, -21.645233154296875, -18.806087493896484, -15.966943740844727, -13.127799034118652, -10.288654327392578, -7.449509620666504, -4.61036491394043, -1.7712211608886719, 1.0679168701171875, 3.9070615768432617, 6.746206283569336, 9.58535099029541, 12.424495697021484, 15.263640403747559, 18.102785110473633, 20.94192886352539, 23.78107452392578, 26.620220184326172, 29.45936393737793, 32.29850769042969, 35.13765335083008, 37.97679901123047, 40.815940856933594, 43.655086517333984, 46.494232177734375, 49.333377838134766, 52.172523498535156, 55.01166534423828, 57.85081100463867, 60.68995666503906, 63.52909851074219, 66.36824035644531, 69.20738983154297, 72.0465316772461, 74.88568115234375, 77.72482299804688, 80.56396484375, 83.40311431884766, 86.24225616455078, 89.08140563964844, 91.92054748535156]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 3.0, 3.0, 4.0, 4.0, 5.0, 4.0, 14.0, 14.0, 12.0, 25.0, 21.0, 22.0, 18.0, 39.0, 32.0, 43.0, 31.0, 44.0, 36.0, 50.0, 37.0, 42.0, 51.0, 45.0, 29.0, 40.0, 41.0, 38.0, 33.0, 33.0, 26.0, 24.0, 25.0, 22.0, 12.0, 13.0, 12.0, 14.0, 6.0, 9.0, 11.0, 5.0, 3.0, 4.0, 1.0, 3.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.53125, -14.0341796875, -13.537109375, -13.0400390625, -12.54296875, -12.0458984375, -11.548828125, -11.0517578125, -10.5546875, -10.0576171875, -9.560546875, -9.0634765625, -8.56640625, -8.0693359375, -7.572265625, -7.0751953125, -6.578125, -6.0810546875, -5.583984375, -5.0869140625, -4.58984375, -4.0927734375, -3.595703125, -3.0986328125, -2.6015625, -2.1044921875, -1.607421875, -1.1103515625, -0.61328125, -0.1162109375, 0.380859375, 0.8779296875, 1.375, 1.8720703125, 2.369140625, 2.8662109375, 3.36328125, 3.8603515625, 4.357421875, 4.8544921875, 5.3515625, 5.8486328125, 6.345703125, 6.8427734375, 7.33984375, 7.8369140625, 8.333984375, 8.8310546875, 9.328125, 9.8251953125, 10.322265625, 10.8193359375, 11.31640625, 11.8134765625, 12.310546875, 12.8076171875, 13.3046875, 13.8017578125, 14.298828125, 14.7958984375, 15.29296875, 15.7900390625, 16.287109375, 16.7841796875, 17.28125]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 8.0, 11.0, 21.0, 32.0, 40.0, 66.0, 85.0, 106.0, 159.0, 236.0, 329.0, 470.0, 683.0, 988.0, 1484.0, 2304.0, 3622.0, 6171.0, 11434.0, 30881.0, 435719.0, 3427722.0, 223826.0, 22039.0, 10135.0, 5557.0, 3337.0, 2119.0, 1402.0, 945.0, 675.0, 453.0, 351.0, 222.0, 189.0, 121.0, 85.0, 74.0, 52.0, 40.0, 24.0, 22.0, 15.0, 11.0, 9.0, 6.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-44.28125, -42.87109375, -41.4609375, -40.05078125, -38.640625, -37.23046875, -35.8203125, -34.41015625, -33.0, -31.58984375, -30.1796875, -28.76953125, -27.359375, -25.94921875, -24.5390625, -23.12890625, -21.71875, -20.30859375, -18.8984375, -17.48828125, -16.078125, -14.66796875, -13.2578125, -11.84765625, -10.4375, -9.02734375, -7.6171875, -6.20703125, -4.796875, -3.38671875, -1.9765625, -0.56640625, 0.84375, 2.25390625, 3.6640625, 5.07421875, 6.484375, 7.89453125, 9.3046875, 10.71484375, 12.125, 13.53515625, 14.9453125, 16.35546875, 17.765625, 19.17578125, 20.5859375, 21.99609375, 23.40625, 24.81640625, 26.2265625, 27.63671875, 29.046875, 30.45703125, 31.8671875, 33.27734375, 34.6875, 36.09765625, 37.5078125, 38.91796875, 40.328125, 41.73828125, 43.1484375, 44.55859375, 45.96875]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 7.0, 7.0, 4.0, 8.0, 7.0, 5.0, 14.0, 17.0, 30.0, 44.0, 74.0, 117.0, 262.0, 568.0, 1033.0, 907.0, 446.0, 191.0, 106.0, 61.0, 40.0, 28.0, 16.0, 24.0, 14.0, 9.0, 9.0, 7.0, 5.0, 4.0, 5.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-36.0, -34.8701171875, -33.740234375, -32.6103515625, -31.48046875, -30.3505859375, -29.220703125, -28.0908203125, -26.9609375, -25.8310546875, -24.701171875, -23.5712890625, -22.44140625, -21.3115234375, -20.181640625, -19.0517578125, -17.921875, -16.7919921875, -15.662109375, -14.5322265625, -13.40234375, -12.2724609375, -11.142578125, -10.0126953125, -8.8828125, -7.7529296875, -6.623046875, -5.4931640625, -4.36328125, -3.2333984375, -2.103515625, -0.9736328125, 0.15625, 1.2861328125, 2.416015625, 3.5458984375, 4.67578125, 5.8056640625, 6.935546875, 8.0654296875, 9.1953125, 10.3251953125, 11.455078125, 12.5849609375, 13.71484375, 14.8447265625, 15.974609375, 17.1044921875, 18.234375, 19.3642578125, 20.494140625, 21.6240234375, 22.75390625, 23.8837890625, 25.013671875, 26.1435546875, 27.2734375, 28.4033203125, 29.533203125, 30.6630859375, 31.79296875, 32.9228515625, 34.052734375, 35.1826171875, 36.3125]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 4.0, 5.0, 6.0, 6.0, 8.0, 24.0, 27.0, 34.0, 52.0, 81.0, 120.0, 164.0, 268.0, 440.0, 739.0, 1366.0, 2609.0, 5369.0, 12553.0, 33772.0, 216700.0, 3723575.0, 145125.0, 29649.0, 11207.0, 4873.0, 2374.0, 1312.0, 705.0, 390.0, 250.0, 150.0, 103.0, 65.0, 52.0, 32.0, 20.0, 21.0, 9.0, 10.0, 6.0, 5.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.25, -63.23828125, -61.2265625, -59.21484375, -57.203125, -55.19140625, -53.1796875, -51.16796875, -49.15625, -47.14453125, -45.1328125, -43.12109375, -41.109375, -39.09765625, -37.0859375, -35.07421875, -33.0625, -31.05078125, -29.0390625, -27.02734375, -25.015625, -23.00390625, -20.9921875, -18.98046875, -16.96875, -14.95703125, -12.9453125, -10.93359375, -8.921875, -6.91015625, -4.8984375, -2.88671875, -0.875, 1.13671875, 3.1484375, 5.16015625, 7.171875, 9.18359375, 11.1953125, 13.20703125, 15.21875, 17.23046875, 19.2421875, 21.25390625, 23.265625, 25.27734375, 27.2890625, 29.30078125, 31.3125, 33.32421875, 35.3359375, 37.34765625, 39.359375, 41.37109375, 43.3828125, 45.39453125, 47.40625, 49.41796875, 51.4296875, 53.44140625, 55.453125, 57.46484375, 59.4765625, 61.48828125, 63.5]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 4.0, 6.0, 18.0, 18.0, 18.0, 48.0, 91.0, 189.0, 237.0, 173.0, 80.0, 55.0, 28.0, 16.0, 11.0, 4.0, 7.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-263.5518798828125, -258.11639404296875, -252.68087768554688, -247.24539184570312, -241.8098907470703, -236.3743896484375, -230.9388885498047, -225.50338745117188, -220.06788635253906, -214.63238525390625, -209.19688415527344, -203.76138305664062, -198.32589721679688, -192.89039611816406, -187.45489501953125, -182.01939392089844, -176.58389282226562, -171.1483917236328, -165.712890625, -160.27740478515625, -154.84190368652344, -149.40640258789062, -143.9709014892578, -138.535400390625, -133.09991455078125, -127.66441345214844, -122.22891998291016, -116.79341888427734, -111.35791778564453, -105.92242431640625, -100.48692321777344, -95.05142211914062, -89.61591339111328, -84.18041229248047, -78.74491882324219, -73.30941772460938, -67.87391662597656, -62.438419342041016, -57.00292205810547, -51.567420959472656, -46.13192367553711, -40.69642639160156, -35.26092529296875, -29.825428009033203, -24.389928817749023, -18.954429626464844, -13.518932342529297, -8.083431243896484, -2.6479339599609375, 2.787564754486084, 8.223063468933105, 13.658561706542969, 19.09406089782715, 24.529560089111328, 29.965057373046875, 35.40055847167969, 40.836055755615234, 46.27155303955078, 51.707054138183594, 57.14255142211914, 62.57804870605469, 68.0135498046875, 73.44905090332031, 78.88455200195312, 84.3200454711914]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 8.0, 6.0, 5.0, 4.0, 3.0, 8.0, 11.0, 12.0, 12.0, 18.0, 11.0, 21.0, 26.0, 33.0, 31.0, 26.0, 41.0, 34.0, 33.0, 33.0, 44.0, 44.0, 39.0, 41.0, 38.0, 34.0, 39.0, 22.0, 39.0, 46.0, 36.0, 23.0, 28.0, 24.0, 22.0, 18.0, 11.0, 18.0, 11.0, 9.0, 9.0, 4.0, 8.0, 5.0, 9.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-76.08663940429688, -73.7289810180664, -71.37132263183594, -69.01365661621094, -66.65599822998047, -64.29833984375, -61.94068145751953, -59.5830192565918, -57.22535705566406, -54.867698669433594, -52.51003646850586, -50.15237808227539, -47.794715881347656, -45.43705749511719, -43.07939910888672, -40.721736907958984, -38.364078521728516, -36.00642013549805, -33.64875793457031, -31.291099548339844, -28.93343734741211, -26.57577896118164, -24.21811866760254, -21.860458374023438, -19.502798080444336, -17.145137786865234, -14.787477493286133, -12.429818153381348, -10.072157859802246, -7.7144975662231445, -5.356838226318359, -2.999177932739258, -0.6415176391601562, 1.7161424160003662, 4.073802471160889, 6.431462287902832, 8.789122581481934, 11.146782875061035, 13.50444221496582, 15.862102508544922, 18.219762802124023, 20.577423095703125, 22.935083389282227, 25.292743682861328, 27.650402069091797, 30.00806427001953, 32.36572265625, 34.72338104248047, 37.0810432434082, 39.43870162963867, 41.796363830566406, 44.154022216796875, 46.51168441772461, 48.86934280395508, 51.22700500488281, 53.58466339111328, 55.94232177734375, 58.29998016357422, 60.65764236450195, 63.01530075073242, 65.37296295166016, 67.73062133789062, 70.0882797241211, 72.44593811035156, 74.80360412597656]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 5.0, 5.0, 10.0, 9.0, 10.0, 12.0, 14.0, 15.0, 19.0, 19.0, 35.0, 21.0, 27.0, 36.0, 30.0, 54.0, 41.0, 54.0, 38.0, 66.0, 39.0, 36.0, 46.0, 35.0, 33.0, 38.0, 29.0, 31.0, 27.0, 25.0, 28.0, 11.0, 19.0, 18.0, 15.0, 11.0, 8.0, 11.0, 6.0, 5.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.375, -14.84765625, -14.3203125, -13.79296875, -13.265625, -12.73828125, -12.2109375, -11.68359375, -11.15625, -10.62890625, -10.1015625, -9.57421875, -9.046875, -8.51953125, -7.9921875, -7.46484375, -6.9375, -6.41015625, -5.8828125, -5.35546875, -4.828125, -4.30078125, -3.7734375, -3.24609375, -2.71875, -2.19140625, -1.6640625, -1.13671875, -0.609375, -0.08203125, 0.4453125, 0.97265625, 1.5, 2.02734375, 2.5546875, 3.08203125, 3.609375, 4.13671875, 4.6640625, 5.19140625, 5.71875, 6.24609375, 6.7734375, 7.30078125, 7.828125, 8.35546875, 8.8828125, 9.41015625, 9.9375, 10.46484375, 10.9921875, 11.51953125, 12.046875, 12.57421875, 13.1015625, 13.62890625, 14.15625, 14.68359375, 15.2109375, 15.73828125, 16.265625, 16.79296875, 17.3203125, 17.84765625, 18.375]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 8.0, 4.0, 7.0, 15.0, 19.0, 25.0, 44.0, 82.0, 85.0, 130.0, 209.0, 287.0, 451.0, 628.0, 965.0, 1451.0, 2218.0, 3282.0, 4880.0, 7854.0, 12262.0, 19500.0, 31677.0, 53839.0, 94914.0, 167898.0, 238075.0, 170552.0, 96226.0, 54066.0, 32359.0, 19536.0, 12206.0, 7868.0, 5001.0, 3319.0, 2161.0, 1463.0, 957.0, 654.0, 464.0, 281.0, 200.0, 146.0, 87.0, 67.0, 46.0, 32.0, 19.0, 11.0, 19.0, 8.0, 2.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-1.3193359375, -1.276092529296875, -1.23284912109375, -1.189605712890625, -1.1463623046875, -1.103118896484375, -1.05987548828125, -1.016632080078125, -0.973388671875, -0.930145263671875, -0.88690185546875, -0.843658447265625, -0.8004150390625, -0.757171630859375, -0.71392822265625, -0.670684814453125, -0.62744140625, -0.584197998046875, -0.54095458984375, -0.497711181640625, -0.4544677734375, -0.411224365234375, -0.36798095703125, -0.324737548828125, -0.281494140625, -0.238250732421875, -0.19500732421875, -0.151763916015625, -0.1085205078125, -0.065277099609375, -0.02203369140625, 0.021209716796875, 0.064453125, 0.107696533203125, 0.15093994140625, 0.194183349609375, 0.2374267578125, 0.280670166015625, 0.32391357421875, 0.367156982421875, 0.410400390625, 0.453643798828125, 0.49688720703125, 0.540130615234375, 0.5833740234375, 0.626617431640625, 0.66986083984375, 0.713104248046875, 0.75634765625, 0.799591064453125, 0.84283447265625, 0.886077880859375, 0.9293212890625, 0.972564697265625, 1.01580810546875, 1.059051513671875, 1.102294921875, 1.145538330078125, 1.18878173828125, 1.232025146484375, 1.2752685546875, 1.318511962890625, 1.36175537109375, 1.404998779296875, 1.4482421875]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 3.0, 3.0, 5.0, 9.0, 6.0, 10.0, 13.0, 9.0, 17.0, 16.0, 19.0, 19.0, 21.0, 32.0, 21.0, 25.0, 43.0, 38.0, 38.0, 30.0, 29.0, 37.0, 1071.0, 37.0, 55.0, 56.0, 31.0, 35.0, 40.0, 31.0, 25.0, 26.0, 23.0, 20.0, 21.0, 16.0, 23.0, 13.0, 13.0, 8.0, 12.0, 3.0, 4.0, 9.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0], "bins": [-10.875, -10.5626220703125, -10.250244140625, -9.9378662109375, -9.62548828125, -9.3131103515625, -9.000732421875, -8.6883544921875, -8.3759765625, -8.0635986328125, -7.751220703125, -7.4388427734375, -7.12646484375, -6.8140869140625, -6.501708984375, -6.1893310546875, -5.876953125, -5.5645751953125, -5.252197265625, -4.9398193359375, -4.62744140625, -4.3150634765625, -4.002685546875, -3.6903076171875, -3.3779296875, -3.0655517578125, -2.753173828125, -2.4407958984375, -2.12841796875, -1.8160400390625, -1.503662109375, -1.1912841796875, -0.87890625, -0.5665283203125, -0.254150390625, 0.0582275390625, 0.37060546875, 0.6829833984375, 0.995361328125, 1.3077392578125, 1.6201171875, 1.9324951171875, 2.244873046875, 2.5572509765625, 2.86962890625, 3.1820068359375, 3.494384765625, 3.8067626953125, 4.119140625, 4.4315185546875, 4.743896484375, 5.0562744140625, 5.36865234375, 5.6810302734375, 5.993408203125, 6.3057861328125, 6.6181640625, 6.9305419921875, 7.242919921875, 7.5552978515625, 7.86767578125, 8.1800537109375, 8.492431640625, 8.8048095703125, 9.1171875]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 6.0, 4.0, 18.0, 22.0, 25.0, 44.0, 71.0, 89.0, 114.0, 178.0, 307.0, 369.0, 596.0, 842.0, 1234.0, 1854.0, 2676.0, 4073.0, 6158.0, 9350.0, 14124.0, 21754.0, 34670.0, 56338.0, 94814.0, 159783.0, 1261147.0, 166306.0, 99157.0, 58575.0, 36074.0, 22768.0, 14614.0, 9510.0, 6340.0, 4188.0, 2855.0, 1980.0, 1284.0, 900.0, 637.0, 408.0, 302.0, 178.0, 127.0, 95.0, 56.0, 40.0, 36.0, 14.0, 7.0, 14.0, 5.0, 6.0, 2.0, 2.0, 3.0, 1.0, 4.0, 0.0, 2.0], "bins": [-0.83935546875, -0.810943603515625, -0.78253173828125, -0.754119873046875, -0.7257080078125, -0.697296142578125, -0.66888427734375, -0.640472412109375, -0.612060546875, -0.583648681640625, -0.55523681640625, -0.526824951171875, -0.4984130859375, -0.470001220703125, -0.44158935546875, -0.413177490234375, -0.384765625, -0.356353759765625, -0.32794189453125, -0.299530029296875, -0.2711181640625, -0.242706298828125, -0.21429443359375, -0.185882568359375, -0.157470703125, -0.129058837890625, -0.10064697265625, -0.072235107421875, -0.0438232421875, -0.015411376953125, 0.01300048828125, 0.041412353515625, 0.06982421875, 0.098236083984375, 0.12664794921875, 0.155059814453125, 0.1834716796875, 0.211883544921875, 0.24029541015625, 0.268707275390625, 0.297119140625, 0.325531005859375, 0.35394287109375, 0.382354736328125, 0.4107666015625, 0.439178466796875, 0.46759033203125, 0.496002197265625, 0.5244140625, 0.552825927734375, 0.58123779296875, 0.609649658203125, 0.6380615234375, 0.666473388671875, 0.69488525390625, 0.723297119140625, 0.751708984375, 0.780120849609375, 0.80853271484375, 0.836944580078125, 0.8653564453125, 0.893768310546875, 0.92218017578125, 0.950592041015625, 0.97900390625]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 6.0, 4.0, 6.0, 7.0, 9.0, 7.0, 13.0, 16.0, 15.0, 19.0, 23.0, 39.0, 65.0, 62.0, 71.0, 83.0, 85.0, 84.0, 79.0, 52.0, 44.0, 39.0, 33.0, 21.0, 8.0, 11.0, 19.0, 13.0, 15.0, 6.0, 8.0, 3.0, 6.0, 7.0, 2.0, 2.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.01629638671875, -0.015798449516296387, -0.015300512313842773, -0.01480257511138916, -0.014304637908935547, -0.013806700706481934, -0.01330876350402832, -0.012810826301574707, -0.012312889099121094, -0.01181495189666748, -0.011317014694213867, -0.010819077491760254, -0.01032114028930664, -0.009823203086853027, -0.009325265884399414, -0.0088273286819458, -0.008329391479492188, -0.007831454277038574, -0.007333517074584961, -0.006835579872131348, -0.006337642669677734, -0.005839705467224121, -0.005341768264770508, -0.0048438310623168945, -0.004345893859863281, -0.003847956657409668, -0.0033500194549560547, -0.0028520822525024414, -0.002354145050048828, -0.0018562078475952148, -0.0013582706451416016, -0.0008603334426879883, -0.000362396240234375, 0.00013554096221923828, 0.0006334781646728516, 0.0011314153671264648, 0.0016293525695800781, 0.0021272897720336914, 0.0026252269744873047, 0.003123164176940918, 0.0036211013793945312, 0.0041190385818481445, 0.004616975784301758, 0.005114912986755371, 0.005612850189208984, 0.006110787391662598, 0.006608724594116211, 0.007106661796569824, 0.0076045989990234375, 0.00810253620147705, 0.008600473403930664, 0.009098410606384277, 0.00959634780883789, 0.010094285011291504, 0.010592222213745117, 0.01109015941619873, 0.011588096618652344, 0.012086033821105957, 0.01258397102355957, 0.013081908226013184, 0.013579845428466797, 0.01407778263092041, 0.014575719833374023, 0.015073657035827637, 0.01557159423828125]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 2.0, 5.0, 3.0, 4.0, 12.0, 5.0, 11.0, 8.0, 16.0, 12.0, 22.0, 16.0, 28.0, 24.0, 30.0, 68.0, 109.0, 142.0, 265.0, 1319.0, 104703.0, 936137.0, 4583.0, 414.0, 189.0, 114.0, 79.0, 51.0, 47.0, 28.0, 21.0, 18.0, 8.0, 17.0, 8.0, 12.0, 4.0, 4.0, 7.0, 5.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.3623046875, -0.35105133056640625, -0.3397979736328125, -0.32854461669921875, -0.317291259765625, -0.30603790283203125, -0.2947845458984375, -0.28353118896484375, -0.27227783203125, -0.26102447509765625, -0.2497711181640625, -0.23851776123046875, -0.227264404296875, -0.21601104736328125, -0.2047576904296875, -0.19350433349609375, -0.1822509765625, -0.17099761962890625, -0.1597442626953125, -0.14849090576171875, -0.137237548828125, -0.12598419189453125, -0.1147308349609375, -0.10347747802734375, -0.09222412109375, -0.08097076416015625, -0.0697174072265625, -0.05846405029296875, -0.047210693359375, -0.03595733642578125, -0.0247039794921875, -0.01345062255859375, -0.002197265625, 0.00905609130859375, 0.0203094482421875, 0.03156280517578125, 0.042816162109375, 0.05406951904296875, 0.0653228759765625, 0.07657623291015625, 0.08782958984375, 0.09908294677734375, 0.1103363037109375, 0.12158966064453125, 0.132843017578125, 0.14409637451171875, 0.1553497314453125, 0.16660308837890625, 0.1778564453125, 0.18910980224609375, 0.2003631591796875, 0.21161651611328125, 0.222869873046875, 0.23412322998046875, 0.2453765869140625, 0.25662994384765625, 0.26788330078125, 0.27913665771484375, 0.2903900146484375, 0.30164337158203125, 0.312896728515625, 0.32415008544921875, 0.3354034423828125, 0.34665679931640625, 0.35791015625]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 43.0, 446.0, 461.0, 50.0, 10.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0415981188416481, -0.03640041500329971, -0.031202707439661026, -0.026005001738667488, -0.02080729603767395, -0.015609590336680412, -0.010411884635686874, -0.005214177072048187, -1.6473233699798584e-05, 0.005181232467293739, 0.010378938168287277, 0.015576643869280815, 0.020774349570274353, 0.02597205527126789, 0.03116976097226143, 0.036367468535900116, 0.041565172374248505, 0.04676287621259689, 0.05196058377623558, 0.05715829133987427, 0.062355995178222656, 0.06755369901657104, 0.07275140285491943, 0.07794911414384842, 0.08314681798219681, 0.0883445218205452, 0.09354223310947418, 0.09873993694782257, 0.10393764078617096, 0.10913534462451935, 0.11433304846286774, 0.11953075975179672, 0.12472847104072571, 0.1299261748790741, 0.13512387871742249, 0.14032158255577087, 0.14551928639411926, 0.15071700513362885, 0.15591470897197723, 0.16111241281032562, 0.166310116648674, 0.1715078204870224, 0.1767055243253708, 0.18190322816371918, 0.18710094690322876, 0.19229865074157715, 0.19749635457992554, 0.20269405841827393, 0.20789176225662231, 0.2130894660949707, 0.2182871699333191, 0.22348487377166748, 0.22868257761001587, 0.23388029634952545, 0.23907800018787384, 0.24427570402622223, 0.24947340786457062, 0.2546711266040802, 0.2598688304424286, 0.265066534280777, 0.27026423811912537, 0.27546194195747375, 0.28065964579582214, 0.28585734963417053, 0.2910550534725189]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 3.0, 3.0, 5.0, 8.0, 12.0, 13.0, 8.0, 13.0, 13.0, 16.0, 19.0, 18.0, 30.0, 31.0, 37.0, 34.0, 35.0, 40.0, 45.0, 47.0, 46.0, 38.0, 44.0, 51.0, 53.0, 41.0, 46.0, 39.0, 31.0, 21.0, 23.0, 24.0, 29.0, 19.0, 18.0, 16.0, 8.0, 4.0, 9.0, 6.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.021617889404296875, -0.020996319130063057, -0.02037474885582924, -0.01975317858159542, -0.019131608307361603, -0.018510038033127785, -0.017888467758893967, -0.01726689748466015, -0.01664532721042633, -0.016023756936192513, -0.015402186661958694, -0.014780616387724876, -0.014159046113491058, -0.01353747583925724, -0.012915905565023422, -0.012294335290789604, -0.011672765016555786, -0.011051194742321968, -0.01042962446808815, -0.009808054193854332, -0.009186483919620514, -0.008564913645386696, -0.007943343371152878, -0.00732177309691906, -0.006700202822685242, -0.006078632548451424, -0.005457062274217606, -0.0048354919999837875, -0.0042139217257499695, -0.0035923514515161514, -0.0029707811772823334, -0.0023492109030485153, -0.0017276406288146973, -0.0011060703545808792, -0.00048450008034706116, 0.0001370701938867569, 0.000758640468120575, 0.001380210742354393, 0.002001781016588211, 0.002623351290822029, 0.003244921565055847, 0.0038664918392896652, 0.004488062113523483, 0.005109632387757301, 0.005731202661991119, 0.0063527729362249374, 0.0069743432104587555, 0.0075959134846925735, 0.008217483758926392, 0.00883905403316021, 0.009460624307394028, 0.010082194581627846, 0.010703764855861664, 0.011325335130095482, 0.0119469054043293, 0.012568475678563118, 0.013190045952796936, 0.013811616227030754, 0.014433186501264572, 0.01505475677549839, 0.015676327049732208, 0.016297897323966026, 0.016919467598199844, 0.017541037872433662, 0.01816260814666748]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 5.0, 5.0, 10.0, 9.0, 10.0, 12.0, 14.0, 15.0, 19.0, 19.0, 35.0, 21.0, 27.0, 36.0, 30.0, 54.0, 41.0, 54.0, 38.0, 66.0, 39.0, 36.0, 46.0, 35.0, 33.0, 38.0, 29.0, 31.0, 27.0, 25.0, 28.0, 11.0, 19.0, 18.0, 15.0, 11.0, 8.0, 11.0, 6.0, 5.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.375, -14.84765625, -14.3203125, -13.79296875, -13.265625, -12.73828125, -12.2109375, -11.68359375, -11.15625, -10.62890625, -10.1015625, -9.57421875, -9.046875, -8.51953125, -7.9921875, -7.46484375, -6.9375, -6.41015625, -5.8828125, -5.35546875, -4.828125, -4.30078125, -3.7734375, -3.24609375, -2.71875, -2.19140625, -1.6640625, -1.13671875, -0.609375, -0.08203125, 0.4453125, 0.97265625, 1.5, 2.02734375, 2.5546875, 3.08203125, 3.609375, 4.13671875, 4.6640625, 5.19140625, 5.71875, 6.24609375, 6.7734375, 7.30078125, 7.828125, 8.35546875, 8.8828125, 9.41015625, 9.9375, 10.46484375, 10.9921875, 11.51953125, 12.046875, 12.57421875, 13.1015625, 13.62890625, 14.15625, 14.68359375, 15.2109375, 15.73828125, 16.265625, 16.79296875, 17.3203125, 17.84765625, 18.375]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 5.0, 7.0, 6.0, 14.0, 18.0, 17.0, 26.0, 26.0, 33.0, 46.0, 60.0, 91.0, 126.0, 176.0, 263.0, 402.0, 604.0, 1109.0, 2096.0, 4891.0, 16219.0, 202429.0, 781536.0, 25821.0, 6502.0, 2583.0, 1268.0, 717.0, 444.0, 282.0, 207.0, 142.0, 96.0, 64.0, 55.0, 30.0, 37.0, 23.0, 20.0, 17.0, 11.0, 11.0, 6.0, 8.0, 5.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-36.75, -35.48876953125, -34.2275390625, -32.96630859375, -31.705078125, -30.44384765625, -29.1826171875, -27.92138671875, -26.66015625, -25.39892578125, -24.1376953125, -22.87646484375, -21.615234375, -20.35400390625, -19.0927734375, -17.83154296875, -16.5703125, -15.30908203125, -14.0478515625, -12.78662109375, -11.525390625, -10.26416015625, -9.0029296875, -7.74169921875, -6.48046875, -5.21923828125, -3.9580078125, -2.69677734375, -1.435546875, -0.17431640625, 1.0869140625, 2.34814453125, 3.609375, 4.87060546875, 6.1318359375, 7.39306640625, 8.654296875, 9.91552734375, 11.1767578125, 12.43798828125, 13.69921875, 14.96044921875, 16.2216796875, 17.48291015625, 18.744140625, 20.00537109375, 21.2666015625, 22.52783203125, 23.7890625, 25.05029296875, 26.3115234375, 27.57275390625, 28.833984375, 30.09521484375, 31.3564453125, 32.61767578125, 33.87890625, 35.14013671875, 36.4013671875, 37.66259765625, 38.923828125, 40.18505859375, 41.4462890625, 42.70751953125, 43.96875]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 7.0, 2.0, 7.0, 8.0, 3.0, 11.0, 8.0, 11.0, 10.0, 19.0, 16.0, 15.0, 22.0, 29.0, 21.0, 31.0, 42.0, 37.0, 38.0, 44.0, 69.0, 92.0, 1605.0, 382.0, 100.0, 52.0, 44.0, 35.0, 36.0, 30.0, 30.0, 32.0, 26.0, 22.0, 20.0, 26.0, 21.0, 13.0, 12.0, 6.0, 5.0, 2.0, 6.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-36.5625, -35.341796875, -34.12109375, -32.900390625, -31.6796875, -30.458984375, -29.23828125, -28.017578125, -26.796875, -25.576171875, -24.35546875, -23.134765625, -21.9140625, -20.693359375, -19.47265625, -18.251953125, -17.03125, -15.810546875, -14.58984375, -13.369140625, -12.1484375, -10.927734375, -9.70703125, -8.486328125, -7.265625, -6.044921875, -4.82421875, -3.603515625, -2.3828125, -1.162109375, 0.05859375, 1.279296875, 2.5, 3.720703125, 4.94140625, 6.162109375, 7.3828125, 8.603515625, 9.82421875, 11.044921875, 12.265625, 13.486328125, 14.70703125, 15.927734375, 17.1484375, 18.369140625, 19.58984375, 20.810546875, 22.03125, 23.251953125, 24.47265625, 25.693359375, 26.9140625, 28.134765625, 29.35546875, 30.576171875, 31.796875, 33.017578125, 34.23828125, 35.458984375, 36.6796875, 37.900390625, 39.12109375, 40.341796875, 41.5625]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 3.0, 3.0, 2.0, 1.0, 2.0, 6.0, 1.0, 12.0, 5.0, 10.0, 12.0, 16.0, 20.0, 32.0, 24.0, 15.0, 40.0, 37.0, 57.0, 47.0, 82.0, 140.0, 265.0, 747.0, 4257.0, 125838.0, 3002292.0, 9512.0, 1250.0, 332.0, 173.0, 108.0, 66.0, 64.0, 44.0, 22.0, 26.0, 16.0, 17.0, 17.0, 20.0, 14.0, 9.0, 12.0, 9.0, 8.0, 5.0, 4.0, 7.0, 1.0, 6.0, 1.0, 2.0, 4.0], "bins": [-107.4375, -104.4677734375, -101.498046875, -98.5283203125, -95.55859375, -92.5888671875, -89.619140625, -86.6494140625, -83.6796875, -80.7099609375, -77.740234375, -74.7705078125, -71.80078125, -68.8310546875, -65.861328125, -62.8916015625, -59.921875, -56.9521484375, -53.982421875, -51.0126953125, -48.04296875, -45.0732421875, -42.103515625, -39.1337890625, -36.1640625, -33.1943359375, -30.224609375, -27.2548828125, -24.28515625, -21.3154296875, -18.345703125, -15.3759765625, -12.40625, -9.4365234375, -6.466796875, -3.4970703125, -0.52734375, 2.4423828125, 5.412109375, 8.3818359375, 11.3515625, 14.3212890625, 17.291015625, 20.2607421875, 23.23046875, 26.2001953125, 29.169921875, 32.1396484375, 35.109375, 38.0791015625, 41.048828125, 44.0185546875, 46.98828125, 49.9580078125, 52.927734375, 55.8974609375, 58.8671875, 61.8369140625, 64.806640625, 67.7763671875, 70.74609375, 73.7158203125, 76.685546875, 79.6552734375, 82.625]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 6.0, 18.0, 19.0, 52.0, 95.0, 171.0, 178.0, 191.0, 116.0, 73.0, 42.0, 30.0, 8.0, 9.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.6999626159668, -51.271575927734375, -49.84318923950195, -48.41480255126953, -46.986419677734375, -45.55803298950195, -44.12964630126953, -42.70125961303711, -41.27287292480469, -39.844486236572266, -38.416099548339844, -36.98771286010742, -35.559326171875, -34.130943298339844, -32.70255661010742, -31.274169921875, -29.845783233642578, -28.417396545410156, -26.989009857177734, -25.560625076293945, -24.132238388061523, -22.7038516998291, -21.275466918945312, -19.84708023071289, -18.41869354248047, -16.990306854248047, -15.561921119689941, -14.133535385131836, -12.705148696899414, -11.276762008666992, -9.848376274108887, -8.419990539550781, -6.991600036621094, -5.56321382522583, -4.134827613830566, -2.7064414024353027, -1.278055191040039, 0.1503310203552246, 1.5787172317504883, 3.0071029663085938, 4.435489654541016, 5.863875865936279, 7.292262077331543, 8.720647811889648, 10.14903450012207, 11.577421188354492, 13.005806922912598, 14.434192657470703, 15.862579345703125, 17.290966033935547, 18.71935272216797, 20.147737503051758, 21.57612419128418, 23.0045108795166, 24.43289566040039, 25.861282348632812, 27.289669036865234, 28.718055725097656, 30.146442413330078, 31.574827194213867, 33.003211975097656, 34.43159866333008, 35.8599853515625, 37.28837203979492, 38.716758728027344]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 2.0, 13.0, 3.0, 17.0, 17.0, 9.0, 19.0, 20.0, 24.0, 25.0, 27.0, 24.0, 32.0, 51.0, 33.0, 50.0, 42.0, 60.0, 58.0, 49.0, 48.0, 56.0, 37.0, 45.0, 35.0, 33.0, 30.0, 18.0, 24.0, 24.0, 17.0, 18.0, 11.0, 7.0, 4.0, 11.0, 8.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-116.44855499267578, -112.91067504882812, -109.37279510498047, -105.83491516113281, -102.29703521728516, -98.7591552734375, -95.22127532958984, -91.68339538574219, -88.14551544189453, -84.60763549804688, -81.06975555419922, -77.53187561035156, -73.9939956665039, -70.45611572265625, -66.9182357788086, -63.38035583496094, -59.84247589111328, -56.304595947265625, -52.76671600341797, -49.22883605957031, -45.690956115722656, -42.153076171875, -38.615196228027344, -35.07731628417969, -31.53943634033203, -28.001556396484375, -24.46367645263672, -20.925796508789062, -17.387916564941406, -13.85003662109375, -10.312156677246094, -6.7742767333984375, -3.2363967895507812, 0.301483154296875, 3.8393630981445312, 7.3772430419921875, 10.915122985839844, 14.4530029296875, 17.990882873535156, 21.528762817382812, 25.06664276123047, 28.604522705078125, 32.14240264892578, 35.68028259277344, 39.218162536621094, 42.75604248046875, 46.293922424316406, 49.83180236816406, 53.36968231201172, 56.907562255859375, 60.44544219970703, 63.98332214355469, 67.52120208740234, 71.05908203125, 74.59696197509766, 78.13484191894531, 81.67272186279297, 85.21060180664062, 88.74848175048828, 92.28636169433594, 95.8242416381836, 99.36212158203125, 102.9000015258789, 106.43788146972656, 109.97576141357422]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 6.0, 6.0, 8.0, 9.0, 8.0, 8.0, 18.0, 18.0, 15.0, 22.0, 25.0, 26.0, 25.0, 34.0, 30.0, 58.0, 43.0, 52.0, 56.0, 57.0, 41.0, 35.0, 40.0, 39.0, 33.0, 30.0, 39.0, 34.0, 31.0, 21.0, 18.0, 25.0, 22.0, 15.0, 9.0, 8.0, 12.0, 5.0, 8.0, 4.0, 3.0, 2.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.7109375, -15.1717529296875, -14.632568359375, -14.0933837890625, -13.55419921875, -13.0150146484375, -12.475830078125, -11.9366455078125, -11.3974609375, -10.8582763671875, -10.319091796875, -9.7799072265625, -9.24072265625, -8.7015380859375, -8.162353515625, -7.6231689453125, -7.083984375, -6.5447998046875, -6.005615234375, -5.4664306640625, -4.92724609375, -4.3880615234375, -3.848876953125, -3.3096923828125, -2.7705078125, -2.2313232421875, -1.692138671875, -1.1529541015625, -0.61376953125, -0.0745849609375, 0.464599609375, 1.0037841796875, 1.54296875, 2.0821533203125, 2.621337890625, 3.1605224609375, 3.69970703125, 4.2388916015625, 4.778076171875, 5.3172607421875, 5.8564453125, 6.3956298828125, 6.934814453125, 7.4739990234375, 8.01318359375, 8.5523681640625, 9.091552734375, 9.6307373046875, 10.169921875, 10.7091064453125, 11.248291015625, 11.7874755859375, 12.32666015625, 12.8658447265625, 13.405029296875, 13.9442138671875, 14.4833984375, 15.0225830078125, 15.561767578125, 16.1009521484375, 16.64013671875, 17.1793212890625, 17.718505859375, 18.2576904296875, 18.796875]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 6.0, 5.0, 17.0, 19.0, 35.0, 43.0, 60.0, 78.0, 131.0, 211.0, 235.0, 401.0, 577.0, 762.0, 1144.0, 1702.0, 2490.0, 3921.0, 6220.0, 10670.0, 21423.0, 125635.0, 2499357.0, 1402652.0, 72797.0, 17484.0, 9533.0, 5612.0, 3583.0, 2280.0, 1575.0, 1058.0, 763.0, 498.0, 373.0, 291.0, 181.0, 124.0, 92.0, 79.0, 43.0, 29.0, 26.0, 24.0, 19.0, 5.0, 14.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-37.4375, -36.14208984375, -34.8466796875, -33.55126953125, -32.255859375, -30.96044921875, -29.6650390625, -28.36962890625, -27.07421875, -25.77880859375, -24.4833984375, -23.18798828125, -21.892578125, -20.59716796875, -19.3017578125, -18.00634765625, -16.7109375, -15.41552734375, -14.1201171875, -12.82470703125, -11.529296875, -10.23388671875, -8.9384765625, -7.64306640625, -6.34765625, -5.05224609375, -3.7568359375, -2.46142578125, -1.166015625, 0.12939453125, 1.4248046875, 2.72021484375, 4.015625, 5.31103515625, 6.6064453125, 7.90185546875, 9.197265625, 10.49267578125, 11.7880859375, 13.08349609375, 14.37890625, 15.67431640625, 16.9697265625, 18.26513671875, 19.560546875, 20.85595703125, 22.1513671875, 23.44677734375, 24.7421875, 26.03759765625, 27.3330078125, 28.62841796875, 29.923828125, 31.21923828125, 32.5146484375, 33.81005859375, 35.10546875, 36.40087890625, 37.6962890625, 38.99169921875, 40.287109375, 41.58251953125, 42.8779296875, 44.17333984375, 45.46875]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 2.0, 3.0, 4.0, 2.0, 5.0, 6.0, 10.0, 13.0, 21.0, 25.0, 29.0, 30.0, 43.0, 109.0, 228.0, 451.0, 899.0, 1006.0, 576.0, 267.0, 124.0, 46.0, 41.0, 22.0, 17.0, 17.0, 10.0, 19.0, 10.0, 6.0, 5.0, 5.0, 1.0, 7.0, 2.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-38.9375, -37.7978515625, -36.658203125, -35.5185546875, -34.37890625, -33.2392578125, -32.099609375, -30.9599609375, -29.8203125, -28.6806640625, -27.541015625, -26.4013671875, -25.26171875, -24.1220703125, -22.982421875, -21.8427734375, -20.703125, -19.5634765625, -18.423828125, -17.2841796875, -16.14453125, -15.0048828125, -13.865234375, -12.7255859375, -11.5859375, -10.4462890625, -9.306640625, -8.1669921875, -7.02734375, -5.8876953125, -4.748046875, -3.6083984375, -2.46875, -1.3291015625, -0.189453125, 0.9501953125, 2.08984375, 3.2294921875, 4.369140625, 5.5087890625, 6.6484375, 7.7880859375, 8.927734375, 10.0673828125, 11.20703125, 12.3466796875, 13.486328125, 14.6259765625, 15.765625, 16.9052734375, 18.044921875, 19.1845703125, 20.32421875, 21.4638671875, 22.603515625, 23.7431640625, 24.8828125, 26.0224609375, 27.162109375, 28.3017578125, 29.44140625, 30.5810546875, 31.720703125, 32.8603515625, 34.0]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 1.0, 3.0, 3.0, 7.0, 8.0, 7.0, 8.0, 27.0, 30.0, 65.0, 83.0, 152.0, 287.0, 456.0, 891.0, 1724.0, 3470.0, 8036.0, 22015.0, 96617.0, 3747038.0, 260475.0, 32777.0, 10853.0, 4566.0, 2206.0, 1084.0, 621.0, 333.0, 163.0, 104.0, 62.0, 46.0, 21.0, 14.0, 7.0, 6.0, 4.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-76.5, -74.083984375, -71.66796875, -69.251953125, -66.8359375, -64.419921875, -62.00390625, -59.587890625, -57.171875, -54.755859375, -52.33984375, -49.923828125, -47.5078125, -45.091796875, -42.67578125, -40.259765625, -37.84375, -35.427734375, -33.01171875, -30.595703125, -28.1796875, -25.763671875, -23.34765625, -20.931640625, -18.515625, -16.099609375, -13.68359375, -11.267578125, -8.8515625, -6.435546875, -4.01953125, -1.603515625, 0.8125, 3.228515625, 5.64453125, 8.060546875, 10.4765625, 12.892578125, 15.30859375, 17.724609375, 20.140625, 22.556640625, 24.97265625, 27.388671875, 29.8046875, 32.220703125, 34.63671875, 37.052734375, 39.46875, 41.884765625, 44.30078125, 46.716796875, 49.1328125, 51.548828125, 53.96484375, 56.380859375, 58.796875, 61.212890625, 63.62890625, 66.044921875, 68.4609375, 70.876953125, 73.29296875, 75.708984375, 78.125]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 50.0, 829.0, 127.0, 11.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1635.44873046875, -1597.9898681640625, -1560.531005859375, -1523.072265625, -1485.6134033203125, -1448.154541015625, -1410.69580078125, -1373.2369384765625, -1335.778076171875, -1298.3192138671875, -1260.8603515625, -1223.401611328125, -1185.9427490234375, -1148.48388671875, -1111.025146484375, -1073.5662841796875, -1036.107421875, -998.6485595703125, -961.1897583007812, -923.73095703125, -886.2720947265625, -848.813232421875, -811.3544311523438, -773.8956298828125, -736.436767578125, -698.9779052734375, -661.5191040039062, -624.060302734375, -586.6014404296875, -549.142578125, -511.68377685546875, -474.2249450683594, -436.7659912109375, -399.3071594238281, -361.84832763671875, -324.3894958496094, -286.9306640625, -249.47183227539062, -212.01300048828125, -174.55416870117188, -137.0953369140625, -99.63650512695312, -62.17767333984375, -24.718841552734375, 12.739990234375, 50.198822021484375, 87.65765380859375, 125.11648559570312, 162.5753173828125, 200.03414916992188, 237.49298095703125, 274.9518127441406, 312.41064453125, 349.8694763183594, 387.32830810546875, 424.7871398925781, 462.2459716796875, 499.7048034667969, 537.1636352539062, 574.6224365234375, 612.081298828125, 649.5401611328125, 686.9989624023438, 724.457763671875, 761.9166259765625]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 3.0, 1.0, 6.0, 3.0, 1.0, 13.0, 15.0, 24.0, 11.0, 22.0, 20.0, 20.0, 23.0, 25.0, 28.0, 40.0, 34.0, 36.0, 45.0, 39.0, 50.0, 38.0, 44.0, 36.0, 42.0, 48.0, 31.0, 42.0, 24.0, 28.0, 37.0, 35.0, 20.0, 30.0, 20.0, 17.0, 14.0, 19.0, 10.0, 7.0, 6.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.83078002929688, -72.99639129638672, -70.16200256347656, -67.32760620117188, -64.49321746826172, -61.65882873535156, -58.824440002441406, -55.99005126953125, -53.15565872192383, -50.32126998901367, -47.48687744140625, -44.652488708496094, -41.81809997558594, -38.983707427978516, -36.14931869506836, -33.31492614746094, -30.48053741455078, -27.646146774291992, -24.811756134033203, -21.977367401123047, -19.142976760864258, -16.30858612060547, -13.474197387695312, -10.639806747436523, -7.805416107177734, -4.9710259437561035, -2.1366357803344727, 0.69775390625, 3.532144546508789, 6.366535186767578, 9.200923919677734, 12.035314559936523, 14.869705200195312, 17.7040958404541, 20.53848648071289, 23.372875213623047, 26.207265853881836, 29.041656494140625, 31.87604522705078, 34.71043395996094, 37.54482650756836, 40.379215240478516, 43.21360778808594, 46.047996520996094, 48.88238525390625, 51.71677780151367, 54.55116653442383, 57.38555908203125, 60.219947814941406, 63.05433654785156, 65.88872528076172, 68.72311401367188, 71.55751037597656, 74.39189910888672, 77.22628784179688, 80.06067657470703, 82.89506530761719, 85.72945404052734, 88.5638427734375, 91.39823913574219, 94.23262786865234, 97.0670166015625, 99.90140533447266, 102.73579406738281, 105.5701904296875]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 6.0, 7.0, 10.0, 4.0, 11.0, 6.0, 15.0, 21.0, 15.0, 26.0, 28.0, 38.0, 34.0, 36.0, 38.0, 41.0, 56.0, 47.0, 48.0, 41.0, 55.0, 37.0, 34.0, 37.0, 29.0, 29.0, 34.0, 31.0, 33.0, 20.0, 24.0, 25.0, 18.0, 17.0, 14.0, 9.0, 8.0, 4.0, 7.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-17.0, -16.428955078125, -15.85791015625, -15.286865234375, -14.7158203125, -14.144775390625, -13.57373046875, -13.002685546875, -12.431640625, -11.860595703125, -11.28955078125, -10.718505859375, -10.1474609375, -9.576416015625, -9.00537109375, -8.434326171875, -7.86328125, -7.292236328125, -6.72119140625, -6.150146484375, -5.5791015625, -5.008056640625, -4.43701171875, -3.865966796875, -3.294921875, -2.723876953125, -2.15283203125, -1.581787109375, -1.0107421875, -0.439697265625, 0.13134765625, 0.702392578125, 1.2734375, 1.844482421875, 2.41552734375, 2.986572265625, 3.5576171875, 4.128662109375, 4.69970703125, 5.270751953125, 5.841796875, 6.412841796875, 6.98388671875, 7.554931640625, 8.1259765625, 8.697021484375, 9.26806640625, 9.839111328125, 10.41015625, 10.981201171875, 11.55224609375, 12.123291015625, 12.6943359375, 13.265380859375, 13.83642578125, 14.407470703125, 14.978515625, 15.549560546875, 16.12060546875, 16.691650390625, 17.2626953125, 17.833740234375, 18.40478515625, 18.975830078125, 19.546875]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 5.0, 7.0, 15.0, 18.0, 46.0, 48.0, 71.0, 124.0, 168.0, 230.0, 381.0, 638.0, 940.0, 1517.0, 2458.0, 4013.0, 6551.0, 10620.0, 18128.0, 30339.0, 52715.0, 94724.0, 175377.0, 249634.0, 175765.0, 95123.0, 52520.0, 30402.0, 18007.0, 10777.0, 6476.0, 3963.0, 2450.0, 1579.0, 988.0, 605.0, 415.0, 219.0, 171.0, 93.0, 70.0, 43.0, 45.0, 32.0, 17.0, 13.0, 8.0, 5.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0], "bins": [-1.732421875, -1.6807098388671875, -1.628997802734375, -1.5772857666015625, -1.52557373046875, -1.4738616943359375, -1.422149658203125, -1.3704376220703125, -1.3187255859375, -1.2670135498046875, -1.215301513671875, -1.1635894775390625, -1.11187744140625, -1.0601654052734375, -1.008453369140625, -0.9567413330078125, -0.905029296875, -0.8533172607421875, -0.801605224609375, -0.7498931884765625, -0.69818115234375, -0.6464691162109375, -0.594757080078125, -0.5430450439453125, -0.4913330078125, -0.4396209716796875, -0.387908935546875, -0.3361968994140625, -0.28448486328125, -0.2327728271484375, -0.181060791015625, -0.1293487548828125, -0.07763671875, -0.0259246826171875, 0.025787353515625, 0.0774993896484375, 0.12921142578125, 0.1809234619140625, 0.232635498046875, 0.2843475341796875, 0.3360595703125, 0.3877716064453125, 0.439483642578125, 0.4911956787109375, 0.54290771484375, 0.5946197509765625, 0.646331787109375, 0.6980438232421875, 0.749755859375, 0.8014678955078125, 0.853179931640625, 0.9048919677734375, 0.95660400390625, 1.0083160400390625, 1.060028076171875, 1.1117401123046875, 1.1634521484375, 1.2151641845703125, 1.266876220703125, 1.3185882568359375, 1.37030029296875, 1.4220123291015625, 1.473724365234375, 1.5254364013671875, 1.5771484375]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 4.0, 7.0, 2.0, 11.0, 11.0, 8.0, 10.0, 8.0, 16.0, 14.0, 19.0, 13.0, 23.0, 18.0, 21.0, 20.0, 29.0, 32.0, 26.0, 38.0, 35.0, 38.0, 44.0, 39.0, 1053.0, 42.0, 48.0, 35.0, 28.0, 31.0, 34.0, 31.0, 27.0, 24.0, 24.0, 23.0, 15.0, 18.0, 12.0, 6.0, 18.0, 22.0, 18.0, 9.0, 7.0, 6.0, 8.0, 1.0, 2.0, 1.0, 4.0], "bins": [-11.2734375, -10.9713134765625, -10.669189453125, -10.3670654296875, -10.06494140625, -9.7628173828125, -9.460693359375, -9.1585693359375, -8.8564453125, -8.5543212890625, -8.252197265625, -7.9500732421875, -7.64794921875, -7.3458251953125, -7.043701171875, -6.7415771484375, -6.439453125, -6.1373291015625, -5.835205078125, -5.5330810546875, -5.23095703125, -4.9288330078125, -4.626708984375, -4.3245849609375, -4.0224609375, -3.7203369140625, -3.418212890625, -3.1160888671875, -2.81396484375, -2.5118408203125, -2.209716796875, -1.9075927734375, -1.60546875, -1.3033447265625, -1.001220703125, -0.6990966796875, -0.39697265625, -0.0948486328125, 0.207275390625, 0.5093994140625, 0.8115234375, 1.1136474609375, 1.415771484375, 1.7178955078125, 2.02001953125, 2.3221435546875, 2.624267578125, 2.9263916015625, 3.228515625, 3.5306396484375, 3.832763671875, 4.1348876953125, 4.43701171875, 4.7391357421875, 5.041259765625, 5.3433837890625, 5.6455078125, 5.9476318359375, 6.249755859375, 6.5518798828125, 6.85400390625, 7.1561279296875, 7.458251953125, 7.7603759765625, 8.0625]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 8.0, 13.0, 27.0, 27.0, 34.0, 54.0, 81.0, 141.0, 220.0, 343.0, 522.0, 837.0, 1266.0, 1989.0, 3107.0, 4716.0, 7361.0, 11002.0, 16892.0, 26878.0, 43223.0, 72961.0, 125473.0, 556828.0, 901353.0, 127222.0, 74001.0, 44220.0, 27248.0, 17078.0, 11029.0, 7285.0, 4732.0, 3177.0, 2074.0, 1339.0, 846.0, 586.0, 334.0, 215.0, 145.0, 72.0, 57.0, 37.0, 35.0, 14.0, 13.0, 9.0, 7.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0], "bins": [-1.0029296875, -0.9716033935546875, -0.940277099609375, -0.9089508056640625, -0.87762451171875, -0.8462982177734375, -0.814971923828125, -0.7836456298828125, -0.7523193359375, -0.7209930419921875, -0.689666748046875, -0.6583404541015625, -0.62701416015625, -0.5956878662109375, -0.564361572265625, -0.5330352783203125, -0.501708984375, -0.4703826904296875, -0.439056396484375, -0.4077301025390625, -0.37640380859375, -0.3450775146484375, -0.313751220703125, -0.2824249267578125, -0.2510986328125, -0.2197723388671875, -0.188446044921875, -0.1571197509765625, -0.12579345703125, -0.0944671630859375, -0.063140869140625, -0.0318145751953125, -0.00048828125, 0.0308380126953125, 0.062164306640625, 0.0934906005859375, 0.12481689453125, 0.1561431884765625, 0.187469482421875, 0.2187957763671875, 0.2501220703125, 0.2814483642578125, 0.312774658203125, 0.3441009521484375, 0.37542724609375, 0.4067535400390625, 0.438079833984375, 0.4694061279296875, 0.500732421875, 0.5320587158203125, 0.563385009765625, 0.5947113037109375, 0.62603759765625, 0.6573638916015625, 0.688690185546875, 0.7200164794921875, 0.7513427734375, 0.7826690673828125, 0.813995361328125, 0.8453216552734375, 0.87664794921875, 0.9079742431640625, 0.939300537109375, 0.9706268310546875, 1.001953125]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 1.0, 1.0, 7.0, 5.0, 7.0, 8.0, 18.0, 20.0, 19.0, 26.0, 32.0, 30.0, 40.0, 55.0, 66.0, 95.0, 104.0, 121.0, 81.0, 52.0, 35.0, 35.0, 33.0, 26.0, 20.0, 15.0, 8.0, 9.0, 8.0, 5.0, 6.0, 5.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.04522705078125, -0.043990135192871094, -0.04275321960449219, -0.04151630401611328, -0.040279388427734375, -0.03904247283935547, -0.03780555725097656, -0.036568641662597656, -0.03533172607421875, -0.034094810485839844, -0.03285789489746094, -0.03162097930908203, -0.030384063720703125, -0.02914714813232422, -0.027910232543945312, -0.026673316955566406, -0.0254364013671875, -0.024199485778808594, -0.022962570190429688, -0.02172565460205078, -0.020488739013671875, -0.01925182342529297, -0.018014907836914062, -0.016777992248535156, -0.01554107666015625, -0.014304161071777344, -0.013067245483398438, -0.011830329895019531, -0.010593414306640625, -0.009356498718261719, -0.008119583129882812, -0.006882667541503906, -0.005645751953125, -0.004408836364746094, -0.0031719207763671875, -0.0019350051879882812, -0.000698089599609375, 0.0005388259887695312, 0.0017757415771484375, 0.0030126571655273438, 0.00424957275390625, 0.005486488342285156, 0.0067234039306640625, 0.007960319519042969, 0.009197235107421875, 0.010434150695800781, 0.011671066284179688, 0.012907981872558594, 0.0141448974609375, 0.015381813049316406, 0.016618728637695312, 0.01785564422607422, 0.019092559814453125, 0.02032947540283203, 0.021566390991210938, 0.022803306579589844, 0.02404022216796875, 0.025277137756347656, 0.026514053344726562, 0.02775096893310547, 0.028987884521484375, 0.03022480010986328, 0.03146171569824219, 0.032698631286621094, 0.033935546875]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 2.0, 11.0, 11.0, 9.0, 13.0, 15.0, 12.0, 25.0, 30.0, 39.0, 72.0, 97.0, 132.0, 274.0, 647.0, 9911.0, 1032676.0, 3327.0, 549.0, 221.0, 127.0, 90.0, 68.0, 47.0, 41.0, 28.0, 22.0, 14.0, 9.0, 6.0, 5.0, 7.0, 6.0, 3.0, 2.0, 1.0, 5.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.697265625, -0.67181396484375, -0.6463623046875, -0.62091064453125, -0.595458984375, -0.57000732421875, -0.5445556640625, -0.51910400390625, -0.49365234375, -0.46820068359375, -0.4427490234375, -0.41729736328125, -0.391845703125, -0.36639404296875, -0.3409423828125, -0.31549072265625, -0.2900390625, -0.26458740234375, -0.2391357421875, -0.21368408203125, -0.188232421875, -0.16278076171875, -0.1373291015625, -0.11187744140625, -0.08642578125, -0.06097412109375, -0.0355224609375, -0.01007080078125, 0.015380859375, 0.04083251953125, 0.0662841796875, 0.09173583984375, 0.1171875, 0.14263916015625, 0.1680908203125, 0.19354248046875, 0.218994140625, 0.24444580078125, 0.2698974609375, 0.29534912109375, 0.32080078125, 0.34625244140625, 0.3717041015625, 0.39715576171875, 0.422607421875, 0.44805908203125, 0.4735107421875, 0.49896240234375, 0.5244140625, 0.54986572265625, 0.5753173828125, 0.60076904296875, 0.626220703125, 0.65167236328125, 0.6771240234375, 0.70257568359375, 0.72802734375, 0.75347900390625, 0.7789306640625, 0.80438232421875, 0.829833984375, 0.85528564453125, 0.8807373046875, 0.90618896484375, 0.931640625]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 27.0, 919.0, 65.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15368282794952393, -0.1356232464313507, -0.11756366491317749, -0.09950407594442368, -0.08144449442625046, -0.06338491290807724, -0.045325323939323425, -0.027265742421150208, -0.00920616090297699, 0.008853422477841377, 0.026913005858659744, 0.04497259110212326, 0.06303217262029648, 0.0810917541384697, 0.09915134310722351, 0.11721092462539673, 0.13527050614356995, 0.15333008766174316, 0.17138966917991638, 0.1894492506980896, 0.20750883221626282, 0.22556841373443604, 0.24362801015377045, 0.26168757677078247, 0.2797471880912781, 0.2978067696094513, 0.3158663511276245, 0.33392593264579773, 0.35198551416397095, 0.37004509568214417, 0.3881046772003174, 0.406164288520813, 0.4242238402366638, 0.44228342175483704, 0.46034300327301025, 0.47840258479118347, 0.4964621663093567, 0.5145217776298523, 0.5325813293457031, 0.5506409406661987, 0.5687004923820496, 0.5867601037025452, 0.604819655418396, 0.6228792667388916, 0.6409388184547424, 0.658998429775238, 0.6770579814910889, 0.6951175928115845, 0.7131772041320801, 0.7312368154525757, 0.7492963671684265, 0.7673559784889221, 0.785415530204773, 0.8034751415252686, 0.8215346932411194, 0.839594304561615, 0.8576538562774658, 0.8757134675979614, 0.8937730193138123, 0.9118326306343079, 0.9298921823501587, 0.9479517936706543, 0.9660113453865051, 0.9840709567070007, 1.0021305084228516]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 2.0, 4.0, 11.0, 10.0, 16.0, 13.0, 15.0, 15.0, 23.0, 23.0, 22.0, 45.0, 37.0, 34.0, 40.0, 37.0, 46.0, 49.0, 45.0, 45.0, 46.0, 51.0, 30.0, 40.0, 31.0, 52.0, 31.0, 31.0, 29.0, 25.0, 22.0, 18.0, 15.0, 16.0, 9.0, 10.0, 5.0, 3.0, 3.0, 1.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05918377637863159, -0.05743154510855675, -0.0556793138384819, -0.05392708256840706, -0.052174851298332214, -0.05042262002825737, -0.048670388758182526, -0.04691815748810768, -0.04516592621803284, -0.04341369494795799, -0.04166146367788315, -0.039909232407808304, -0.03815700113773346, -0.036404769867658615, -0.03465253859758377, -0.032900307327508926, -0.031148076057434082, -0.029395844787359238, -0.027643613517284393, -0.02589138224720955, -0.024139150977134705, -0.02238691970705986, -0.020634688436985016, -0.01888245716691017, -0.017130225896835327, -0.015377994626760483, -0.013625763356685638, -0.011873532086610794, -0.01012130081653595, -0.008369069546461105, -0.006616838276386261, -0.004864607006311417, -0.0031123757362365723, -0.001360144466161728, 0.00039208680391311646, 0.002144318073987961, 0.003896549344062805, 0.0056487806141376495, 0.007401011884212494, 0.009153243154287338, 0.010905474424362183, 0.012657705694437027, 0.014409936964511871, 0.016162168234586716, 0.01791439950466156, 0.019666630774736404, 0.02141886204481125, 0.023171093314886093, 0.024923324584960938, 0.026675555855035782, 0.028427787125110626, 0.03018001839518547, 0.031932249665260315, 0.03368448093533516, 0.035436712205410004, 0.03718894347548485, 0.03894117474555969, 0.04069340601563454, 0.04244563728570938, 0.044197868555784225, 0.04595009982585907, 0.047702331095933914, 0.04945456236600876, 0.0512067936360836, 0.05295902490615845]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 6.0, 7.0, 10.0, 4.0, 11.0, 6.0, 15.0, 21.0, 16.0, 25.0, 28.0, 38.0, 34.0, 36.0, 39.0, 41.0, 56.0, 46.0, 48.0, 40.0, 56.0, 37.0, 35.0, 36.0, 29.0, 30.0, 33.0, 31.0, 33.0, 20.0, 24.0, 25.0, 18.0, 17.0, 14.0, 9.0, 8.0, 4.0, 7.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-17.0, -16.428955078125, -15.85791015625, -15.286865234375, -14.7158203125, -14.144775390625, -13.57373046875, -13.002685546875, -12.431640625, -11.860595703125, -11.28955078125, -10.718505859375, -10.1474609375, -9.576416015625, -9.00537109375, -8.434326171875, -7.86328125, -7.292236328125, -6.72119140625, -6.150146484375, -5.5791015625, -5.008056640625, -4.43701171875, -3.865966796875, -3.294921875, -2.723876953125, -2.15283203125, -1.581787109375, -1.0107421875, -0.439697265625, 0.13134765625, 0.702392578125, 1.2734375, 1.844482421875, 2.41552734375, 2.986572265625, 3.5576171875, 4.128662109375, 4.69970703125, 5.270751953125, 5.841796875, 6.412841796875, 6.98388671875, 7.554931640625, 8.1259765625, 8.697021484375, 9.26806640625, 9.839111328125, 10.41015625, 10.981201171875, 11.55224609375, 12.123291015625, 12.6943359375, 13.265380859375, 13.83642578125, 14.407470703125, 14.978515625, 15.549560546875, 16.12060546875, 16.691650390625, 17.2626953125, 17.833740234375, 18.40478515625, 18.975830078125, 19.546875]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 6.0, 11.0, 11.0, 15.0, 32.0, 35.0, 44.0, 70.0, 62.0, 95.0, 148.0, 251.0, 395.0, 589.0, 953.0, 1624.0, 2853.0, 5709.0, 14598.0, 69026.0, 634492.0, 264938.0, 33080.0, 9590.0, 4166.0, 2164.0, 1310.0, 762.0, 508.0, 284.0, 204.0, 140.0, 113.0, 72.0, 69.0, 35.0, 23.0, 20.0, 17.0, 9.0, 10.0, 10.0, 7.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-23.375, -22.563232421875, -21.75146484375, -20.939697265625, -20.1279296875, -19.316162109375, -18.50439453125, -17.692626953125, -16.880859375, -16.069091796875, -15.25732421875, -14.445556640625, -13.6337890625, -12.822021484375, -12.01025390625, -11.198486328125, -10.38671875, -9.574951171875, -8.76318359375, -7.951416015625, -7.1396484375, -6.327880859375, -5.51611328125, -4.704345703125, -3.892578125, -3.080810546875, -2.26904296875, -1.457275390625, -0.6455078125, 0.166259765625, 0.97802734375, 1.789794921875, 2.6015625, 3.413330078125, 4.22509765625, 5.036865234375, 5.8486328125, 6.660400390625, 7.47216796875, 8.283935546875, 9.095703125, 9.907470703125, 10.71923828125, 11.531005859375, 12.3427734375, 13.154541015625, 13.96630859375, 14.778076171875, 15.58984375, 16.401611328125, 17.21337890625, 18.025146484375, 18.8369140625, 19.648681640625, 20.46044921875, 21.272216796875, 22.083984375, 22.895751953125, 23.70751953125, 24.519287109375, 25.3310546875, 26.142822265625, 26.95458984375, 27.766357421875, 28.578125]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 4.0, 2.0, 4.0, 3.0, 6.0, 9.0, 10.0, 14.0, 13.0, 8.0, 16.0, 20.0, 25.0, 26.0, 18.0, 26.0, 44.0, 38.0, 41.0, 66.0, 70.0, 174.0, 1665.0, 231.0, 94.0, 62.0, 54.0, 36.0, 52.0, 37.0, 37.0, 28.0, 24.0, 24.0, 15.0, 17.0, 9.0, 11.0, 6.0, 3.0, 4.0, 2.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-43.625, -42.24560546875, -40.8662109375, -39.48681640625, -38.107421875, -36.72802734375, -35.3486328125, -33.96923828125, -32.58984375, -31.21044921875, -29.8310546875, -28.45166015625, -27.072265625, -25.69287109375, -24.3134765625, -22.93408203125, -21.5546875, -20.17529296875, -18.7958984375, -17.41650390625, -16.037109375, -14.65771484375, -13.2783203125, -11.89892578125, -10.51953125, -9.14013671875, -7.7607421875, -6.38134765625, -5.001953125, -3.62255859375, -2.2431640625, -0.86376953125, 0.515625, 1.89501953125, 3.2744140625, 4.65380859375, 6.033203125, 7.41259765625, 8.7919921875, 10.17138671875, 11.55078125, 12.93017578125, 14.3095703125, 15.68896484375, 17.068359375, 18.44775390625, 19.8271484375, 21.20654296875, 22.5859375, 23.96533203125, 25.3447265625, 26.72412109375, 28.103515625, 29.48291015625, 30.8623046875, 32.24169921875, 33.62109375, 35.00048828125, 36.3798828125, 37.75927734375, 39.138671875, 40.51806640625, 41.8974609375, 43.27685546875, 44.65625]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 1.0, 4.0, 6.0, 9.0, 17.0, 13.0, 20.0, 32.0, 51.0, 85.0, 114.0, 191.0, 334.0, 873.0, 4387.0, 146614.0, 2975866.0, 14228.0, 1722.0, 467.0, 222.0, 141.0, 95.0, 61.0, 53.0, 34.0, 22.0, 17.0, 11.0, 6.0, 2.0, 7.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.625, -66.1943359375, -63.763671875, -61.3330078125, -58.90234375, -56.4716796875, -54.041015625, -51.6103515625, -49.1796875, -46.7490234375, -44.318359375, -41.8876953125, -39.45703125, -37.0263671875, -34.595703125, -32.1650390625, -29.734375, -27.3037109375, -24.873046875, -22.4423828125, -20.01171875, -17.5810546875, -15.150390625, -12.7197265625, -10.2890625, -7.8583984375, -5.427734375, -2.9970703125, -0.56640625, 1.8642578125, 4.294921875, 6.7255859375, 9.15625, 11.5869140625, 14.017578125, 16.4482421875, 18.87890625, 21.3095703125, 23.740234375, 26.1708984375, 28.6015625, 31.0322265625, 33.462890625, 35.8935546875, 38.32421875, 40.7548828125, 43.185546875, 45.6162109375, 48.046875, 50.4775390625, 52.908203125, 55.3388671875, 57.76953125, 60.2001953125, 62.630859375, 65.0615234375, 67.4921875, 69.9228515625, 72.353515625, 74.7841796875, 77.21484375, 79.6455078125, 82.076171875, 84.5068359375, 86.9375]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 338.0, 677.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.522544860839844, -45.73832702636719, -30.95410919189453, -16.169891357421875, -1.3856735229492188, 13.398544311523438, 28.182762145996094, 42.96697998046875, 57.751197814941406, 72.53541564941406, 87.31963348388672, 102.10385131835938, 116.88806915283203, 131.6722869873047, 146.45651245117188, 161.24072265625, 176.02493286132812, 190.80914306640625, 205.59336853027344, 220.37759399414062, 235.16180419921875, 249.94601440429688, 264.730224609375, 279.51446533203125, 294.2986755371094, 309.0828857421875, 323.86712646484375, 338.6513366699219, 353.435546875, 368.2197570800781, 383.00396728515625, 397.7882080078125, 412.57244873046875, 427.3566589355469, 442.140869140625, 456.92510986328125, 471.7093200683594, 486.4935302734375, 501.27777099609375, 516.0619506835938, 530.84619140625, 545.6304321289062, 560.4146118164062, 575.1988525390625, 589.9830322265625, 604.7672729492188, 619.551513671875, 634.335693359375, 649.1199340820312, 663.9041748046875, 678.6883544921875, 693.4725952148438, 708.2568359375, 723.041015625, 737.8252563476562, 752.6094360351562, 767.3936767578125, 782.1779174804688, 796.9620971679688, 811.746337890625, 826.530517578125, 841.3147583007812, 856.0989990234375, 870.8831787109375, 885.6674194335938]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 6.0, 4.0, 6.0, 12.0, 5.0, 11.0, 15.0, 12.0, 26.0, 21.0, 17.0, 31.0, 31.0, 35.0, 31.0, 41.0, 37.0, 44.0, 41.0, 32.0, 43.0, 53.0, 43.0, 43.0, 35.0, 29.0, 34.0, 33.0, 38.0, 24.0, 32.0, 23.0, 20.0, 22.0, 14.0, 12.0, 11.0, 7.0, 6.0, 8.0, 5.0, 2.0, 2.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-98.87551879882812, -96.03118133544922, -93.18684387207031, -90.34249877929688, -87.49816131591797, -84.65382385253906, -81.80948638916016, -78.96514892578125, -76.12080383300781, -73.2764663696289, -70.43212890625, -67.58778381347656, -64.74344635009766, -61.89910888671875, -59.054771423339844, -56.21043395996094, -53.36609649658203, -50.521759033203125, -47.67741775512695, -44.83308029174805, -41.988739013671875, -39.14440155029297, -36.30006408691406, -33.455726623535156, -30.611385345458984, -27.767045974731445, -24.922706604003906, -22.078369140625, -19.23402976989746, -16.389690399169922, -13.545352935791016, -10.701013565063477, -7.8566741943359375, -5.012335300445557, -2.167996406555176, 0.6763420104980469, 3.520681381225586, 6.365020751953125, 9.209358215332031, 12.05369758605957, 14.89803695678711, 17.74237632751465, 20.586715698242188, 23.431053161621094, 26.275392532348633, 29.119731903076172, 31.964069366455078, 34.80841064453125, 37.652748107910156, 40.49708557128906, 43.341426849365234, 46.18576431274414, 49.03010559082031, 51.87444305419922, 54.718780517578125, 57.56311798095703, 60.4074592590332, 63.25179672241211, 66.09613800048828, 68.94047546386719, 71.7848129272461, 74.629150390625, 77.47349548339844, 80.31783294677734, 83.16217041015625]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 5.0, 4.0, 11.0, 2.0, 12.0, 8.0, 14.0, 16.0, 14.0, 17.0, 22.0, 40.0, 28.0, 37.0, 30.0, 41.0, 48.0, 39.0, 42.0, 49.0, 34.0, 47.0, 36.0, 49.0, 41.0, 38.0, 21.0, 41.0, 32.0, 15.0, 33.0, 22.0, 19.0, 15.0, 19.0, 15.0, 12.0, 8.0, 10.0, 7.0, 2.0, 2.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-16.5, -15.9482421875, -15.396484375, -14.8447265625, -14.29296875, -13.7412109375, -13.189453125, -12.6376953125, -12.0859375, -11.5341796875, -10.982421875, -10.4306640625, -9.87890625, -9.3271484375, -8.775390625, -8.2236328125, -7.671875, -7.1201171875, -6.568359375, -6.0166015625, -5.46484375, -4.9130859375, -4.361328125, -3.8095703125, -3.2578125, -2.7060546875, -2.154296875, -1.6025390625, -1.05078125, -0.4990234375, 0.052734375, 0.6044921875, 1.15625, 1.7080078125, 2.259765625, 2.8115234375, 3.36328125, 3.9150390625, 4.466796875, 5.0185546875, 5.5703125, 6.1220703125, 6.673828125, 7.2255859375, 7.77734375, 8.3291015625, 8.880859375, 9.4326171875, 9.984375, 10.5361328125, 11.087890625, 11.6396484375, 12.19140625, 12.7431640625, 13.294921875, 13.8466796875, 14.3984375, 14.9501953125, 15.501953125, 16.0537109375, 16.60546875, 17.1572265625, 17.708984375, 18.2607421875, 18.8125]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 9.0, 8.0, 7.0, 18.0, 21.0, 45.0, 44.0, 73.0, 105.0, 160.0, 209.0, 356.0, 469.0, 679.0, 1018.0, 1522.0, 2263.0, 3494.0, 6048.0, 12584.0, 60364.0, 1718130.0, 2284184.0, 72465.0, 12715.0, 6125.0, 3715.0, 2447.0, 1598.0, 1102.0, 729.0, 497.0, 337.0, 221.0, 157.0, 103.0, 73.0, 59.0, 39.0, 21.0, 23.0, 14.0, 10.0, 11.0, 3.0, 0.0, 4.0, 5.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-43.75, -42.29345703125, -40.8369140625, -39.38037109375, -37.923828125, -36.46728515625, -35.0107421875, -33.55419921875, -32.09765625, -30.64111328125, -29.1845703125, -27.72802734375, -26.271484375, -24.81494140625, -23.3583984375, -21.90185546875, -20.4453125, -18.98876953125, -17.5322265625, -16.07568359375, -14.619140625, -13.16259765625, -11.7060546875, -10.24951171875, -8.79296875, -7.33642578125, -5.8798828125, -4.42333984375, -2.966796875, -1.51025390625, -0.0537109375, 1.40283203125, 2.859375, 4.31591796875, 5.7724609375, 7.22900390625, 8.685546875, 10.14208984375, 11.5986328125, 13.05517578125, 14.51171875, 15.96826171875, 17.4248046875, 18.88134765625, 20.337890625, 21.79443359375, 23.2509765625, 24.70751953125, 26.1640625, 27.62060546875, 29.0771484375, 30.53369140625, 31.990234375, 33.44677734375, 34.9033203125, 36.35986328125, 37.81640625, 39.27294921875, 40.7294921875, 42.18603515625, 43.642578125, 45.09912109375, 46.5556640625, 48.01220703125, 49.46875]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 6.0, 13.0, 9.0, 13.0, 24.0, 24.0, 48.0, 77.0, 140.0, 330.0, 861.0, 1323.0, 645.0, 272.0, 98.0, 49.0, 38.0, 26.0, 13.0, 16.0, 9.0, 10.0, 4.0, 4.0, 6.0, 4.0, 2.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-37.15625, -35.8896484375, -34.623046875, -33.3564453125, -32.08984375, -30.8232421875, -29.556640625, -28.2900390625, -27.0234375, -25.7568359375, -24.490234375, -23.2236328125, -21.95703125, -20.6904296875, -19.423828125, -18.1572265625, -16.890625, -15.6240234375, -14.357421875, -13.0908203125, -11.82421875, -10.5576171875, -9.291015625, -8.0244140625, -6.7578125, -5.4912109375, -4.224609375, -2.9580078125, -1.69140625, -0.4248046875, 0.841796875, 2.1083984375, 3.375, 4.6416015625, 5.908203125, 7.1748046875, 8.44140625, 9.7080078125, 10.974609375, 12.2412109375, 13.5078125, 14.7744140625, 16.041015625, 17.3076171875, 18.57421875, 19.8408203125, 21.107421875, 22.3740234375, 23.640625, 24.9072265625, 26.173828125, 27.4404296875, 28.70703125, 29.9736328125, 31.240234375, 32.5068359375, 33.7734375, 35.0400390625, 36.306640625, 37.5732421875, 38.83984375, 40.1064453125, 41.373046875, 42.6396484375, 43.90625]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 9.0, 7.0, 14.0, 24.0, 27.0, 33.0, 53.0, 58.0, 95.0, 143.0, 209.0, 319.0, 506.0, 823.0, 1411.0, 2520.0, 4824.0, 9421.0, 21489.0, 66133.0, 1215697.0, 2733632.0, 88540.0, 25078.0, 10891.0, 5312.0, 2731.0, 1638.0, 935.0, 594.0, 388.0, 223.0, 150.0, 106.0, 62.0, 46.0, 40.0, 32.0, 18.0, 12.0, 13.0, 9.0, 8.0, 5.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0], "bins": [-54.34375, -52.794921875, -51.24609375, -49.697265625, -48.1484375, -46.599609375, -45.05078125, -43.501953125, -41.953125, -40.404296875, -38.85546875, -37.306640625, -35.7578125, -34.208984375, -32.66015625, -31.111328125, -29.5625, -28.013671875, -26.46484375, -24.916015625, -23.3671875, -21.818359375, -20.26953125, -18.720703125, -17.171875, -15.623046875, -14.07421875, -12.525390625, -10.9765625, -9.427734375, -7.87890625, -6.330078125, -4.78125, -3.232421875, -1.68359375, -0.134765625, 1.4140625, 2.962890625, 4.51171875, 6.060546875, 7.609375, 9.158203125, 10.70703125, 12.255859375, 13.8046875, 15.353515625, 16.90234375, 18.451171875, 20.0, 21.548828125, 23.09765625, 24.646484375, 26.1953125, 27.744140625, 29.29296875, 30.841796875, 32.390625, 33.939453125, 35.48828125, 37.037109375, 38.5859375, 40.134765625, 41.68359375, 43.232421875, 44.78125]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 5.0, 6.0, 16.0, 32.0, 65.0, 162.0, 302.0, 212.0, 106.0, 45.0, 21.0, 17.0, 8.0, 5.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-308.9152526855469, -302.4376525878906, -295.9600830078125, -289.48248291015625, -283.0048828125, -276.52728271484375, -270.0497131347656, -263.5721130371094, -257.0945129394531, -250.61692810058594, -244.1393280029297, -237.6617431640625, -231.18414306640625, -224.70655822753906, -218.2289581298828, -211.75137329101562, -205.27377319335938, -198.7961883544922, -192.31858825683594, -185.84100341796875, -179.3634033203125, -172.8858184814453, -166.40821838378906, -159.93063354492188, -153.4530487060547, -146.9754638671875, -140.49786376953125, -134.02027893066406, -127.54267883300781, -121.06509399414062, -114.58749389648438, -108.10990905761719, -101.63230895996094, -95.15471649169922, -88.6771240234375, -82.19953155517578, -75.72193908691406, -69.24435424804688, -62.76675796508789, -56.28916549682617, -49.81157302856445, -43.333980560302734, -36.856388092041016, -30.37879753112793, -23.90120506286621, -17.423614501953125, -10.946022033691406, -4.4684295654296875, 2.0091629028320312, 8.48675537109375, 14.964346885681152, 21.441938400268555, 27.919530868530273, 34.39712142944336, 40.87471389770508, 47.3523063659668, 53.829898834228516, 60.307491302490234, 66.78507995605469, 73.2626724243164, 79.74026489257812, 86.21785736083984, 92.69544982910156, 99.17304229736328, 105.650634765625]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 6.0, 4.0, 7.0, 9.0, 10.0, 12.0, 6.0, 19.0, 22.0, 18.0, 26.0, 37.0, 17.0, 38.0, 36.0, 28.0, 39.0, 46.0, 41.0, 47.0, 44.0, 46.0, 40.0, 53.0, 36.0, 42.0, 44.0, 35.0, 24.0, 17.0, 33.0, 26.0, 14.0, 11.0, 15.0, 10.0, 11.0, 11.0, 5.0, 2.0, 4.0, 5.0, 5.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-86.68189239501953, -84.02593994140625, -81.36998748779297, -78.71403503417969, -76.05807495117188, -73.4021224975586, -70.74617004394531, -68.09021759033203, -65.43426513671875, -62.77831268310547, -60.12236022949219, -57.46640396118164, -54.81045150756836, -52.15449905395508, -49.49854278564453, -46.84259033203125, -44.18663787841797, -41.53068542480469, -38.874732971191406, -36.21877670288086, -33.56282424926758, -30.906871795654297, -28.250917434692383, -25.59496307373047, -22.939010620117188, -20.283058166503906, -17.627103805541992, -14.971150398254395, -12.315196990966797, -9.6592435836792, -7.003290176391602, -4.3473358154296875, -1.6913909912109375, 0.9645624160766602, 3.620515823364258, 6.2764692306518555, 8.932422637939453, 11.58837604522705, 14.244329452514648, 16.900283813476562, 19.556236267089844, 22.212188720703125, 24.86814308166504, 27.524097442626953, 30.180049896240234, 32.836002349853516, 35.49195861816406, 38.147911071777344, 40.803863525390625, 43.459815979003906, 46.11576843261719, 48.771724700927734, 51.427677154541016, 54.0836296081543, 56.739585876464844, 59.395538330078125, 62.051490783691406, 64.70744323730469, 67.36339569091797, 70.01934814453125, 72.67530822753906, 75.33126068115234, 77.98721313476562, 80.6431655883789, 83.29911804199219]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 5.0, 1.0, 3.0, 4.0, 7.0, 6.0, 13.0, 17.0, 27.0, 16.0, 17.0, 27.0, 20.0, 30.0, 41.0, 51.0, 39.0, 36.0, 48.0, 48.0, 50.0, 42.0, 52.0, 46.0, 41.0, 45.0, 37.0, 41.0, 22.0, 29.0, 20.0, 31.0, 15.0, 20.0, 12.0, 15.0, 8.0, 11.0, 4.0, 6.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-19.390625, -18.769287109375, -18.14794921875, -17.526611328125, -16.9052734375, -16.283935546875, -15.66259765625, -15.041259765625, -14.419921875, -13.798583984375, -13.17724609375, -12.555908203125, -11.9345703125, -11.313232421875, -10.69189453125, -10.070556640625, -9.44921875, -8.827880859375, -8.20654296875, -7.585205078125, -6.9638671875, -6.342529296875, -5.72119140625, -5.099853515625, -4.478515625, -3.857177734375, -3.23583984375, -2.614501953125, -1.9931640625, -1.371826171875, -0.75048828125, -0.129150390625, 0.4921875, 1.113525390625, 1.73486328125, 2.356201171875, 2.9775390625, 3.598876953125, 4.22021484375, 4.841552734375, 5.462890625, 6.084228515625, 6.70556640625, 7.326904296875, 7.9482421875, 8.569580078125, 9.19091796875, 9.812255859375, 10.43359375, 11.054931640625, 11.67626953125, 12.297607421875, 12.9189453125, 13.540283203125, 14.16162109375, 14.782958984375, 15.404296875, 16.025634765625, 16.64697265625, 17.268310546875, 17.8896484375, 18.510986328125, 19.13232421875, 19.753662109375, 20.375]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 6.0, 19.0, 24.0, 25.0, 32.0, 38.0, 60.0, 92.0, 128.0, 196.0, 286.0, 425.0, 646.0, 943.0, 1330.0, 1939.0, 2709.0, 4142.0, 6207.0, 9335.0, 14084.0, 22013.0, 34039.0, 55144.0, 93451.0, 157620.0, 215941.0, 166140.0, 98965.0, 58707.0, 36181.0, 23097.0, 14780.0, 9719.0, 6398.0, 4306.0, 2956.0, 2022.0, 1400.0, 965.0, 631.0, 408.0, 320.0, 227.0, 153.0, 109.0, 61.0, 41.0, 35.0, 16.0, 11.0, 12.0, 11.0, 5.0, 7.0, 6.0], "bins": [-1.5771484375, -1.5315093994140625, -1.485870361328125, -1.4402313232421875, -1.39459228515625, -1.3489532470703125, -1.303314208984375, -1.2576751708984375, -1.2120361328125, -1.1663970947265625, -1.120758056640625, -1.0751190185546875, -1.02947998046875, -0.9838409423828125, -0.938201904296875, -0.8925628662109375, -0.846923828125, -0.8012847900390625, -0.755645751953125, -0.7100067138671875, -0.66436767578125, -0.6187286376953125, -0.573089599609375, -0.5274505615234375, -0.4818115234375, -0.4361724853515625, -0.390533447265625, -0.3448944091796875, -0.29925537109375, -0.2536163330078125, -0.207977294921875, -0.1623382568359375, -0.11669921875, -0.0710601806640625, -0.025421142578125, 0.0202178955078125, 0.06585693359375, 0.1114959716796875, 0.157135009765625, 0.2027740478515625, 0.2484130859375, 0.2940521240234375, 0.339691162109375, 0.3853302001953125, 0.43096923828125, 0.4766082763671875, 0.522247314453125, 0.5678863525390625, 0.613525390625, 0.6591644287109375, 0.704803466796875, 0.7504425048828125, 0.79608154296875, 0.8417205810546875, 0.887359619140625, 0.9329986572265625, 0.9786376953125, 1.0242767333984375, 1.069915771484375, 1.1155548095703125, 1.16119384765625, 1.2068328857421875, 1.252471923828125, 1.2981109619140625, 1.34375]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 1.0, 2.0, 7.0, 6.0, 4.0, 6.0, 2.0, 10.0, 15.0, 11.0, 18.0, 19.0, 21.0, 24.0, 33.0, 36.0, 30.0, 26.0, 42.0, 48.0, 27.0, 55.0, 36.0, 1065.0, 35.0, 41.0, 38.0, 43.0, 37.0, 38.0, 29.0, 37.0, 23.0, 28.0, 25.0, 21.0, 19.0, 12.0, 7.0, 15.0, 6.0, 5.0, 6.0, 5.0, 8.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-11.78125, -11.4287109375, -11.076171875, -10.7236328125, -10.37109375, -10.0185546875, -9.666015625, -9.3134765625, -8.9609375, -8.6083984375, -8.255859375, -7.9033203125, -7.55078125, -7.1982421875, -6.845703125, -6.4931640625, -6.140625, -5.7880859375, -5.435546875, -5.0830078125, -4.73046875, -4.3779296875, -4.025390625, -3.6728515625, -3.3203125, -2.9677734375, -2.615234375, -2.2626953125, -1.91015625, -1.5576171875, -1.205078125, -0.8525390625, -0.5, -0.1474609375, 0.205078125, 0.5576171875, 0.91015625, 1.2626953125, 1.615234375, 1.9677734375, 2.3203125, 2.6728515625, 3.025390625, 3.3779296875, 3.73046875, 4.0830078125, 4.435546875, 4.7880859375, 5.140625, 5.4931640625, 5.845703125, 6.1982421875, 6.55078125, 6.9033203125, 7.255859375, 7.6083984375, 7.9609375, 8.3134765625, 8.666015625, 9.0185546875, 9.37109375, 9.7236328125, 10.076171875, 10.4287109375, 10.78125]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 7.0, 7.0, 18.0, 27.0, 32.0, 52.0, 77.0, 114.0, 178.0, 231.0, 369.0, 581.0, 794.0, 1126.0, 1688.0, 2558.0, 3772.0, 5627.0, 8519.0, 13480.0, 21531.0, 35566.0, 59306.0, 101973.0, 173945.0, 1269289.0, 159732.0, 93371.0, 54483.0, 32078.0, 19914.0, 12514.0, 7935.0, 5312.0, 3533.0, 2400.0, 1531.0, 1113.0, 770.0, 484.0, 359.0, 252.0, 161.0, 110.0, 87.0, 46.0, 35.0, 18.0, 3.0, 7.0, 9.0, 4.0, 3.0, 2.0, 4.0, 2.0, 0.0, 3.0], "bins": [-1.05078125, -1.017333984375, -0.98388671875, -0.950439453125, -0.9169921875, -0.883544921875, -0.85009765625, -0.816650390625, -0.783203125, -0.749755859375, -0.71630859375, -0.682861328125, -0.6494140625, -0.615966796875, -0.58251953125, -0.549072265625, -0.515625, -0.482177734375, -0.44873046875, -0.415283203125, -0.3818359375, -0.348388671875, -0.31494140625, -0.281494140625, -0.248046875, -0.214599609375, -0.18115234375, -0.147705078125, -0.1142578125, -0.080810546875, -0.04736328125, -0.013916015625, 0.01953125, 0.052978515625, 0.08642578125, 0.119873046875, 0.1533203125, 0.186767578125, 0.22021484375, 0.253662109375, 0.287109375, 0.320556640625, 0.35400390625, 0.387451171875, 0.4208984375, 0.454345703125, 0.48779296875, 0.521240234375, 0.5546875, 0.588134765625, 0.62158203125, 0.655029296875, 0.6884765625, 0.721923828125, 0.75537109375, 0.788818359375, 0.822265625, 0.855712890625, 0.88916015625, 0.922607421875, 0.9560546875, 0.989501953125, 1.02294921875, 1.056396484375, 1.08984375]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 1.0, 0.0, 4.0, 4.0, 2.0, 4.0, 6.0, 5.0, 4.0, 5.0, 3.0, 11.0, 7.0, 10.0, 14.0, 32.0, 29.0, 38.0, 71.0, 73.0, 97.0, 122.0, 112.0, 86.0, 76.0, 49.0, 26.0, 17.0, 18.0, 10.0, 9.0, 11.0, 13.0, 7.0, 6.0, 5.0, 2.0, 5.0, 1.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0310516357421875, -0.030129194259643555, -0.02920675277709961, -0.028284311294555664, -0.02736186981201172, -0.026439428329467773, -0.025516986846923828, -0.024594545364379883, -0.023672103881835938, -0.022749662399291992, -0.021827220916748047, -0.0209047794342041, -0.019982337951660156, -0.01905989646911621, -0.018137454986572266, -0.01721501350402832, -0.016292572021484375, -0.01537013053894043, -0.014447689056396484, -0.013525247573852539, -0.012602806091308594, -0.011680364608764648, -0.010757923126220703, -0.009835481643676758, -0.008913040161132812, -0.007990598678588867, -0.007068157196044922, -0.0061457157135009766, -0.005223274230957031, -0.004300832748413086, -0.0033783912658691406, -0.0024559497833251953, -0.00153350830078125, -0.0006110668182373047, 0.0003113746643066406, 0.001233816146850586, 0.0021562576293945312, 0.0030786991119384766, 0.004001140594482422, 0.004923582077026367, 0.0058460235595703125, 0.006768465042114258, 0.007690906524658203, 0.008613348007202148, 0.009535789489746094, 0.010458230972290039, 0.011380672454833984, 0.01230311393737793, 0.013225555419921875, 0.01414799690246582, 0.015070438385009766, 0.01599287986755371, 0.016915321350097656, 0.0178377628326416, 0.018760204315185547, 0.019682645797729492, 0.020605087280273438, 0.021527528762817383, 0.022449970245361328, 0.023372411727905273, 0.02429485321044922, 0.025217294692993164, 0.02613973617553711, 0.027062177658081055, 0.027984619140625]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 3.0, 1.0, 4.0, 4.0, 5.0, 11.0, 6.0, 12.0, 15.0, 27.0, 16.0, 31.0, 48.0, 49.0, 67.0, 92.0, 189.0, 368.0, 1567.0, 42559.0, 988117.0, 13636.0, 893.0, 265.0, 152.0, 109.0, 78.0, 51.0, 38.0, 28.0, 20.0, 22.0, 9.0, 5.0, 10.0, 6.0, 10.0, 2.0, 8.0, 3.0, 6.0, 3.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.5244140625, -0.5059280395507812, -0.4874420166015625, -0.46895599365234375, -0.450469970703125, -0.43198394775390625, -0.4134979248046875, -0.39501190185546875, -0.37652587890625, -0.35803985595703125, -0.3395538330078125, -0.32106781005859375, -0.302581787109375, -0.28409576416015625, -0.2656097412109375, -0.24712371826171875, -0.2286376953125, -0.21015167236328125, -0.1916656494140625, -0.17317962646484375, -0.154693603515625, -0.13620758056640625, -0.1177215576171875, -0.09923553466796875, -0.08074951171875, -0.06226348876953125, -0.0437774658203125, -0.02529144287109375, -0.006805419921875, 0.01168060302734375, 0.0301666259765625, 0.04865264892578125, 0.067138671875, 0.08562469482421875, 0.1041107177734375, 0.12259674072265625, 0.141082763671875, 0.15956878662109375, 0.1780548095703125, 0.19654083251953125, 0.21502685546875, 0.23351287841796875, 0.2519989013671875, 0.27048492431640625, 0.288970947265625, 0.30745697021484375, 0.3259429931640625, 0.34442901611328125, 0.3629150390625, 0.38140106201171875, 0.3998870849609375, 0.41837310791015625, 0.436859130859375, 0.45534515380859375, 0.4738311767578125, 0.49231719970703125, 0.51080322265625, 0.5292892456054688, 0.5477752685546875, 0.5662612915039062, 0.584747314453125, 0.6032333374023438, 0.6217193603515625, 0.6402053833007812, 0.65869140625]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 19.0, 82.0, 429.0, 376.0, 76.0, 18.0, 8.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09516280889511108, -0.08785489201545715, -0.08054696768522263, -0.0732390433549881, -0.06593112647533417, -0.05862320587038994, -0.05131528526544571, -0.04400736466050148, -0.03669944405555725, -0.029391523450613022, -0.022083602845668793, -0.014775682240724564, -0.0074677616357803345, -0.00015984103083610535, 0.007148079574108124, 0.014456000179052353, 0.021763920783996582, 0.02907184138894081, 0.03637976199388504, 0.04368768259882927, 0.0509956032037735, 0.05830352380871773, 0.06561144441366196, 0.07291936874389648, 0.08022728562355042, 0.08753520250320435, 0.09484312683343887, 0.1021510511636734, 0.10945896804332733, 0.11676688492298126, 0.12407480925321579, 0.13138273358345032, 0.13869065046310425, 0.14599856734275818, 0.1533064842224121, 0.16061441600322723, 0.16792233288288116, 0.1752302497625351, 0.18253818154335022, 0.18984609842300415, 0.19715401530265808, 0.204461932182312, 0.21176984906196594, 0.21907778084278107, 0.226385697722435, 0.23369361460208893, 0.24100154638290405, 0.24830946326255798, 0.2556173801422119, 0.26292529702186584, 0.2702332139015198, 0.2775411307811737, 0.28484904766082764, 0.29215699434280396, 0.2994649112224579, 0.3067728281021118, 0.31408074498176575, 0.3213886618614197, 0.3286965787410736, 0.33600449562072754, 0.34331244230270386, 0.3506203591823578, 0.3579282760620117, 0.36523619294166565, 0.3725441098213196]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 6.0, 7.0, 13.0, 17.0, 16.0, 14.0, 18.0, 18.0, 24.0, 22.0, 30.0, 28.0, 28.0, 35.0, 38.0, 39.0, 42.0, 41.0, 36.0, 54.0, 38.0, 44.0, 35.0, 38.0, 30.0, 25.0, 35.0, 32.0, 32.0, 24.0, 28.0, 23.0, 18.0, 14.0, 12.0, 13.0, 9.0, 5.0, 4.0, 8.0, 1.0, 3.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.023150980472564697, -0.02247793599963188, -0.021804893389344215, -0.02113185077905655, -0.020458806306123734, -0.019785761833190918, -0.01911271922290325, -0.018439676612615585, -0.01776663213968277, -0.017093587666749954, -0.016420545056462288, -0.01574750244617462, -0.015074457973241806, -0.014401414431631565, -0.013728370890021324, -0.013055327348411083, -0.012382283806800842, -0.011709240265190601, -0.01103619672358036, -0.01036315318197012, -0.009690109640359879, -0.009017066098749638, -0.008344022557139397, -0.007670979015529156, -0.006997935473918915, -0.006324891932308674, -0.005651848390698433, -0.004978804849088192, -0.004305761307477951, -0.00363271776586771, -0.002959674224257469, -0.0022866306826472282, -0.0016135871410369873, -0.0009405435994267464, -0.00026750005781650543, 0.0004055434837937355, 0.0010785870254039764, 0.0017516305670142174, 0.0024246741086244583, 0.0030977176502346992, 0.00377076119184494, 0.004443804733455181, 0.005116848275065422, 0.005789891816675663, 0.006462935358285904, 0.007135978899896145, 0.007809022441506386, 0.008482065983116627, 0.009155109524726868, 0.009828153066337109, 0.01050119660794735, 0.01117424014955759, 0.011847283691167831, 0.012520327232778072, 0.013193370774388313, 0.013866414315998554, 0.014539457857608795, 0.015212501399219036, 0.015885544940829277, 0.016558587551116943, 0.01723163202404976, 0.017904676496982574, 0.01857771910727024, 0.019250761717557907, 0.019923806190490723]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 2.0, 3.0, 2.0, 9.0, 6.0, 13.0, 16.0, 27.0, 17.0, 17.0, 27.0, 20.0, 30.0, 40.0, 51.0, 39.0, 37.0, 47.0, 49.0, 50.0, 40.0, 54.0, 46.0, 41.0, 45.0, 36.0, 41.0, 22.0, 29.0, 21.0, 31.0, 15.0, 19.0, 13.0, 15.0, 8.0, 10.0, 5.0, 6.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-19.40625, -18.78466796875, -18.1630859375, -17.54150390625, -16.919921875, -16.29833984375, -15.6767578125, -15.05517578125, -14.43359375, -13.81201171875, -13.1904296875, -12.56884765625, -11.947265625, -11.32568359375, -10.7041015625, -10.08251953125, -9.4609375, -8.83935546875, -8.2177734375, -7.59619140625, -6.974609375, -6.35302734375, -5.7314453125, -5.10986328125, -4.48828125, -3.86669921875, -3.2451171875, -2.62353515625, -2.001953125, -1.38037109375, -0.7587890625, -0.13720703125, 0.484375, 1.10595703125, 1.7275390625, 2.34912109375, 2.970703125, 3.59228515625, 4.2138671875, 4.83544921875, 5.45703125, 6.07861328125, 6.7001953125, 7.32177734375, 7.943359375, 8.56494140625, 9.1865234375, 9.80810546875, 10.4296875, 11.05126953125, 11.6728515625, 12.29443359375, 12.916015625, 13.53759765625, 14.1591796875, 14.78076171875, 15.40234375, 16.02392578125, 16.6455078125, 17.26708984375, 17.888671875, 18.51025390625, 19.1318359375, 19.75341796875, 20.375]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 5.0, 6.0, 9.0, 14.0, 13.0, 22.0, 44.0, 45.0, 75.0, 115.0, 153.0, 211.0, 318.0, 399.0, 644.0, 992.0, 1492.0, 2295.0, 3649.0, 6111.0, 10691.0, 22904.0, 81049.0, 553788.0, 278153.0, 46526.0, 16545.0, 8434.0, 4942.0, 3054.0, 1929.0, 1272.0, 869.0, 542.0, 379.0, 245.0, 172.0, 141.0, 92.0, 59.0, 49.0, 25.0, 29.0, 12.0, 15.0, 10.0, 4.0, 4.0, 3.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0], "bins": [-24.71875, -23.91650390625, -23.1142578125, -22.31201171875, -21.509765625, -20.70751953125, -19.9052734375, -19.10302734375, -18.30078125, -17.49853515625, -16.6962890625, -15.89404296875, -15.091796875, -14.28955078125, -13.4873046875, -12.68505859375, -11.8828125, -11.08056640625, -10.2783203125, -9.47607421875, -8.673828125, -7.87158203125, -7.0693359375, -6.26708984375, -5.46484375, -4.66259765625, -3.8603515625, -3.05810546875, -2.255859375, -1.45361328125, -0.6513671875, 0.15087890625, 0.953125, 1.75537109375, 2.5576171875, 3.35986328125, 4.162109375, 4.96435546875, 5.7666015625, 6.56884765625, 7.37109375, 8.17333984375, 8.9755859375, 9.77783203125, 10.580078125, 11.38232421875, 12.1845703125, 12.98681640625, 13.7890625, 14.59130859375, 15.3935546875, 16.19580078125, 16.998046875, 17.80029296875, 18.6025390625, 19.40478515625, 20.20703125, 21.00927734375, 21.8115234375, 22.61376953125, 23.416015625, 24.21826171875, 25.0205078125, 25.82275390625, 26.625]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 1.0, 10.0, 10.0, 9.0, 14.0, 12.0, 11.0, 13.0, 15.0, 12.0, 25.0, 26.0, 26.0, 25.0, 31.0, 38.0, 32.0, 48.0, 69.0, 89.0, 220.0, 1584.0, 208.0, 99.0, 58.0, 44.0, 51.0, 25.0, 33.0, 34.0, 19.0, 16.0, 23.0, 15.0, 17.0, 15.0, 18.0, 11.0, 8.0, 10.0, 10.0, 4.0, 4.0, 2.0, 7.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-37.65625, -36.53076171875, -35.4052734375, -34.27978515625, -33.154296875, -32.02880859375, -30.9033203125, -29.77783203125, -28.65234375, -27.52685546875, -26.4013671875, -25.27587890625, -24.150390625, -23.02490234375, -21.8994140625, -20.77392578125, -19.6484375, -18.52294921875, -17.3974609375, -16.27197265625, -15.146484375, -14.02099609375, -12.8955078125, -11.77001953125, -10.64453125, -9.51904296875, -8.3935546875, -7.26806640625, -6.142578125, -5.01708984375, -3.8916015625, -2.76611328125, -1.640625, -0.51513671875, 0.6103515625, 1.73583984375, 2.861328125, 3.98681640625, 5.1123046875, 6.23779296875, 7.36328125, 8.48876953125, 9.6142578125, 10.73974609375, 11.865234375, 12.99072265625, 14.1162109375, 15.24169921875, 16.3671875, 17.49267578125, 18.6181640625, 19.74365234375, 20.869140625, 21.99462890625, 23.1201171875, 24.24560546875, 25.37109375, 26.49658203125, 27.6220703125, 28.74755859375, 29.873046875, 30.99853515625, 32.1240234375, 33.24951171875, 34.375]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 3.0, 2.0, 3.0, 4.0, 4.0, 3.0, 6.0, 5.0, 11.0, 17.0, 26.0, 39.0, 55.0, 78.0, 146.0, 256.0, 631.0, 3047.0, 45225.0, 3072325.0, 20743.0, 1993.0, 480.0, 247.0, 126.0, 74.0, 47.0, 36.0, 20.0, 17.0, 10.0, 9.0, 6.0, 3.0, 0.0, 1.0, 5.0, 3.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-91.75, -88.400390625, -85.05078125, -81.701171875, -78.3515625, -75.001953125, -71.65234375, -68.302734375, -64.953125, -61.603515625, -58.25390625, -54.904296875, -51.5546875, -48.205078125, -44.85546875, -41.505859375, -38.15625, -34.806640625, -31.45703125, -28.107421875, -24.7578125, -21.408203125, -18.05859375, -14.708984375, -11.359375, -8.009765625, -4.66015625, -1.310546875, 2.0390625, 5.388671875, 8.73828125, 12.087890625, 15.4375, 18.787109375, 22.13671875, 25.486328125, 28.8359375, 32.185546875, 35.53515625, 38.884765625, 42.234375, 45.583984375, 48.93359375, 52.283203125, 55.6328125, 58.982421875, 62.33203125, 65.681640625, 69.03125, 72.380859375, 75.73046875, 79.080078125, 82.4296875, 85.779296875, 89.12890625, 92.478515625, 95.828125, 99.177734375, 102.52734375, 105.876953125, 109.2265625, 112.576171875, 115.92578125, 119.275390625, 122.625]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 18.0, 142.0, 495.0, 294.0, 61.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.3460578918457, -46.34069061279297, -40.33531951904297, -34.32994842529297, -28.324581146240234, -22.319211959838867, -16.3138427734375, -10.308475494384766, -4.303104400634766, 1.7022647857666016, 7.707633972167969, 13.713003158569336, 19.718372344970703, 25.72374153137207, 31.729110717773438, 37.73447799682617, 43.73984909057617, 49.745216369628906, 55.750587463378906, 61.755958557128906, 67.76132202148438, 73.76669311523438, 79.77206420898438, 85.77743530273438, 91.78280639648438, 97.78817749023438, 103.79354858398438, 109.79891204833984, 115.80428314208984, 121.80965423583984, 127.81501770019531, 133.8203887939453, 139.82574462890625, 145.83111572265625, 151.83648681640625, 157.84185791015625, 163.84722900390625, 169.8525848388672, 175.8579559326172, 181.8633270263672, 187.8686981201172, 193.8740692138672, 199.8794403076172, 205.8848114013672, 211.89016723632812, 217.89553833007812, 223.90090942382812, 229.90628051757812, 235.91165161132812, 241.91702270507812, 247.92239379882812, 253.92776489257812, 259.9331359863281, 265.9385070800781, 271.9438781738281, 277.94921875, 283.95458984375, 289.9599609375, 295.96533203125, 301.970703125, 307.97607421875, 313.9814453125, 319.98681640625, 325.9921875, 331.99755859375]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 5.0, 3.0, 8.0, 8.0, 12.0, 8.0, 10.0, 8.0, 15.0, 19.0, 22.0, 23.0, 29.0, 25.0, 27.0, 32.0, 42.0, 27.0, 39.0, 36.0, 40.0, 51.0, 44.0, 35.0, 41.0, 39.0, 33.0, 34.0, 26.0, 33.0, 38.0, 31.0, 29.0, 15.0, 22.0, 12.0, 10.0, 17.0, 11.0, 9.0, 11.0, 8.0, 7.0, 5.0, 4.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-71.37543487548828, -68.8658447265625, -66.35624694824219, -63.84665298461914, -61.337059020996094, -58.82746887207031, -56.317874908447266, -53.80828094482422, -51.29868698120117, -48.789093017578125, -46.27949905395508, -43.76990509033203, -41.26031494140625, -38.75071716308594, -36.241127014160156, -33.73153305053711, -31.221939086914062, -28.712345123291016, -26.20275115966797, -23.693159103393555, -21.183565139770508, -18.67397117614746, -16.164379119873047, -13.65478515625, -11.145191192626953, -8.635597229003906, -6.126004219055176, -3.616410732269287, -1.1068172454833984, 1.4027767181396484, 3.912369728088379, 6.421962738037109, 8.931556701660156, 11.441150665283203, 13.950743675231934, 16.460336685180664, 18.96993064880371, 21.479524612426758, 23.989116668701172, 26.49871063232422, 29.008304595947266, 31.517898559570312, 34.02749252319336, 36.537086486816406, 39.04667663574219, 41.5562744140625, 44.06586456298828, 46.57545852661133, 49.085052490234375, 51.59464645385742, 54.10424041748047, 56.613834381103516, 59.12342834472656, 61.633018493652344, 64.14261627197266, 66.65220642089844, 69.16180419921875, 71.67139434814453, 74.18099212646484, 76.69058227539062, 79.20018005371094, 81.70977020263672, 84.21936798095703, 86.72895812988281, 89.2385482788086]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 2.0, 1.0, 8.0, 13.0, 6.0, 12.0, 15.0, 21.0, 19.0, 21.0, 34.0, 20.0, 31.0, 37.0, 38.0, 37.0, 42.0, 46.0, 42.0, 47.0, 50.0, 55.0, 44.0, 43.0, 39.0, 44.0, 27.0, 27.0, 30.0, 19.0, 17.0, 23.0, 27.0, 14.0, 13.0, 8.0, 11.0, 4.0, 4.0, 4.0, 5.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-18.359375, -17.750244140625, -17.14111328125, -16.531982421875, -15.9228515625, -15.313720703125, -14.70458984375, -14.095458984375, -13.486328125, -12.877197265625, -12.26806640625, -11.658935546875, -11.0498046875, -10.440673828125, -9.83154296875, -9.222412109375, -8.61328125, -8.004150390625, -7.39501953125, -6.785888671875, -6.1767578125, -5.567626953125, -4.95849609375, -4.349365234375, -3.740234375, -3.131103515625, -2.52197265625, -1.912841796875, -1.3037109375, -0.694580078125, -0.08544921875, 0.523681640625, 1.1328125, 1.741943359375, 2.35107421875, 2.960205078125, 3.5693359375, 4.178466796875, 4.78759765625, 5.396728515625, 6.005859375, 6.614990234375, 7.22412109375, 7.833251953125, 8.4423828125, 9.051513671875, 9.66064453125, 10.269775390625, 10.87890625, 11.488037109375, 12.09716796875, 12.706298828125, 13.3154296875, 13.924560546875, 14.53369140625, 15.142822265625, 15.751953125, 16.361083984375, 16.97021484375, 17.579345703125, 18.1884765625, 18.797607421875, 19.40673828125, 20.015869140625, 20.625]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 10.0, 7.0, 11.0, 9.0, 9.0, 24.0, 15.0, 21.0, 30.0, 26.0, 38.0, 47.0, 55.0, 97.0, 107.0, 158.0, 244.0, 363.0, 784.0, 2674.0, 29914.0, 4142420.0, 13330.0, 1981.0, 686.0, 365.0, 223.0, 149.0, 102.0, 87.0, 54.0, 40.0, 49.0, 28.0, 29.0, 16.0, 16.0, 14.0, 10.0, 13.0, 6.0, 7.0, 3.0, 4.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-186.5, -180.365234375, -174.23046875, -168.095703125, -161.9609375, -155.826171875, -149.69140625, -143.556640625, -137.421875, -131.287109375, -125.15234375, -119.017578125, -112.8828125, -106.748046875, -100.61328125, -94.478515625, -88.34375, -82.208984375, -76.07421875, -69.939453125, -63.8046875, -57.669921875, -51.53515625, -45.400390625, -39.265625, -33.130859375, -26.99609375, -20.861328125, -14.7265625, -8.591796875, -2.45703125, 3.677734375, 9.8125, 15.947265625, 22.08203125, 28.216796875, 34.3515625, 40.486328125, 46.62109375, 52.755859375, 58.890625, 65.025390625, 71.16015625, 77.294921875, 83.4296875, 89.564453125, 95.69921875, 101.833984375, 107.96875, 114.103515625, 120.23828125, 126.373046875, 132.5078125, 138.642578125, 144.77734375, 150.912109375, 157.046875, 163.181640625, 169.31640625, 175.451171875, 181.5859375, 187.720703125, 193.85546875, 199.990234375, 206.125]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 2.0, 4.0, 9.0, 9.0, 10.0, 9.0, 11.0, 25.0, 23.0, 29.0, 47.0, 59.0, 92.0, 166.0, 342.0, 676.0, 1184.0, 643.0, 312.0, 165.0, 74.0, 45.0, 37.0, 21.0, 15.0, 15.0, 6.0, 6.0, 7.0, 6.0, 8.0, 3.0, 1.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-38.75, -37.65576171875, -36.5615234375, -35.46728515625, -34.373046875, -33.27880859375, -32.1845703125, -31.09033203125, -29.99609375, -28.90185546875, -27.8076171875, -26.71337890625, -25.619140625, -24.52490234375, -23.4306640625, -22.33642578125, -21.2421875, -20.14794921875, -19.0537109375, -17.95947265625, -16.865234375, -15.77099609375, -14.6767578125, -13.58251953125, -12.48828125, -11.39404296875, -10.2998046875, -9.20556640625, -8.111328125, -7.01708984375, -5.9228515625, -4.82861328125, -3.734375, -2.64013671875, -1.5458984375, -0.45166015625, 0.642578125, 1.73681640625, 2.8310546875, 3.92529296875, 5.01953125, 6.11376953125, 7.2080078125, 8.30224609375, 9.396484375, 10.49072265625, 11.5849609375, 12.67919921875, 13.7734375, 14.86767578125, 15.9619140625, 17.05615234375, 18.150390625, 19.24462890625, 20.3388671875, 21.43310546875, 22.52734375, 23.62158203125, 24.7158203125, 25.81005859375, 26.904296875, 27.99853515625, 29.0927734375, 30.18701171875, 31.28125]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 5.0, 0.0, 4.0, 8.0, 14.0, 13.0, 7.0, 10.0, 25.0, 34.0, 40.0, 67.0, 125.0, 290.0, 626.0, 1800.0, 5757.0, 28107.0, 1850415.0, 2269737.0, 28446.0, 5746.0, 1787.0, 617.0, 261.0, 126.0, 65.0, 38.0, 23.0, 34.0, 12.0, 8.0, 10.0, 9.0, 6.0, 6.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-91.8125, -88.4130859375, -85.013671875, -81.6142578125, -78.21484375, -74.8154296875, -71.416015625, -68.0166015625, -64.6171875, -61.2177734375, -57.818359375, -54.4189453125, -51.01953125, -47.6201171875, -44.220703125, -40.8212890625, -37.421875, -34.0224609375, -30.623046875, -27.2236328125, -23.82421875, -20.4248046875, -17.025390625, -13.6259765625, -10.2265625, -6.8271484375, -3.427734375, -0.0283203125, 3.37109375, 6.7705078125, 10.169921875, 13.5693359375, 16.96875, 20.3681640625, 23.767578125, 27.1669921875, 30.56640625, 33.9658203125, 37.365234375, 40.7646484375, 44.1640625, 47.5634765625, 50.962890625, 54.3623046875, 57.76171875, 61.1611328125, 64.560546875, 67.9599609375, 71.359375, 74.7587890625, 78.158203125, 81.5576171875, 84.95703125, 88.3564453125, 91.755859375, 95.1552734375, 98.5546875, 101.9541015625, 105.353515625, 108.7529296875, 112.15234375, 115.5517578125, 118.951171875, 122.3505859375, 125.75]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 13.0, 27.0, 65.0, 212.0, 398.0, 191.0, 69.0, 22.0, 8.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-278.3038330078125, -269.4793395996094, -260.6548156738281, -251.830322265625, -243.0058135986328, -234.18130493164062, -225.3568115234375, -216.5323028564453, -207.70779418945312, -198.88328552246094, -190.0587921142578, -181.23428344726562, -172.40977478027344, -163.58526611328125, -154.76077270507812, -145.93626403808594, -137.1117706298828, -128.28726196289062, -119.46276092529297, -110.63825988769531, -101.81375122070312, -92.98925018310547, -84.16474914550781, -75.34024047851562, -66.51573944091797, -57.69123458862305, -48.866729736328125, -40.04222869873047, -31.217723846435547, -22.393218994140625, -13.568717956542969, -4.744213104248047, 4.080291748046875, 12.90479564666748, 21.729299545288086, 30.553802490234375, 39.3783073425293, 48.20281219482422, 57.027313232421875, 65.85182189941406, 74.67632293701172, 83.50082397460938, 92.32533264160156, 101.14983367919922, 109.97433471679688, 118.79884338378906, 127.62334442138672, 136.44784545898438, 145.27235412597656, 154.09686279296875, 162.92135620117188, 171.74586486816406, 180.57037353515625, 189.39486694335938, 198.21937561035156, 207.04388427734375, 215.86837768554688, 224.69288635253906, 233.5173797607422, 242.34188842773438, 251.16639709472656, 259.99090576171875, 268.8153991699219, 277.639892578125, 286.46441650390625]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 9.0, 5.0, 10.0, 10.0, 13.0, 10.0, 15.0, 25.0, 22.0, 36.0, 19.0, 41.0, 35.0, 37.0, 43.0, 43.0, 50.0, 40.0, 38.0, 52.0, 39.0, 37.0, 39.0, 34.0, 42.0, 32.0, 36.0, 30.0, 30.0, 20.0, 14.0, 21.0, 16.0, 13.0, 5.0, 9.0, 5.0, 9.0, 3.0, 7.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-82.40347290039062, -79.65919494628906, -76.9149169921875, -74.17063903808594, -71.4263687133789, -68.68209075927734, -65.93781280517578, -63.19353485107422, -60.44926071166992, -57.70498275756836, -54.96070861816406, -52.2164306640625, -49.47215270996094, -46.72787857055664, -43.98360061645508, -41.23932647705078, -38.49504852294922, -35.750770568847656, -33.00649642944336, -30.262218475341797, -27.517942428588867, -24.773666381835938, -22.029388427734375, -19.285112380981445, -16.540836334228516, -13.796560287475586, -11.05228328704834, -8.308006286621094, -5.563730239868164, -2.8194541931152344, -0.07517623901367188, 2.669099807739258, 5.4133758544921875, 8.157651901245117, 10.901928901672363, 13.64620590209961, 16.39048194885254, 19.13475799560547, 21.87903594970703, 24.62331199645996, 27.36758804321289, 30.11186408996582, 32.85614013671875, 35.60041809082031, 38.344696044921875, 41.08897018432617, 43.833248138427734, 46.57752227783203, 49.321800231933594, 52.066078186035156, 54.81035232543945, 57.554630279541016, 60.29890441894531, 63.043182373046875, 65.78746032714844, 68.53173828125, 71.27601623535156, 74.02029418945312, 76.76457214355469, 79.50885009765625, 82.25312042236328, 84.99739837646484, 87.7416763305664, 90.48595428466797, 93.230224609375]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 2.0, 1.0, 6.0, 4.0, 8.0, 5.0, 13.0, 10.0, 18.0, 16.0, 23.0, 14.0, 32.0, 34.0, 18.0, 31.0, 32.0, 31.0, 42.0, 51.0, 44.0, 52.0, 49.0, 40.0, 44.0, 54.0, 33.0, 49.0, 30.0, 30.0, 32.0, 25.0, 21.0, 21.0, 18.0, 17.0, 11.0, 7.0, 12.0, 9.0, 10.0, 1.0, 5.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.4375, -18.8525390625, -18.267578125, -17.6826171875, -17.09765625, -16.5126953125, -15.927734375, -15.3427734375, -14.7578125, -14.1728515625, -13.587890625, -13.0029296875, -12.41796875, -11.8330078125, -11.248046875, -10.6630859375, -10.078125, -9.4931640625, -8.908203125, -8.3232421875, -7.73828125, -7.1533203125, -6.568359375, -5.9833984375, -5.3984375, -4.8134765625, -4.228515625, -3.6435546875, -3.05859375, -2.4736328125, -1.888671875, -1.3037109375, -0.71875, -0.1337890625, 0.451171875, 1.0361328125, 1.62109375, 2.2060546875, 2.791015625, 3.3759765625, 3.9609375, 4.5458984375, 5.130859375, 5.7158203125, 6.30078125, 6.8857421875, 7.470703125, 8.0556640625, 8.640625, 9.2255859375, 9.810546875, 10.3955078125, 10.98046875, 11.5654296875, 12.150390625, 12.7353515625, 13.3203125, 13.9052734375, 14.490234375, 15.0751953125, 15.66015625, 16.2451171875, 16.830078125, 17.4150390625, 18.0]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 8.0, 4.0, 11.0, 12.0, 23.0, 47.0, 46.0, 73.0, 105.0, 154.0, 240.0, 300.0, 464.0, 716.0, 1100.0, 1648.0, 2436.0, 3658.0, 5589.0, 8692.0, 13253.0, 20918.0, 32707.0, 53066.0, 89208.0, 154854.0, 225520.0, 173058.0, 99829.0, 59173.0, 36252.0, 22969.0, 14702.0, 9523.0, 6118.0, 4036.0, 2607.0, 1808.0, 1191.0, 789.0, 513.0, 366.0, 253.0, 170.0, 100.0, 70.0, 56.0, 40.0, 34.0, 13.0, 15.0, 4.0, 4.0, 3.0, 4.0, 4.0, 3.0, 4.0], "bins": [-1.576171875, -1.52783203125, -1.4794921875, -1.43115234375, -1.3828125, -1.33447265625, -1.2861328125, -1.23779296875, -1.189453125, -1.14111328125, -1.0927734375, -1.04443359375, -0.99609375, -0.94775390625, -0.8994140625, -0.85107421875, -0.802734375, -0.75439453125, -0.7060546875, -0.65771484375, -0.609375, -0.56103515625, -0.5126953125, -0.46435546875, -0.416015625, -0.36767578125, -0.3193359375, -0.27099609375, -0.22265625, -0.17431640625, -0.1259765625, -0.07763671875, -0.029296875, 0.01904296875, 0.0673828125, 0.11572265625, 0.1640625, 0.21240234375, 0.2607421875, 0.30908203125, 0.357421875, 0.40576171875, 0.4541015625, 0.50244140625, 0.55078125, 0.59912109375, 0.6474609375, 0.69580078125, 0.744140625, 0.79248046875, 0.8408203125, 0.88916015625, 0.9375, 0.98583984375, 1.0341796875, 1.08251953125, 1.130859375, 1.17919921875, 1.2275390625, 1.27587890625, 1.32421875, 1.37255859375, 1.4208984375, 1.46923828125, 1.517578125]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 6.0, 2.0, 8.0, 7.0, 5.0, 7.0, 5.0, 19.0, 6.0, 16.0, 24.0, 14.0, 23.0, 22.0, 19.0, 32.0, 34.0, 25.0, 31.0, 40.0, 31.0, 39.0, 49.0, 1059.0, 38.0, 37.0, 39.0, 41.0, 32.0, 43.0, 33.0, 24.0, 26.0, 30.0, 20.0, 24.0, 21.0, 20.0, 18.0, 17.0, 11.0, 2.0, 7.0, 2.0, 8.0, 5.0, 3.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-10.9453125, -10.601318359375, -10.25732421875, -9.913330078125, -9.5693359375, -9.225341796875, -8.88134765625, -8.537353515625, -8.193359375, -7.849365234375, -7.50537109375, -7.161376953125, -6.8173828125, -6.473388671875, -6.12939453125, -5.785400390625, -5.44140625, -5.097412109375, -4.75341796875, -4.409423828125, -4.0654296875, -3.721435546875, -3.37744140625, -3.033447265625, -2.689453125, -2.345458984375, -2.00146484375, -1.657470703125, -1.3134765625, -0.969482421875, -0.62548828125, -0.281494140625, 0.0625, 0.406494140625, 0.75048828125, 1.094482421875, 1.4384765625, 1.782470703125, 2.12646484375, 2.470458984375, 2.814453125, 3.158447265625, 3.50244140625, 3.846435546875, 4.1904296875, 4.534423828125, 4.87841796875, 5.222412109375, 5.56640625, 5.910400390625, 6.25439453125, 6.598388671875, 6.9423828125, 7.286376953125, 7.63037109375, 7.974365234375, 8.318359375, 8.662353515625, 9.00634765625, 9.350341796875, 9.6943359375, 10.038330078125, 10.38232421875, 10.726318359375, 11.0703125]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 2.0, 6.0, 9.0, 25.0, 24.0, 48.0, 81.0, 123.0, 179.0, 252.0, 403.0, 644.0, 997.0, 1518.0, 2223.0, 3570.0, 5444.0, 8385.0, 12857.0, 19980.0, 32106.0, 52542.0, 90823.0, 157514.0, 1276082.0, 174760.0, 101002.0, 58478.0, 35340.0, 21875.0, 13921.0, 8896.0, 5931.0, 3876.0, 2470.0, 1655.0, 1127.0, 685.0, 446.0, 295.0, 186.0, 133.0, 82.0, 45.0, 31.0, 22.0, 13.0, 9.0, 8.0, 7.0, 5.0, 4.0, 1.0], "bins": [-1.2529296875, -1.2177352905273438, -1.1825408935546875, -1.1473464965820312, -1.112152099609375, -1.0769577026367188, -1.0417633056640625, -1.0065689086914062, -0.97137451171875, -0.9361801147460938, -0.9009857177734375, -0.8657913208007812, -0.830596923828125, -0.7954025268554688, -0.7602081298828125, -0.7250137329101562, -0.6898193359375, -0.6546249389648438, -0.6194305419921875, -0.5842361450195312, -0.549041748046875, -0.5138473510742188, -0.4786529541015625, -0.44345855712890625, -0.40826416015625, -0.37306976318359375, -0.3378753662109375, -0.30268096923828125, -0.267486572265625, -0.23229217529296875, -0.1970977783203125, -0.16190338134765625, -0.126708984375, -0.09151458740234375, -0.0563201904296875, -0.02112579345703125, 0.014068603515625, 0.04926300048828125, 0.0844573974609375, 0.11965179443359375, 0.15484619140625, 0.19004058837890625, 0.2252349853515625, 0.26042938232421875, 0.295623779296875, 0.33081817626953125, 0.3660125732421875, 0.40120697021484375, 0.4364013671875, 0.47159576416015625, 0.5067901611328125, 0.5419845581054688, 0.577178955078125, 0.6123733520507812, 0.6475677490234375, 0.6827621459960938, 0.71795654296875, 0.7531509399414062, 0.7883453369140625, 0.8235397338867188, 0.858734130859375, 0.8939285278320312, 0.9291229248046875, 0.9643173217773438, 0.99951171875]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 3.0, 2.0, 0.0, 4.0, 5.0, 2.0, 4.0, 7.0, 8.0, 3.0, 18.0, 14.0, 13.0, 14.0, 20.0, 22.0, 22.0, 34.0, 63.0, 71.0, 88.0, 96.0, 107.0, 80.0, 55.0, 47.0, 37.0, 23.0, 17.0, 27.0, 17.0, 9.0, 19.0, 12.0, 10.0, 4.0, 7.0, 2.0, 3.0, 4.0, 5.0, 0.0, 5.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0250701904296875, -0.02422618865966797, -0.023382186889648438, -0.022538185119628906, -0.021694183349609375, -0.020850181579589844, -0.020006179809570312, -0.01916217803955078, -0.01831817626953125, -0.01747417449951172, -0.016630172729492188, -0.015786170959472656, -0.014942169189453125, -0.014098167419433594, -0.013254165649414062, -0.012410163879394531, -0.011566162109375, -0.010722160339355469, -0.009878158569335938, -0.009034156799316406, -0.008190155029296875, -0.007346153259277344, -0.0065021514892578125, -0.005658149719238281, -0.00481414794921875, -0.003970146179199219, -0.0031261444091796875, -0.0022821426391601562, -0.001438140869140625, -0.0005941390991210938, 0.0002498626708984375, 0.0010938644409179688, 0.0019378662109375, 0.0027818679809570312, 0.0036258697509765625, 0.004469871520996094, 0.005313873291015625, 0.006157875061035156, 0.0070018768310546875, 0.007845878601074219, 0.00868988037109375, 0.009533882141113281, 0.010377883911132812, 0.011221885681152344, 0.012065887451171875, 0.012909889221191406, 0.013753890991210938, 0.014597892761230469, 0.01544189453125, 0.01628589630126953, 0.017129898071289062, 0.017973899841308594, 0.018817901611328125, 0.019661903381347656, 0.020505905151367188, 0.02134990692138672, 0.02219390869140625, 0.02303791046142578, 0.023881912231445312, 0.024725914001464844, 0.025569915771484375, 0.026413917541503906, 0.027257919311523438, 0.02810192108154297, 0.0289459228515625]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 1.0, 4.0, 3.0, 7.0, 1.0, 5.0, 4.0, 6.0, 7.0, 8.0, 7.0, 15.0, 15.0, 16.0, 29.0, 27.0, 37.0, 50.0, 95.0, 91.0, 136.0, 277.0, 796.0, 5227.0, 147355.0, 876603.0, 15167.0, 1585.0, 405.0, 166.0, 92.0, 66.0, 55.0, 49.0, 31.0, 23.0, 19.0, 13.0, 9.0, 13.0, 2.0, 7.0, 7.0, 3.0, 8.0, 5.0, 3.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.54150390625, -0.5251922607421875, -0.508880615234375, -0.4925689697265625, -0.47625732421875, -0.4599456787109375, -0.443634033203125, -0.4273223876953125, -0.4110107421875, -0.3946990966796875, -0.378387451171875, -0.3620758056640625, -0.34576416015625, -0.3294525146484375, -0.313140869140625, -0.2968292236328125, -0.280517578125, -0.2642059326171875, -0.247894287109375, -0.2315826416015625, -0.21527099609375, -0.1989593505859375, -0.182647705078125, -0.1663360595703125, -0.1500244140625, -0.1337127685546875, -0.117401123046875, -0.1010894775390625, -0.08477783203125, -0.0684661865234375, -0.052154541015625, -0.0358428955078125, -0.01953125, -0.0032196044921875, 0.013092041015625, 0.0294036865234375, 0.04571533203125, 0.0620269775390625, 0.078338623046875, 0.0946502685546875, 0.1109619140625, 0.1272735595703125, 0.143585205078125, 0.1598968505859375, 0.17620849609375, 0.1925201416015625, 0.208831787109375, 0.2251434326171875, 0.241455078125, 0.2577667236328125, 0.274078369140625, 0.2903900146484375, 0.30670166015625, 0.3230133056640625, 0.339324951171875, 0.3556365966796875, 0.3719482421875, 0.3882598876953125, 0.404571533203125, 0.4208831787109375, 0.43719482421875, 0.4535064697265625, 0.469818115234375, 0.4861297607421875, 0.50244140625]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 14.0, 40.0, 127.0, 391.0, 297.0, 90.0, 32.0, 11.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07173629850149155, -0.06513958424329758, -0.058542877435684204, -0.051946163177490234, -0.04534945636987686, -0.03875274211168289, -0.03215603157877922, -0.02555932104587555, -0.018962610512971878, -0.012365899980068207, -0.005769188515841961, 0.000827522948384285, 0.007424233481287956, 0.014020945876836777, 0.020617656409740448, 0.02721436694264412, 0.03381107747554779, 0.04040778800845146, 0.04700449854135513, 0.0536012127995491, 0.060197919607162476, 0.06679463386535645, 0.07339134812355042, 0.07998805493116379, 0.08658476173877716, 0.09318147599697113, 0.0997781828045845, 0.10637489706277847, 0.11297160387039185, 0.11956831812858582, 0.12616503238677979, 0.13276174664497375, 0.13935844600200653, 0.1459551602602005, 0.15255187451839447, 0.15914857387542725, 0.16574528813362122, 0.17234200239181519, 0.17893871665000916, 0.18553543090820312, 0.1921321302652359, 0.19872884452342987, 0.20532555878162384, 0.21192225813865662, 0.21851897239685059, 0.22511568665504456, 0.23171240091323853, 0.2383091151714325, 0.24490582942962646, 0.25150254368782043, 0.2580992579460144, 0.2646959722042084, 0.27129268646240234, 0.2778893709182739, 0.2844860851764679, 0.29108279943466187, 0.29767951369285583, 0.3042762279510498, 0.3108729422092438, 0.31746965646743774, 0.3240663707256317, 0.3306630849838257, 0.33725976943969727, 0.34385648369789124, 0.3504531979560852]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 7.0, 9.0, 7.0, 8.0, 19.0, 16.0, 24.0, 18.0, 33.0, 27.0, 37.0, 22.0, 41.0, 34.0, 42.0, 45.0, 56.0, 43.0, 49.0, 61.0, 34.0, 60.0, 41.0, 32.0, 47.0, 30.0, 20.0, 29.0, 33.0, 18.0, 12.0, 9.0, 12.0, 4.0, 6.0, 3.0, 7.0, 2.0, 3.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.020522117614746094, -0.019879672676324844, -0.019237225875258446, -0.018594779074192047, -0.017952334135770798, -0.01730988919734955, -0.01666744239628315, -0.01602499559521675, -0.015382550656795502, -0.014740104787051678, -0.014097658917307854, -0.01345521304756403, -0.012812767177820206, -0.012170321308076382, -0.011527875438332558, -0.010885429568588734, -0.01024298369884491, -0.009600537829101086, -0.008958091959357262, -0.008315646089613438, -0.007673200219869614, -0.00703075435012579, -0.006388308480381966, -0.005745862610638142, -0.005103416740894318, -0.004460970871150494, -0.0038185250014066696, -0.0031760791316628456, -0.0025336332619190216, -0.0018911873921751976, -0.0012487415224313736, -0.0006062956526875496, 3.6150217056274414e-05, 0.0006785960868000984, 0.0013210419565439224, 0.0019634878262877464, 0.0026059336960315704, 0.0032483795657753944, 0.0038908254355192184, 0.0045332713052630424, 0.0051757171750068665, 0.0058181630447506905, 0.0064606089144945145, 0.0071030547842383385, 0.0077455006539821625, 0.008387946523725986, 0.00903039239346981, 0.009672838263213634, 0.010315284132957458, 0.010957730002701283, 0.011600175872445107, 0.01224262174218893, 0.012885067611932755, 0.013527513481676579, 0.014169959351420403, 0.014812405221164227, 0.01545485109090805, 0.0160972960293293, 0.0167397428303957, 0.017382189631462097, 0.018024634569883347, 0.018667079508304596, 0.019309526309370995, 0.019951973110437393, 0.020594418048858643]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 2.0, 1.0, 6.0, 4.0, 8.0, 5.0, 13.0, 10.0, 18.0, 16.0, 23.0, 14.0, 32.0, 34.0, 18.0, 31.0, 32.0, 31.0, 42.0, 51.0, 44.0, 52.0, 49.0, 40.0, 44.0, 54.0, 33.0, 49.0, 30.0, 30.0, 32.0, 25.0, 21.0, 21.0, 18.0, 17.0, 11.0, 7.0, 12.0, 9.0, 10.0, 1.0, 5.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.4375, -18.8525390625, -18.267578125, -17.6826171875, -17.09765625, -16.5126953125, -15.927734375, -15.3427734375, -14.7578125, -14.1728515625, -13.587890625, -13.0029296875, -12.41796875, -11.8330078125, -11.248046875, -10.6630859375, -10.078125, -9.4931640625, -8.908203125, -8.3232421875, -7.73828125, -7.1533203125, -6.568359375, -5.9833984375, -5.3984375, -4.8134765625, -4.228515625, -3.6435546875, -3.05859375, -2.4736328125, -1.888671875, -1.3037109375, -0.71875, -0.1337890625, 0.451171875, 1.0361328125, 1.62109375, 2.2060546875, 2.791015625, 3.3759765625, 3.9609375, 4.5458984375, 5.130859375, 5.7158203125, 6.30078125, 6.8857421875, 7.470703125, 8.0556640625, 8.640625, 9.2255859375, 9.810546875, 10.3955078125, 10.98046875, 11.5654296875, 12.150390625, 12.7353515625, 13.3203125, 13.9052734375, 14.490234375, 15.0751953125, 15.66015625, 16.2451171875, 16.830078125, 17.4150390625, 18.0]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 2.0, 4.0, 11.0, 9.0, 12.0, 20.0, 19.0, 37.0, 48.0, 57.0, 83.0, 127.0, 157.0, 220.0, 370.0, 473.0, 724.0, 1042.0, 1647.0, 2476.0, 4712.0, 10504.0, 37189.0, 272088.0, 608668.0, 75917.0, 16479.0, 6354.0, 3186.0, 1974.0, 1226.0, 821.0, 544.0, 392.0, 277.0, 199.0, 146.0, 80.0, 75.0, 48.0, 41.0, 30.0, 27.0, 14.0, 3.0, 4.0, 13.0, 3.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-33.8125, -32.794189453125, -31.77587890625, -30.757568359375, -29.7392578125, -28.720947265625, -27.70263671875, -26.684326171875, -25.666015625, -24.647705078125, -23.62939453125, -22.611083984375, -21.5927734375, -20.574462890625, -19.55615234375, -18.537841796875, -17.51953125, -16.501220703125, -15.48291015625, -14.464599609375, -13.4462890625, -12.427978515625, -11.40966796875, -10.391357421875, -9.373046875, -8.354736328125, -7.33642578125, -6.318115234375, -5.2998046875, -4.281494140625, -3.26318359375, -2.244873046875, -1.2265625, -0.208251953125, 0.81005859375, 1.828369140625, 2.8466796875, 3.864990234375, 4.88330078125, 5.901611328125, 6.919921875, 7.938232421875, 8.95654296875, 9.974853515625, 10.9931640625, 12.011474609375, 13.02978515625, 14.048095703125, 15.06640625, 16.084716796875, 17.10302734375, 18.121337890625, 19.1396484375, 20.157958984375, 21.17626953125, 22.194580078125, 23.212890625, 24.231201171875, 25.24951171875, 26.267822265625, 27.2861328125, 28.304443359375, 29.32275390625, 30.341064453125, 31.359375]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 5.0, 4.0, 7.0, 4.0, 4.0, 6.0, 11.0, 15.0, 12.0, 10.0, 21.0, 29.0, 23.0, 43.0, 23.0, 33.0, 30.0, 48.0, 55.0, 77.0, 165.0, 1599.0, 252.0, 99.0, 68.0, 74.0, 48.0, 35.0, 41.0, 35.0, 34.0, 24.0, 21.0, 14.0, 19.0, 8.0, 11.0, 6.0, 15.0, 9.0, 2.0, 4.0, 5.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-36.84375, -35.71484375, -34.5859375, -33.45703125, -32.328125, -31.19921875, -30.0703125, -28.94140625, -27.8125, -26.68359375, -25.5546875, -24.42578125, -23.296875, -22.16796875, -21.0390625, -19.91015625, -18.78125, -17.65234375, -16.5234375, -15.39453125, -14.265625, -13.13671875, -12.0078125, -10.87890625, -9.75, -8.62109375, -7.4921875, -6.36328125, -5.234375, -4.10546875, -2.9765625, -1.84765625, -0.71875, 0.41015625, 1.5390625, 2.66796875, 3.796875, 4.92578125, 6.0546875, 7.18359375, 8.3125, 9.44140625, 10.5703125, 11.69921875, 12.828125, 13.95703125, 15.0859375, 16.21484375, 17.34375, 18.47265625, 19.6015625, 20.73046875, 21.859375, 22.98828125, 24.1171875, 25.24609375, 26.375, 27.50390625, 28.6328125, 29.76171875, 30.890625, 32.01953125, 33.1484375, 34.27734375, 35.40625]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 1.0, 5.0, 10.0, 11.0, 5.0, 17.0, 11.0, 16.0, 21.0, 33.0, 47.0, 61.0, 98.0, 157.0, 270.0, 564.0, 1626.0, 263323.0, 2875949.0, 2103.0, 603.0, 268.0, 166.0, 97.0, 62.0, 32.0, 29.0, 19.0, 15.0, 20.0, 9.0, 15.0, 14.0, 8.0, 2.0, 4.0, 3.0, 2.0, 0.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-144.125, -139.16796875, -134.2109375, -129.25390625, -124.296875, -119.33984375, -114.3828125, -109.42578125, -104.46875, -99.51171875, -94.5546875, -89.59765625, -84.640625, -79.68359375, -74.7265625, -69.76953125, -64.8125, -59.85546875, -54.8984375, -49.94140625, -44.984375, -40.02734375, -35.0703125, -30.11328125, -25.15625, -20.19921875, -15.2421875, -10.28515625, -5.328125, -0.37109375, 4.5859375, 9.54296875, 14.5, 19.45703125, 24.4140625, 29.37109375, 34.328125, 39.28515625, 44.2421875, 49.19921875, 54.15625, 59.11328125, 64.0703125, 69.02734375, 73.984375, 78.94140625, 83.8984375, 88.85546875, 93.8125, 98.76953125, 103.7265625, 108.68359375, 113.640625, 118.59765625, 123.5546875, 128.51171875, 133.46875, 138.42578125, 143.3828125, 148.33984375, 153.296875, 158.25390625, 163.2109375, 168.16796875, 173.125]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 9.0, 41.0, 250.0, 466.0, 196.0, 35.0, 14.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-224.83074951171875, -218.1095428466797, -211.38832092285156, -204.6671142578125, -197.94589233398438, -191.2246856689453, -184.50347900390625, -177.78225708007812, -171.06105041503906, -164.33984375, -157.61862182617188, -150.8974151611328, -144.17620849609375, -137.45498657226562, -130.73377990722656, -124.01256561279297, -117.29135131835938, -110.57013702392578, -103.84892272949219, -97.12771606445312, -90.40650177001953, -83.68528747558594, -76.96408081054688, -70.24286651611328, -63.52165222167969, -56.800437927246094, -50.079227447509766, -43.35801696777344, -36.636802673339844, -29.91558837890625, -23.194377899169922, -16.473167419433594, -9.751968383789062, -3.0307559967041016, 3.6904563903808594, 10.41166877746582, 17.13288116455078, 23.854095458984375, 30.575305938720703, 37.29651641845703, 44.017730712890625, 50.73894500732422, 57.46015548706055, 64.18136596679688, 70.90258026123047, 77.62379455566406, 84.34500122070312, 91.06621551513672, 97.78742980957031, 104.5086441040039, 111.2298583984375, 117.95106506347656, 124.67227935791016, 131.39349365234375, 138.1147003173828, 144.83590698242188, 151.55712890625, 158.27833557128906, 164.9995574951172, 171.72076416015625, 178.44198608398438, 185.16319274902344, 191.8843994140625, 198.60562133789062, 205.3268280029297]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 7.0, 7.0, 7.0, 6.0, 8.0, 8.0, 14.0, 8.0, 19.0, 17.0, 19.0, 16.0, 22.0, 28.0, 31.0, 37.0, 44.0, 38.0, 47.0, 43.0, 47.0, 46.0, 53.0, 40.0, 46.0, 36.0, 41.0, 27.0, 31.0, 31.0, 20.0, 27.0, 24.0, 18.0, 16.0, 20.0, 9.0, 12.0, 9.0, 6.0, 8.0, 4.0, 2.0, 0.0, 1.0, 6.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-92.90000915527344, -89.84323120117188, -86.78644561767578, -83.72966766357422, -80.67288208007812, -77.61610412597656, -74.55931854248047, -71.5025405883789, -68.44575500488281, -65.38897705078125, -62.332191467285156, -59.27540969848633, -56.2186279296875, -53.16184616088867, -50.105064392089844, -47.04828643798828, -43.99150466918945, -40.934722900390625, -37.8779411315918, -34.82115936279297, -31.76437759399414, -28.707595825195312, -25.650815963745117, -22.59403419494629, -19.53725242614746, -16.480470657348633, -13.423688888549805, -10.366908073425293, -7.310126304626465, -4.253344535827637, -1.196563720703125, 1.8602180480957031, 4.916999816894531, 7.973781585693359, 11.030563354492188, 14.0873441696167, 17.144126892089844, 20.200908660888672, 23.257688522338867, 26.314470291137695, 29.371252059936523, 32.42803192138672, 35.48481369018555, 38.541595458984375, 41.5983772277832, 44.65515899658203, 47.71194076538086, 50.76872253417969, 53.825504302978516, 56.882286071777344, 59.93906784057617, 62.995849609375, 66.05262756347656, 69.10941314697266, 72.16619110107422, 75.22297668457031, 78.27975463867188, 81.33653259277344, 84.39331817626953, 87.4500961303711, 90.50688171386719, 93.56365966796875, 96.62044525146484, 99.6772232055664, 102.7340087890625]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 4.0, 4.0, 3.0, 4.0, 8.0, 9.0, 11.0, 13.0, 23.0, 25.0, 16.0, 23.0, 33.0, 30.0, 28.0, 25.0, 42.0, 38.0, 41.0, 52.0, 48.0, 41.0, 63.0, 36.0, 54.0, 41.0, 34.0, 38.0, 30.0, 23.0, 25.0, 24.0, 23.0, 10.0, 19.0, 13.0, 14.0, 11.0, 7.0, 5.0, 4.0, 1.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-19.234375, -18.65576171875, -18.0771484375, -17.49853515625, -16.919921875, -16.34130859375, -15.7626953125, -15.18408203125, -14.60546875, -14.02685546875, -13.4482421875, -12.86962890625, -12.291015625, -11.71240234375, -11.1337890625, -10.55517578125, -9.9765625, -9.39794921875, -8.8193359375, -8.24072265625, -7.662109375, -7.08349609375, -6.5048828125, -5.92626953125, -5.34765625, -4.76904296875, -4.1904296875, -3.61181640625, -3.033203125, -2.45458984375, -1.8759765625, -1.29736328125, -0.71875, -0.14013671875, 0.4384765625, 1.01708984375, 1.595703125, 2.17431640625, 2.7529296875, 3.33154296875, 3.91015625, 4.48876953125, 5.0673828125, 5.64599609375, 6.224609375, 6.80322265625, 7.3818359375, 7.96044921875, 8.5390625, 9.11767578125, 9.6962890625, 10.27490234375, 10.853515625, 11.43212890625, 12.0107421875, 12.58935546875, 13.16796875, 13.74658203125, 14.3251953125, 14.90380859375, 15.482421875, 16.06103515625, 16.6396484375, 17.21826171875, 17.796875]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 4.0, 4.0, 9.0, 13.0, 5.0, 15.0, 21.0, 21.0, 36.0, 53.0, 74.0, 106.0, 144.0, 162.0, 296.0, 418.0, 633.0, 1145.0, 2125.0, 5014.0, 15315.0, 165816.0, 3441290.0, 524654.0, 24264.0, 6603.0, 2576.0, 1335.0, 703.0, 410.0, 305.0, 238.0, 128.0, 104.0, 57.0, 55.0, 27.0, 23.0, 32.0, 17.0, 8.0, 13.0, 6.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-59.40625, -57.529296875, -55.65234375, -53.775390625, -51.8984375, -50.021484375, -48.14453125, -46.267578125, -44.390625, -42.513671875, -40.63671875, -38.759765625, -36.8828125, -35.005859375, -33.12890625, -31.251953125, -29.375, -27.498046875, -25.62109375, -23.744140625, -21.8671875, -19.990234375, -18.11328125, -16.236328125, -14.359375, -12.482421875, -10.60546875, -8.728515625, -6.8515625, -4.974609375, -3.09765625, -1.220703125, 0.65625, 2.533203125, 4.41015625, 6.287109375, 8.1640625, 10.041015625, 11.91796875, 13.794921875, 15.671875, 17.548828125, 19.42578125, 21.302734375, 23.1796875, 25.056640625, 26.93359375, 28.810546875, 30.6875, 32.564453125, 34.44140625, 36.318359375, 38.1953125, 40.072265625, 41.94921875, 43.826171875, 45.703125, 47.580078125, 49.45703125, 51.333984375, 53.2109375, 55.087890625, 56.96484375, 58.841796875, 60.71875]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 2.0, 4.0, 6.0, 4.0, 10.0, 12.0, 7.0, 11.0, 27.0, 14.0, 16.0, 34.0, 38.0, 49.0, 65.0, 103.0, 121.0, 197.0, 294.0, 530.0, 742.0, 619.0, 375.0, 256.0, 151.0, 90.0, 79.0, 53.0, 44.0, 29.0, 22.0, 17.0, 14.0, 8.0, 7.0, 7.0, 4.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-29.53125, -28.5673828125, -27.603515625, -26.6396484375, -25.67578125, -24.7119140625, -23.748046875, -22.7841796875, -21.8203125, -20.8564453125, -19.892578125, -18.9287109375, -17.96484375, -17.0009765625, -16.037109375, -15.0732421875, -14.109375, -13.1455078125, -12.181640625, -11.2177734375, -10.25390625, -9.2900390625, -8.326171875, -7.3623046875, -6.3984375, -5.4345703125, -4.470703125, -3.5068359375, -2.54296875, -1.5791015625, -0.615234375, 0.3486328125, 1.3125, 2.2763671875, 3.240234375, 4.2041015625, 5.16796875, 6.1318359375, 7.095703125, 8.0595703125, 9.0234375, 9.9873046875, 10.951171875, 11.9150390625, 12.87890625, 13.8427734375, 14.806640625, 15.7705078125, 16.734375, 17.6982421875, 18.662109375, 19.6259765625, 20.58984375, 21.5537109375, 22.517578125, 23.4814453125, 24.4453125, 25.4091796875, 26.373046875, 27.3369140625, 28.30078125, 29.2646484375, 30.228515625, 31.1923828125, 32.15625]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 2.0, 6.0, 7.0, 11.0, 16.0, 20.0, 34.0, 48.0, 73.0, 129.0, 204.0, 373.0, 763.0, 1420.0, 2985.0, 6859.0, 17269.0, 53578.0, 331777.0, 3439139.0, 264005.0, 47595.0, 15713.0, 6299.0, 2913.0, 1381.0, 715.0, 371.0, 208.0, 126.0, 70.0, 53.0, 34.0, 21.0, 21.0, 13.0, 8.0, 5.0, 1.0, 4.0, 5.0, 3.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-50.96875, -49.3984375, -47.828125, -46.2578125, -44.6875, -43.1171875, -41.546875, -39.9765625, -38.40625, -36.8359375, -35.265625, -33.6953125, -32.125, -30.5546875, -28.984375, -27.4140625, -25.84375, -24.2734375, -22.703125, -21.1328125, -19.5625, -17.9921875, -16.421875, -14.8515625, -13.28125, -11.7109375, -10.140625, -8.5703125, -7.0, -5.4296875, -3.859375, -2.2890625, -0.71875, 0.8515625, 2.421875, 3.9921875, 5.5625, 7.1328125, 8.703125, 10.2734375, 11.84375, 13.4140625, 14.984375, 16.5546875, 18.125, 19.6953125, 21.265625, 22.8359375, 24.40625, 25.9765625, 27.546875, 29.1171875, 30.6875, 32.2578125, 33.828125, 35.3984375, 36.96875, 38.5390625, 40.109375, 41.6796875, 43.25, 44.8203125, 46.390625, 47.9609375, 49.53125]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [7.0, 11.0, 30.0, 154.0, 541.0, 228.0, 36.0, 10.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.45288848876953, -64.00987243652344, -46.56685256958008, -29.12383270263672, -11.680816650390625, 5.762199401855469, 23.205223083496094, 40.64823913574219, 58.09125518798828, 75.53427124023438, 92.977294921875, 110.4203109741211, 127.86332702636719, 145.30633544921875, 162.74935913085938, 180.1923828125, 197.63540649414062, 215.07843017578125, 232.5214385986328, 249.96446228027344, 267.407470703125, 284.8504943847656, 302.29351806640625, 319.7365417480469, 337.1795349121094, 354.62255859375, 372.0655822753906, 389.50860595703125, 406.95159912109375, 424.3946228027344, 441.837646484375, 459.2806701660156, 476.72369384765625, 494.1667175292969, 511.6097412109375, 529.052734375, 546.4957885742188, 563.9387817382812, 581.3818359375, 598.8248291015625, 616.267822265625, 633.7108154296875, 651.1538696289062, 668.5968627929688, 686.0399169921875, 703.48291015625, 720.9259033203125, 738.3689575195312, 755.81201171875, 773.2550048828125, 790.6980590820312, 808.1410522460938, 825.5841064453125, 843.027099609375, 860.4700927734375, 877.9131469726562, 895.3561401367188, 912.7991333007812, 930.2421875, 947.6851806640625, 965.1282348632812, 982.5712280273438, 1000.0142822265625, 1017.457275390625, 1034.9002685546875]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 5.0, 1.0, 4.0, 6.0, 8.0, 14.0, 9.0, 13.0, 17.0, 18.0, 12.0, 21.0, 19.0, 35.0, 24.0, 30.0, 47.0, 36.0, 39.0, 41.0, 38.0, 44.0, 42.0, 40.0, 37.0, 39.0, 28.0, 30.0, 31.0, 32.0, 30.0, 33.0, 28.0, 21.0, 23.0, 13.0, 18.0, 15.0, 12.0, 7.0, 11.0, 11.0, 6.0, 5.0, 2.0, 7.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-104.64703369140625, -101.5959701538086, -98.54490661621094, -95.49384307861328, -92.44277954101562, -89.39170837402344, -86.34064483642578, -83.28958129882812, -80.23851776123047, -77.18745422363281, -74.13639068603516, -71.0853271484375, -68.03425598144531, -64.98319244384766, -61.93212890625, -58.881065368652344, -55.83000183105469, -52.77893829345703, -49.727874755859375, -46.67680740356445, -43.6257438659668, -40.57468032836914, -37.52361297607422, -34.47254943847656, -31.421485900878906, -28.37042236328125, -25.31935691833496, -22.268291473388672, -19.217227935791016, -16.16616439819336, -13.11509895324707, -10.064033508300781, -7.012977600097656, -3.9619131088256836, -0.9108486175537109, 2.1402158737182617, 5.191280364990234, 8.242344856262207, 11.29340934753418, 14.344474792480469, 17.395538330078125, 20.44660186767578, 23.49766731262207, 26.54873275756836, 29.599796295166016, 32.65085983276367, 35.701927185058594, 38.75299072265625, 41.804054260253906, 44.85511779785156, 47.90618133544922, 50.95724868774414, 54.0083122253418, 57.05937576293945, 60.110443115234375, 63.16150665283203, 66.21257019042969, 69.26363372802734, 72.314697265625, 75.36576080322266, 78.41682434082031, 81.4678955078125, 84.51895904541016, 87.57002258300781, 90.62108612060547]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 6.0, 2.0, 6.0, 7.0, 13.0, 7.0, 11.0, 16.0, 12.0, 21.0, 25.0, 27.0, 34.0, 27.0, 27.0, 29.0, 46.0, 47.0, 54.0, 34.0, 40.0, 43.0, 34.0, 42.0, 41.0, 45.0, 31.0, 27.0, 29.0, 35.0, 28.0, 14.0, 20.0, 18.0, 16.0, 22.0, 12.0, 13.0, 7.0, 11.0, 6.0, 5.0, 7.0, 1.0, 1.0, 6.0, 2.0, 2.0, 1.0], "bins": [-16.484375, -16.031982421875, -15.57958984375, -15.127197265625, -14.6748046875, -14.222412109375, -13.77001953125, -13.317626953125, -12.865234375, -12.412841796875, -11.96044921875, -11.508056640625, -11.0556640625, -10.603271484375, -10.15087890625, -9.698486328125, -9.24609375, -8.793701171875, -8.34130859375, -7.888916015625, -7.4365234375, -6.984130859375, -6.53173828125, -6.079345703125, -5.626953125, -5.174560546875, -4.72216796875, -4.269775390625, -3.8173828125, -3.364990234375, -2.91259765625, -2.460205078125, -2.0078125, -1.555419921875, -1.10302734375, -0.650634765625, -0.1982421875, 0.254150390625, 0.70654296875, 1.158935546875, 1.611328125, 2.063720703125, 2.51611328125, 2.968505859375, 3.4208984375, 3.873291015625, 4.32568359375, 4.778076171875, 5.23046875, 5.682861328125, 6.13525390625, 6.587646484375, 7.0400390625, 7.492431640625, 7.94482421875, 8.397216796875, 8.849609375, 9.302001953125, 9.75439453125, 10.206787109375, 10.6591796875, 11.111572265625, 11.56396484375, 12.016357421875, 12.46875]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [5.0, 3.0, 6.0, 9.0, 9.0, 16.0, 23.0, 32.0, 43.0, 64.0, 69.0, 106.0, 158.0, 220.0, 336.0, 401.0, 636.0, 868.0, 1219.0, 1773.0, 2450.0, 3421.0, 4995.0, 7503.0, 10808.0, 16294.0, 25545.0, 40969.0, 68014.0, 115877.0, 190097.0, 208026.0, 135451.0, 79268.0, 47248.0, 28878.0, 18615.0, 12172.0, 8079.0, 5680.0, 3843.0, 2708.0, 1916.0, 1384.0, 975.0, 712.0, 462.0, 340.0, 242.0, 152.0, 115.0, 92.0, 74.0, 67.0, 31.0, 35.0, 18.0, 4.0, 4.0, 3.0, 3.0, 4.0, 3.0, 3.0], "bins": [-1.1904296875, -1.1522064208984375, -1.113983154296875, -1.0757598876953125, -1.03753662109375, -0.9993133544921875, -0.961090087890625, -0.9228668212890625, -0.8846435546875, -0.8464202880859375, -0.808197021484375, -0.7699737548828125, -0.73175048828125, -0.6935272216796875, -0.655303955078125, -0.6170806884765625, -0.578857421875, -0.5406341552734375, -0.502410888671875, -0.4641876220703125, -0.42596435546875, -0.3877410888671875, -0.349517822265625, -0.3112945556640625, -0.2730712890625, -0.2348480224609375, -0.196624755859375, -0.1584014892578125, -0.12017822265625, -0.0819549560546875, -0.043731689453125, -0.0055084228515625, 0.03271484375, 0.0709381103515625, 0.109161376953125, 0.1473846435546875, 0.18560791015625, 0.2238311767578125, 0.262054443359375, 0.3002777099609375, 0.3385009765625, 0.3767242431640625, 0.414947509765625, 0.4531707763671875, 0.49139404296875, 0.5296173095703125, 0.567840576171875, 0.6060638427734375, 0.644287109375, 0.6825103759765625, 0.720733642578125, 0.7589569091796875, 0.79718017578125, 0.8354034423828125, 0.873626708984375, 0.9118499755859375, 0.9500732421875, 0.9882965087890625, 1.026519775390625, 1.0647430419921875, 1.10296630859375, 1.1411895751953125, 1.179412841796875, 1.2176361083984375, 1.255859375]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 4.0, 0.0, 4.0, 3.0, 4.0, 2.0, 4.0, 5.0, 8.0, 7.0, 9.0, 15.0, 16.0, 16.0, 18.0, 25.0, 30.0, 19.0, 30.0, 20.0, 40.0, 29.0, 41.0, 44.0, 38.0, 35.0, 36.0, 1067.0, 32.0, 40.0, 38.0, 32.0, 35.0, 27.0, 28.0, 27.0, 31.0, 29.0, 26.0, 24.0, 18.0, 14.0, 20.0, 13.0, 6.0, 5.0, 8.0, 7.0, 4.0, 0.0, 4.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.89453125, -7.61505126953125, -7.3355712890625, -7.05609130859375, -6.776611328125, -6.49713134765625, -6.2176513671875, -5.93817138671875, -5.65869140625, -5.37921142578125, -5.0997314453125, -4.82025146484375, -4.540771484375, -4.26129150390625, -3.9818115234375, -3.70233154296875, -3.4228515625, -3.14337158203125, -2.8638916015625, -2.58441162109375, -2.304931640625, -2.02545166015625, -1.7459716796875, -1.46649169921875, -1.18701171875, -0.90753173828125, -0.6280517578125, -0.34857177734375, -0.069091796875, 0.21038818359375, 0.4898681640625, 0.76934814453125, 1.048828125, 1.32830810546875, 1.6077880859375, 1.88726806640625, 2.166748046875, 2.44622802734375, 2.7257080078125, 3.00518798828125, 3.28466796875, 3.56414794921875, 3.8436279296875, 4.12310791015625, 4.402587890625, 4.68206787109375, 4.9615478515625, 5.24102783203125, 5.5205078125, 5.79998779296875, 6.0794677734375, 6.35894775390625, 6.638427734375, 6.91790771484375, 7.1973876953125, 7.47686767578125, 7.75634765625, 8.03582763671875, 8.3153076171875, 8.59478759765625, 8.874267578125, 9.15374755859375, 9.4332275390625, 9.71270751953125, 9.9921875]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 10.0, 9.0, 12.0, 29.0, 43.0, 85.0, 86.0, 176.0, 237.0, 347.0, 554.0, 869.0, 1271.0, 1965.0, 2933.0, 4677.0, 7070.0, 11015.0, 17273.0, 27320.0, 44258.0, 75096.0, 128919.0, 991983.0, 463480.0, 125859.0, 73787.0, 43609.0, 26605.0, 16813.0, 10748.0, 6813.0, 4598.0, 3052.0, 1876.0, 1256.0, 806.0, 603.0, 323.0, 219.0, 158.0, 101.0, 59.0, 44.0, 31.0, 26.0, 7.0, 12.0, 4.0, 4.0, 3.0, 1.0, 3.0], "bins": [-1.029296875, -0.9998703002929688, -0.9704437255859375, -0.9410171508789062, -0.911590576171875, -0.8821640014648438, -0.8527374267578125, -0.8233108520507812, -0.79388427734375, -0.7644577026367188, -0.7350311279296875, -0.7056045532226562, -0.676177978515625, -0.6467514038085938, -0.6173248291015625, -0.5878982543945312, -0.5584716796875, -0.5290451049804688, -0.4996185302734375, -0.47019195556640625, -0.440765380859375, -0.41133880615234375, -0.3819122314453125, -0.35248565673828125, -0.32305908203125, -0.29363250732421875, -0.2642059326171875, -0.23477935791015625, -0.205352783203125, -0.17592620849609375, -0.1464996337890625, -0.11707305908203125, -0.087646484375, -0.05821990966796875, -0.0287933349609375, 0.00063323974609375, 0.030059814453125, 0.05948638916015625, 0.0889129638671875, 0.11833953857421875, 0.14776611328125, 0.17719268798828125, 0.2066192626953125, 0.23604583740234375, 0.265472412109375, 0.29489898681640625, 0.3243255615234375, 0.35375213623046875, 0.3831787109375, 0.41260528564453125, 0.4420318603515625, 0.47145843505859375, 0.500885009765625, 0.5303115844726562, 0.5597381591796875, 0.5891647338867188, 0.61859130859375, 0.6480178833007812, 0.6774444580078125, 0.7068710327148438, 0.736297607421875, 0.7657241821289062, 0.7951507568359375, 0.8245773315429688, 0.85400390625]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 5.0, 6.0, 7.0, 4.0, 10.0, 8.0, 9.0, 17.0, 16.0, 19.0, 29.0, 53.0, 67.0, 94.0, 121.0, 128.0, 99.0, 82.0, 65.0, 38.0, 33.0, 19.0, 13.0, 11.0, 3.0, 6.0, 3.0, 3.0, 3.0, 7.0, 3.0, 1.0, 3.0, 1.0, 6.0, 2.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.031494140625, -0.03055095672607422, -0.029607772827148438, -0.028664588928222656, -0.027721405029296875, -0.026778221130371094, -0.025835037231445312, -0.02489185333251953, -0.02394866943359375, -0.02300548553466797, -0.022062301635742188, -0.021119117736816406, -0.020175933837890625, -0.019232749938964844, -0.018289566040039062, -0.01734638214111328, -0.0164031982421875, -0.015460014343261719, -0.014516830444335938, -0.013573646545410156, -0.012630462646484375, -0.011687278747558594, -0.010744094848632812, -0.009800910949707031, -0.00885772705078125, -0.007914543151855469, -0.0069713592529296875, -0.006028175354003906, -0.005084991455078125, -0.004141807556152344, -0.0031986236572265625, -0.0022554397583007812, -0.001312255859375, -0.00036907196044921875, 0.0005741119384765625, 0.0015172958374023438, 0.002460479736328125, 0.0034036636352539062, 0.0043468475341796875, 0.005290031433105469, 0.00623321533203125, 0.007176399230957031, 0.008119583129882812, 0.009062767028808594, 0.010005950927734375, 0.010949134826660156, 0.011892318725585938, 0.012835502624511719, 0.0137786865234375, 0.014721870422363281, 0.015665054321289062, 0.016608238220214844, 0.017551422119140625, 0.018494606018066406, 0.019437789916992188, 0.02038097381591797, 0.02132415771484375, 0.02226734161376953, 0.023210525512695312, 0.024153709411621094, 0.025096893310546875, 0.026040077209472656, 0.026983261108398438, 0.02792644500732422, 0.02886962890625]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 3.0, 8.0, 6.0, 5.0, 5.0, 7.0, 8.0, 5.0, 11.0, 8.0, 11.0, 13.0, 21.0, 27.0, 40.0, 65.0, 120.0, 178.0, 361.0, 1271.0, 187414.0, 855840.0, 2070.0, 431.0, 218.0, 104.0, 63.0, 51.0, 48.0, 33.0, 21.0, 14.0, 17.0, 13.0, 8.0, 7.0, 7.0, 5.0, 2.0, 6.0, 3.0, 3.0, 1.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.591796875, -0.5727615356445312, -0.5537261962890625, -0.5346908569335938, -0.515655517578125, -0.49662017822265625, -0.4775848388671875, -0.45854949951171875, -0.43951416015625, -0.42047882080078125, -0.4014434814453125, -0.38240814208984375, -0.363372802734375, -0.34433746337890625, -0.3253021240234375, -0.30626678466796875, -0.2872314453125, -0.26819610595703125, -0.2491607666015625, -0.23012542724609375, -0.211090087890625, -0.19205474853515625, -0.1730194091796875, -0.15398406982421875, -0.13494873046875, -0.11591339111328125, -0.0968780517578125, -0.07784271240234375, -0.058807373046875, -0.03977203369140625, -0.0207366943359375, -0.00170135498046875, 0.017333984375, 0.03636932373046875, 0.0554046630859375, 0.07444000244140625, 0.093475341796875, 0.11251068115234375, 0.1315460205078125, 0.15058135986328125, 0.16961669921875, 0.18865203857421875, 0.2076873779296875, 0.22672271728515625, 0.245758056640625, 0.26479339599609375, 0.2838287353515625, 0.30286407470703125, 0.3218994140625, 0.34093475341796875, 0.3599700927734375, 0.37900543212890625, 0.398040771484375, 0.41707611083984375, 0.4361114501953125, 0.45514678955078125, 0.47418212890625, 0.49321746826171875, 0.5122528076171875, 0.5312881469726562, 0.550323486328125, 0.5693588256835938, 0.5883941650390625, 0.6074295043945312, 0.62646484375]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 18.0, 88.0, 633.0, 237.0, 29.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15334580838680267, -0.14595602452754974, -0.138566255569458, -0.13117647171020508, -0.12378668785095215, -0.11639690399169922, -0.10900712758302689, -0.10161735117435455, -0.09422756731510162, -0.0868377834558487, -0.07944800704717636, -0.07205823063850403, -0.0646684467792511, -0.05727866664528847, -0.049888886511325836, -0.042499106377363205, -0.035109326243400574, -0.027719546109437943, -0.02032976597547531, -0.01293998584151268, -0.005550205707550049, 0.0018395744264125824, 0.009229354560375214, 0.016619134694337845, 0.024008914828300476, 0.03139869496226311, 0.03878847509622574, 0.04617825523018837, 0.053568035364151, 0.06095781549811363, 0.06834759563207626, 0.0757373720407486, 0.08312717080116272, 0.09051695466041565, 0.09790673106908798, 0.10529650747776031, 0.11268629133701324, 0.12007607519626617, 0.1274658441543579, 0.13485562801361084, 0.14224541187286377, 0.1496351957321167, 0.15702497959136963, 0.16441474854946136, 0.1718045324087143, 0.17919431626796722, 0.18658408522605896, 0.1939738690853119, 0.20136365294456482, 0.20875343680381775, 0.21614322066307068, 0.22353298962116241, 0.23092277348041534, 0.23831255733966827, 0.24570232629776, 0.25309211015701294, 0.26048189401626587, 0.2678716778755188, 0.27526146173477173, 0.28265124559402466, 0.2900410294532776, 0.29743078351020813, 0.30482056736946106, 0.312210351228714, 0.3196001350879669]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 5.0, 7.0, 5.0, 11.0, 5.0, 9.0, 11.0, 15.0, 20.0, 14.0, 17.0, 23.0, 25.0, 32.0, 30.0, 37.0, 40.0, 47.0, 53.0, 50.0, 32.0, 50.0, 36.0, 35.0, 45.0, 44.0, 38.0, 31.0, 28.0, 32.0, 34.0, 30.0, 19.0, 15.0, 15.0, 19.0, 13.0, 9.0, 4.0, 11.0, 2.0, 3.0, 2.0, 2.0, 5.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.03445249795913696, -0.033480700105428696, -0.03250890225172043, -0.03153710812330246, -0.030565310269594193, -0.029593512415885925, -0.028621716424822807, -0.02764992043375969, -0.026678122580051422, -0.025706324726343155, -0.024734528735280037, -0.02376273274421692, -0.02279093489050865, -0.021819137036800385, -0.020847341045737267, -0.01987554505467415, -0.01890374720096588, -0.017931949347257614, -0.016960153356194496, -0.015988357365131378, -0.015016559511423111, -0.014044762589037418, -0.013072965666651726, -0.012101168744266033, -0.01112937182188034, -0.010157574899494648, -0.009185777977108955, -0.008213981054723263, -0.00724218413233757, -0.006270387209951878, -0.005298590287566185, -0.004326793365180492, -0.0033549964427948, -0.002383199520409107, -0.0014114025980234146, -0.000439605675637722, 0.0005321912467479706, 0.0015039881691336632, 0.0024757850915193558, 0.0034475820139050484, 0.004419378936290741, 0.0053911758586764336, 0.006362972781062126, 0.007334769703447819, 0.008306566625833511, 0.009278363548219204, 0.010250160470604897, 0.01122195739299059, 0.012193754315376282, 0.013165551237761974, 0.014137348160147667, 0.01510914508253336, 0.016080942004919052, 0.01705273985862732, 0.018024535849690437, 0.018996331840753555, 0.019968129694461823, 0.02093992754817009, 0.021911723539233208, 0.022883519530296326, 0.023855317384004593, 0.02482711523771286, 0.025798911228775978, 0.026770707219839096, 0.027742505073547363]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 6.0, 2.0, 6.0, 7.0, 13.0, 7.0, 11.0, 16.0, 12.0, 21.0, 25.0, 28.0, 35.0, 25.0, 29.0, 28.0, 46.0, 47.0, 54.0, 33.0, 40.0, 43.0, 34.0, 42.0, 41.0, 46.0, 30.0, 27.0, 29.0, 36.0, 27.0, 14.0, 20.0, 18.0, 16.0, 22.0, 12.0, 13.0, 7.0, 11.0, 6.0, 5.0, 7.0, 1.0, 1.0, 6.0, 2.0, 2.0, 1.0], "bins": [-16.46875, -16.0166015625, -15.564453125, -15.1123046875, -14.66015625, -14.2080078125, -13.755859375, -13.3037109375, -12.8515625, -12.3994140625, -11.947265625, -11.4951171875, -11.04296875, -10.5908203125, -10.138671875, -9.6865234375, -9.234375, -8.7822265625, -8.330078125, -7.8779296875, -7.42578125, -6.9736328125, -6.521484375, -6.0693359375, -5.6171875, -5.1650390625, -4.712890625, -4.2607421875, -3.80859375, -3.3564453125, -2.904296875, -2.4521484375, -2.0, -1.5478515625, -1.095703125, -0.6435546875, -0.19140625, 0.2607421875, 0.712890625, 1.1650390625, 1.6171875, 2.0693359375, 2.521484375, 2.9736328125, 3.42578125, 3.8779296875, 4.330078125, 4.7822265625, 5.234375, 5.6865234375, 6.138671875, 6.5908203125, 7.04296875, 7.4951171875, 7.947265625, 8.3994140625, 8.8515625, 9.3037109375, 9.755859375, 10.2080078125, 10.66015625, 11.1123046875, 11.564453125, 12.0166015625, 12.46875]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 4.0, 4.0, 4.0, 6.0, 4.0, 13.0, 17.0, 23.0, 19.0, 39.0, 44.0, 70.0, 106.0, 162.0, 163.0, 290.0, 403.0, 596.0, 922.0, 1416.0, 2101.0, 3629.0, 6746.0, 16619.0, 97672.0, 787589.0, 96610.0, 16574.0, 6632.0, 3565.0, 2215.0, 1434.0, 919.0, 602.0, 418.0, 264.0, 198.0, 136.0, 101.0, 66.0, 38.0, 33.0, 22.0, 29.0, 15.0, 9.0, 8.0, 7.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.78125, -34.47998046875, -33.1787109375, -31.87744140625, -30.576171875, -29.27490234375, -27.9736328125, -26.67236328125, -25.37109375, -24.06982421875, -22.7685546875, -21.46728515625, -20.166015625, -18.86474609375, -17.5634765625, -16.26220703125, -14.9609375, -13.65966796875, -12.3583984375, -11.05712890625, -9.755859375, -8.45458984375, -7.1533203125, -5.85205078125, -4.55078125, -3.24951171875, -1.9482421875, -0.64697265625, 0.654296875, 1.95556640625, 3.2568359375, 4.55810546875, 5.859375, 7.16064453125, 8.4619140625, 9.76318359375, 11.064453125, 12.36572265625, 13.6669921875, 14.96826171875, 16.26953125, 17.57080078125, 18.8720703125, 20.17333984375, 21.474609375, 22.77587890625, 24.0771484375, 25.37841796875, 26.6796875, 27.98095703125, 29.2822265625, 30.58349609375, 31.884765625, 33.18603515625, 34.4873046875, 35.78857421875, 37.08984375, 38.39111328125, 39.6923828125, 40.99365234375, 42.294921875, 43.59619140625, 44.8974609375, 46.19873046875, 47.5]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 2.0, 3.0, 4.0, 3.0, 6.0, 7.0, 6.0, 10.0, 5.0, 19.0, 14.0, 19.0, 19.0, 29.0, 29.0, 34.0, 42.0, 54.0, 61.0, 63.0, 98.0, 142.0, 367.0, 1395.0, 132.0, 81.0, 59.0, 72.0, 46.0, 43.0, 40.0, 30.0, 17.0, 22.0, 22.0, 11.0, 11.0, 5.0, 8.0, 1.0, 5.0, 4.0, 5.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.28125, -30.303955078125, -29.32666015625, -28.349365234375, -27.3720703125, -26.394775390625, -25.41748046875, -24.440185546875, -23.462890625, -22.485595703125, -21.50830078125, -20.531005859375, -19.5537109375, -18.576416015625, -17.59912109375, -16.621826171875, -15.64453125, -14.667236328125, -13.68994140625, -12.712646484375, -11.7353515625, -10.758056640625, -9.78076171875, -8.803466796875, -7.826171875, -6.848876953125, -5.87158203125, -4.894287109375, -3.9169921875, -2.939697265625, -1.96240234375, -0.985107421875, -0.0078125, 0.969482421875, 1.94677734375, 2.924072265625, 3.9013671875, 4.878662109375, 5.85595703125, 6.833251953125, 7.810546875, 8.787841796875, 9.76513671875, 10.742431640625, 11.7197265625, 12.697021484375, 13.67431640625, 14.651611328125, 15.62890625, 16.606201171875, 17.58349609375, 18.560791015625, 19.5380859375, 20.515380859375, 21.49267578125, 22.469970703125, 23.447265625, 24.424560546875, 25.40185546875, 26.379150390625, 27.3564453125, 28.333740234375, 29.31103515625, 30.288330078125, 31.265625]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 1.0, 7.0, 1.0, 2.0, 14.0, 5.0, 13.0, 20.0, 35.0, 58.0, 55.0, 90.0, 137.0, 300.0, 739.0, 3143.0, 3055820.0, 82441.0, 1569.0, 564.0, 261.0, 138.0, 85.0, 53.0, 44.0, 25.0, 21.0, 16.0, 9.0, 8.0, 4.0, 4.0, 2.0, 4.0, 4.0, 2.0, 3.0, 1.0, 2.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-133.75, -128.943359375, -124.13671875, -119.330078125, -114.5234375, -109.716796875, -104.91015625, -100.103515625, -95.296875, -90.490234375, -85.68359375, -80.876953125, -76.0703125, -71.263671875, -66.45703125, -61.650390625, -56.84375, -52.037109375, -47.23046875, -42.423828125, -37.6171875, -32.810546875, -28.00390625, -23.197265625, -18.390625, -13.583984375, -8.77734375, -3.970703125, 0.8359375, 5.642578125, 10.44921875, 15.255859375, 20.0625, 24.869140625, 29.67578125, 34.482421875, 39.2890625, 44.095703125, 48.90234375, 53.708984375, 58.515625, 63.322265625, 68.12890625, 72.935546875, 77.7421875, 82.548828125, 87.35546875, 92.162109375, 96.96875, 101.775390625, 106.58203125, 111.388671875, 116.1953125, 121.001953125, 125.80859375, 130.615234375, 135.421875, 140.228515625, 145.03515625, 149.841796875, 154.6484375, 159.455078125, 164.26171875, 169.068359375, 173.875]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 8.0, 21.0, 32.0, 70.0, 208.0, 307.0, 224.0, 83.0, 37.0, 15.0, 4.0, 7.0], "bins": [-392.7497253417969, -385.93365478515625, -379.11761474609375, -372.3015441894531, -365.4854736328125, -358.66943359375, -351.8533630371094, -345.03729248046875, -338.22125244140625, -331.4051818847656, -324.5891418457031, -317.7730712890625, -310.9570007324219, -304.1409606933594, -297.32489013671875, -290.50885009765625, -283.6927795410156, -276.876708984375, -270.0606689453125, -263.2445983886719, -256.42852783203125, -249.61248779296875, -242.79641723632812, -235.98036193847656, -229.16429138183594, -222.34823608398438, -215.53216552734375, -208.7161102294922, -201.90005493164062, -195.083984375, -188.26792907714844, -181.45187377929688, -174.63580322265625, -167.8197479248047, -161.00367736816406, -154.1876220703125, -147.37156677246094, -140.55551147460938, -133.73944091796875, -126.92338562011719, -120.10733032226562, -113.29126739501953, -106.47521209716797, -99.65914916992188, -92.84309387207031, -86.02703094482422, -79.21096801757812, -72.39491271972656, -65.578857421875, -58.76279830932617, -51.946739196777344, -45.13067626953125, -38.31462097167969, -31.498558044433594, -24.682498931884766, -17.866439819335938, -11.050376892089844, -4.234317302703857, 2.581742286682129, 9.397802352905273, 16.2138614654541, 23.029922485351562, 29.84598159790039, 36.66204071044922, 43.47809982299805]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 4.0, 4.0, 5.0, 8.0, 8.0, 11.0, 20.0, 17.0, 16.0, 13.0, 19.0, 24.0, 30.0, 29.0, 39.0, 32.0, 39.0, 43.0, 32.0, 46.0, 41.0, 42.0, 38.0, 49.0, 38.0, 43.0, 45.0, 37.0, 26.0, 31.0, 25.0, 17.0, 17.0, 25.0, 17.0, 11.0, 9.0, 10.0, 11.0, 9.0, 7.0, 3.0, 5.0, 1.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-86.37979888916016, -83.68284606933594, -80.98590087890625, -78.28894805908203, -75.59200286865234, -72.89505004882812, -70.19810485839844, -67.50115203857422, -64.80419921875, -62.10725021362305, -59.410301208496094, -56.713348388671875, -54.01640319824219, -51.31945037841797, -48.622501373291016, -45.92555236816406, -43.228607177734375, -40.53165817260742, -37.83470916748047, -35.13775634765625, -32.44081115722656, -29.743860244750977, -27.04690933227539, -24.349960327148438, -21.653011322021484, -18.95606231689453, -16.259113311767578, -13.562162399291992, -10.865213394165039, -8.168264389038086, -5.4713134765625, -2.774364471435547, -0.077423095703125, 2.6195263862609863, 5.316475868225098, 8.013425827026367, 10.71037483215332, 13.407323837280273, 16.10427474975586, 18.801223754882812, 21.498172760009766, 24.19512176513672, 26.892070770263672, 29.589021682739258, 32.285972595214844, 34.98291778564453, 37.67987060546875, 40.3768196105957, 43.073768615722656, 45.77071762084961, 48.46766662597656, 51.16461944580078, 53.86156463623047, 56.55851745605469, 59.25546646118164, 61.952415466308594, 64.64936828613281, 67.34632110595703, 70.04326629638672, 72.74021911621094, 75.43716430664062, 78.13411712646484, 80.83106994628906, 83.52801513671875, 86.22496032714844]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 3.0, 2.0, 7.0, 11.0, 15.0, 26.0, 19.0, 13.0, 22.0, 25.0, 29.0, 35.0, 43.0, 33.0, 31.0, 39.0, 42.0, 44.0, 35.0, 55.0, 37.0, 47.0, 51.0, 32.0, 33.0, 31.0, 30.0, 24.0, 28.0, 26.0, 27.0, 24.0, 19.0, 17.0, 5.0, 6.0, 8.0, 4.0, 8.0, 6.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.046875, -15.5501708984375, -15.053466796875, -14.5567626953125, -14.06005859375, -13.5633544921875, -13.066650390625, -12.5699462890625, -12.0732421875, -11.5765380859375, -11.079833984375, -10.5831298828125, -10.08642578125, -9.5897216796875, -9.093017578125, -8.5963134765625, -8.099609375, -7.6029052734375, -7.106201171875, -6.6094970703125, -6.11279296875, -5.6160888671875, -5.119384765625, -4.6226806640625, -4.1259765625, -3.6292724609375, -3.132568359375, -2.6358642578125, -2.13916015625, -1.6424560546875, -1.145751953125, -0.6490478515625, -0.15234375, 0.3443603515625, 0.841064453125, 1.3377685546875, 1.83447265625, 2.3311767578125, 2.827880859375, 3.3245849609375, 3.8212890625, 4.3179931640625, 4.814697265625, 5.3114013671875, 5.80810546875, 6.3048095703125, 6.801513671875, 7.2982177734375, 7.794921875, 8.2916259765625, 8.788330078125, 9.2850341796875, 9.78173828125, 10.2784423828125, 10.775146484375, 11.2718505859375, 11.7685546875, 12.2652587890625, 12.761962890625, 13.2586669921875, 13.75537109375, 14.2520751953125, 14.748779296875, 15.2454833984375, 15.7421875]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 4.0, 5.0, 2.0, 3.0, 4.0, 10.0, 8.0, 18.0, 20.0, 15.0, 33.0, 38.0, 31.0, 60.0, 64.0, 97.0, 113.0, 153.0, 192.0, 290.0, 424.0, 725.0, 1456.0, 4214.0, 35970.0, 3367529.0, 765848.0, 11419.0, 2571.0, 1054.0, 583.0, 354.0, 240.0, 178.0, 133.0, 92.0, 88.0, 43.0, 46.0, 36.0, 30.0, 30.0, 5.0, 13.0, 14.0, 6.0, 10.0, 6.0, 2.0, 4.0, 0.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-73.625, -71.380859375, -69.13671875, -66.892578125, -64.6484375, -62.404296875, -60.16015625, -57.916015625, -55.671875, -53.427734375, -51.18359375, -48.939453125, -46.6953125, -44.451171875, -42.20703125, -39.962890625, -37.71875, -35.474609375, -33.23046875, -30.986328125, -28.7421875, -26.498046875, -24.25390625, -22.009765625, -19.765625, -17.521484375, -15.27734375, -13.033203125, -10.7890625, -8.544921875, -6.30078125, -4.056640625, -1.8125, 0.431640625, 2.67578125, 4.919921875, 7.1640625, 9.408203125, 11.65234375, 13.896484375, 16.140625, 18.384765625, 20.62890625, 22.873046875, 25.1171875, 27.361328125, 29.60546875, 31.849609375, 34.09375, 36.337890625, 38.58203125, 40.826171875, 43.0703125, 45.314453125, 47.55859375, 49.802734375, 52.046875, 54.291015625, 56.53515625, 58.779296875, 61.0234375, 63.267578125, 65.51171875, 67.755859375, 70.0]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 8.0, 6.0, 13.0, 24.0, 34.0, 66.0, 101.0, 182.0, 302.0, 579.0, 1024.0, 740.0, 417.0, 222.0, 122.0, 78.0, 51.0, 32.0, 23.0, 13.0, 9.0, 3.0, 9.0, 4.0, 2.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.75, -40.54638671875, -39.3427734375, -38.13916015625, -36.935546875, -35.73193359375, -34.5283203125, -33.32470703125, -32.12109375, -30.91748046875, -29.7138671875, -28.51025390625, -27.306640625, -26.10302734375, -24.8994140625, -23.69580078125, -22.4921875, -21.28857421875, -20.0849609375, -18.88134765625, -17.677734375, -16.47412109375, -15.2705078125, -14.06689453125, -12.86328125, -11.65966796875, -10.4560546875, -9.25244140625, -8.048828125, -6.84521484375, -5.6416015625, -4.43798828125, -3.234375, -2.03076171875, -0.8271484375, 0.37646484375, 1.580078125, 2.78369140625, 3.9873046875, 5.19091796875, 6.39453125, 7.59814453125, 8.8017578125, 10.00537109375, 11.208984375, 12.41259765625, 13.6162109375, 14.81982421875, 16.0234375, 17.22705078125, 18.4306640625, 19.63427734375, 20.837890625, 22.04150390625, 23.2451171875, 24.44873046875, 25.65234375, 26.85595703125, 28.0595703125, 29.26318359375, 30.466796875, 31.67041015625, 32.8740234375, 34.07763671875, 35.28125]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 4.0, 2.0, 5.0, 10.0, 8.0, 14.0, 21.0, 45.0, 69.0, 100.0, 224.0, 544.0, 1699.0, 8714.0, 174263.0, 3954268.0, 47831.0, 4588.0, 1149.0, 368.0, 164.0, 77.0, 51.0, 26.0, 13.0, 6.0, 9.0, 5.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-83.5, -80.6533203125, -77.806640625, -74.9599609375, -72.11328125, -69.2666015625, -66.419921875, -63.5732421875, -60.7265625, -57.8798828125, -55.033203125, -52.1865234375, -49.33984375, -46.4931640625, -43.646484375, -40.7998046875, -37.953125, -35.1064453125, -32.259765625, -29.4130859375, -26.56640625, -23.7197265625, -20.873046875, -18.0263671875, -15.1796875, -12.3330078125, -9.486328125, -6.6396484375, -3.79296875, -0.9462890625, 1.900390625, 4.7470703125, 7.59375, 10.4404296875, 13.287109375, 16.1337890625, 18.98046875, 21.8271484375, 24.673828125, 27.5205078125, 30.3671875, 33.2138671875, 36.060546875, 38.9072265625, 41.75390625, 44.6005859375, 47.447265625, 50.2939453125, 53.140625, 55.9873046875, 58.833984375, 61.6806640625, 64.52734375, 67.3740234375, 70.220703125, 73.0673828125, 75.9140625, 78.7607421875, 81.607421875, 84.4541015625, 87.30078125, 90.1474609375, 92.994140625, 95.8408203125, 98.6875]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 11.0, 266.0, 696.0, 35.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1320.40576171875, -1294.0941162109375, -1267.7823486328125, -1241.470703125, -1215.158935546875, -1188.8472900390625, -1162.5355224609375, -1136.223876953125, -1109.912109375, -1083.6004638671875, -1057.2886962890625, -1030.97705078125, -1004.665283203125, -978.3535766601562, -952.0418701171875, -925.7301635742188, -899.41845703125, -873.1067504882812, -846.7950439453125, -820.4833374023438, -794.171630859375, -767.8599243164062, -741.5482177734375, -715.2365112304688, -688.9248657226562, -662.6131591796875, -636.3014526367188, -609.98974609375, -583.6780395507812, -557.3663330078125, -531.0546264648438, -504.742919921875, -478.4312438964844, -452.1195373535156, -425.8078308105469, -399.4961242675781, -373.1844177246094, -346.87274169921875, -320.56103515625, -294.24932861328125, -267.9376220703125, -241.62591552734375, -215.314208984375, -189.00250244140625, -162.6907958984375, -136.3791046142578, -110.06739807128906, -83.75569152832031, -57.4439697265625, -31.132265090942383, -4.820560455322266, 21.49114227294922, 47.80284881591797, 74.11454772949219, 100.42625427246094, 126.73796081542969, 153.04966735839844, 179.3613739013672, 205.67308044433594, 231.98477172851562, 258.2964782714844, 284.6081848144531, 310.9198913574219, 337.2315979003906, 363.5433044433594]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 7.0, 3.0, 6.0, 8.0, 8.0, 15.0, 16.0, 12.0, 29.0, 23.0, 24.0, 27.0, 25.0, 32.0, 40.0, 33.0, 43.0, 37.0, 44.0, 36.0, 41.0, 39.0, 48.0, 37.0, 49.0, 32.0, 43.0, 28.0, 21.0, 29.0, 26.0, 26.0, 13.0, 18.0, 16.0, 18.0, 11.0, 10.0, 6.0, 2.0, 6.0, 4.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-85.37924194335938, -82.60194396972656, -79.82464599609375, -77.04734802246094, -74.27005004882812, -71.49275207519531, -68.7154541015625, -65.93815612792969, -63.160858154296875, -60.38356018066406, -57.60626220703125, -54.82896423339844, -52.051666259765625, -49.27436828613281, -46.4970703125, -43.71977233886719, -40.942474365234375, -38.16517639160156, -35.38787841796875, -32.61058044433594, -29.833282470703125, -27.055984497070312, -24.2786865234375, -21.501388549804688, -18.724090576171875, -15.946792602539062, -13.16949462890625, -10.392196655273438, -7.614898681640625, -4.8376007080078125, -2.060302734375, 0.7169952392578125, 3.4942855834960938, 6.271583557128906, 9.048881530761719, 11.826179504394531, 14.603477478027344, 17.380775451660156, 20.15807342529297, 22.93537139892578, 25.712669372558594, 28.489967346191406, 31.26726531982422, 34.04456329345703, 36.821861267089844, 39.599159240722656, 42.37645721435547, 45.15375518798828, 47.931053161621094, 50.708351135253906, 53.48564910888672, 56.26294708251953, 59.040245056152344, 61.817543029785156, 64.59484100341797, 67.37213897705078, 70.1494369506836, 72.9267349243164, 75.70403289794922, 78.48133087158203, 81.25862884521484, 84.03592681884766, 86.81322479248047, 89.59052276611328, 92.3678207397461]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 3.0, 3.0, 9.0, 7.0, 10.0, 6.0, 11.0, 12.0, 14.0, 12.0, 20.0, 18.0, 21.0, 22.0, 14.0, 21.0, 39.0, 38.0, 37.0, 29.0, 36.0, 39.0, 36.0, 46.0, 39.0, 33.0, 22.0, 36.0, 35.0, 30.0, 22.0, 30.0, 35.0, 31.0, 16.0, 24.0, 24.0, 15.0, 17.0, 19.0, 8.0, 10.0, 11.0, 9.0, 9.0, 5.0, 7.0, 3.0, 5.0, 4.0, 3.0, 0.0, 2.0, 0.0, 2.0], "bins": [-11.5, -11.15380859375, -10.8076171875, -10.46142578125, -10.115234375, -9.76904296875, -9.4228515625, -9.07666015625, -8.73046875, -8.38427734375, -8.0380859375, -7.69189453125, -7.345703125, -6.99951171875, -6.6533203125, -6.30712890625, -5.9609375, -5.61474609375, -5.2685546875, -4.92236328125, -4.576171875, -4.22998046875, -3.8837890625, -3.53759765625, -3.19140625, -2.84521484375, -2.4990234375, -2.15283203125, -1.806640625, -1.46044921875, -1.1142578125, -0.76806640625, -0.421875, -0.07568359375, 0.2705078125, 0.61669921875, 0.962890625, 1.30908203125, 1.6552734375, 2.00146484375, 2.34765625, 2.69384765625, 3.0400390625, 3.38623046875, 3.732421875, 4.07861328125, 4.4248046875, 4.77099609375, 5.1171875, 5.46337890625, 5.8095703125, 6.15576171875, 6.501953125, 6.84814453125, 7.1943359375, 7.54052734375, 7.88671875, 8.23291015625, 8.5791015625, 8.92529296875, 9.271484375, 9.61767578125, 9.9638671875, 10.31005859375, 10.65625]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 4.0, 6.0, 2.0, 5.0, 17.0, 19.0, 33.0, 37.0, 64.0, 59.0, 118.0, 162.0, 236.0, 345.0, 575.0, 768.0, 1061.0, 1571.0, 2426.0, 3478.0, 5184.0, 7708.0, 11616.0, 17659.0, 27557.0, 43728.0, 72365.0, 123112.0, 199415.0, 201466.0, 126433.0, 74051.0, 44815.0, 27941.0, 18318.0, 11786.0, 7727.0, 5460.0, 3555.0, 2446.0, 1709.0, 1075.0, 745.0, 520.0, 388.0, 227.0, 192.0, 139.0, 85.0, 54.0, 35.0, 21.0, 15.0, 13.0, 9.0, 6.0, 7.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.9560546875, -0.9262008666992188, -0.8963470458984375, -0.8664932250976562, -0.836639404296875, -0.8067855834960938, -0.7769317626953125, -0.7470779418945312, -0.71722412109375, -0.6873703002929688, -0.6575164794921875, -0.6276626586914062, -0.597808837890625, -0.5679550170898438, -0.5381011962890625, -0.5082473754882812, -0.4783935546875, -0.44853973388671875, -0.4186859130859375, -0.38883209228515625, -0.358978271484375, -0.32912445068359375, -0.2992706298828125, -0.26941680908203125, -0.23956298828125, -0.20970916748046875, -0.1798553466796875, -0.15000152587890625, -0.120147705078125, -0.09029388427734375, -0.0604400634765625, -0.03058624267578125, -0.000732421875, 0.02912139892578125, 0.0589752197265625, 0.08882904052734375, 0.118682861328125, 0.14853668212890625, 0.1783905029296875, 0.20824432373046875, 0.23809814453125, 0.26795196533203125, 0.2978057861328125, 0.32765960693359375, 0.357513427734375, 0.38736724853515625, 0.4172210693359375, 0.44707489013671875, 0.4769287109375, 0.5067825317382812, 0.5366363525390625, 0.5664901733398438, 0.596343994140625, 0.6261978149414062, 0.6560516357421875, 0.6859054565429688, 0.71575927734375, 0.7456130981445312, 0.7754669189453125, 0.8053207397460938, 0.835174560546875, 0.8650283813476562, 0.8948822021484375, 0.9247360229492188, 0.95458984375]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 6.0, 7.0, 11.0, 5.0, 6.0, 17.0, 12.0, 12.0, 17.0, 15.0, 30.0, 30.0, 37.0, 34.0, 35.0, 24.0, 26.0, 49.0, 37.0, 50.0, 40.0, 1063.0, 42.0, 50.0, 40.0, 20.0, 35.0, 36.0, 30.0, 23.0, 22.0, 29.0, 20.0, 18.0, 20.0, 17.0, 13.0, 10.0, 8.0, 9.0, 6.0, 3.0, 2.0, 5.0, 1.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.328125, -8.07720947265625, -7.8262939453125, -7.57537841796875, -7.324462890625, -7.07354736328125, -6.8226318359375, -6.57171630859375, -6.32080078125, -6.06988525390625, -5.8189697265625, -5.56805419921875, -5.317138671875, -5.06622314453125, -4.8153076171875, -4.56439208984375, -4.3134765625, -4.06256103515625, -3.8116455078125, -3.56072998046875, -3.309814453125, -3.05889892578125, -2.8079833984375, -2.55706787109375, -2.30615234375, -2.05523681640625, -1.8043212890625, -1.55340576171875, -1.302490234375, -1.05157470703125, -0.8006591796875, -0.54974365234375, -0.298828125, -0.04791259765625, 0.2030029296875, 0.45391845703125, 0.704833984375, 0.95574951171875, 1.2066650390625, 1.45758056640625, 1.70849609375, 1.95941162109375, 2.2103271484375, 2.46124267578125, 2.712158203125, 2.96307373046875, 3.2139892578125, 3.46490478515625, 3.7158203125, 3.96673583984375, 4.2176513671875, 4.46856689453125, 4.719482421875, 4.97039794921875, 5.2213134765625, 5.47222900390625, 5.72314453125, 5.97406005859375, 6.2249755859375, 6.47589111328125, 6.726806640625, 6.97772216796875, 7.2286376953125, 7.47955322265625, 7.73046875]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 4.0, 10.0, 17.0, 24.0, 38.0, 53.0, 86.0, 160.0, 204.0, 325.0, 407.0, 739.0, 1075.0, 1566.0, 2420.0, 3554.0, 5319.0, 8284.0, 12411.0, 18667.0, 29423.0, 47370.0, 80212.0, 137386.0, 1251425.0, 200020.0, 114381.0, 66735.0, 41130.0, 25567.0, 16204.0, 10771.0, 7063.0, 4578.0, 3190.0, 2105.0, 1461.0, 925.0, 615.0, 447.0, 276.0, 158.0, 119.0, 76.0, 44.0, 37.0, 18.0, 11.0, 8.0, 9.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.73876953125, -0.714813232421875, -0.69085693359375, -0.666900634765625, -0.6429443359375, -0.618988037109375, -0.59503173828125, -0.571075439453125, -0.547119140625, -0.523162841796875, -0.49920654296875, -0.475250244140625, -0.4512939453125, -0.427337646484375, -0.40338134765625, -0.379425048828125, -0.35546875, -0.331512451171875, -0.30755615234375, -0.283599853515625, -0.2596435546875, -0.235687255859375, -0.21173095703125, -0.187774658203125, -0.163818359375, -0.139862060546875, -0.11590576171875, -0.091949462890625, -0.0679931640625, -0.044036865234375, -0.02008056640625, 0.003875732421875, 0.02783203125, 0.051788330078125, 0.07574462890625, 0.099700927734375, 0.1236572265625, 0.147613525390625, 0.17156982421875, 0.195526123046875, 0.219482421875, 0.243438720703125, 0.26739501953125, 0.291351318359375, 0.3153076171875, 0.339263916015625, 0.36322021484375, 0.387176513671875, 0.4111328125, 0.435089111328125, 0.45904541015625, 0.483001708984375, 0.5069580078125, 0.530914306640625, 0.55487060546875, 0.578826904296875, 0.602783203125, 0.626739501953125, 0.65069580078125, 0.674652099609375, 0.6986083984375, 0.722564697265625, 0.74652099609375, 0.770477294921875, 0.79443359375]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 3.0, 3.0, 3.0, 6.0, 6.0, 14.0, 10.0, 23.0, 18.0, 55.0, 108.0, 206.0, 273.0, 111.0, 66.0, 32.0, 15.0, 13.0, 9.0, 8.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.033782958984375, -0.032663822174072266, -0.03154468536376953, -0.030425548553466797, -0.029306411743164062, -0.028187274932861328, -0.027068138122558594, -0.02594900131225586, -0.024829864501953125, -0.02371072769165039, -0.022591590881347656, -0.021472454071044922, -0.020353317260742188, -0.019234180450439453, -0.01811504364013672, -0.016995906829833984, -0.01587677001953125, -0.014757633209228516, -0.013638496398925781, -0.012519359588623047, -0.011400222778320312, -0.010281085968017578, -0.009161949157714844, -0.00804281234741211, -0.006923675537109375, -0.005804538726806641, -0.004685401916503906, -0.003566265106201172, -0.0024471282958984375, -0.0013279914855957031, -0.00020885467529296875, 0.0009102821350097656, 0.0020294189453125, 0.0031485557556152344, 0.004267692565917969, 0.005386829376220703, 0.0065059661865234375, 0.007625102996826172, 0.008744239807128906, 0.00986337661743164, 0.010982513427734375, 0.01210165023803711, 0.013220787048339844, 0.014339923858642578, 0.015459060668945312, 0.016578197479248047, 0.01769733428955078, 0.018816471099853516, 0.01993560791015625, 0.021054744720458984, 0.02217388153076172, 0.023293018341064453, 0.024412155151367188, 0.025531291961669922, 0.026650428771972656, 0.02776956558227539, 0.028888702392578125, 0.03000783920288086, 0.031126976013183594, 0.03224611282348633, 0.03336524963378906, 0.0344843864440918, 0.03560352325439453, 0.036722660064697266, 0.037841796875]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 4.0, 3.0, 2.0, 3.0, 8.0, 3.0, 6.0, 14.0, 20.0, 21.0, 33.0, 55.0, 114.0, 267.0, 1041.0, 1030052.0, 15914.0, 497.0, 197.0, 90.0, 62.0, 41.0, 24.0, 20.0, 11.0, 6.0, 12.0, 7.0, 3.0, 7.0, 3.0, 1.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.744140625, -0.7221145629882812, -0.7000885009765625, -0.6780624389648438, -0.656036376953125, -0.6340103149414062, -0.6119842529296875, -0.5899581909179688, -0.56793212890625, -0.5459060668945312, -0.5238800048828125, -0.5018539428710938, -0.479827880859375, -0.45780181884765625, -0.4357757568359375, -0.41374969482421875, -0.3917236328125, -0.36969757080078125, -0.3476715087890625, -0.32564544677734375, -0.303619384765625, -0.28159332275390625, -0.2595672607421875, -0.23754119873046875, -0.21551513671875, -0.19348907470703125, -0.1714630126953125, -0.14943695068359375, -0.127410888671875, -0.10538482666015625, -0.0833587646484375, -0.06133270263671875, -0.039306640625, -0.01728057861328125, 0.0047454833984375, 0.02677154541015625, 0.048797607421875, 0.07082366943359375, 0.0928497314453125, 0.11487579345703125, 0.13690185546875, 0.15892791748046875, 0.1809539794921875, 0.20298004150390625, 0.225006103515625, 0.24703216552734375, 0.2690582275390625, 0.29108428955078125, 0.3131103515625, 0.33513641357421875, 0.3571624755859375, 0.37918853759765625, 0.401214599609375, 0.42324066162109375, 0.4452667236328125, 0.46729278564453125, 0.48931884765625, 0.5113449096679688, 0.5333709716796875, 0.5553970336914062, 0.577423095703125, 0.5994491577148438, 0.6214752197265625, 0.6435012817382812, 0.66552734375]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 7.0, 1000.0, 10.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.177730530500412, -0.16547609865665436, -0.15322166681289673, -0.1409672349691391, -0.12871280312538147, -0.11645837128162384, -0.10420393943786621, -0.09194950759410858, -0.07969507575035095, -0.06744064390659332, -0.05518621206283569, -0.042931780219078064, -0.030677348375320435, -0.018422916531562805, -0.006168484687805176, 0.006085947155952454, 0.018340378999710083, 0.030594810843467712, 0.04284924268722534, 0.05510367453098297, 0.0673581063747406, 0.07961253821849823, 0.09186697006225586, 0.10412140190601349, 0.11637583374977112, 0.12863026559352875, 0.14088469743728638, 0.153139129281044, 0.16539356112480164, 0.17764799296855927, 0.1899024248123169, 0.20215685665607452, 0.21441125869750977, 0.2266656905412674, 0.23892012238502502, 0.25117456912994385, 0.2634289860725403, 0.2756834030151367, 0.28793784976005554, 0.30019229650497437, 0.3124467134475708, 0.32470113039016724, 0.33695557713508606, 0.3492100238800049, 0.3614644408226013, 0.37371885776519775, 0.3859733045101166, 0.3982277512550354, 0.41048216819763184, 0.42273658514022827, 0.4349910318851471, 0.4472454786300659, 0.45949989557266235, 0.4717543125152588, 0.4840087592601776, 0.49626320600509644, 0.5085176229476929, 0.5207720398902893, 0.5330264568328857, 0.545280933380127, 0.5575353503227234, 0.5697897672653198, 0.582044243812561, 0.5942986607551575, 0.6065530776977539]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 6.0, 5.0, 10.0, 11.0, 19.0, 31.0, 33.0, 59.0, 68.0, 67.0, 68.0, 71.0, 91.0, 64.0, 71.0, 75.0, 60.0, 41.0, 47.0, 32.0, 25.0, 21.0, 12.0, 10.0, 4.0, 1.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.027426540851593018, -0.026311088353395462, -0.025195635855197906, -0.02408018335700035, -0.022964730858802795, -0.02184927836060524, -0.020733825862407684, -0.01961837336421013, -0.018502920866012573, -0.017387468367815018, -0.016272015869617462, -0.015156563371419907, -0.014041110873222351, -0.012925658375024796, -0.01181020587682724, -0.010694753378629684, -0.009579300880432129, -0.008463848382234573, -0.007348395884037018, -0.006232943385839462, -0.005117490887641907, -0.004002038389444351, -0.0028865858912467957, -0.0017711333930492401, -0.0006556808948516846, 0.00045977160334587097, 0.0015752241015434265, 0.002690676599740982, 0.0038061290979385376, 0.004921581596136093, 0.006037034094333649, 0.007152486592531204, 0.00826793909072876, 0.009383391588926315, 0.01049884408712387, 0.011614296585321426, 0.012729749083518982, 0.013845201581716537, 0.014960654079914093, 0.01607610657811165, 0.017191559076309204, 0.01830701157450676, 0.019422464072704315, 0.02053791657090187, 0.021653369069099426, 0.022768821567296982, 0.023884274065494537, 0.024999726563692093, 0.02611517906188965, 0.027230631560087204, 0.02834608405828476, 0.029461536556482315, 0.03057698905467987, 0.031692441552877426, 0.03280789405107498, 0.03392334654927254, 0.03503879904747009, 0.03615425154566765, 0.037269704043865204, 0.03838515654206276, 0.039500609040260315, 0.04061606153845787, 0.041731514036655426, 0.04284696653485298, 0.04396241903305054]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 3.0, 3.0, 9.0, 7.0, 10.0, 6.0, 11.0, 12.0, 14.0, 12.0, 20.0, 17.0, 22.0, 22.0, 14.0, 19.0, 41.0, 38.0, 36.0, 30.0, 35.0, 39.0, 36.0, 47.0, 38.0, 34.0, 22.0, 35.0, 36.0, 30.0, 22.0, 29.0, 36.0, 31.0, 15.0, 25.0, 24.0, 15.0, 17.0, 19.0, 8.0, 10.0, 11.0, 9.0, 9.0, 5.0, 7.0, 3.0, 5.0, 4.0, 3.0, 0.0, 2.0, 0.0, 2.0], "bins": [-11.5078125, -11.1614990234375, -10.815185546875, -10.4688720703125, -10.12255859375, -9.7762451171875, -9.429931640625, -9.0836181640625, -8.7373046875, -8.3909912109375, -8.044677734375, -7.6983642578125, -7.35205078125, -7.0057373046875, -6.659423828125, -6.3131103515625, -5.966796875, -5.6204833984375, -5.274169921875, -4.9278564453125, -4.58154296875, -4.2352294921875, -3.888916015625, -3.5426025390625, -3.1962890625, -2.8499755859375, -2.503662109375, -2.1573486328125, -1.81103515625, -1.4647216796875, -1.118408203125, -0.7720947265625, -0.42578125, -0.0794677734375, 0.266845703125, 0.6131591796875, 0.95947265625, 1.3057861328125, 1.652099609375, 1.9984130859375, 2.3447265625, 2.6910400390625, 3.037353515625, 3.3836669921875, 3.72998046875, 4.0762939453125, 4.422607421875, 4.7689208984375, 5.115234375, 5.4615478515625, 5.807861328125, 6.1541748046875, 6.50048828125, 6.8468017578125, 7.193115234375, 7.5394287109375, 7.8857421875, 8.2320556640625, 8.578369140625, 8.9246826171875, 9.27099609375, 9.6173095703125, 9.963623046875, 10.3099365234375, 10.65625]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 2.0, 5.0, 5.0, 8.0, 13.0, 13.0, 23.0, 30.0, 30.0, 42.0, 50.0, 75.0, 105.0, 123.0, 164.0, 205.0, 326.0, 389.0, 670.0, 944.0, 1500.0, 2559.0, 5138.0, 12417.0, 43865.0, 252024.0, 592589.0, 95843.0, 22281.0, 7774.0, 3511.0, 1981.0, 1140.0, 752.0, 534.0, 376.0, 262.0, 179.0, 140.0, 117.0, 101.0, 57.0, 45.0, 34.0, 37.0, 24.0, 19.0, 10.0, 9.0, 8.0, 7.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0], "bins": [-20.171875, -19.565185546875, -18.95849609375, -18.351806640625, -17.7451171875, -17.138427734375, -16.53173828125, -15.925048828125, -15.318359375, -14.711669921875, -14.10498046875, -13.498291015625, -12.8916015625, -12.284912109375, -11.67822265625, -11.071533203125, -10.46484375, -9.858154296875, -9.25146484375, -8.644775390625, -8.0380859375, -7.431396484375, -6.82470703125, -6.218017578125, -5.611328125, -5.004638671875, -4.39794921875, -3.791259765625, -3.1845703125, -2.577880859375, -1.97119140625, -1.364501953125, -0.7578125, -0.151123046875, 0.45556640625, 1.062255859375, 1.6689453125, 2.275634765625, 2.88232421875, 3.489013671875, 4.095703125, 4.702392578125, 5.30908203125, 5.915771484375, 6.5224609375, 7.129150390625, 7.73583984375, 8.342529296875, 8.94921875, 9.555908203125, 10.16259765625, 10.769287109375, 11.3759765625, 11.982666015625, 12.58935546875, 13.196044921875, 13.802734375, 14.409423828125, 15.01611328125, 15.622802734375, 16.2294921875, 16.836181640625, 17.44287109375, 18.049560546875, 18.65625]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 3.0, 3.0, 6.0, 5.0, 9.0, 6.0, 8.0, 16.0, 7.0, 17.0, 20.0, 17.0, 14.0, 36.0, 24.0, 30.0, 60.0, 47.0, 72.0, 87.0, 138.0, 1438.0, 387.0, 135.0, 87.0, 68.0, 49.0, 47.0, 26.0, 39.0, 23.0, 22.0, 16.0, 18.0, 11.0, 16.0, 9.0, 8.0, 9.0, 2.0, 6.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-25.34375, -24.468505859375, -23.59326171875, -22.718017578125, -21.8427734375, -20.967529296875, -20.09228515625, -19.217041015625, -18.341796875, -17.466552734375, -16.59130859375, -15.716064453125, -14.8408203125, -13.965576171875, -13.09033203125, -12.215087890625, -11.33984375, -10.464599609375, -9.58935546875, -8.714111328125, -7.8388671875, -6.963623046875, -6.08837890625, -5.213134765625, -4.337890625, -3.462646484375, -2.58740234375, -1.712158203125, -0.8369140625, 0.038330078125, 0.91357421875, 1.788818359375, 2.6640625, 3.539306640625, 4.41455078125, 5.289794921875, 6.1650390625, 7.040283203125, 7.91552734375, 8.790771484375, 9.666015625, 10.541259765625, 11.41650390625, 12.291748046875, 13.1669921875, 14.042236328125, 14.91748046875, 15.792724609375, 16.66796875, 17.543212890625, 18.41845703125, 19.293701171875, 20.1689453125, 21.044189453125, 21.91943359375, 22.794677734375, 23.669921875, 24.545166015625, 25.42041015625, 26.295654296875, 27.1708984375, 28.046142578125, 28.92138671875, 29.796630859375, 30.671875]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 8.0, 6.0, 9.0, 9.0, 16.0, 19.0, 18.0, 26.0, 35.0, 34.0, 55.0, 80.0, 94.0, 157.0, 213.0, 419.0, 817.0, 2068.0, 32692.0, 3084225.0, 20926.0, 1850.0, 699.0, 418.0, 225.0, 142.0, 115.0, 65.0, 55.0, 48.0, 41.0, 20.0, 23.0, 12.0, 14.0, 15.0, 9.0, 3.0, 7.0, 6.0, 3.0, 6.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-61.6875, -59.89697265625, -58.1064453125, -56.31591796875, -54.525390625, -52.73486328125, -50.9443359375, -49.15380859375, -47.36328125, -45.57275390625, -43.7822265625, -41.99169921875, -40.201171875, -38.41064453125, -36.6201171875, -34.82958984375, -33.0390625, -31.24853515625, -29.4580078125, -27.66748046875, -25.876953125, -24.08642578125, -22.2958984375, -20.50537109375, -18.71484375, -16.92431640625, -15.1337890625, -13.34326171875, -11.552734375, -9.76220703125, -7.9716796875, -6.18115234375, -4.390625, -2.60009765625, -0.8095703125, 0.98095703125, 2.771484375, 4.56201171875, 6.3525390625, 8.14306640625, 9.93359375, 11.72412109375, 13.5146484375, 15.30517578125, 17.095703125, 18.88623046875, 20.6767578125, 22.46728515625, 24.2578125, 26.04833984375, 27.8388671875, 29.62939453125, 31.419921875, 33.21044921875, 35.0009765625, 36.79150390625, 38.58203125, 40.37255859375, 42.1630859375, 43.95361328125, 45.744140625, 47.53466796875, 49.3251953125, 51.11572265625, 52.90625]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 47.0, 697.0, 254.0, 11.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-653.3788452148438, -640.7673950195312, -628.1559448242188, -615.5444946289062, -602.9330444335938, -590.3215942382812, -577.7101440429688, -565.0986938476562, -552.4872436523438, -539.8757934570312, -527.2643432617188, -514.6528930664062, -502.04144287109375, -489.42999267578125, -476.81854248046875, -464.20709228515625, -451.59564208984375, -438.98419189453125, -426.37274169921875, -413.76129150390625, -401.14984130859375, -388.53839111328125, -375.92694091796875, -363.31549072265625, -350.70404052734375, -338.09259033203125, -325.48114013671875, -312.86968994140625, -300.25823974609375, -287.64678955078125, -275.03533935546875, -262.42388916015625, -249.81240844726562, -237.20095825195312, -224.58950805664062, -211.97805786132812, -199.36660766601562, -186.75515747070312, -174.14370727539062, -161.53225708007812, -148.92080688476562, -136.30935668945312, -123.69790649414062, -111.08645629882812, -98.47500610351562, -85.86355590820312, -73.25210571289062, -60.640655517578125, -48.029205322265625, -35.417755126953125, -22.806304931640625, -10.194854736328125, 2.416595458984375, 15.028045654296875, 27.639495849609375, 40.250946044921875, 52.862396240234375, 65.47384643554688, 78.08529663085938, 90.69674682617188, 103.30819702148438, 115.91964721679688, 128.53109741210938, 141.14254760742188, 153.75399780273438]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 8.0, 4.0, 5.0, 13.0, 8.0, 16.0, 10.0, 13.0, 21.0, 22.0, 20.0, 27.0, 22.0, 20.0, 23.0, 30.0, 35.0, 37.0, 32.0, 38.0, 35.0, 52.0, 38.0, 41.0, 32.0, 37.0, 32.0, 38.0, 27.0, 28.0, 21.0, 28.0, 30.0, 20.0, 22.0, 10.0, 18.0, 22.0, 13.0, 8.0, 9.0, 16.0, 9.0, 3.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-68.07286071777344, -66.01931762695312, -63.96577835083008, -61.91223907470703, -59.85869598388672, -57.805152893066406, -55.75161361694336, -53.69807434082031, -51.64453125, -49.59098815917969, -47.53744888305664, -45.483909606933594, -43.43036651611328, -41.37682342529297, -39.32328414916992, -37.269744873046875, -35.21620178222656, -33.16265869140625, -31.109119415283203, -29.055578231811523, -27.002037048339844, -24.948495864868164, -22.894954681396484, -20.841413497924805, -18.787872314453125, -16.734331130981445, -14.680789947509766, -12.627248764038086, -10.573707580566406, -8.520166397094727, -6.466625213623047, -4.413084030151367, -2.3595352172851562, -0.30599403381347656, 1.7475471496582031, 3.801088333129883, 5.8546295166015625, 7.908170700073242, 9.961711883544922, 12.015253067016602, 14.068794250488281, 16.12233543395996, 18.17587661743164, 20.22941780090332, 22.282958984375, 24.33650016784668, 26.39004135131836, 28.44358253479004, 30.49712371826172, 32.55066680908203, 34.60420608520508, 36.657745361328125, 38.71128845214844, 40.76483154296875, 42.8183708190918, 44.871910095214844, 46.925453186035156, 48.97899627685547, 51.032535552978516, 53.08607482910156, 55.139617919921875, 57.19316101074219, 59.246700286865234, 61.30023956298828, 63.353782653808594]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 5.0, 4.0, 8.0, 8.0, 15.0, 11.0, 6.0, 13.0, 15.0, 18.0, 24.0, 20.0, 16.0, 27.0, 22.0, 38.0, 30.0, 33.0, 32.0, 41.0, 39.0, 32.0, 38.0, 46.0, 38.0, 30.0, 40.0, 39.0, 29.0, 33.0, 20.0, 36.0, 28.0, 25.0, 23.0, 17.0, 14.0, 11.0, 12.0, 6.0, 11.0, 7.0, 6.0, 11.0, 5.0, 5.0, 7.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-12.0703125, -11.6793212890625, -11.288330078125, -10.8973388671875, -10.50634765625, -10.1153564453125, -9.724365234375, -9.3333740234375, -8.9423828125, -8.5513916015625, -8.160400390625, -7.7694091796875, -7.37841796875, -6.9874267578125, -6.596435546875, -6.2054443359375, -5.814453125, -5.4234619140625, -5.032470703125, -4.6414794921875, -4.25048828125, -3.8594970703125, -3.468505859375, -3.0775146484375, -2.6865234375, -2.2955322265625, -1.904541015625, -1.5135498046875, -1.12255859375, -0.7315673828125, -0.340576171875, 0.0504150390625, 0.44140625, 0.8323974609375, 1.223388671875, 1.6143798828125, 2.00537109375, 2.3963623046875, 2.787353515625, 3.1783447265625, 3.5693359375, 3.9603271484375, 4.351318359375, 4.7423095703125, 5.13330078125, 5.5242919921875, 5.915283203125, 6.3062744140625, 6.697265625, 7.0882568359375, 7.479248046875, 7.8702392578125, 8.26123046875, 8.6522216796875, 9.043212890625, 9.4342041015625, 9.8251953125, 10.2161865234375, 10.607177734375, 10.9981689453125, 11.38916015625, 11.7801513671875, 12.171142578125, 12.5621337890625, 12.953125]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 1.0, 7.0, 4.0, 3.0, 11.0, 15.0, 16.0, 13.0, 17.0, 25.0, 47.0, 63.0, 68.0, 119.0, 144.0, 225.0, 328.0, 508.0, 794.0, 1334.0, 2559.0, 5559.0, 14167.0, 106854.0, 3422785.0, 600437.0, 22613.0, 7833.0, 3291.0, 1732.0, 890.0, 571.0, 370.0, 241.0, 177.0, 130.0, 88.0, 62.0, 45.0, 32.0, 27.0, 19.0, 10.0, 15.0, 4.0, 6.0, 6.0, 10.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-63.0625, -61.072265625, -59.08203125, -57.091796875, -55.1015625, -53.111328125, -51.12109375, -49.130859375, -47.140625, -45.150390625, -43.16015625, -41.169921875, -39.1796875, -37.189453125, -35.19921875, -33.208984375, -31.21875, -29.228515625, -27.23828125, -25.248046875, -23.2578125, -21.267578125, -19.27734375, -17.287109375, -15.296875, -13.306640625, -11.31640625, -9.326171875, -7.3359375, -5.345703125, -3.35546875, -1.365234375, 0.625, 2.615234375, 4.60546875, 6.595703125, 8.5859375, 10.576171875, 12.56640625, 14.556640625, 16.546875, 18.537109375, 20.52734375, 22.517578125, 24.5078125, 26.498046875, 28.48828125, 30.478515625, 32.46875, 34.458984375, 36.44921875, 38.439453125, 40.4296875, 42.419921875, 44.41015625, 46.400390625, 48.390625, 50.380859375, 52.37109375, 54.361328125, 56.3515625, 58.341796875, 60.33203125, 62.322265625, 64.3125]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 6.0, 7.0, 4.0, 12.0, 9.0, 14.0, 22.0, 42.0, 42.0, 67.0, 107.0, 203.0, 428.0, 888.0, 967.0, 579.0, 264.0, 136.0, 82.0, 52.0, 32.0, 33.0, 24.0, 19.0, 8.0, 11.0, 9.0, 6.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.71875, -36.37939453125, -35.0400390625, -33.70068359375, -32.361328125, -31.02197265625, -29.6826171875, -28.34326171875, -27.00390625, -25.66455078125, -24.3251953125, -22.98583984375, -21.646484375, -20.30712890625, -18.9677734375, -17.62841796875, -16.2890625, -14.94970703125, -13.6103515625, -12.27099609375, -10.931640625, -9.59228515625, -8.2529296875, -6.91357421875, -5.57421875, -4.23486328125, -2.8955078125, -1.55615234375, -0.216796875, 1.12255859375, 2.4619140625, 3.80126953125, 5.140625, 6.47998046875, 7.8193359375, 9.15869140625, 10.498046875, 11.83740234375, 13.1767578125, 14.51611328125, 15.85546875, 17.19482421875, 18.5341796875, 19.87353515625, 21.212890625, 22.55224609375, 23.8916015625, 25.23095703125, 26.5703125, 27.90966796875, 29.2490234375, 30.58837890625, 31.927734375, 33.26708984375, 34.6064453125, 35.94580078125, 37.28515625, 38.62451171875, 39.9638671875, 41.30322265625, 42.642578125, 43.98193359375, 45.3212890625, 46.66064453125, 48.0]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 5.0, 9.0, 9.0, 10.0, 5.0, 17.0, 18.0, 42.0, 51.0, 92.0, 118.0, 189.0, 252.0, 447.0, 806.0, 1493.0, 2918.0, 6039.0, 13054.0, 32025.0, 104986.0, 1057356.0, 2712195.0, 182830.0, 45878.0, 17612.0, 7819.0, 3687.0, 1875.0, 1014.0, 523.0, 309.0, 204.0, 108.0, 66.0, 69.0, 37.0, 37.0, 30.0, 18.0, 9.0, 9.0, 9.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-32.84375, -31.853515625, -30.86328125, -29.873046875, -28.8828125, -27.892578125, -26.90234375, -25.912109375, -24.921875, -23.931640625, -22.94140625, -21.951171875, -20.9609375, -19.970703125, -18.98046875, -17.990234375, -17.0, -16.009765625, -15.01953125, -14.029296875, -13.0390625, -12.048828125, -11.05859375, -10.068359375, -9.078125, -8.087890625, -7.09765625, -6.107421875, -5.1171875, -4.126953125, -3.13671875, -2.146484375, -1.15625, -0.166015625, 0.82421875, 1.814453125, 2.8046875, 3.794921875, 4.78515625, 5.775390625, 6.765625, 7.755859375, 8.74609375, 9.736328125, 10.7265625, 11.716796875, 12.70703125, 13.697265625, 14.6875, 15.677734375, 16.66796875, 17.658203125, 18.6484375, 19.638671875, 20.62890625, 21.619140625, 22.609375, 23.599609375, 24.58984375, 25.580078125, 26.5703125, 27.560546875, 28.55078125, 29.541015625, 30.53125]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 6.0, 4.0, 5.0, 9.0, 13.0, 16.0, 15.0, 36.0, 35.0, 66.0, 74.0, 80.0, 112.0, 127.0, 103.0, 74.0, 70.0, 34.0, 29.0, 21.0, 20.0, 15.0, 12.0, 12.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-159.45872497558594, -152.8987579345703, -146.33877563476562, -139.77880859375, -133.21884155273438, -126.65885925292969, -120.09889221191406, -113.5389175415039, -106.97894287109375, -100.4189682006836, -93.85899353027344, -87.29902648925781, -80.73905181884766, -74.1790771484375, -67.61911010742188, -61.05913543701172, -54.49916076660156, -47.939186096191406, -41.379215240478516, -34.819244384765625, -28.25926971435547, -21.699295043945312, -15.139324188232422, -8.579353332519531, -2.019378662109375, 4.540594100952148, 11.100566864013672, 17.660539627075195, 24.22051239013672, 30.780487060546875, 37.340457916259766, 43.900428771972656, 50.460418701171875, 57.02039337158203, 63.58036422729492, 70.14033508300781, 76.70030975341797, 83.26028442382812, 89.82025146484375, 96.3802261352539, 102.94020080566406, 109.50017547607422, 116.06015014648438, 122.6201171875, 129.18008422851562, 135.7400665283203, 142.30003356933594, 148.86001586914062, 155.41998291015625, 161.97994995117188, 168.53993225097656, 175.0998992919922, 181.65988159179688, 188.2198486328125, 194.77981567382812, 201.33978271484375, 207.89976501464844, 214.45973205566406, 221.01971435546875, 227.57968139648438, 234.1396484375, 240.6996307373047, 247.2595977783203, 253.819580078125, 260.3795471191406]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 7.0, 1.0, 3.0, 10.0, 7.0, 7.0, 16.0, 11.0, 15.0, 11.0, 14.0, 16.0, 24.0, 38.0, 24.0, 34.0, 39.0, 48.0, 34.0, 30.0, 42.0, 47.0, 39.0, 34.0, 34.0, 37.0, 34.0, 34.0, 32.0, 33.0, 32.0, 29.0, 30.0, 19.0, 22.0, 17.0, 22.0, 11.0, 15.0, 12.0, 7.0, 9.0, 8.0, 7.0, 7.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-123.80955505371094, -120.26142120361328, -116.71328735351562, -113.16515350341797, -109.61701965332031, -106.06888580322266, -102.520751953125, -98.97261810302734, -95.42448425292969, -91.87635040283203, -88.32821655273438, -84.78008270263672, -81.23194885253906, -77.6838150024414, -74.13568115234375, -70.5875473022461, -67.03941345214844, -63.49127960205078, -59.943145751953125, -56.39501190185547, -52.84687805175781, -49.298744201660156, -45.7506103515625, -42.202476501464844, -38.65434265136719, -35.10620880126953, -31.558074951171875, -28.00994110107422, -24.461807250976562, -20.913673400878906, -17.36553955078125, -13.817405700683594, -10.269271850585938, -6.721138000488281, -3.173004150390625, 0.37512969970703125, 3.9232635498046875, 7.471397399902344, 11.01953125, 14.567665100097656, 18.115798950195312, 21.66393280029297, 25.212066650390625, 28.76020050048828, 32.30833435058594, 35.856468200683594, 39.40460205078125, 42.952735900878906, 46.50086975097656, 50.04900360107422, 53.597137451171875, 57.14527130126953, 60.69340515136719, 64.24153900146484, 67.7896728515625, 71.33780670166016, 74.88594055175781, 78.43407440185547, 81.98220825195312, 85.53034210205078, 89.07847595214844, 92.6266098022461, 96.17474365234375, 99.7228775024414, 103.27101135253906]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 5.0, 2.0, 10.0, 6.0, 6.0, 8.0, 6.0, 16.0, 15.0, 16.0, 26.0, 13.0, 28.0, 29.0, 24.0, 38.0, 37.0, 44.0, 48.0, 43.0, 48.0, 41.0, 43.0, 41.0, 40.0, 45.0, 37.0, 33.0, 34.0, 29.0, 33.0, 20.0, 20.0, 27.0, 15.0, 16.0, 8.0, 14.0, 10.0, 9.0, 9.0, 10.0, 9.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-223.75, -217.376953125, -211.00390625, -204.630859375, -198.2578125, -191.884765625, -185.51171875, -179.138671875, -172.765625, -166.392578125, -160.01953125, -153.646484375, -147.2734375, -140.900390625, -134.52734375, -128.154296875, -121.78125, -115.408203125, -109.03515625, -102.662109375, -96.2890625, -89.916015625, -83.54296875, -77.169921875, -70.796875, -64.423828125, -58.05078125, -51.677734375, -45.3046875, -38.931640625, -32.55859375, -26.185546875, -19.8125, -13.439453125, -7.06640625, -0.693359375, 5.6796875, 12.052734375, 18.42578125, 24.798828125, 31.171875, 37.544921875, 43.91796875, 50.291015625, 56.6640625, 63.037109375, 69.41015625, 75.783203125, 82.15625, 88.529296875, 94.90234375, 101.275390625, 107.6484375, 114.021484375, 120.39453125, 126.767578125, 133.140625, 139.513671875, 145.88671875, 152.259765625, 158.6328125, 165.005859375, 171.37890625, 177.751953125, 184.125]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 10.0, 13.0, 16.0, 25.0, 36.0, 40.0, 51.0, 106.0, 160.0, 207.0, 302.0, 477.0, 686.0, 986.0, 1346.0, 2002.0, 3098.0, 4438.0, 6575.0, 9885.0, 14992.0, 23254.0, 37012.0, 61449.0, 109662.0, 196985.0, 230691.0, 139597.0, 77254.0, 45613.0, 28054.0, 17712.0, 11649.0, 7761.0, 5209.0, 3585.0, 2421.0, 1615.0, 1195.0, 786.0, 486.0, 350.0, 255.0, 180.0, 119.0, 68.0, 51.0, 35.0, 23.0, 19.0, 6.0, 7.0, 4.0, 2.0, 3.0, 0.0, 4.0, 2.0, 0.0, 2.0], "bins": [-12.015625, -11.6177978515625, -11.219970703125, -10.8221435546875, -10.42431640625, -10.0264892578125, -9.628662109375, -9.2308349609375, -8.8330078125, -8.4351806640625, -8.037353515625, -7.6395263671875, -7.24169921875, -6.8438720703125, -6.446044921875, -6.0482177734375, -5.650390625, -5.2525634765625, -4.854736328125, -4.4569091796875, -4.05908203125, -3.6612548828125, -3.263427734375, -2.8656005859375, -2.4677734375, -2.0699462890625, -1.672119140625, -1.2742919921875, -0.87646484375, -0.4786376953125, -0.080810546875, 0.3170166015625, 0.71484375, 1.1126708984375, 1.510498046875, 1.9083251953125, 2.30615234375, 2.7039794921875, 3.101806640625, 3.4996337890625, 3.8974609375, 4.2952880859375, 4.693115234375, 5.0909423828125, 5.48876953125, 5.8865966796875, 6.284423828125, 6.6822509765625, 7.080078125, 7.4779052734375, 7.875732421875, 8.2735595703125, 8.67138671875, 9.0692138671875, 9.467041015625, 9.8648681640625, 10.2626953125, 10.6605224609375, 11.058349609375, 11.4561767578125, 11.85400390625, 12.2518310546875, 12.649658203125, 13.0474853515625, 13.4453125]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 4.0, 1.0, 5.0, 3.0, 5.0, 10.0, 12.0, 11.0, 14.0, 18.0, 18.0, 13.0, 23.0, 24.0, 22.0, 33.0, 28.0, 35.0, 30.0, 32.0, 47.0, 30.0, 34.0, 36.0, 1056.0, 30.0, 33.0, 28.0, 41.0, 36.0, 36.0, 30.0, 21.0, 33.0, 17.0, 22.0, 22.0, 20.0, 19.0, 8.0, 13.0, 13.0, 12.0, 12.0, 8.0, 6.0, 3.0, 4.0, 5.0, 5.0, 1.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-109.1875, -105.744140625, -102.30078125, -98.857421875, -95.4140625, -91.970703125, -88.52734375, -85.083984375, -81.640625, -78.197265625, -74.75390625, -71.310546875, -67.8671875, -64.423828125, -60.98046875, -57.537109375, -54.09375, -50.650390625, -47.20703125, -43.763671875, -40.3203125, -36.876953125, -33.43359375, -29.990234375, -26.546875, -23.103515625, -19.66015625, -16.216796875, -12.7734375, -9.330078125, -5.88671875, -2.443359375, 1.0, 4.443359375, 7.88671875, 11.330078125, 14.7734375, 18.216796875, 21.66015625, 25.103515625, 28.546875, 31.990234375, 35.43359375, 38.876953125, 42.3203125, 45.763671875, 49.20703125, 52.650390625, 56.09375, 59.537109375, 62.98046875, 66.423828125, 69.8671875, 73.310546875, 76.75390625, 80.197265625, 83.640625, 87.083984375, 90.52734375, 93.970703125, 97.4140625, 100.857421875, 104.30078125, 107.744140625, 111.1875]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 10.0, 13.0, 15.0, 17.0, 36.0, 70.0, 111.0, 127.0, 197.0, 297.0, 459.0, 732.0, 1142.0, 1793.0, 2666.0, 3924.0, 6093.0, 9155.0, 14557.0, 23135.0, 37010.0, 62570.0, 110490.0, 206754.0, 1266801.0, 143441.0, 80766.0, 46151.0, 28147.0, 17691.0, 11460.0, 7217.0, 4746.0, 3294.0, 2039.0, 1388.0, 868.0, 621.0, 400.0, 258.0, 161.0, 116.0, 74.0, 40.0, 32.0, 18.0, 12.0, 8.0, 4.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.484375, -11.1043701171875, -10.724365234375, -10.3443603515625, -9.96435546875, -9.5843505859375, -9.204345703125, -8.8243408203125, -8.4443359375, -8.0643310546875, -7.684326171875, -7.3043212890625, -6.92431640625, -6.5443115234375, -6.164306640625, -5.7843017578125, -5.404296875, -5.0242919921875, -4.644287109375, -4.2642822265625, -3.88427734375, -3.5042724609375, -3.124267578125, -2.7442626953125, -2.3642578125, -1.9842529296875, -1.604248046875, -1.2242431640625, -0.84423828125, -0.4642333984375, -0.084228515625, 0.2957763671875, 0.67578125, 1.0557861328125, 1.435791015625, 1.8157958984375, 2.19580078125, 2.5758056640625, 2.955810546875, 3.3358154296875, 3.7158203125, 4.0958251953125, 4.475830078125, 4.8558349609375, 5.23583984375, 5.6158447265625, 5.995849609375, 6.3758544921875, 6.755859375, 7.1358642578125, 7.515869140625, 7.8958740234375, 8.27587890625, 8.6558837890625, 9.035888671875, 9.4158935546875, 9.7958984375, 10.1759033203125, 10.555908203125, 10.9359130859375, 11.31591796875, 11.6959228515625, 12.075927734375, 12.4559326171875, 12.8359375]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 3.0, 1.0, 3.0, 4.0, 11.0, 3.0, 8.0, 7.0, 7.0, 14.0, 21.0, 15.0, 32.0, 20.0, 30.0, 39.0, 52.0, 73.0, 103.0, 77.0, 86.0, 59.0, 59.0, 43.0, 41.0, 30.0, 30.0, 21.0, 20.0, 18.0, 8.0, 18.0, 8.0, 6.0, 6.0, 2.0, 6.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.10626220703125, -0.10278892517089844, -0.09931564331054688, -0.09584236145019531, -0.09236907958984375, -0.08889579772949219, -0.08542251586914062, -0.08194923400878906, -0.0784759521484375, -0.07500267028808594, -0.07152938842773438, -0.06805610656738281, -0.06458282470703125, -0.06110954284667969, -0.057636260986328125, -0.05416297912597656, -0.050689697265625, -0.04721641540527344, -0.043743133544921875, -0.04026985168457031, -0.03679656982421875, -0.03332328796386719, -0.029850006103515625, -0.026376724243164062, -0.0229034423828125, -0.019430160522460938, -0.015956878662109375, -0.012483596801757812, -0.00901031494140625, -0.0055370330810546875, -0.002063751220703125, 0.0014095306396484375, 0.0048828125, 0.008356094360351562, 0.011829376220703125, 0.015302658081054688, 0.01877593994140625, 0.022249221801757812, 0.025722503662109375, 0.029195785522460938, 0.0326690673828125, 0.03614234924316406, 0.039615631103515625, 0.04308891296386719, 0.04656219482421875, 0.05003547668457031, 0.053508758544921875, 0.05698204040527344, 0.060455322265625, 0.06392860412597656, 0.06740188598632812, 0.07087516784667969, 0.07434844970703125, 0.07782173156738281, 0.08129501342773438, 0.08476829528808594, 0.0882415771484375, 0.09171485900878906, 0.09518814086914062, 0.09866142272949219, 0.10213470458984375, 0.10560798645019531, 0.10908126831054688, 0.11255455017089844, 0.11602783203125]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 7.0, 6.0, 5.0, 9.0, 9.0, 12.0, 16.0, 21.0, 33.0, 37.0, 26.0, 62.0, 64.0, 81.0, 105.0, 188.0, 274.0, 449.0, 752.0, 1277.0, 2652.0, 5324.0, 12013.0, 30273.0, 90976.0, 393859.0, 371929.0, 86638.0, 28870.0, 11612.0, 5134.0, 2510.0, 1264.0, 761.0, 444.0, 263.0, 165.0, 108.0, 77.0, 64.0, 31.0, 38.0, 27.0, 26.0, 17.0, 14.0, 7.0, 8.0, 7.0, 3.0, 4.0, 4.0, 2.0, 4.0, 1.0, 2.0, 2.0], "bins": [-0.60986328125, -0.59136962890625, -0.5728759765625, -0.55438232421875, -0.535888671875, -0.51739501953125, -0.4989013671875, -0.48040771484375, -0.4619140625, -0.44342041015625, -0.4249267578125, -0.40643310546875, -0.387939453125, -0.36944580078125, -0.3509521484375, -0.33245849609375, -0.31396484375, -0.29547119140625, -0.2769775390625, -0.25848388671875, -0.239990234375, -0.22149658203125, -0.2030029296875, -0.18450927734375, -0.166015625, -0.14752197265625, -0.1290283203125, -0.11053466796875, -0.092041015625, -0.07354736328125, -0.0550537109375, -0.03656005859375, -0.01806640625, 0.00042724609375, 0.0189208984375, 0.03741455078125, 0.055908203125, 0.07440185546875, 0.0928955078125, 0.11138916015625, 0.1298828125, 0.14837646484375, 0.1668701171875, 0.18536376953125, 0.203857421875, 0.22235107421875, 0.2408447265625, 0.25933837890625, 0.27783203125, 0.29632568359375, 0.3148193359375, 0.33331298828125, 0.351806640625, 0.37030029296875, 0.3887939453125, 0.40728759765625, 0.42578125, 0.44427490234375, 0.4627685546875, 0.48126220703125, 0.499755859375, 0.51824951171875, 0.5367431640625, 0.55523681640625, 0.57373046875]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 9.0, 14.0, 41.0, 94.0, 205.0, 225.0, 155.0, 88.0, 52.0, 41.0, 22.0, 22.0, 7.0, 12.0, 6.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.11078447103500366, -0.09978906810283661, -0.08879366517066956, -0.0777982547879219, -0.06680285185575485, -0.0558074489235878, -0.04481203854084015, -0.033816635608673096, -0.022821232676506042, -0.01182582788169384, -0.0008304230868816376, 0.010164983570575714, 0.021160386502742767, 0.03215578943490982, 0.04315119981765747, 0.054146602749824524, 0.06514200568199158, 0.07613740861415863, 0.08713281154632568, 0.09812822192907333, 0.10912362486124039, 0.12011902779340744, 0.1311144381761551, 0.14210984110832214, 0.1531052440404892, 0.16410064697265625, 0.1750960499048233, 0.18609145283699036, 0.1970868706703186, 0.20808225870132446, 0.2190776765346527, 0.23007307946681976, 0.24106848239898682, 0.25206390023231506, 0.2630592882633209, 0.27405470609664917, 0.28505009412765503, 0.2960455119609833, 0.3070409297943115, 0.3180363178253174, 0.32903170585632324, 0.3400271236896515, 0.35102251172065735, 0.3620179295539856, 0.37301331758499146, 0.3840087354183197, 0.39500415325164795, 0.4059995412826538, 0.41699495911598206, 0.4279903769493103, 0.43898576498031616, 0.4499811828136444, 0.46097657084465027, 0.4719719886779785, 0.4829673767089844, 0.4939627945423126, 0.5049582123756409, 0.5159536004066467, 0.5269490480422974, 0.5379444360733032, 0.5489398241043091, 0.5599352121353149, 0.5709306597709656, 0.5819260478019714, 0.5929214358329773]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 6.0, 4.0, 6.0, 7.0, 7.0, 8.0, 12.0, 13.0, 14.0, 14.0, 14.0, 18.0, 39.0, 28.0, 19.0, 18.0, 34.0, 34.0, 39.0, 33.0, 34.0, 39.0, 36.0, 29.0, 36.0, 45.0, 39.0, 38.0, 33.0, 21.0, 28.0, 24.0, 32.0, 24.0, 28.0, 20.0, 18.0, 15.0, 13.0, 12.0, 8.0, 19.0, 16.0, 11.0, 6.0, 6.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 3.0], "bins": [-0.11677920818328857, -0.11341586709022522, -0.11005252599716187, -0.10668918490409851, -0.10332584381103516, -0.0999625027179718, -0.09659916907548904, -0.09323582798242569, -0.08987248688936234, -0.08650914579629898, -0.08314580470323563, -0.07978246361017227, -0.07641912996768951, -0.07305578887462616, -0.0696924477815628, -0.06632910668849945, -0.0629657655954361, -0.05960242450237274, -0.05623908340930939, -0.05287574604153633, -0.04951240494847298, -0.04614906385540962, -0.042785726487636566, -0.03942238539457321, -0.03605904430150986, -0.0326957032084465, -0.029332363978028297, -0.025969024747610092, -0.022605683654546738, -0.019242342561483383, -0.015879003331065178, -0.012515664100646973, -0.009152323007583618, -0.005788982845842838, -0.0024256426841020584, 0.0009376974776387215, 0.004301037639379501, 0.007664378732442856, 0.011027717962861061, 0.014391057193279266, 0.01775439828634262, 0.021117739379405975, 0.02448107860982418, 0.027844417840242386, 0.03120775893330574, 0.034571100026369095, 0.03793443739414215, 0.041297778487205505, 0.04466111958026886, 0.048024460673332214, 0.05138780176639557, 0.054751139134168625, 0.05811448022723198, 0.061477821320295334, 0.06484115868806839, 0.06820449978113174, 0.0715678408741951, 0.07493118196725845, 0.07829452306032181, 0.08165786415338516, 0.08502119779586792, 0.08838453888893127, 0.09174787998199463, 0.09511122107505798, 0.09847456216812134]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 10.0, 5.0, 7.0, 8.0, 6.0, 16.0, 15.0, 16.0, 25.0, 14.0, 30.0, 27.0, 24.0, 38.0, 36.0, 44.0, 50.0, 42.0, 49.0, 40.0, 43.0, 43.0, 37.0, 46.0, 37.0, 32.0, 36.0, 27.0, 33.0, 21.0, 21.0, 27.0, 14.0, 17.0, 7.0, 14.0, 10.0, 9.0, 9.0, 11.0, 8.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-223.75, -217.376953125, -211.00390625, -204.630859375, -198.2578125, -191.884765625, -185.51171875, -179.138671875, -172.765625, -166.392578125, -160.01953125, -153.646484375, -147.2734375, -140.900390625, -134.52734375, -128.154296875, -121.78125, -115.408203125, -109.03515625, -102.662109375, -96.2890625, -89.916015625, -83.54296875, -77.169921875, -70.796875, -64.423828125, -58.05078125, -51.677734375, -45.3046875, -38.931640625, -32.55859375, -26.185546875, -19.8125, -13.439453125, -7.06640625, -0.693359375, 5.6796875, 12.052734375, 18.42578125, 24.798828125, 31.171875, 37.544921875, 43.91796875, 50.291015625, 56.6640625, 63.037109375, 69.41015625, 75.783203125, 82.15625, 88.529296875, 94.90234375, 101.275390625, 107.6484375, 114.021484375, 120.39453125, 126.767578125, 133.140625, 139.513671875, 145.88671875, 152.259765625, 158.6328125, 165.005859375, 171.37890625, 177.751953125, 184.125]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 3.0, 11.0, 11.0, 10.0, 17.0, 25.0, 16.0, 37.0, 28.0, 34.0, 44.0, 52.0, 80.0, 111.0, 176.0, 304.0, 570.0, 1349.0, 3523.0, 11027.0, 44139.0, 279682.0, 586974.0, 91421.0, 19160.0, 5717.0, 2010.0, 819.0, 431.0, 232.0, 136.0, 74.0, 67.0, 51.0, 41.0, 26.0, 29.0, 25.0, 19.0, 19.0, 11.0, 14.0, 13.0, 5.0, 7.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0], "bins": [-41.71875, -40.49951171875, -39.2802734375, -38.06103515625, -36.841796875, -35.62255859375, -34.4033203125, -33.18408203125, -31.96484375, -30.74560546875, -29.5263671875, -28.30712890625, -27.087890625, -25.86865234375, -24.6494140625, -23.43017578125, -22.2109375, -20.99169921875, -19.7724609375, -18.55322265625, -17.333984375, -16.11474609375, -14.8955078125, -13.67626953125, -12.45703125, -11.23779296875, -10.0185546875, -8.79931640625, -7.580078125, -6.36083984375, -5.1416015625, -3.92236328125, -2.703125, -1.48388671875, -0.2646484375, 0.95458984375, 2.173828125, 3.39306640625, 4.6123046875, 5.83154296875, 7.05078125, 8.27001953125, 9.4892578125, 10.70849609375, 11.927734375, 13.14697265625, 14.3662109375, 15.58544921875, 16.8046875, 18.02392578125, 19.2431640625, 20.46240234375, 21.681640625, 22.90087890625, 24.1201171875, 25.33935546875, 26.55859375, 27.77783203125, 28.9970703125, 30.21630859375, 31.435546875, 32.65478515625, 33.8740234375, 35.09326171875, 36.3125]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 7.0, 8.0, 9.0, 14.0, 14.0, 20.0, 35.0, 49.0, 38.0, 43.0, 67.0, 75.0, 60.0, 2101.0, 96.0, 67.0, 75.0, 57.0, 50.0, 34.0, 37.0, 25.0, 21.0, 9.0, 14.0, 8.0, 6.0, 5.0, 3.0, 1.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-328.0, -316.15625, -304.3125, -292.46875, -280.625, -268.78125, -256.9375, -245.09375, -233.25, -221.40625, -209.5625, -197.71875, -185.875, -174.03125, -162.1875, -150.34375, -138.5, -126.65625, -114.8125, -102.96875, -91.125, -79.28125, -67.4375, -55.59375, -43.75, -31.90625, -20.0625, -8.21875, 3.625, 15.46875, 27.3125, 39.15625, 51.0, 62.84375, 74.6875, 86.53125, 98.375, 110.21875, 122.0625, 133.90625, 145.75, 157.59375, 169.4375, 181.28125, 193.125, 204.96875, 216.8125, 228.65625, 240.5, 252.34375, 264.1875, 276.03125, 287.875, 299.71875, 311.5625, 323.40625, 335.25, 347.09375, 358.9375, 370.78125, 382.625, 394.46875, 406.3125, 418.15625, 430.0]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 12.0, 9.0, 15.0, 25.0, 29.0, 46.0, 79.0, 140.0, 236.0, 409.0, 1015.0, 2612.0, 17733.0, 2813542.0, 296379.0, 9680.0, 2055.0, 788.0, 389.0, 210.0, 90.0, 81.0, 40.0, 27.0, 22.0, 12.0, 12.0, 0.0, 3.0, 6.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-86.5, -84.154296875, -81.80859375, -79.462890625, -77.1171875, -74.771484375, -72.42578125, -70.080078125, -67.734375, -65.388671875, -63.04296875, -60.697265625, -58.3515625, -56.005859375, -53.66015625, -51.314453125, -48.96875, -46.623046875, -44.27734375, -41.931640625, -39.5859375, -37.240234375, -34.89453125, -32.548828125, -30.203125, -27.857421875, -25.51171875, -23.166015625, -20.8203125, -18.474609375, -16.12890625, -13.783203125, -11.4375, -9.091796875, -6.74609375, -4.400390625, -2.0546875, 0.291015625, 2.63671875, 4.982421875, 7.328125, 9.673828125, 12.01953125, 14.365234375, 16.7109375, 19.056640625, 21.40234375, 23.748046875, 26.09375, 28.439453125, 30.78515625, 33.130859375, 35.4765625, 37.822265625, 40.16796875, 42.513671875, 44.859375, 47.205078125, 49.55078125, 51.896484375, 54.2421875, 56.587890625, 58.93359375, 61.279296875, 63.625]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 2.0, 4.0, 6.0, 18.0, 16.0, 17.0, 67.0, 93.0, 184.0, 192.0, 174.0, 92.0, 49.0, 29.0, 15.0, 11.0, 7.0, 4.0, 4.0, 5.0, 2.0, 4.0, 0.0, 2.0, 3.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-541.301513671875, -526.8113403320312, -512.3211669921875, -497.83099365234375, -483.3407897949219, -468.8506164550781, -454.3604431152344, -439.8702697753906, -425.38006591796875, -410.889892578125, -396.39971923828125, -381.9095458984375, -367.4193420410156, -352.9291687011719, -338.4389953613281, -323.9488220214844, -309.4586486816406, -294.9684753417969, -280.4783020019531, -265.98809814453125, -251.4979248046875, -237.00775146484375, -222.517578125, -208.02740478515625, -193.53721618652344, -179.0470428466797, -164.55685424804688, -150.06668090820312, -135.57650756835938, -121.08631896972656, -106.59614562988281, -92.10596466064453, -77.61578369140625, -63.12560272216797, -48.63542556762695, -34.14524841308594, -19.655067443847656, -5.164886474609375, 9.325286865234375, 23.815467834472656, 38.30564880371094, 52.79582977294922, 67.2860107421875, 81.77618408203125, 96.26636505126953, 110.75654602050781, 125.24671936035156, 139.73690795898438, 154.22708129882812, 168.71725463867188, 183.2074432373047, 197.69761657714844, 212.18780517578125, 226.677978515625, 241.16815185546875, 255.6583251953125, 270.14849853515625, 284.638671875, 299.12884521484375, 313.6190185546875, 328.1092224121094, 342.5993957519531, 357.0895690917969, 371.5797424316406, 386.0699462890625]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 7.0, 8.0, 6.0, 13.0, 8.0, 19.0, 24.0, 29.0, 32.0, 31.0, 30.0, 43.0, 44.0, 46.0, 39.0, 57.0, 57.0, 50.0, 43.0, 45.0, 57.0, 32.0, 41.0, 47.0, 26.0, 35.0, 23.0, 24.0, 19.0, 9.0, 13.0, 2.0, 8.0, 6.0, 5.0, 6.0, 3.0, 7.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-411.3312072753906, -399.6236267089844, -387.9160461425781, -376.2084655761719, -364.5008850097656, -352.7933349609375, -341.08575439453125, -329.378173828125, -317.67059326171875, -305.9630126953125, -294.25543212890625, -282.5478515625, -270.84027099609375, -259.1326904296875, -247.4251251220703, -235.71755981445312, -224.0099639892578, -212.30238342285156, -200.5948028564453, -188.88723754882812, -177.17965698242188, -165.47207641601562, -153.76449584960938, -142.05691528320312, -130.34933471679688, -118.64175415039062, -106.9341812133789, -95.22660064697266, -83.51902770996094, -71.81144714355469, -60.10386657714844, -48.39629364013672, -36.688720703125, -24.981143951416016, -13.273565292358398, -1.5659866333007812, 10.141590118408203, 21.849166870117188, 33.55674743652344, 45.264320373535156, 56.971900939941406, 68.67948150634766, 80.38705444335938, 92.09463500976562, 103.80221557617188, 115.5097885131836, 127.21736907958984, 138.92494201660156, 150.6325225830078, 162.34010314941406, 174.0476837158203, 185.7552490234375, 197.46282958984375, 209.17041015625, 220.87799072265625, 232.5855712890625, 244.29315185546875, 256.000732421875, 267.70831298828125, 279.4158935546875, 291.12347412109375, 302.8310546875, 314.53863525390625, 326.2461853027344, 337.9537658691406]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 6.0, 7.0, 3.0, 1.0, 8.0, 10.0, 12.0, 15.0, 9.0, 20.0, 24.0, 12.0, 28.0, 23.0, 34.0, 44.0, 55.0, 86.0, 153.0, 302.0, 612.0, 1125.0, 1041124.0, 2352.0, 1047.0, 616.0, 288.0, 151.0, 82.0, 49.0, 48.0, 35.0, 19.0, 26.0, 23.0, 20.0, 15.0, 17.0, 11.0, 8.0, 9.0, 10.0, 4.0, 8.0, 3.0, 2.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-183.59390258789062, -178.02786254882812, -172.46182250976562, -166.89578247070312, -161.32974243164062, -155.7637176513672, -150.1976776123047, -144.6316375732422, -139.0655975341797, -133.4995574951172, -127.93351745605469, -122.36748504638672, -116.80144500732422, -111.23540496826172, -105.66937255859375, -100.10333251953125, -94.53729248046875, -88.97125244140625, -83.40521240234375, -77.83917999267578, -72.27313995361328, -66.70709991455078, -61.14106369018555, -55.57502746582031, -50.00898742675781, -44.44294738769531, -38.87691116333008, -33.310874938964844, -27.744834899902344, -22.178796768188477, -16.61275863647461, -11.046722412109375, -5.4806976318359375, 0.08534049987792969, 5.651378631591797, 11.217416763305664, 16.78345489501953, 22.3494930267334, 27.915531158447266, 33.4815673828125, 39.047607421875, 44.6136474609375, 50.179683685302734, 55.74571990966797, 61.31175994873047, 66.87779998779297, 72.44383239746094, 78.00987243652344, 83.57591247558594, 89.14195251464844, 94.70799255371094, 100.2740249633789, 105.8400650024414, 111.4061050415039, 116.97213745117188, 122.53817749023438, 128.10421752929688, 133.67025756835938, 139.23629760742188, 144.80233764648438, 150.36837768554688, 155.9344024658203, 161.5004425048828, 167.0664825439453, 172.6325225830078]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 3.0, 3.0, 4.0, 2.0, 4.0, 8.0, 6.0, 8.0, 14.0, 13.0, 15.0, 28.0, 35.0, 78.0, 349.0, 51441860.0, 20352.0, 273.0, 50.0, 29.0, 17.0, 7.0, 7.0, 6.0, 9.0, 1.0, 7.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-2284.1474609375, -2216.785888671875, -2149.424072265625, -2082.0625, -2014.70068359375, -1947.339111328125, -1879.9774169921875, -1812.61572265625, -1745.2540283203125, -1677.892333984375, -1610.5306396484375, -1543.1689453125, -1475.807373046875, -1408.445556640625, -1341.083984375, -1273.7222900390625, -1206.360595703125, -1138.9989013671875, -1071.63720703125, -1004.2755737304688, -936.9138793945312, -869.5521850585938, -802.1905517578125, -734.828857421875, -667.4671630859375, -600.10546875, -532.7437744140625, -465.38214111328125, -398.02044677734375, -330.65875244140625, -263.2970886230469, -195.9354248046875, -128.57373046875, -61.21205139160156, 6.149627685546875, 73.51130676269531, 140.87298583984375, 208.23468017578125, 275.5963439941406, 342.9580078125, 410.3197021484375, 477.681396484375, 545.0430908203125, 612.4047241210938, 679.7664184570312, 747.1281127929688, 814.48974609375, 881.8514404296875, 949.213134765625, 1016.5748291015625, 1083.9365234375, 1151.2982177734375, 1218.659912109375, 1286.021484375, 1353.3831787109375, 1420.744873046875, 1488.1065673828125, 1555.46826171875, 1622.8299560546875, 1690.191650390625, 1757.55322265625, 1824.9150390625, 1892.276611328125, 1959.6383056640625, 2027.0]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 1.0, 2.0, 3.0, 5.0, 13.0, 29.0, 37.0, 47.0, 80.0, 153.0, 202.0, 307.0, 556.0, 870.0, 1315.0, 1966.0, 3094.0, 4846.0, 7423.0, 11045.0, 17809.0, 28319.0, 45431.0, 73579.0, 125278.0, 219306.0, 390510.0, 1635331.0, 2751805.0, 408674.0, 227935.0, 130027.0, 77588.0, 47348.0, 29040.0, 18273.0, 11620.0, 7698.0, 4893.0, 3057.0, 2082.0, 1341.0, 875.0, 560.0, 358.0, 258.0, 163.0, 105.0, 73.0, 39.0, 29.0, 19.0, 9.0, 9.0, 7.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-3.525390625, -3.41180419921875, -3.2982177734375, -3.18463134765625, -3.071044921875, -2.95745849609375, -2.8438720703125, -2.73028564453125, -2.61669921875, -2.50311279296875, -2.3895263671875, -2.27593994140625, -2.162353515625, -2.04876708984375, -1.9351806640625, -1.82159423828125, -1.7080078125, -1.59442138671875, -1.4808349609375, -1.36724853515625, -1.253662109375, -1.14007568359375, -1.0264892578125, -0.91290283203125, -0.79931640625, -0.68572998046875, -0.5721435546875, -0.45855712890625, -0.344970703125, -0.23138427734375, -0.1177978515625, -0.00421142578125, 0.109375, 0.22296142578125, 0.3365478515625, 0.45013427734375, 0.563720703125, 0.67730712890625, 0.7908935546875, 0.90447998046875, 1.01806640625, 1.13165283203125, 1.2452392578125, 1.35882568359375, 1.472412109375, 1.58599853515625, 1.6995849609375, 1.81317138671875, 1.9267578125, 2.04034423828125, 2.1539306640625, 2.26751708984375, 2.381103515625, 2.49468994140625, 2.6082763671875, 2.72186279296875, 2.83544921875, 2.94903564453125, 3.0626220703125, 3.17620849609375, 3.289794921875, 3.40338134765625, 3.5169677734375, 3.63055419921875, 3.744140625]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 6.0, 3.0, 6.0, 12.0, 10.0, 11.0, 10.0, 7.0, 11.0, 16.0, 17.0, 14.0, 22.0, 26.0, 30.0, 30.0, 36.0, 24.0, 35.0, 29.0, 41.0, 44.0, 120.0, 955.0, 83.0, 39.0, 28.0, 28.0, 33.0, 41.0, 31.0, 40.0, 29.0, 20.0, 17.0, 13.0, 23.0, 17.0, 13.0, 14.0, 15.0, 4.0, 5.0, 8.0, 4.0, 4.0, 3.0, 2.0, 4.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.0, -32.71533203125, -31.4306640625, -30.14599609375, -28.861328125, -27.57666015625, -26.2919921875, -25.00732421875, -23.72265625, -22.43798828125, -21.1533203125, -19.86865234375, -18.583984375, -17.29931640625, -16.0146484375, -14.72998046875, -13.4453125, -12.16064453125, -10.8759765625, -9.59130859375, -8.306640625, -7.02197265625, -5.7373046875, -4.45263671875, -3.16796875, -1.88330078125, -0.5986328125, 0.68603515625, 1.970703125, 3.25537109375, 4.5400390625, 5.82470703125, 7.109375, 8.39404296875, 9.6787109375, 10.96337890625, 12.248046875, 13.53271484375, 14.8173828125, 16.10205078125, 17.38671875, 18.67138671875, 19.9560546875, 21.24072265625, 22.525390625, 23.81005859375, 25.0947265625, 26.37939453125, 27.6640625, 28.94873046875, 30.2333984375, 31.51806640625, 32.802734375, 34.08740234375, 35.3720703125, 36.65673828125, 37.94140625, 39.22607421875, 40.5107421875, 41.79541015625, 43.080078125, 44.36474609375, 45.6494140625, 46.93408203125, 48.21875]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 6.0, 10.0, 20.0, 15.0, 30.0, 32.0, 64.0, 95.0, 170.0, 277.0, 479.0, 690.0, 1100.0, 1759.0, 2853.0, 4622.0, 7351.0, 11619.0, 18706.0, 30237.0, 48658.0, 79088.0, 131886.0, 218741.0, 340194.0, 506527.0, 3615205.0, 452069.0, 312398.0, 197273.0, 119950.0, 72053.0, 44687.0, 27303.0, 17087.0, 10303.0, 6690.0, 4244.0, 2609.0, 1678.0, 926.0, 654.0, 408.0, 220.0, 156.0, 109.0, 75.0, 39.0, 32.0, 12.0, 9.0, 8.0, 4.0, 3.0, 2.0, 3.0, 3.0, 3.0], "bins": [-2.775390625, -2.689727783203125, -2.60406494140625, -2.518402099609375, -2.4327392578125, -2.347076416015625, -2.26141357421875, -2.175750732421875, -2.090087890625, -2.004425048828125, -1.91876220703125, -1.833099365234375, -1.7474365234375, -1.661773681640625, -1.57611083984375, -1.490447998046875, -1.40478515625, -1.319122314453125, -1.23345947265625, -1.147796630859375, -1.0621337890625, -0.976470947265625, -0.89080810546875, -0.805145263671875, -0.719482421875, -0.633819580078125, -0.54815673828125, -0.462493896484375, -0.3768310546875, -0.291168212890625, -0.20550537109375, -0.119842529296875, -0.0341796875, 0.051483154296875, 0.13714599609375, 0.222808837890625, 0.3084716796875, 0.394134521484375, 0.47979736328125, 0.565460205078125, 0.651123046875, 0.736785888671875, 0.82244873046875, 0.908111572265625, 0.9937744140625, 1.079437255859375, 1.16510009765625, 1.250762939453125, 1.33642578125, 1.422088623046875, 1.50775146484375, 1.593414306640625, 1.6790771484375, 1.764739990234375, 1.85040283203125, 1.936065673828125, 2.021728515625, 2.107391357421875, 2.19305419921875, 2.278717041015625, 2.3643798828125, 2.450042724609375, 2.53570556640625, 2.621368408203125, 2.70703125]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 5.0, 5.0, 9.0, 4.0, 5.0, 5.0, 12.0, 9.0, 13.0, 18.0, 22.0, 23.0, 21.0, 28.0, 29.0, 25.0, 34.0, 44.0, 28.0, 33.0, 40.0, 34.0, 125.0, 966.0, 49.0, 36.0, 37.0, 39.0, 41.0, 27.0, 36.0, 25.0, 25.0, 29.0, 23.0, 15.0, 17.0, 12.0, 15.0, 11.0, 13.0, 15.0, 7.0, 9.0, 3.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-31.125, -30.165283203125, -29.20556640625, -28.245849609375, -27.2861328125, -26.326416015625, -25.36669921875, -24.406982421875, -23.447265625, -22.487548828125, -21.52783203125, -20.568115234375, -19.6083984375, -18.648681640625, -17.68896484375, -16.729248046875, -15.76953125, -14.809814453125, -13.85009765625, -12.890380859375, -11.9306640625, -10.970947265625, -10.01123046875, -9.051513671875, -8.091796875, -7.132080078125, -6.17236328125, -5.212646484375, -4.2529296875, -3.293212890625, -2.33349609375, -1.373779296875, -0.4140625, 0.545654296875, 1.50537109375, 2.465087890625, 3.4248046875, 4.384521484375, 5.34423828125, 6.303955078125, 7.263671875, 8.223388671875, 9.18310546875, 10.142822265625, 11.1025390625, 12.062255859375, 13.02197265625, 13.981689453125, 14.94140625, 15.901123046875, 16.86083984375, 17.820556640625, 18.7802734375, 19.739990234375, 20.69970703125, 21.659423828125, 22.619140625, 23.578857421875, 24.53857421875, 25.498291015625, 26.4580078125, 27.417724609375, 28.37744140625, 29.337158203125, 30.296875]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 12.0, 9.0, 7.0, 12.0, 17.0, 25.0, 28.0, 28.0, 51.0, 93.0, 123.0, 188.0, 208.0, 270.0, 397.0, 577.0, 1012.0, 1630.0, 3041.0, 5997.0, 12029.0, 24706.0, 52903.0, 114482.0, 5659354.0, 243140.0, 88709.0, 41753.0, 19955.0, 9637.0, 4693.0, 2520.0, 1286.0, 774.0, 486.0, 364.0, 261.0, 164.0, 143.0, 98.0, 74.0, 52.0, 29.0, 25.0, 21.0, 13.0, 14.0, 14.0, 5.0, 4.0, 3.0, 4.0, 0.0, 3.0], "bins": [-10.3984375, -10.0999755859375, -9.801513671875, -9.5030517578125, -9.20458984375, -8.9061279296875, -8.607666015625, -8.3092041015625, -8.0107421875, -7.7122802734375, -7.413818359375, -7.1153564453125, -6.81689453125, -6.5184326171875, -6.219970703125, -5.9215087890625, -5.623046875, -5.3245849609375, -5.026123046875, -4.7276611328125, -4.42919921875, -4.1307373046875, -3.832275390625, -3.5338134765625, -3.2353515625, -2.9368896484375, -2.638427734375, -2.3399658203125, -2.04150390625, -1.7430419921875, -1.444580078125, -1.1461181640625, -0.84765625, -0.5491943359375, -0.250732421875, 0.0477294921875, 0.34619140625, 0.6446533203125, 0.943115234375, 1.2415771484375, 1.5400390625, 1.8385009765625, 2.136962890625, 2.4354248046875, 2.73388671875, 3.0323486328125, 3.330810546875, 3.6292724609375, 3.927734375, 4.2261962890625, 4.524658203125, 4.8231201171875, 5.12158203125, 5.4200439453125, 5.718505859375, 6.0169677734375, 6.3154296875, 6.6138916015625, 6.912353515625, 7.2108154296875, 7.50927734375, 7.8077392578125, 8.106201171875, 8.4046630859375, 8.703125]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 4.0, 3.0, 8.0, 4.0, 8.0, 10.0, 13.0, 12.0, 11.0, 15.0, 13.0, 20.0, 26.0, 28.0, 35.0, 33.0, 28.0, 20.0, 29.0, 36.0, 44.0, 35.0, 566.0, 556.0, 38.0, 32.0, 42.0, 38.0, 29.0, 43.0, 31.0, 35.0, 32.0, 21.0, 20.0, 23.0, 14.0, 14.0, 20.0, 9.0, 7.0, 8.0, 5.0, 5.0, 3.0, 1.0, 5.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.671875, -21.801513671875, -20.93115234375, -20.060791015625, -19.1904296875, -18.320068359375, -17.44970703125, -16.579345703125, -15.708984375, -14.838623046875, -13.96826171875, -13.097900390625, -12.2275390625, -11.357177734375, -10.48681640625, -9.616455078125, -8.74609375, -7.875732421875, -7.00537109375, -6.135009765625, -5.2646484375, -4.394287109375, -3.52392578125, -2.653564453125, -1.783203125, -0.912841796875, -0.04248046875, 0.827880859375, 1.6982421875, 2.568603515625, 3.43896484375, 4.309326171875, 5.1796875, 6.050048828125, 6.92041015625, 7.790771484375, 8.6611328125, 9.531494140625, 10.40185546875, 11.272216796875, 12.142578125, 13.012939453125, 13.88330078125, 14.753662109375, 15.6240234375, 16.494384765625, 17.36474609375, 18.235107421875, 19.10546875, 19.975830078125, 20.84619140625, 21.716552734375, 22.5869140625, 23.457275390625, 24.32763671875, 25.197998046875, 26.068359375, 26.938720703125, 27.80908203125, 28.679443359375, 29.5498046875, 30.420166015625, 31.29052734375, 32.160888671875, 33.03125]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 5.0, 5.0, 18.0, 34.0, 78.0, 238.0, 380.0, 157.0, 55.0, 26.0, 9.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-169.63021850585938, -165.21250915527344, -160.79481506347656, -156.37710571289062, -151.9593963623047, -147.54168701171875, -143.12399291992188, -138.70628356933594, -134.28857421875, -129.87086486816406, -125.45316314697266, -121.03546142578125, -116.61775207519531, -112.2000503540039, -107.7823486328125, -103.36463928222656, -98.94693756103516, -94.52923583984375, -90.11152648925781, -85.6938247680664, -81.27611541748047, -76.85841369628906, -72.44070434570312, -68.02300262451172, -63.60529708862305, -59.187591552734375, -54.7698860168457, -50.35218048095703, -45.934478759765625, -41.51676940917969, -37.09906768798828, -32.68136215209961, -28.263656616210938, -23.845951080322266, -19.428245544433594, -15.010541915893555, -10.592836380004883, -6.175130844116211, -1.7574272155761719, 2.6602783203125, 7.077983856201172, 11.495689392089844, 15.9133939743042, 20.331098556518555, 24.748804092407227, 29.1665096282959, 33.58421325683594, 38.00191879272461, 42.41962432861328, 46.83732986450195, 51.255035400390625, 55.67273712158203, 60.09044647216797, 64.50814819335938, 68.92585754394531, 73.34355926513672, 77.76126098632812, 82.17896270751953, 86.59667205810547, 91.01437377929688, 95.43208312988281, 99.84978485107422, 104.26748657226562, 108.68519592285156, 113.1029052734375]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 6.0, 6.0, 7.0, 7.0, 11.0, 14.0, 14.0, 19.0, 27.0, 17.0, 29.0, 34.0, 39.0, 45.0, 52.0, 40.0, 57.0, 49.0, 55.0, 48.0, 47.0, 40.0, 45.0, 49.0, 29.0, 35.0, 40.0, 28.0, 21.0, 16.0, 11.0, 18.0, 9.0, 13.0, 6.0, 8.0, 7.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-73.93032836914062, -71.72845458984375, -69.5265884399414, -67.32471466064453, -65.12284851074219, -62.92097473144531, -60.71910095214844, -58.51723098754883, -56.31536102294922, -54.11349105834961, -51.91162109375, -49.709747314453125, -47.507877349853516, -45.306007385253906, -43.10413360595703, -40.90226364135742, -38.70039367675781, -36.4985237121582, -34.296653747558594, -32.09477996826172, -29.89291000366211, -27.6910400390625, -25.489168167114258, -23.287296295166016, -21.085426330566406, -18.883556365966797, -16.681684494018555, -14.479813575744629, -12.277942657470703, -10.076071739196777, -7.874200820922852, -5.672329902648926, -3.470458984375, -1.2685880661010742, 0.9332828521728516, 3.1351537704467773, 5.337024688720703, 7.538895606994629, 9.740766525268555, 11.94263744354248, 14.144508361816406, 16.346378326416016, 18.548250198364258, 20.7501220703125, 22.95199203491211, 25.15386199951172, 27.35573387145996, 29.557605743408203, 31.759475708007812, 33.96134567260742, 36.16321563720703, 38.365089416503906, 40.566959381103516, 42.768829345703125, 44.970703125, 47.17257308959961, 49.37444305419922, 51.57631301879883, 53.77818298339844, 55.98005676269531, 58.18192672729492, 60.38379669189453, 62.585670471191406, 64.78753662109375, 66.98941040039062]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 2.0, 2.0, 4.0, 7.0, 6.0, 13.0, 11.0, 9.0, 24.0, 17.0, 17.0, 31.0, 54.0, 56.0, 94.0, 120.0, 153.0, 215.0, 302.0, 401.0, 614.0, 1117.0, 1989.0, 4024.0, 10613.0, 46441.0, 3963256.0, 131930.0, 18634.0, 6440.0, 2994.0, 1554.0, 956.0, 573.0, 434.0, 281.0, 196.0, 149.0, 101.0, 101.0, 78.0, 51.0, 56.0, 33.0, 27.0, 17.0, 25.0, 15.0, 10.0, 8.0, 8.0, 11.0, 9.0, 1.0, 7.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.56640625, -0.5473403930664062, -0.5282745361328125, -0.5092086791992188, -0.490142822265625, -0.47107696533203125, -0.4520111083984375, -0.43294525146484375, -0.41387939453125, -0.39481353759765625, -0.3757476806640625, -0.35668182373046875, -0.337615966796875, -0.31855010986328125, -0.2994842529296875, -0.28041839599609375, -0.2613525390625, -0.24228668212890625, -0.2232208251953125, -0.20415496826171875, -0.185089111328125, -0.16602325439453125, -0.1469573974609375, -0.12789154052734375, -0.10882568359375, -0.08975982666015625, -0.0706939697265625, -0.05162811279296875, -0.032562255859375, -0.01349639892578125, 0.0055694580078125, 0.02463531494140625, 0.043701171875, 0.06276702880859375, 0.0818328857421875, 0.10089874267578125, 0.119964599609375, 0.13903045654296875, 0.1580963134765625, 0.17716217041015625, 0.19622802734375, 0.21529388427734375, 0.2343597412109375, 0.25342559814453125, 0.272491455078125, 0.29155731201171875, 0.3106231689453125, 0.32968902587890625, 0.3487548828125, 0.36782073974609375, 0.3868865966796875, 0.40595245361328125, 0.425018310546875, 0.44408416748046875, 0.4631500244140625, 0.48221588134765625, 0.50128173828125, 0.5203475952148438, 0.5394134521484375, 0.5584793090820312, 0.577545166015625, 0.5966110229492188, 0.6156768798828125, 0.6347427368164062, 0.65380859375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 0.0, 2.0, 1.0, 5.0, 3.0, 1.0, 4.0, 6.0, 2.0, 10.0, 5.0, 7.0, 13.0, 17.0, 14.0, 23.0, 759.0, 24.0, 15.0, 11.0, 12.0, 6.0, 7.0, 8.0, 5.0, 5.0, 7.0, 5.0, 4.0, 4.0, 5.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.261474609375, -0.25269317626953125, -0.2439117431640625, -0.23513031005859375, -0.226348876953125, -0.21756744384765625, -0.2087860107421875, -0.20000457763671875, -0.19122314453125, -0.18244171142578125, -0.1736602783203125, -0.16487884521484375, -0.156097412109375, -0.14731597900390625, -0.1385345458984375, -0.12975311279296875, -0.1209716796875, -0.11219024658203125, -0.1034088134765625, -0.09462738037109375, -0.085845947265625, -0.07706451416015625, -0.0682830810546875, -0.05950164794921875, -0.05072021484375, -0.04193878173828125, -0.0331573486328125, -0.02437591552734375, -0.015594482421875, -0.00681304931640625, 0.0019683837890625, 0.01074981689453125, 0.01953125, 0.02831268310546875, 0.0370941162109375, 0.04587554931640625, 0.054656982421875, 0.06343841552734375, 0.0722198486328125, 0.08100128173828125, 0.08978271484375, 0.09856414794921875, 0.1073455810546875, 0.11612701416015625, 0.124908447265625, 0.13368988037109375, 0.1424713134765625, 0.15125274658203125, 0.1600341796875, 0.16881561279296875, 0.1775970458984375, 0.18637847900390625, 0.195159912109375, 0.20394134521484375, 0.2127227783203125, 0.22150421142578125, 0.23028564453125, 0.23906707763671875, 0.2478485107421875, 0.25662994384765625, 0.265411376953125, 0.27419281005859375, 0.2829742431640625, 0.29175567626953125, 0.300537109375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 3.0, 7.0, 2.0, 1.0, 5.0, 9.0, 17.0, 11.0, 16.0, 34.0, 36.0, 71.0, 100.0, 145.0, 228.0, 303.0, 549.0, 892.0, 1734.0, 3424.0, 8993.0, 32504.0, 379314.0, 3632159.0, 103446.0, 18123.0, 5969.0, 2522.0, 1382.0, 795.0, 498.0, 333.0, 221.0, 154.0, 81.0, 55.0, 43.0, 34.0, 19.0, 13.0, 10.0, 7.0, 10.0, 3.0, 3.0, 5.0, 4.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.662109375, -0.6402511596679688, -0.6183929443359375, -0.5965347290039062, -0.574676513671875, -0.5528182983398438, -0.5309600830078125, -0.5091018676757812, -0.48724365234375, -0.46538543701171875, -0.4435272216796875, -0.42166900634765625, -0.399810791015625, -0.37795257568359375, -0.3560943603515625, -0.33423614501953125, -0.3123779296875, -0.29051971435546875, -0.2686614990234375, -0.24680328369140625, -0.224945068359375, -0.20308685302734375, -0.1812286376953125, -0.15937042236328125, -0.13751220703125, -0.11565399169921875, -0.0937957763671875, -0.07193756103515625, -0.050079345703125, -0.02822113037109375, -0.0063629150390625, 0.01549530029296875, 0.037353515625, 0.05921173095703125, 0.0810699462890625, 0.10292816162109375, 0.124786376953125, 0.14664459228515625, 0.1685028076171875, 0.19036102294921875, 0.21221923828125, 0.23407745361328125, 0.2559356689453125, 0.27779388427734375, 0.299652099609375, 0.32151031494140625, 0.3433685302734375, 0.36522674560546875, 0.3870849609375, 0.40894317626953125, 0.4308013916015625, 0.45265960693359375, 0.474517822265625, 0.49637603759765625, 0.5182342529296875, 0.5400924682617188, 0.56195068359375, 0.5838088989257812, 0.6056671142578125, 0.6275253295898438, 0.649383544921875, 0.6712417602539062, 0.6930999755859375, 0.7149581909179688, 0.73681640625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 5.0, 9.0, 5.0, 13.0, 9.0, 22.0, 45.0, 62.0, 162.0, 797.0, 2140.0, 514.0, 130.0, 58.0, 37.0, 19.0, 12.0, 6.0, 8.0, 5.0, 6.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.4912109375, -0.4760284423828125, -0.460845947265625, -0.4456634521484375, -0.43048095703125, -0.4152984619140625, -0.400115966796875, -0.3849334716796875, -0.3697509765625, -0.3545684814453125, -0.339385986328125, -0.3242034912109375, -0.30902099609375, -0.2938385009765625, -0.278656005859375, -0.2634735107421875, -0.248291015625, -0.2331085205078125, -0.217926025390625, -0.2027435302734375, -0.18756103515625, -0.1723785400390625, -0.157196044921875, -0.1420135498046875, -0.1268310546875, -0.1116485595703125, -0.096466064453125, -0.0812835693359375, -0.06610107421875, -0.0509185791015625, -0.035736083984375, -0.0205535888671875, -0.00537109375, 0.0098114013671875, 0.024993896484375, 0.0401763916015625, 0.05535888671875, 0.0705413818359375, 0.085723876953125, 0.1009063720703125, 0.1160888671875, 0.1312713623046875, 0.146453857421875, 0.1616363525390625, 0.17681884765625, 0.1920013427734375, 0.207183837890625, 0.2223663330078125, 0.237548828125, 0.2527313232421875, 0.267913818359375, 0.2830963134765625, 0.29827880859375, 0.3134613037109375, 0.328643798828125, 0.3438262939453125, 0.3590087890625, 0.3741912841796875, 0.389373779296875, 0.4045562744140625, 0.41973876953125, 0.4349212646484375, 0.450103759765625, 0.4652862548828125, 0.48046875]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 8.0, 14.0, 39.0, 115.0, 316.0, 324.0, 117.0, 39.0, 14.0, 6.0, 4.0, 4.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6542479991912842, -1.5881787538528442, -1.5221095085144043, -1.4560402631759644, -1.3899710178375244, -1.3239017724990845, -1.2578325271606445, -1.1917634010314941, -1.1256940364837646, -1.0596247911453247, -0.9935555458068848, -0.9274863004684448, -0.8614170551300049, -0.7953478097915649, -0.7292786240577698, -0.6632093787193298, -0.5971401929855347, -0.5310709476470947, -0.4650017023086548, -0.39893248677253723, -0.3328632414340973, -0.26679399609565735, -0.2007247805595398, -0.13465553522109985, -0.06858628988265991, -0.0025170519948005676, 0.06355218589305878, 0.12962141633033752, 0.19569066166877747, 0.2617599070072174, 0.32782912254333496, 0.3938983678817749, 0.45996761322021484, 0.5260368585586548, 0.5921061038970947, 0.6581753492355347, 0.7242445945739746, 0.7903138399124146, 0.8563830256462097, 0.9224522709846497, 0.9885215163230896, 1.0545907020568848, 1.1206599473953247, 1.1867291927337646, 1.2527984380722046, 1.3188676834106445, 1.3849369287490845, 1.4510061740875244, 1.5170754194259644, 1.5831446647644043, 1.6492139101028442, 1.7152831554412842, 1.7813524007797241, 1.847421646118164, 1.9134907722473145, 1.979560136795044, 2.0456292629241943, 2.1116983890533447, 2.177767753601074, 2.2438368797302246, 2.309906244277954, 2.3759753704071045, 2.442044734954834, 2.5081138610839844, 2.574183225631714]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 3.0, 1.0, 5.0, 4.0, 4.0, 6.0, 5.0, 6.0, 17.0, 7.0, 21.0, 22.0, 24.0, 38.0, 36.0, 48.0, 55.0, 79.0, 64.0, 59.0, 66.0, 77.0, 61.0, 49.0, 43.0, 40.0, 29.0, 18.0, 18.0, 20.0, 14.0, 10.0, 14.0, 13.0, 7.0, 3.0, 11.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.0924677848815918, -1.0598351955413818, -1.0272026062011719, -0.9945700764656067, -0.9619375467300415, -0.9293049573898315, -0.8966723680496216, -0.8640397787094116, -0.8314072489738464, -0.7987746596336365, -0.7661421298980713, -0.7335095405578613, -0.7008769512176514, -0.6682444214820862, -0.6356118321418762, -0.602979302406311, -0.5703467130661011, -0.5377141237258911, -0.5050815939903259, -0.47244900465011597, -0.4398164451122284, -0.4071838855743408, -0.37455129623413086, -0.3419187366962433, -0.3092861771583557, -0.27665361762046814, -0.24402104318141937, -0.2113884687423706, -0.17875590920448303, -0.14612334966659546, -0.11349077522754669, -0.08085820078849792, -0.0482257604598999, -0.015593193471431732, 0.017039373517036438, 0.04967194050550461, 0.08230450749397278, 0.11493706703186035, 0.14756964147090912, 0.18020221590995789, 0.21283477544784546, 0.24546733498573303, 0.2780998945236206, 0.31073248386383057, 0.34336504340171814, 0.3759976029396057, 0.4086301922798157, 0.44126275181770325, 0.4738953113555908, 0.5065279006958008, 0.539160430431366, 0.5717930197715759, 0.6044255495071411, 0.6370581388473511, 0.669690728187561, 0.702323317527771, 0.7349558472633362, 0.7675884366035461, 0.8002209663391113, 0.8328535556793213, 0.8654861450195312, 0.8981186747550964, 0.9307512640953064, 0.9633837938308716, 0.9960163831710815]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 9.0, 1.0, 8.0, 11.0, 12.0, 19.0, 20.0, 45.0, 55.0, 94.0, 132.0, 225.0, 301.0, 412.0, 610.0, 884.0, 1380.0, 2053.0, 3015.0, 4951.0, 8374.0, 16038.0, 35675.0, 857250.0, 64900.0, 22650.0, 11574.0, 6562.0, 3926.0, 2469.0, 1567.0, 1032.0, 740.0, 499.0, 352.0, 236.0, 166.0, 87.0, 70.0, 53.0, 41.0, 25.0, 11.0, 14.0, 5.0, 4.0, 6.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3798828125, -1.337738037109375, -1.29559326171875, -1.253448486328125, -1.2113037109375, -1.169158935546875, -1.12701416015625, -1.084869384765625, -1.042724609375, -1.000579833984375, -0.95843505859375, -0.916290283203125, -0.8741455078125, -0.832000732421875, -0.78985595703125, -0.747711181640625, -0.70556640625, -0.663421630859375, -0.62127685546875, -0.579132080078125, -0.5369873046875, -0.494842529296875, -0.45269775390625, -0.410552978515625, -0.368408203125, -0.326263427734375, -0.28411865234375, -0.241973876953125, -0.1998291015625, -0.157684326171875, -0.11553955078125, -0.073394775390625, -0.03125, 0.010894775390625, 0.05303955078125, 0.095184326171875, 0.1373291015625, 0.179473876953125, 0.22161865234375, 0.263763427734375, 0.305908203125, 0.348052978515625, 0.39019775390625, 0.432342529296875, 0.4744873046875, 0.516632080078125, 0.55877685546875, 0.600921630859375, 0.64306640625, 0.685211181640625, 0.72735595703125, 0.769500732421875, 0.8116455078125, 0.853790283203125, 0.89593505859375, 0.938079833984375, 0.980224609375, 1.022369384765625, 1.06451416015625, 1.106658935546875, 1.1488037109375, 1.190948486328125, 1.23309326171875, 1.275238037109375, 1.3173828125]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 0.0, 4.0, 2.0, 5.0, 9.0, 4.0, 5.0, 10.0, 13.0, 14.0, 20.0, 162.0, 616.0, 25.0, 16.0, 8.0, 14.0, 7.0, 3.0, 10.0, 4.0, 3.0, 6.0, 10.0, 1.0, 3.0, 6.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2418212890625, -0.2333087921142578, -0.22479629516601562, -0.21628379821777344, -0.20777130126953125, -0.19925880432128906, -0.19074630737304688, -0.1822338104248047, -0.1737213134765625, -0.1652088165283203, -0.15669631958007812, -0.14818382263183594, -0.13967132568359375, -0.13115882873535156, -0.12264633178710938, -0.11413383483886719, -0.105621337890625, -0.09710884094238281, -0.08859634399414062, -0.08008384704589844, -0.07157135009765625, -0.06305885314941406, -0.054546356201171875, -0.04603385925292969, -0.0375213623046875, -0.029008865356445312, -0.020496368408203125, -0.011983871459960938, -0.00347137451171875, 0.0050411224365234375, 0.013553619384765625, 0.022066116333007812, 0.03057861328125, 0.03909111022949219, 0.047603607177734375, 0.05611610412597656, 0.06462860107421875, 0.07314109802246094, 0.08165359497070312, 0.09016609191894531, 0.0986785888671875, 0.10719108581542969, 0.11570358276367188, 0.12421607971191406, 0.13272857666015625, 0.14124107360839844, 0.14975357055664062, 0.1582660675048828, 0.166778564453125, 0.1752910614013672, 0.18380355834960938, 0.19231605529785156, 0.20082855224609375, 0.20934104919433594, 0.21785354614257812, 0.2263660430908203, 0.2348785400390625, 0.2433910369873047, 0.2519035339355469, 0.26041603088378906, 0.26892852783203125, 0.27744102478027344, 0.2859535217285156, 0.2944660186767578, 0.302978515625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 6.0, 10.0, 14.0, 17.0, 25.0, 30.0, 33.0, 48.0, 63.0, 92.0, 127.0, 196.0, 260.0, 436.0, 636.0, 1249.0, 2555.0, 5588.0, 13293.0, 35240.0, 106623.0, 366738.0, 353034.0, 103668.0, 34334.0, 13083.0, 5448.0, 2427.0, 1256.0, 707.0, 434.0, 247.0, 156.0, 118.0, 95.0, 68.0, 67.0, 41.0, 26.0, 21.0, 14.0, 16.0, 8.0, 2.0, 8.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.73779296875, -0.71234130859375, -0.6868896484375, -0.66143798828125, -0.635986328125, -0.61053466796875, -0.5850830078125, -0.55963134765625, -0.5341796875, -0.50872802734375, -0.4832763671875, -0.45782470703125, -0.432373046875, -0.40692138671875, -0.3814697265625, -0.35601806640625, -0.33056640625, -0.30511474609375, -0.2796630859375, -0.25421142578125, -0.228759765625, -0.20330810546875, -0.1778564453125, -0.15240478515625, -0.126953125, -0.10150146484375, -0.0760498046875, -0.05059814453125, -0.025146484375, 0.00030517578125, 0.0257568359375, 0.05120849609375, 0.07666015625, 0.10211181640625, 0.1275634765625, 0.15301513671875, 0.178466796875, 0.20391845703125, 0.2293701171875, 0.25482177734375, 0.2802734375, 0.30572509765625, 0.3311767578125, 0.35662841796875, 0.382080078125, 0.40753173828125, 0.4329833984375, 0.45843505859375, 0.48388671875, 0.50933837890625, 0.5347900390625, 0.56024169921875, 0.585693359375, 0.61114501953125, 0.6365966796875, 0.66204833984375, 0.6875, 0.71295166015625, 0.7384033203125, 0.76385498046875, 0.789306640625, 0.81475830078125, 0.8402099609375, 0.86566162109375, 0.89111328125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 3.0, 8.0, 4.0, 4.0, 9.0, 9.0, 22.0, 15.0, 8.0, 16.0, 14.0, 20.0, 31.0, 26.0, 26.0, 31.0, 25.0, 33.0, 32.0, 31.0, 39.0, 29.0, 34.0, 37.0, 33.0, 38.0, 34.0, 35.0, 26.0, 34.0, 21.0, 33.0, 36.0, 30.0, 24.0, 20.0, 28.0, 18.0, 9.0, 14.0, 9.0, 11.0, 8.0, 6.0, 8.0, 6.0, 8.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.8662109375, -0.8380355834960938, -0.8098602294921875, -0.7816848754882812, -0.753509521484375, -0.7253341674804688, -0.6971588134765625, -0.6689834594726562, -0.64080810546875, -0.6126327514648438, -0.5844573974609375, -0.5562820434570312, -0.528106689453125, -0.49993133544921875, -0.4717559814453125, -0.44358062744140625, -0.4154052734375, -0.38722991943359375, -0.3590545654296875, -0.33087921142578125, -0.302703857421875, -0.27452850341796875, -0.2463531494140625, -0.21817779541015625, -0.19000244140625, -0.16182708740234375, -0.1336517333984375, -0.10547637939453125, -0.077301025390625, -0.04912567138671875, -0.0209503173828125, 0.00722503662109375, 0.035400390625, 0.06357574462890625, 0.0917510986328125, 0.11992645263671875, 0.148101806640625, 0.17627716064453125, 0.2044525146484375, 0.23262786865234375, 0.26080322265625, 0.28897857666015625, 0.3171539306640625, 0.34532928466796875, 0.373504638671875, 0.40167999267578125, 0.4298553466796875, 0.45803070068359375, 0.4862060546875, 0.5143814086914062, 0.5425567626953125, 0.5707321166992188, 0.598907470703125, 0.6270828247070312, 0.6552581787109375, 0.6834335327148438, 0.71160888671875, 0.7397842407226562, 0.7679595947265625, 0.7961349487304688, 0.824310302734375, 0.8524856567382812, 0.8806610107421875, 0.9088363647460938, 0.93701171875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 7.0, 2.0, 5.0, 4.0, 6.0, 13.0, 15.0, 18.0, 24.0, 39.0, 56.0, 52.0, 103.0, 138.0, 212.0, 374.0, 641.0, 1137.0, 2883.0, 8051.0, 41367.0, 814926.0, 154539.0, 15740.0, 4335.0, 1757.0, 826.0, 467.0, 286.0, 188.0, 95.0, 76.0, 42.0, 36.0, 22.0, 22.0, 13.0, 12.0, 6.0, 8.0, 4.0, 4.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.99560546875, -0.9597091674804688, -0.9238128662109375, -0.8879165649414062, -0.852020263671875, -0.8161239624023438, -0.7802276611328125, -0.7443313598632812, -0.70843505859375, -0.6725387573242188, -0.6366424560546875, -0.6007461547851562, -0.564849853515625, -0.5289535522460938, -0.4930572509765625, -0.45716094970703125, -0.4212646484375, -0.38536834716796875, -0.3494720458984375, -0.31357574462890625, -0.277679443359375, -0.24178314208984375, -0.2058868408203125, -0.16999053955078125, -0.13409423828125, -0.09819793701171875, -0.0623016357421875, -0.02640533447265625, 0.009490966796875, 0.04538726806640625, 0.0812835693359375, 0.11717987060546875, 0.153076171875, 0.18897247314453125, 0.2248687744140625, 0.26076507568359375, 0.296661376953125, 0.33255767822265625, 0.3684539794921875, 0.40435028076171875, 0.44024658203125, 0.47614288330078125, 0.5120391845703125, 0.5479354858398438, 0.583831787109375, 0.6197280883789062, 0.6556243896484375, 0.6915206909179688, 0.7274169921875, 0.7633132934570312, 0.7992095947265625, 0.8351058959960938, 0.871002197265625, 0.9068984985351562, 0.9427947998046875, 0.9786911010742188, 1.01458740234375, 1.0504837036132812, 1.0863800048828125, 1.1222763061523438, 1.158172607421875, 1.1940689086914062, 1.2299652099609375, 1.2658615112304688, 1.3017578125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 5.0, 1.0, 5.0, 6.0, 10.0, 18.0, 15.0, 27.0, 33.0, 56.0, 66.0, 83.0, 93.0, 96.0, 120.0, 98.0, 85.0, 55.0, 33.0, 27.0, 23.0, 15.0, 6.0, 6.0, 8.0, 4.0, 5.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-6.765127182006836e-05, -6.594602018594742e-05, -6.424076855182648e-05, -6.253551691770554e-05, -6.0830265283584595e-05, -5.9125013649463654e-05, -5.741976201534271e-05, -5.571451038122177e-05, -5.400925874710083e-05, -5.230400711297989e-05, -5.059875547885895e-05, -4.8893503844738007e-05, -4.7188252210617065e-05, -4.5483000576496124e-05, -4.377774894237518e-05, -4.207249730825424e-05, -4.03672456741333e-05, -3.866199404001236e-05, -3.695674240589142e-05, -3.525149077177048e-05, -3.3546239137649536e-05, -3.1840987503528595e-05, -3.0135735869407654e-05, -2.8430484235286713e-05, -2.672523260116577e-05, -2.501998096704483e-05, -2.331472933292389e-05, -2.1609477698802948e-05, -1.9904226064682007e-05, -1.8198974430561066e-05, -1.6493722796440125e-05, -1.4788471162319183e-05, -1.3083219528198242e-05, -1.1377967894077301e-05, -9.67271625995636e-06, -7.967464625835419e-06, -6.2622129917144775e-06, -4.556961357593536e-06, -2.8517097234725952e-06, -1.146458089351654e-06, 5.587935447692871e-07, 2.2640451788902283e-06, 3.9692968130111694e-06, 5.674548447132111e-06, 7.379800081253052e-06, 9.085051715373993e-06, 1.0790303349494934e-05, 1.2495554983615875e-05, 1.4200806617736816e-05, 1.5906058251857758e-05, 1.76113098859787e-05, 1.931656152009964e-05, 2.102181315422058e-05, 2.2727064788341522e-05, 2.4432316422462463e-05, 2.6137568056583405e-05, 2.7842819690704346e-05, 2.9548071324825287e-05, 3.125332295894623e-05, 3.295857459306717e-05, 3.466382622718811e-05, 3.636907786130905e-05, 3.807432949542999e-05, 3.9779581129550934e-05, 4.1484832763671875e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 6.0, 10.0, 6.0, 5.0, 18.0, 34.0, 19.0, 66.0, 83.0, 131.0, 216.0, 338.0, 667.0, 1204.0, 2546.0, 5680.0, 16447.0, 93561.0, 799687.0, 99189.0, 17108.0, 5954.0, 2554.0, 1338.0, 679.0, 359.0, 219.0, 149.0, 93.0, 61.0, 29.0, 20.0, 14.0, 19.0, 11.0, 13.0, 7.0, 8.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.158203125, -1.1161041259765625, -1.074005126953125, -1.0319061279296875, -0.98980712890625, -0.9477081298828125, -0.905609130859375, -0.8635101318359375, -0.8214111328125, -0.7793121337890625, -0.737213134765625, -0.6951141357421875, -0.65301513671875, -0.6109161376953125, -0.568817138671875, -0.5267181396484375, -0.484619140625, -0.4425201416015625, -0.400421142578125, -0.3583221435546875, -0.31622314453125, -0.2741241455078125, -0.232025146484375, -0.1899261474609375, -0.1478271484375, -0.1057281494140625, -0.063629150390625, -0.0215301513671875, 0.02056884765625, 0.0626678466796875, 0.104766845703125, 0.1468658447265625, 0.18896484375, 0.2310638427734375, 0.273162841796875, 0.3152618408203125, 0.35736083984375, 0.3994598388671875, 0.441558837890625, 0.4836578369140625, 0.5257568359375, 0.5678558349609375, 0.609954833984375, 0.6520538330078125, 0.69415283203125, 0.7362518310546875, 0.778350830078125, 0.8204498291015625, 0.862548828125, 0.9046478271484375, 0.946746826171875, 0.9888458251953125, 1.03094482421875, 1.0730438232421875, 1.115142822265625, 1.1572418212890625, 1.1993408203125, 1.2414398193359375, 1.283538818359375, 1.3256378173828125, 1.36773681640625, 1.4098358154296875, 1.451934814453125, 1.4940338134765625, 1.5361328125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 4.0, 3.0, 1.0, 7.0, 6.0, 8.0, 8.0, 7.0, 12.0, 26.0, 21.0, 44.0, 66.0, 63.0, 102.0, 115.0, 104.0, 114.0, 60.0, 49.0, 39.0, 39.0, 16.0, 17.0, 19.0, 5.0, 11.0, 8.0, 4.0, 4.0, 5.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.4140625, -1.3710784912109375, -1.328094482421875, -1.2851104736328125, -1.24212646484375, -1.1991424560546875, -1.156158447265625, -1.1131744384765625, -1.0701904296875, -1.0272064208984375, -0.984222412109375, -0.9412384033203125, -0.89825439453125, -0.8552703857421875, -0.812286376953125, -0.7693023681640625, -0.726318359375, -0.6833343505859375, -0.640350341796875, -0.5973663330078125, -0.55438232421875, -0.5113983154296875, -0.468414306640625, -0.4254302978515625, -0.3824462890625, -0.3394622802734375, -0.296478271484375, -0.2534942626953125, -0.21051025390625, -0.1675262451171875, -0.124542236328125, -0.0815582275390625, -0.03857421875, 0.0044097900390625, 0.047393798828125, 0.0903778076171875, 0.13336181640625, 0.1763458251953125, 0.219329833984375, 0.2623138427734375, 0.3052978515625, 0.3482818603515625, 0.391265869140625, 0.4342498779296875, 0.47723388671875, 0.5202178955078125, 0.563201904296875, 0.6061859130859375, 0.649169921875, 0.6921539306640625, 0.735137939453125, 0.7781219482421875, 0.82110595703125, 0.8640899658203125, 0.907073974609375, 0.9500579833984375, 0.9930419921875, 1.0360260009765625, 1.079010009765625, 1.1219940185546875, 1.16497802734375, 1.2079620361328125, 1.250946044921875, 1.2939300537109375, 1.3369140625]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 3.0, 16.0, 28.0, 144.0, 483.0, 228.0, 59.0, 20.0, 9.0, 7.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.70941925048828, -16.927597045898438, -16.145774841308594, -15.363953590393066, -14.582131385803223, -13.800310134887695, -13.018487930297852, -12.236665725708008, -11.454843521118164, -10.67302131652832, -9.891200065612793, -9.10937786102295, -8.327555656433105, -7.54573392868042, -6.763912200927734, -5.982089996337891, -5.200268745422363, -4.418447017669678, -3.636624813079834, -2.8548030853271484, -2.072981119155884, -1.2911591529846191, -0.5093374252319336, 0.27248477935791016, 1.0543065071105957, 1.8361284732818604, 2.617950439453125, 3.3997721672058105, 4.181593894958496, 4.96341609954834, 5.745237827301025, 6.527060031890869, 7.308881759643555, 8.090703964233398, 8.872525215148926, 9.65434741973877, 10.436169624328613, 11.21799087524414, 11.999813079833984, 12.781635284423828, 13.563457489013672, 14.345279693603516, 15.127100944519043, 15.908923149108887, 16.690744400024414, 17.472566604614258, 18.2543888092041, 19.036211013793945, 19.818031311035156, 20.599853515625, 21.381675720214844, 22.163497924804688, 22.9453182220459, 23.727140426635742, 24.508962631225586, 25.29078483581543, 26.072607040405273, 26.854429244995117, 27.63625144958496, 28.418071746826172, 29.199893951416016, 29.98171615600586, 30.763538360595703, 31.545360565185547, 32.32718276977539]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 3.0, 4.0, 2.0, 3.0, 6.0, 9.0, 10.0, 6.0, 6.0, 12.0, 17.0, 24.0, 43.0, 71.0, 73.0, 121.0, 111.0, 95.0, 97.0, 73.0, 61.0, 39.0, 15.0, 25.0, 11.0, 10.0, 6.0, 4.0, 6.0, 7.0, 2.0, 4.0, 3.0, 2.0, 0.0, 5.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0], "bins": [-15.543840408325195, -15.022405624389648, -14.500970840454102, -13.979536056518555, -13.458101272583008, -12.936666488647461, -12.415230751037598, -11.89379596710205, -11.372361183166504, -10.850926399230957, -10.32949161529541, -9.808056831359863, -9.28662109375, -8.765186309814453, -8.243751525878906, -7.722316741943359, -7.2008819580078125, -6.679447174072266, -6.158012390136719, -5.636577129364014, -5.115142345428467, -4.59370756149292, -4.072272300720215, -3.550837516784668, -3.029402732849121, -2.507967948913574, -1.9865329265594482, -1.4650980234146118, -0.9436631202697754, -0.4222283363342285, 0.09920668601989746, 0.6206417083740234, 1.1420783996582031, 1.6635133028030396, 2.184948205947876, 2.706383228302002, 3.227818012237549, 3.7492527961730957, 4.270688056945801, 4.792122840881348, 5.3135576248168945, 5.834992408752441, 6.356427192687988, 6.877862453460693, 7.39929723739624, 7.920732021331787, 8.442167282104492, 8.963602066040039, 9.485036849975586, 10.006471633911133, 10.52790641784668, 11.049341201782227, 11.570775985717773, 12.09221076965332, 12.613646507263184, 13.13508129119873, 13.656516075134277, 14.177950859069824, 14.699385643005371, 15.220820426940918, 15.742256164550781, 16.263690948486328, 16.785125732421875, 17.306560516357422, 17.82799530029297]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 5.0, 10.0, 14.0, 21.0, 20.0, 40.0, 54.0, 86.0, 98.0, 172.0, 278.0, 393.0, 718.0, 1172.0, 2013.0, 3684.0, 7468.0, 18054.0, 66999.0, 3765508.0, 261350.0, 36599.0, 13686.0, 6860.0, 3580.0, 2055.0, 1211.0, 821.0, 450.0, 281.0, 198.0, 120.0, 93.0, 47.0, 42.0, 25.0, 23.0, 12.0, 6.0, 4.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-1.9609375, -1.9028778076171875, -1.844818115234375, -1.7867584228515625, -1.72869873046875, -1.6706390380859375, -1.612579345703125, -1.5545196533203125, -1.4964599609375, -1.4384002685546875, -1.380340576171875, -1.3222808837890625, -1.26422119140625, -1.2061614990234375, -1.148101806640625, -1.0900421142578125, -1.031982421875, -0.9739227294921875, -0.915863037109375, -0.8578033447265625, -0.79974365234375, -0.7416839599609375, -0.683624267578125, -0.6255645751953125, -0.5675048828125, -0.5094451904296875, -0.451385498046875, -0.3933258056640625, -0.33526611328125, -0.2772064208984375, -0.219146728515625, -0.1610870361328125, -0.10302734375, -0.0449676513671875, 0.013092041015625, 0.0711517333984375, 0.12921142578125, 0.1872711181640625, 0.245330810546875, 0.3033905029296875, 0.3614501953125, 0.4195098876953125, 0.477569580078125, 0.5356292724609375, 0.59368896484375, 0.6517486572265625, 0.709808349609375, 0.7678680419921875, 0.825927734375, 0.8839874267578125, 0.942047119140625, 1.0001068115234375, 1.05816650390625, 1.1162261962890625, 1.174285888671875, 1.2323455810546875, 1.2904052734375, 1.3484649658203125, 1.406524658203125, 1.4645843505859375, 1.52264404296875, 1.5807037353515625, 1.638763427734375, 1.6968231201171875, 1.7548828125]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 1.0, 7.0, 4.0, 0.0, 4.0, 9.0, 10.0, 9.0, 9.0, 12.0, 28.0, 51.0, 145.0, 270.0, 214.0, 77.0, 37.0, 20.0, 10.0, 7.0, 11.0, 7.0, 7.0, 5.0, 5.0, 4.0, 5.0, 5.0, 4.0, 2.0, 4.0, 4.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.2041015625, -0.1980915069580078, -0.19208145141601562, -0.18607139587402344, -0.18006134033203125, -0.17405128479003906, -0.16804122924804688, -0.1620311737060547, -0.1560211181640625, -0.1500110626220703, -0.14400100708007812, -0.13799095153808594, -0.13198089599609375, -0.12597084045410156, -0.11996078491210938, -0.11395072937011719, -0.107940673828125, -0.10193061828613281, -0.09592056274414062, -0.08991050720214844, -0.08390045166015625, -0.07789039611816406, -0.07188034057617188, -0.06587028503417969, -0.0598602294921875, -0.05385017395019531, -0.047840118408203125, -0.04183006286621094, -0.03582000732421875, -0.029809951782226562, -0.023799896240234375, -0.017789840698242188, -0.01177978515625, -0.0057697296142578125, 0.000240325927734375, 0.0062503814697265625, 0.01226043701171875, 0.018270492553710938, 0.024280548095703125, 0.030290603637695312, 0.0363006591796875, 0.04231071472167969, 0.048320770263671875, 0.05433082580566406, 0.06034088134765625, 0.06635093688964844, 0.07236099243164062, 0.07837104797363281, 0.084381103515625, 0.09039115905761719, 0.09640121459960938, 0.10241127014160156, 0.10842132568359375, 0.11443138122558594, 0.12044143676757812, 0.1264514923095703, 0.1324615478515625, 0.1384716033935547, 0.14448165893554688, 0.15049171447753906, 0.15650177001953125, 0.16251182556152344, 0.16852188110351562, 0.1745319366455078, 0.1805419921875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 4.0, 5.0, 4.0, 7.0, 8.0, 13.0, 12.0, 24.0, 33.0, 45.0, 55.0, 96.0, 132.0, 185.0, 340.0, 601.0, 1042.0, 2229.0, 5329.0, 15178.0, 57765.0, 580572.0, 3356868.0, 131879.0, 26991.0, 8156.0, 3301.0, 1484.0, 788.0, 404.0, 235.0, 161.0, 108.0, 60.0, 45.0, 33.0, 30.0, 17.0, 11.0, 10.0, 11.0, 5.0, 4.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.091796875, -1.0531158447265625, -1.014434814453125, -0.9757537841796875, -0.93707275390625, -0.8983917236328125, -0.859710693359375, -0.8210296630859375, -0.7823486328125, -0.7436676025390625, -0.704986572265625, -0.6663055419921875, -0.62762451171875, -0.5889434814453125, -0.550262451171875, -0.5115814208984375, -0.472900390625, -0.4342193603515625, -0.395538330078125, -0.3568572998046875, -0.31817626953125, -0.2794952392578125, -0.240814208984375, -0.2021331787109375, -0.1634521484375, -0.1247711181640625, -0.086090087890625, -0.0474090576171875, -0.00872802734375, 0.0299530029296875, 0.068634033203125, 0.1073150634765625, 0.14599609375, 0.1846771240234375, 0.223358154296875, 0.2620391845703125, 0.30072021484375, 0.3394012451171875, 0.378082275390625, 0.4167633056640625, 0.4554443359375, 0.4941253662109375, 0.532806396484375, 0.5714874267578125, 0.61016845703125, 0.6488494873046875, 0.687530517578125, 0.7262115478515625, 0.764892578125, 0.8035736083984375, 0.842254638671875, 0.8809356689453125, 0.91961669921875, 0.9582977294921875, 0.996978759765625, 1.0356597900390625, 1.0743408203125, 1.1130218505859375, 1.151702880859375, 1.1903839111328125, 1.22906494140625, 1.2677459716796875, 1.306427001953125, 1.3451080322265625, 1.3837890625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 5.0, 6.0, 11.0, 7.0, 11.0, 14.0, 15.0, 31.0, 28.0, 41.0, 56.0, 92.0, 150.0, 462.0, 1523.0, 806.0, 331.0, 161.0, 85.0, 56.0, 36.0, 41.0, 23.0, 21.0, 10.0, 15.0, 10.0, 4.0, 3.0, 7.0, 2.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.275146484375, -0.2669963836669922, -0.2588462829589844, -0.25069618225097656, -0.24254608154296875, -0.23439598083496094, -0.22624588012695312, -0.2180957794189453, -0.2099456787109375, -0.2017955780029297, -0.19364547729492188, -0.18549537658691406, -0.17734527587890625, -0.16919517517089844, -0.16104507446289062, -0.1528949737548828, -0.144744873046875, -0.1365947723388672, -0.12844467163085938, -0.12029457092285156, -0.11214447021484375, -0.10399436950683594, -0.09584426879882812, -0.08769416809082031, -0.0795440673828125, -0.07139396667480469, -0.06324386596679688, -0.05509376525878906, -0.04694366455078125, -0.03879356384277344, -0.030643463134765625, -0.022493362426757812, -0.01434326171875, -0.0061931610107421875, 0.001956939697265625, 0.010107040405273438, 0.01825714111328125, 0.026407241821289062, 0.034557342529296875, 0.04270744323730469, 0.0508575439453125, 0.05900764465332031, 0.06715774536132812, 0.07530784606933594, 0.08345794677734375, 0.09160804748535156, 0.09975814819335938, 0.10790824890136719, 0.116058349609375, 0.12420845031738281, 0.13235855102539062, 0.14050865173339844, 0.14865875244140625, 0.15680885314941406, 0.16495895385742188, 0.1731090545654297, 0.1812591552734375, 0.1894092559814453, 0.19755935668945312, 0.20570945739746094, 0.21385955810546875, 0.22200965881347656, 0.23015975952148438, 0.2383098602294922, 0.2464599609375]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 5.0, 32.0, 344.0, 486.0, 92.0, 14.0, 9.0, 8.0, 4.0, 2.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.371602535247803, -5.226481914520264, -5.081361293792725, -4.936240196228027, -4.791119575500488, -4.645998954772949, -4.50087833404541, -4.355757713317871, -4.210637092590332, -4.065516471862793, -3.920395612716675, -3.7752749919891357, -3.6301541328430176, -3.4850335121154785, -3.3399128913879395, -3.1947922706604004, -3.049671173095703, -2.904550552368164, -2.759429693222046, -2.614309072494507, -2.4691882133483887, -2.3240675926208496, -2.1789469718933105, -2.0338263511657715, -1.8887054920196533, -1.7435847520828247, -1.598464012145996, -1.453343391418457, -1.3082226514816284, -1.1631019115447998, -1.0179812908172607, -0.8728605508804321, -0.7277393341064453, -0.5826185941696167, -0.43749791383743286, -0.29237720370292664, -0.1472564935684204, -0.002135753631591797, 0.14298492670059204, 0.2881056070327759, 0.4332263469696045, 0.5783470869064331, 0.7234677672386169, 0.8685884475708008, 1.0137091875076294, 1.158829927444458, 1.303950548171997, 1.4490712881088257, 1.5941920280456543, 1.739312767982483, 1.8844335079193115, 2.0295541286468506, 2.1746749877929688, 2.319795608520508, 2.464916229248047, 2.610036849975586, 2.755157709121704, 2.900278329849243, 3.0453991889953613, 3.1905198097229004, 3.3356404304504395, 3.4807612895965576, 3.6258819103240967, 3.771002769470215, 3.916123390197754]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 4.0, 3.0, 4.0, 13.0, 9.0, 8.0, 25.0, 17.0, 28.0, 30.0, 43.0, 60.0, 63.0, 69.0, 66.0, 79.0, 75.0, 64.0, 56.0, 60.0, 39.0, 49.0, 31.0, 28.0, 22.0, 13.0, 14.0, 9.0, 5.0, 3.0, 6.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.4345269203186035, -1.3878427743911743, -1.3411585092544556, -1.2944743633270264, -1.2477902173995972, -1.201106071472168, -1.1544218063354492, -1.10773766040802, -1.0610535144805908, -1.0143693685531616, -0.9676851630210876, -0.9210009574890137, -0.8743168115615845, -0.8276326060295105, -0.7809484004974365, -0.7342642545700073, -0.6875800490379333, -0.6408958435058594, -0.5942116975784302, -0.5475274920463562, -0.500843346118927, -0.454159140586853, -0.40747496485710144, -0.36079078912734985, -0.31410661339759827, -0.2674224376678467, -0.2207382619380951, -0.1740540713071823, -0.12736989557743073, -0.08068571984767914, -0.03400152921676636, 0.01268264651298523, 0.059366822242736816, 0.1060509979724884, 0.15273517370224, 0.19941936433315277, 0.24610354006290436, 0.29278773069381714, 0.3394719064235687, 0.3861560821533203, 0.4328402578830719, 0.4795244336128235, 0.5262086391448975, 0.5728927850723267, 0.6195769906044006, 0.6662611365318298, 0.7129453420639038, 0.759629487991333, 0.806313693523407, 0.852997899055481, 0.8996820449829102, 0.9463662505149841, 0.9930503964424133, 1.0397346019744873, 1.0864187479019165, 1.1331028938293457, 1.1797871589660645, 1.2264713048934937, 1.2731555700302124, 1.3198397159576416, 1.3665238618850708, 1.4132080078125, 1.4598922729492188, 1.506576418876648, 1.5532605648040771]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 6.0, 4.0, 6.0, 7.0, 11.0, 22.0, 36.0, 47.0, 65.0, 91.0, 149.0, 205.0, 339.0, 487.0, 662.0, 1020.0, 1659.0, 2344.0, 3585.0, 5686.0, 9206.0, 17101.0, 41404.0, 332349.0, 528745.0, 55804.0, 19354.0, 10292.0, 6136.0, 3869.0, 2615.0, 1760.0, 1158.0, 736.0, 497.0, 373.0, 220.0, 176.0, 112.0, 70.0, 47.0, 39.0, 18.0, 12.0, 6.0, 9.0, 6.0, 5.0, 7.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-1.0556640625, -1.0227813720703125, -0.989898681640625, -0.9570159912109375, -0.92413330078125, -0.8912506103515625, -0.858367919921875, -0.8254852294921875, -0.7926025390625, -0.7597198486328125, -0.726837158203125, -0.6939544677734375, -0.66107177734375, -0.6281890869140625, -0.595306396484375, -0.5624237060546875, -0.529541015625, -0.4966583251953125, -0.463775634765625, -0.4308929443359375, -0.39801025390625, -0.3651275634765625, -0.332244873046875, -0.2993621826171875, -0.2664794921875, -0.2335968017578125, -0.200714111328125, -0.1678314208984375, -0.13494873046875, -0.1020660400390625, -0.069183349609375, -0.0363006591796875, -0.00341796875, 0.0294647216796875, 0.062347412109375, 0.0952301025390625, 0.12811279296875, 0.1609954833984375, 0.193878173828125, 0.2267608642578125, 0.2596435546875, 0.2925262451171875, 0.325408935546875, 0.3582916259765625, 0.39117431640625, 0.4240570068359375, 0.456939697265625, 0.4898223876953125, 0.522705078125, 0.5555877685546875, 0.588470458984375, 0.6213531494140625, 0.65423583984375, 0.6871185302734375, 0.720001220703125, 0.7528839111328125, 0.7857666015625, 0.8186492919921875, 0.851531982421875, 0.8844146728515625, 0.91729736328125, 0.9501800537109375, 0.983062744140625, 1.0159454345703125, 1.048828125]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 7.0, 2.0, 3.0, 7.0, 13.0, 3.0, 12.0, 17.0, 19.0, 49.0, 132.0, 192.0, 188.0, 140.0, 77.0, 36.0, 16.0, 17.0, 6.0, 8.0, 3.0, 9.0, 3.0, 4.0, 3.0, 4.0, 2.0, 5.0, 2.0, 4.0, 2.0, 3.0, 5.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.1898193359375, -0.18430709838867188, -0.17879486083984375, -0.17328262329101562, -0.1677703857421875, -0.16225814819335938, -0.15674591064453125, -0.15123367309570312, -0.145721435546875, -0.14020919799804688, -0.13469696044921875, -0.12918472290039062, -0.1236724853515625, -0.11816024780273438, -0.11264801025390625, -0.10713577270507812, -0.10162353515625, -0.09611129760742188, -0.09059906005859375, -0.08508682250976562, -0.0795745849609375, -0.07406234741210938, -0.06855010986328125, -0.06303787231445312, -0.057525634765625, -0.052013397216796875, -0.04650115966796875, -0.040988922119140625, -0.0354766845703125, -0.029964447021484375, -0.02445220947265625, -0.018939971923828125, -0.013427734375, -0.007915496826171875, -0.00240325927734375, 0.003108978271484375, 0.0086212158203125, 0.014133453369140625, 0.01964569091796875, 0.025157928466796875, 0.030670166015625, 0.036182403564453125, 0.04169464111328125, 0.047206878662109375, 0.0527191162109375, 0.058231353759765625, 0.06374359130859375, 0.06925582885742188, 0.07476806640625, 0.08028030395507812, 0.08579254150390625, 0.09130477905273438, 0.0968170166015625, 0.10232925415039062, 0.10784149169921875, 0.11335372924804688, 0.118865966796875, 0.12437820434570312, 0.12989044189453125, 0.13540267944335938, 0.1409149169921875, 0.14642715454101562, 0.15193939208984375, 0.15745162963867188, 0.1629638671875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 2.0, 2.0, 6.0, 19.0, 41.0, 92.0, 402.0, 1458.0, 15261.0, 596680.0, 422476.0, 10426.0, 1197.0, 319.0, 106.0, 30.0, 19.0, 4.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.876953125, -2.789642333984375, -2.70233154296875, -2.615020751953125, -2.5277099609375, -2.440399169921875, -2.35308837890625, -2.265777587890625, -2.178466796875, -2.091156005859375, -2.00384521484375, -1.916534423828125, -1.8292236328125, -1.741912841796875, -1.65460205078125, -1.567291259765625, -1.47998046875, -1.392669677734375, -1.30535888671875, -1.218048095703125, -1.1307373046875, -1.043426513671875, -0.95611572265625, -0.868804931640625, -0.781494140625, -0.694183349609375, -0.60687255859375, -0.519561767578125, -0.4322509765625, -0.344940185546875, -0.25762939453125, -0.170318603515625, -0.0830078125, 0.004302978515625, 0.09161376953125, 0.178924560546875, 0.2662353515625, 0.353546142578125, 0.44085693359375, 0.528167724609375, 0.615478515625, 0.702789306640625, 0.79010009765625, 0.877410888671875, 0.9647216796875, 1.052032470703125, 1.13934326171875, 1.226654052734375, 1.31396484375, 1.401275634765625, 1.48858642578125, 1.575897216796875, 1.6632080078125, 1.750518798828125, 1.83782958984375, 1.925140380859375, 2.012451171875, 2.099761962890625, 2.18707275390625, 2.274383544921875, 2.3616943359375, 2.449005126953125, 2.53631591796875, 2.623626708984375, 2.7109375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 2.0, 3.0, 5.0, 5.0, 8.0, 8.0, 9.0, 14.0, 12.0, 15.0, 13.0, 26.0, 20.0, 24.0, 31.0, 25.0, 22.0, 32.0, 37.0, 35.0, 31.0, 48.0, 36.0, 48.0, 38.0, 53.0, 35.0, 51.0, 31.0, 40.0, 27.0, 45.0, 25.0, 22.0, 19.0, 15.0, 17.0, 17.0, 9.0, 10.0, 14.0, 11.0, 7.0, 4.0, 3.0, 4.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.60693359375, -0.5877609252929688, -0.5685882568359375, -0.5494155883789062, -0.530242919921875, -0.5110702514648438, -0.4918975830078125, -0.47272491455078125, -0.45355224609375, -0.43437957763671875, -0.4152069091796875, -0.39603424072265625, -0.376861572265625, -0.35768890380859375, -0.3385162353515625, -0.31934356689453125, -0.3001708984375, -0.28099822998046875, -0.2618255615234375, -0.24265289306640625, -0.223480224609375, -0.20430755615234375, -0.1851348876953125, -0.16596221923828125, -0.14678955078125, -0.12761688232421875, -0.1084442138671875, -0.08927154541015625, -0.070098876953125, -0.05092620849609375, -0.0317535400390625, -0.01258087158203125, 0.006591796875, 0.02576446533203125, 0.0449371337890625, 0.06410980224609375, 0.083282470703125, 0.10245513916015625, 0.1216278076171875, 0.14080047607421875, 0.15997314453125, 0.17914581298828125, 0.1983184814453125, 0.21749114990234375, 0.236663818359375, 0.25583648681640625, 0.2750091552734375, 0.29418182373046875, 0.3133544921875, 0.33252716064453125, 0.3516998291015625, 0.37087249755859375, 0.390045166015625, 0.40921783447265625, 0.4283905029296875, 0.44756317138671875, 0.46673583984375, 0.48590850830078125, 0.5050811767578125, 0.5242538452148438, 0.543426513671875, 0.5625991821289062, 0.5817718505859375, 0.6009445190429688, 0.6201171875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 7.0, 2.0, 3.0, 3.0, 5.0, 3.0, 7.0, 16.0, 18.0, 23.0, 38.0, 50.0, 53.0, 109.0, 215.0, 418.0, 949.0, 2604.0, 12306.0, 383541.0, 627735.0, 15453.0, 2916.0, 996.0, 449.0, 237.0, 136.0, 84.0, 59.0, 28.0, 27.0, 16.0, 12.0, 12.0, 7.0, 3.0, 8.0, 1.0, 4.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-2.146484375, -2.0834503173828125, -2.020416259765625, -1.9573822021484375, -1.89434814453125, -1.8313140869140625, -1.768280029296875, -1.7052459716796875, -1.6422119140625, -1.5791778564453125, -1.516143798828125, -1.4531097412109375, -1.39007568359375, -1.3270416259765625, -1.264007568359375, -1.2009735107421875, -1.137939453125, -1.0749053955078125, -1.011871337890625, -0.9488372802734375, -0.88580322265625, -0.8227691650390625, -0.759735107421875, -0.6967010498046875, -0.6336669921875, -0.5706329345703125, -0.507598876953125, -0.4445648193359375, -0.38153076171875, -0.3184967041015625, -0.255462646484375, -0.1924285888671875, -0.12939453125, -0.0663604736328125, -0.003326416015625, 0.0597076416015625, 0.12274169921875, 0.1857757568359375, 0.248809814453125, 0.3118438720703125, 0.3748779296875, 0.4379119873046875, 0.500946044921875, 0.5639801025390625, 0.62701416015625, 0.6900482177734375, 0.753082275390625, 0.8161163330078125, 0.879150390625, 0.9421844482421875, 1.005218505859375, 1.0682525634765625, 1.13128662109375, 1.1943206787109375, 1.257354736328125, 1.3203887939453125, 1.3834228515625, 1.4464569091796875, 1.509490966796875, 1.5725250244140625, 1.63555908203125, 1.6985931396484375, 1.761627197265625, 1.8246612548828125, 1.8876953125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 6.0, 14.0, 11.0, 16.0, 23.0, 36.0, 49.0, 81.0, 134.0, 159.0, 147.0, 112.0, 67.0, 46.0, 37.0, 16.0, 20.0, 7.0, 5.0, 4.0, 5.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.791685104370117e-05, -8.463207632303238e-05, -8.134730160236359e-05, -7.80625268816948e-05, -7.4777752161026e-05, -7.149297744035721e-05, -6.820820271968842e-05, -6.492342799901962e-05, -6.163865327835083e-05, -5.835387855768204e-05, -5.5069103837013245e-05, -5.178432911634445e-05, -4.849955439567566e-05, -4.5214779675006866e-05, -4.1930004954338074e-05, -3.864523023366928e-05, -3.536045551300049e-05, -3.2075680792331696e-05, -2.8790906071662903e-05, -2.550613135099411e-05, -2.2221356630325317e-05, -1.8936581909656525e-05, -1.5651807188987732e-05, -1.236703246831894e-05, -9.082257747650146e-06, -5.797483026981354e-06, -2.512708306312561e-06, 7.720664143562317e-07, 4.056841135025024e-06, 7.341615855693817e-06, 1.062639057636261e-05, 1.3911165297031403e-05, 1.7195940017700195e-05, 2.0480714738368988e-05, 2.376548945903778e-05, 2.7050264179706573e-05, 3.0335038900375366e-05, 3.361981362104416e-05, 3.690458834171295e-05, 4.0189363062381744e-05, 4.347413778305054e-05, 4.675891250371933e-05, 5.004368722438812e-05, 5.3328461945056915e-05, 5.661323666572571e-05, 5.98980113863945e-05, 6.31827861070633e-05, 6.646756082773209e-05, 6.975233554840088e-05, 7.303711026906967e-05, 7.632188498973846e-05, 7.960665971040726e-05, 8.289143443107605e-05, 8.617620915174484e-05, 8.946098387241364e-05, 9.274575859308243e-05, 9.603053331375122e-05, 9.931530803442001e-05, 0.0001026000827550888, 0.0001058848574757576, 0.00010916963219642639, 0.00011245440691709518, 0.00011573918163776398, 0.00011902395635843277, 0.00012230873107910156]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 5.0, 10.0, 15.0, 26.0, 18.0, 50.0, 74.0, 108.0, 178.0, 281.0, 569.0, 1318.0, 3701.0, 13090.0, 87029.0, 793038.0, 125490.0, 16202.0, 4440.0, 1517.0, 640.0, 321.0, 153.0, 105.0, 58.0, 46.0, 17.0, 20.0, 11.0, 8.0, 3.0, 5.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.44140625, -1.40087890625, -1.3603515625, -1.31982421875, -1.279296875, -1.23876953125, -1.1982421875, -1.15771484375, -1.1171875, -1.07666015625, -1.0361328125, -0.99560546875, -0.955078125, -0.91455078125, -0.8740234375, -0.83349609375, -0.79296875, -0.75244140625, -0.7119140625, -0.67138671875, -0.630859375, -0.59033203125, -0.5498046875, -0.50927734375, -0.46875, -0.42822265625, -0.3876953125, -0.34716796875, -0.306640625, -0.26611328125, -0.2255859375, -0.18505859375, -0.14453125, -0.10400390625, -0.0634765625, -0.02294921875, 0.017578125, 0.05810546875, 0.0986328125, 0.13916015625, 0.1796875, 0.22021484375, 0.2607421875, 0.30126953125, 0.341796875, 0.38232421875, 0.4228515625, 0.46337890625, 0.50390625, 0.54443359375, 0.5849609375, 0.62548828125, 0.666015625, 0.70654296875, 0.7470703125, 0.78759765625, 0.828125, 0.86865234375, 0.9091796875, 0.94970703125, 0.990234375, 1.03076171875, 1.0712890625, 1.11181640625, 1.15234375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 2.0, 3.0, 4.0, 9.0, 9.0, 6.0, 17.0, 18.0, 24.0, 50.0, 70.0, 118.0, 120.0, 135.0, 114.0, 90.0, 69.0, 47.0, 30.0, 17.0, 18.0, 6.0, 8.0, 10.0, 2.0, 3.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2626953125, -1.2306365966796875, -1.198577880859375, -1.1665191650390625, -1.13446044921875, -1.1024017333984375, -1.070343017578125, -1.0382843017578125, -1.0062255859375, -0.9741668701171875, -0.942108154296875, -0.9100494384765625, -0.87799072265625, -0.8459320068359375, -0.813873291015625, -0.7818145751953125, -0.749755859375, -0.7176971435546875, -0.685638427734375, -0.6535797119140625, -0.62152099609375, -0.5894622802734375, -0.557403564453125, -0.5253448486328125, -0.4932861328125, -0.4612274169921875, -0.429168701171875, -0.3971099853515625, -0.36505126953125, -0.3329925537109375, -0.300933837890625, -0.2688751220703125, -0.23681640625, -0.2047576904296875, -0.172698974609375, -0.1406402587890625, -0.10858154296875, -0.0765228271484375, -0.044464111328125, -0.0124053955078125, 0.0196533203125, 0.0517120361328125, 0.083770751953125, 0.1158294677734375, 0.14788818359375, 0.1799468994140625, 0.212005615234375, 0.2440643310546875, 0.276123046875, 0.3081817626953125, 0.340240478515625, 0.3722991943359375, 0.40435791015625, 0.4364166259765625, 0.468475341796875, 0.5005340576171875, 0.5325927734375, 0.5646514892578125, 0.596710205078125, 0.6287689208984375, 0.66082763671875, 0.6928863525390625, 0.724945068359375, 0.7570037841796875, 0.7890625]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 7.0, 12.0, 59.0, 433.0, 399.0, 59.0, 15.0, 5.0, 8.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-21.027870178222656, -20.369081497192383, -19.71029281616211, -19.051504135131836, -18.392715454101562, -17.73392677307129, -17.075138092041016, -16.416349411010742, -15.757560729980469, -15.098772048950195, -14.439983367919922, -13.781194686889648, -13.122406005859375, -12.463617324829102, -11.804828643798828, -11.146039962768555, -10.487252235412598, -9.828463554382324, -9.16967487335205, -8.510886192321777, -7.852097511291504, -7.1933088302612305, -6.534520626068115, -5.875731945037842, -5.216943264007568, -4.558154582977295, -3.8993659019470215, -3.240577459335327, -2.5817887783050537, -1.9230000972747803, -1.264211654663086, -0.6054229736328125, 0.05336570739746094, 0.7121543288230896, 1.3709429502487183, 2.029731512069702, 2.6885201930999756, 3.347308874130249, 4.006097316741943, 4.664885997772217, 5.32367467880249, 5.982463359832764, 6.641252040863037, 7.300040245056152, 7.958828926086426, 8.6176176071167, 9.276406288146973, 9.935194969177246, 10.59398365020752, 11.252772331237793, 11.911561012268066, 12.57034969329834, 13.229138374328613, 13.887927055358887, 14.546714782714844, 15.205503463745117, 15.86429214477539, 16.523080825805664, 17.181869506835938, 17.84065818786621, 18.499446868896484, 19.158235549926758, 19.81702423095703, 20.475812911987305, 21.134601593017578]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 4.0, 5.0, 3.0, 5.0, 9.0, 4.0, 2.0, 5.0, 8.0, 8.0, 20.0, 19.0, 41.0, 61.0, 61.0, 92.0, 96.0, 109.0, 98.0, 68.0, 65.0, 59.0, 46.0, 32.0, 17.0, 14.0, 19.0, 8.0, 5.0, 12.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0], "bins": [-9.805558204650879, -9.537004470825195, -9.268450736999512, -8.999897003173828, -8.731342315673828, -8.462788581848145, -8.194234848022461, -7.925681114196777, -7.657127380371094, -7.38857364654541, -7.120019912719727, -6.851465702056885, -6.582911968231201, -6.314358234405518, -6.045804023742676, -5.777250289916992, -5.508696556091309, -5.240142822265625, -4.971589088439941, -4.7030348777771, -4.434481143951416, -4.165927410125732, -3.8973734378814697, -3.628819465637207, -3.3602657318115234, -3.09171199798584, -2.823158025741577, -2.5546040534973145, -2.286050319671631, -2.0174965858459473, -1.7489426136016846, -1.4803887605667114, -1.2118349075317383, -0.9432810544967651, -0.674727201461792, -0.40617334842681885, -0.1376194953918457, 0.13093435764312744, 0.3994882106781006, 0.6680420637130737, 0.9365959167480469, 1.20514976978302, 1.4737036228179932, 1.7422574758529663, 2.0108113288879395, 2.279365062713623, 2.5479190349578857, 2.8164730072021484, 3.085026741027832, 3.3535804748535156, 3.6221344470977783, 3.890688419342041, 4.159242153167725, 4.427795886993408, 4.69635009765625, 4.964903831481934, 5.233457565307617, 5.502011299133301, 5.770565032958984, 6.039119243621826, 6.30767297744751, 6.576226711273193, 6.844780921936035, 7.113334655761719, 7.381888389587402]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 2.0, 4.0, 8.0, 4.0, 12.0, 14.0, 14.0, 17.0, 32.0, 32.0, 38.0, 64.0, 72.0, 120.0, 165.0, 247.0, 459.0, 792.0, 1626.0, 4307.0, 21349.0, 4037364.0, 112071.0, 9387.0, 3026.0, 1250.0, 688.0, 393.0, 231.0, 172.0, 99.0, 54.0, 60.0, 37.0, 20.0, 19.0, 11.0, 7.0, 8.0, 1.0, 7.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.42578125, -5.26971435546875, -5.1136474609375, -4.95758056640625, -4.801513671875, -4.64544677734375, -4.4893798828125, -4.33331298828125, -4.17724609375, -4.02117919921875, -3.8651123046875, -3.70904541015625, -3.552978515625, -3.39691162109375, -3.2408447265625, -3.08477783203125, -2.9287109375, -2.77264404296875, -2.6165771484375, -2.46051025390625, -2.304443359375, -2.14837646484375, -1.9923095703125, -1.83624267578125, -1.68017578125, -1.52410888671875, -1.3680419921875, -1.21197509765625, -1.055908203125, -0.89984130859375, -0.7437744140625, -0.58770751953125, -0.431640625, -0.27557373046875, -0.1195068359375, 0.03656005859375, 0.192626953125, 0.34869384765625, 0.5047607421875, 0.66082763671875, 0.81689453125, 0.97296142578125, 1.1290283203125, 1.28509521484375, 1.441162109375, 1.59722900390625, 1.7532958984375, 1.90936279296875, 2.0654296875, 2.22149658203125, 2.3775634765625, 2.53363037109375, 2.689697265625, 2.84576416015625, 3.0018310546875, 3.15789794921875, 3.31396484375, 3.47003173828125, 3.6260986328125, 3.78216552734375, 3.938232421875, 4.09429931640625, 4.2503662109375, 4.40643310546875, 4.5625]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 1.0, 4.0, 8.0, 6.0, 6.0, 14.0, 17.0, 26.0, 69.0, 125.0, 178.0, 187.0, 144.0, 79.0, 44.0, 19.0, 17.0, 19.0, 5.0, 5.0, 6.0, 6.0, 7.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.2322998046875, -0.22590065002441406, -0.21950149536132812, -0.2131023406982422, -0.20670318603515625, -0.2003040313720703, -0.19390487670898438, -0.18750572204589844, -0.1811065673828125, -0.17470741271972656, -0.16830825805664062, -0.1619091033935547, -0.15550994873046875, -0.1491107940673828, -0.14271163940429688, -0.13631248474121094, -0.129913330078125, -0.12351417541503906, -0.11711502075195312, -0.11071586608886719, -0.10431671142578125, -0.09791755676269531, -0.09151840209960938, -0.08511924743652344, -0.0787200927734375, -0.07232093811035156, -0.06592178344726562, -0.05952262878417969, -0.05312347412109375, -0.04672431945800781, -0.040325164794921875, -0.03392601013183594, -0.02752685546875, -0.021127700805664062, -0.014728546142578125, -0.008329391479492188, -0.00193023681640625, 0.0044689178466796875, 0.010868072509765625, 0.017267227172851562, 0.0236663818359375, 0.030065536499023438, 0.036464691162109375, 0.04286384582519531, 0.04926300048828125, 0.05566215515136719, 0.062061309814453125, 0.06846046447753906, 0.074859619140625, 0.08125877380371094, 0.08765792846679688, 0.09405708312988281, 0.10045623779296875, 0.10685539245605469, 0.11325454711914062, 0.11965370178222656, 0.1260528564453125, 0.13245201110839844, 0.13885116577148438, 0.1452503204345703, 0.15164947509765625, 0.1580486297607422, 0.16444778442382812, 0.17084693908691406, 0.17724609375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 3.0, 2.0, 4.0, 6.0, 6.0, 5.0, 6.0, 10.0, 14.0, 18.0, 24.0, 32.0, 67.0, 116.0, 442.0, 2888.0, 136169.0, 4044204.0, 8973.0, 853.0, 177.0, 101.0, 51.0, 29.0, 19.0, 9.0, 16.0, 9.0, 10.0, 6.0, 2.0, 2.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-6.07421875, -5.8912353515625, -5.708251953125, -5.5252685546875, -5.34228515625, -5.1593017578125, -4.976318359375, -4.7933349609375, -4.6103515625, -4.4273681640625, -4.244384765625, -4.0614013671875, -3.87841796875, -3.6954345703125, -3.512451171875, -3.3294677734375, -3.146484375, -2.9635009765625, -2.780517578125, -2.5975341796875, -2.41455078125, -2.2315673828125, -2.048583984375, -1.8656005859375, -1.6826171875, -1.4996337890625, -1.316650390625, -1.1336669921875, -0.95068359375, -0.7677001953125, -0.584716796875, -0.4017333984375, -0.21875, -0.0357666015625, 0.147216796875, 0.3302001953125, 0.51318359375, 0.6961669921875, 0.879150390625, 1.0621337890625, 1.2451171875, 1.4281005859375, 1.611083984375, 1.7940673828125, 1.97705078125, 2.1600341796875, 2.343017578125, 2.5260009765625, 2.708984375, 2.8919677734375, 3.074951171875, 3.2579345703125, 3.44091796875, 3.6239013671875, 3.806884765625, 3.9898681640625, 4.1728515625, 4.3558349609375, 4.538818359375, 4.7218017578125, 4.90478515625, 5.0877685546875, 5.270751953125, 5.4537353515625, 5.63671875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 6.0, 7.0, 4.0, 9.0, 13.0, 11.0, 16.0, 22.0, 39.0, 60.0, 90.0, 167.0, 368.0, 964.0, 1480.0, 360.0, 152.0, 92.0, 59.0, 35.0, 21.0, 14.0, 22.0, 11.0, 13.0, 6.0, 5.0, 6.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.2315673828125, -0.22388267517089844, -0.21619796752929688, -0.2085132598876953, -0.20082855224609375, -0.1931438446044922, -0.18545913696289062, -0.17777442932128906, -0.1700897216796875, -0.16240501403808594, -0.15472030639648438, -0.1470355987548828, -0.13935089111328125, -0.1316661834716797, -0.12398147583007812, -0.11629676818847656, -0.108612060546875, -0.10092735290527344, -0.09324264526367188, -0.08555793762207031, -0.07787322998046875, -0.07018852233886719, -0.06250381469726562, -0.05481910705566406, -0.0471343994140625, -0.03944969177246094, -0.031764984130859375, -0.024080276489257812, -0.01639556884765625, -0.008710861206054688, -0.001026153564453125, 0.0066585540771484375, 0.01434326171875, 0.022027969360351562, 0.029712677001953125, 0.03739738464355469, 0.04508209228515625, 0.05276679992675781, 0.060451507568359375, 0.06813621520996094, 0.0758209228515625, 0.08350563049316406, 0.09119033813476562, 0.09887504577636719, 0.10655975341796875, 0.11424446105957031, 0.12192916870117188, 0.12961387634277344, 0.137298583984375, 0.14498329162597656, 0.15266799926757812, 0.1603527069091797, 0.16803741455078125, 0.1757221221923828, 0.18340682983398438, 0.19109153747558594, 0.1987762451171875, 0.20646095275878906, 0.21414566040039062, 0.2218303680419922, 0.22951507568359375, 0.2371997833251953, 0.24488449096679688, 0.25256919860839844, 0.26025390625]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 4.0, 4.0, 2.0, 9.0, 11.0, 29.0, 175.0, 540.0, 195.0, 31.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.672968864440918, -3.5300850868225098, -3.3872010707855225, -3.2443172931671143, -3.101433277130127, -2.9585494995117188, -2.8156657218933105, -2.6727819442749023, -2.529897928237915, -2.387014150619507, -2.2441301345825195, -2.1012463569641113, -1.9583624601364136, -1.8154785633087158, -1.6725947856903076, -1.5297108888626099, -1.386826992034912, -1.2439430952072144, -1.1010591983795166, -0.9581754207611084, -0.8152915239334106, -0.6724076271057129, -0.5295237898826599, -0.38663995265960693, -0.24375605583190918, -0.10087218880653381, 0.04201167821884155, 0.18489554524421692, 0.3277794122695923, 0.47066330909729004, 0.613547146320343, 0.756430983543396, 0.899315357208252, 1.0421992540359497, 1.1850831508636475, 1.3279669284820557, 1.4708508253097534, 1.6137347221374512, 1.7566184997558594, 1.8995023965835571, 2.042386293411255, 2.185270071029663, 2.3281540870666504, 2.4710378646850586, 2.613921642303467, 2.756805658340454, 2.8996894359588623, 3.0425734519958496, 3.185457229614258, 3.328341007232666, 3.4712250232696533, 3.6141088008880615, 3.756992816925049, 3.899876594543457, 4.042760372161865, 4.185644149780273, 4.32852840423584, 4.471412181854248, 4.614295959472656, 4.757180213928223, 4.900063991546631, 5.042947769165039, 5.185831546783447, 5.3287153244018555, 5.471599102020264]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 9.0, 10.0, 9.0, 25.0, 28.0, 31.0, 49.0, 59.0, 60.0, 70.0, 83.0, 102.0, 96.0, 71.0, 59.0, 58.0, 52.0, 29.0, 29.0, 17.0, 15.0, 11.0, 7.0, 3.0, 4.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.363701343536377, -1.3197206258773804, -1.2757399082183838, -1.2317591905593872, -1.1877784729003906, -1.143797755241394, -1.0998170375823975, -1.0558363199234009, -1.0118556022644043, -0.9678748846054077, -0.9238941669464111, -0.8799134492874146, -0.835932731628418, -0.7919520139694214, -0.7479712963104248, -0.7039905786514282, -0.6600098609924316, -0.6160291433334351, -0.5720484256744385, -0.5280677080154419, -0.4840869903564453, -0.44010627269744873, -0.39612555503845215, -0.35214483737945557, -0.308164119720459, -0.2641834020614624, -0.22020268440246582, -0.17622196674346924, -0.13224124908447266, -0.08826053142547607, -0.04427981376647949, -0.00029909610748291016, 0.04368162155151367, 0.08766233921051025, 0.13164305686950684, 0.17562377452850342, 0.2196044921875, 0.2635852098464966, 0.30756592750549316, 0.35154664516448975, 0.39552736282348633, 0.4395080804824829, 0.4834887981414795, 0.5274695158004761, 0.5714502334594727, 0.6154309511184692, 0.6594116687774658, 0.7033923864364624, 0.747373104095459, 0.7913538217544556, 0.8353345394134521, 0.8793152570724487, 0.9232959747314453, 0.9672766923904419, 1.0112574100494385, 1.055238127708435, 1.0992188453674316, 1.1431995630264282, 1.1871802806854248, 1.2311609983444214, 1.275141716003418, 1.3191224336624146, 1.3631031513214111, 1.4070838689804077, 1.4510645866394043]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 8.0, 3.0, 4.0, 6.0, 7.0, 15.0, 31.0, 27.0, 40.0, 60.0, 119.0, 228.0, 398.0, 957.0, 2472.0, 11183.0, 380327.0, 634140.0, 13606.0, 2883.0, 996.0, 459.0, 231.0, 125.0, 72.0, 52.0, 37.0, 13.0, 12.0, 16.0, 5.0, 6.0, 6.0, 4.0, 1.0, 4.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.380859375, -3.275390625, -3.169921875, -3.064453125, -2.958984375, -2.853515625, -2.748046875, -2.642578125, -2.537109375, -2.431640625, -2.326171875, -2.220703125, -2.115234375, -2.009765625, -1.904296875, -1.798828125, -1.693359375, -1.587890625, -1.482421875, -1.376953125, -1.271484375, -1.166015625, -1.060546875, -0.955078125, -0.849609375, -0.744140625, -0.638671875, -0.533203125, -0.427734375, -0.322265625, -0.216796875, -0.111328125, -0.005859375, 0.099609375, 0.205078125, 0.310546875, 0.416015625, 0.521484375, 0.626953125, 0.732421875, 0.837890625, 0.943359375, 1.048828125, 1.154296875, 1.259765625, 1.365234375, 1.470703125, 1.576171875, 1.681640625, 1.787109375, 1.892578125, 1.998046875, 2.103515625, 2.208984375, 2.314453125, 2.419921875, 2.525390625, 2.630859375, 2.736328125, 2.841796875, 2.947265625, 3.052734375, 3.158203125, 3.263671875, 3.369140625]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 10.0, 8.0, 10.0, 25.0, 66.0, 162.0, 227.0, 234.0, 130.0, 56.0, 34.0, 16.0, 4.0, 7.0, 5.0, 2.0, 3.0, 2.0, 0.0, 0.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2188720703125, -0.2107715606689453, -0.20267105102539062, -0.19457054138183594, -0.18647003173828125, -0.17836952209472656, -0.17026901245117188, -0.1621685028076172, -0.1540679931640625, -0.1459674835205078, -0.13786697387695312, -0.12976646423339844, -0.12166595458984375, -0.11356544494628906, -0.10546493530273438, -0.09736442565917969, -0.089263916015625, -0.08116340637207031, -0.07306289672851562, -0.06496238708496094, -0.05686187744140625, -0.04876136779785156, -0.040660858154296875, -0.03256034851074219, -0.0244598388671875, -0.016359329223632812, -0.008258819580078125, -0.0001583099365234375, 0.00794219970703125, 0.016042709350585938, 0.024143218994140625, 0.03224372863769531, 0.04034423828125, 0.04844474792480469, 0.056545257568359375, 0.06464576721191406, 0.07274627685546875, 0.08084678649902344, 0.08894729614257812, 0.09704780578613281, 0.1051483154296875, 0.11324882507324219, 0.12134933471679688, 0.12944984436035156, 0.13755035400390625, 0.14565086364746094, 0.15375137329101562, 0.1618518829345703, 0.169952392578125, 0.1780529022216797, 0.18615341186523438, 0.19425392150878906, 0.20235443115234375, 0.21045494079589844, 0.21855545043945312, 0.2266559600830078, 0.2347564697265625, 0.2428569793701172, 0.2509574890136719, 0.25905799865722656, 0.26715850830078125, 0.27525901794433594, 0.2833595275878906, 0.2914600372314453, 0.299560546875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 1.0, 5.0, 6.0, 11.0, 13.0, 20.0, 14.0, 24.0, 23.0, 48.0, 55.0, 70.0, 97.0, 152.0, 209.0, 331.0, 617.0, 1320.0, 3335.0, 10852.0, 44925.0, 242481.0, 550616.0, 151407.0, 29387.0, 7594.0, 2496.0, 992.0, 494.0, 284.0, 187.0, 134.0, 84.0, 71.0, 47.0, 37.0, 36.0, 19.0, 24.0, 18.0, 10.0, 4.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.345703125, -1.30279541015625, -1.2598876953125, -1.21697998046875, -1.174072265625, -1.13116455078125, -1.0882568359375, -1.04534912109375, -1.00244140625, -0.95953369140625, -0.9166259765625, -0.87371826171875, -0.830810546875, -0.78790283203125, -0.7449951171875, -0.70208740234375, -0.6591796875, -0.61627197265625, -0.5733642578125, -0.53045654296875, -0.487548828125, -0.44464111328125, -0.4017333984375, -0.35882568359375, -0.31591796875, -0.27301025390625, -0.2301025390625, -0.18719482421875, -0.144287109375, -0.10137939453125, -0.0584716796875, -0.01556396484375, 0.02734375, 0.07025146484375, 0.1131591796875, 0.15606689453125, 0.198974609375, 0.24188232421875, 0.2847900390625, 0.32769775390625, 0.37060546875, 0.41351318359375, 0.4564208984375, 0.49932861328125, 0.542236328125, 0.58514404296875, 0.6280517578125, 0.67095947265625, 0.7138671875, 0.75677490234375, 0.7996826171875, 0.84259033203125, 0.885498046875, 0.92840576171875, 0.9713134765625, 1.01422119140625, 1.05712890625, 1.10003662109375, 1.1429443359375, 1.18585205078125, 1.228759765625, 1.27166748046875, 1.3145751953125, 1.35748291015625, 1.400390625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 4.0, 3.0, 12.0, 4.0, 9.0, 14.0, 17.0, 19.0, 23.0, 16.0, 33.0, 38.0, 35.0, 46.0, 48.0, 51.0, 51.0, 46.0, 54.0, 55.0, 56.0, 51.0, 41.0, 47.0, 37.0, 45.0, 26.0, 21.0, 22.0, 18.0, 14.0, 11.0, 9.0, 7.0, 4.0, 4.0, 7.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64599609375, -0.6233596801757812, -0.6007232666015625, -0.5780868530273438, -0.555450439453125, -0.5328140258789062, -0.5101776123046875, -0.48754119873046875, -0.46490478515625, -0.44226837158203125, -0.4196319580078125, -0.39699554443359375, -0.374359130859375, -0.35172271728515625, -0.3290863037109375, -0.30644989013671875, -0.2838134765625, -0.26117706298828125, -0.2385406494140625, -0.21590423583984375, -0.193267822265625, -0.17063140869140625, -0.1479949951171875, -0.12535858154296875, -0.10272216796875, -0.08008575439453125, -0.0574493408203125, -0.03481292724609375, -0.012176513671875, 0.01045989990234375, 0.0330963134765625, 0.05573272705078125, 0.078369140625, 0.10100555419921875, 0.1236419677734375, 0.14627838134765625, 0.168914794921875, 0.19155120849609375, 0.2141876220703125, 0.23682403564453125, 0.25946044921875, 0.28209686279296875, 0.3047332763671875, 0.32736968994140625, 0.350006103515625, 0.37264251708984375, 0.3952789306640625, 0.41791534423828125, 0.4405517578125, 0.46318817138671875, 0.4858245849609375, 0.5084609985351562, 0.531097412109375, 0.5537338256835938, 0.5763702392578125, 0.5990066528320312, 0.62164306640625, 0.6442794799804688, 0.6669158935546875, 0.6895523071289062, 0.712188720703125, 0.7348251342773438, 0.7574615478515625, 0.7800979614257812, 0.802734375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 4.0, 6.0, 4.0, 5.0, 5.0, 12.0, 11.0, 30.0, 35.0, 57.0, 109.0, 208.0, 509.0, 1594.0, 6596.0, 56877.0, 893023.0, 78706.0, 7720.0, 1923.0, 612.0, 242.0, 105.0, 67.0, 30.0, 20.0, 19.0, 12.0, 6.0, 2.0, 3.0, 5.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.3203125, -2.26446533203125, -2.2086181640625, -2.15277099609375, -2.096923828125, -2.04107666015625, -1.9852294921875, -1.92938232421875, -1.87353515625, -1.81768798828125, -1.7618408203125, -1.70599365234375, -1.650146484375, -1.59429931640625, -1.5384521484375, -1.48260498046875, -1.4267578125, -1.37091064453125, -1.3150634765625, -1.25921630859375, -1.203369140625, -1.14752197265625, -1.0916748046875, -1.03582763671875, -0.97998046875, -0.92413330078125, -0.8682861328125, -0.81243896484375, -0.756591796875, -0.70074462890625, -0.6448974609375, -0.58905029296875, -0.533203125, -0.47735595703125, -0.4215087890625, -0.36566162109375, -0.309814453125, -0.25396728515625, -0.1981201171875, -0.14227294921875, -0.08642578125, -0.03057861328125, 0.0252685546875, 0.08111572265625, 0.136962890625, 0.19281005859375, 0.2486572265625, 0.30450439453125, 0.3603515625, 0.41619873046875, 0.4720458984375, 0.52789306640625, 0.583740234375, 0.63958740234375, 0.6954345703125, 0.75128173828125, 0.80712890625, 0.86297607421875, 0.9188232421875, 0.97467041015625, 1.030517578125, 1.08636474609375, 1.1422119140625, 1.19805908203125, 1.25390625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 8.0, 7.0, 15.0, 20.0, 15.0, 41.0, 53.0, 92.0, 154.0, 157.0, 131.0, 99.0, 70.0, 46.0, 28.0, 15.0, 11.0, 12.0, 4.0, 3.0, 3.0, 2.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0001633167266845703, -0.00015886686742305756, -0.0001544170081615448, -0.00014996714890003204, -0.0001455172896385193, -0.00014106743037700653, -0.00013661757111549377, -0.00013216771185398102, -0.00012771785259246826, -0.0001232679933309555, -0.00011881813406944275, -0.00011436827480792999, -0.00010991841554641724, -0.00010546855628490448, -0.00010101869702339172, -9.656883776187897e-05, -9.211897850036621e-05, -8.766911923885345e-05, -8.32192599773407e-05, -7.876940071582794e-05, -7.431954145431519e-05, -6.986968219280243e-05, -6.541982293128967e-05, -6.0969963669776917e-05, -5.652010440826416e-05, -5.2070245146751404e-05, -4.762038588523865e-05, -4.317052662372589e-05, -3.8720667362213135e-05, -3.427080810070038e-05, -2.9820948839187622e-05, -2.5371089577674866e-05, -2.092123031616211e-05, -1.6471371054649353e-05, -1.2021511793136597e-05, -7.57165253162384e-06, -3.121793270111084e-06, 1.3280659914016724e-06, 5.777925252914429e-06, 1.0227784514427185e-05, 1.4677643775939941e-05, 1.9127503037452698e-05, 2.3577362298965454e-05, 2.802722156047821e-05, 3.247708082199097e-05, 3.692694008350372e-05, 4.137679934501648e-05, 4.5826658606529236e-05, 5.027651786804199e-05, 5.472637712955475e-05, 5.9176236391067505e-05, 6.362609565258026e-05, 6.807595491409302e-05, 7.252581417560577e-05, 7.697567343711853e-05, 8.142553269863129e-05, 8.587539196014404e-05, 9.03252512216568e-05, 9.477511048316956e-05, 9.922496974468231e-05, 0.00010367482900619507, 0.00010812468826770782, 0.00011257454752922058, 0.00011702440679073334, 0.0001214742660522461]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 1.0, 9.0, 3.0, 11.0, 21.0, 19.0, 28.0, 55.0, 80.0, 142.0, 287.0, 550.0, 1240.0, 3328.0, 10246.0, 69096.0, 842185.0, 102637.0, 12274.0, 3658.0, 1414.0, 587.0, 282.0, 164.0, 76.0, 51.0, 36.0, 21.0, 15.0, 7.0, 12.0, 1.0, 5.0, 4.0, 1.0, 3.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.826171875, -1.7762298583984375, -1.726287841796875, -1.6763458251953125, -1.62640380859375, -1.5764617919921875, -1.526519775390625, -1.4765777587890625, -1.4266357421875, -1.3766937255859375, -1.326751708984375, -1.2768096923828125, -1.22686767578125, -1.1769256591796875, -1.126983642578125, -1.0770416259765625, -1.027099609375, -0.9771575927734375, -0.927215576171875, -0.8772735595703125, -0.82733154296875, -0.7773895263671875, -0.727447509765625, -0.6775054931640625, -0.6275634765625, -0.5776214599609375, -0.527679443359375, -0.4777374267578125, -0.42779541015625, -0.3778533935546875, -0.327911376953125, -0.2779693603515625, -0.22802734375, -0.1780853271484375, -0.128143310546875, -0.0782012939453125, -0.02825927734375, 0.0216827392578125, 0.071624755859375, 0.1215667724609375, 0.1715087890625, 0.2214508056640625, 0.271392822265625, 0.3213348388671875, 0.37127685546875, 0.4212188720703125, 0.471160888671875, 0.5211029052734375, 0.571044921875, 0.6209869384765625, 0.670928955078125, 0.7208709716796875, 0.77081298828125, 0.8207550048828125, 0.870697021484375, 0.9206390380859375, 0.9705810546875, 1.0205230712890625, 1.070465087890625, 1.1204071044921875, 1.17034912109375, 1.2202911376953125, 1.270233154296875, 1.3201751708984375, 1.3701171875]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 4.0, 4.0, 1.0, 6.0, 13.0, 11.0, 14.0, 16.0, 21.0, 30.0, 49.0, 48.0, 73.0, 85.0, 106.0, 89.0, 82.0, 78.0, 68.0, 58.0, 33.0, 28.0, 23.0, 11.0, 13.0, 8.0, 3.0, 3.0, 2.0, 6.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.443359375, -0.428192138671875, -0.41302490234375, -0.397857666015625, -0.3826904296875, -0.367523193359375, -0.35235595703125, -0.337188720703125, -0.322021484375, -0.306854248046875, -0.29168701171875, -0.276519775390625, -0.2613525390625, -0.246185302734375, -0.23101806640625, -0.215850830078125, -0.20068359375, -0.185516357421875, -0.17034912109375, -0.155181884765625, -0.1400146484375, -0.124847412109375, -0.10968017578125, -0.094512939453125, -0.079345703125, -0.064178466796875, -0.04901123046875, -0.033843994140625, -0.0186767578125, -0.003509521484375, 0.01165771484375, 0.026824951171875, 0.0419921875, 0.057159423828125, 0.07232666015625, 0.087493896484375, 0.1026611328125, 0.117828369140625, 0.13299560546875, 0.148162841796875, 0.163330078125, 0.178497314453125, 0.19366455078125, 0.208831787109375, 0.2239990234375, 0.239166259765625, 0.25433349609375, 0.269500732421875, 0.28466796875, 0.299835205078125, 0.31500244140625, 0.330169677734375, 0.3453369140625, 0.360504150390625, 0.37567138671875, 0.390838623046875, 0.406005859375, 0.421173095703125, 0.43634033203125, 0.451507568359375, 0.4666748046875, 0.481842041015625, 0.49700927734375, 0.512176513671875, 0.52734375]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 4.0, 12.0, 41.0, 159.0, 469.0, 232.0, 67.0, 13.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.33147621154785, -15.641979217529297, -14.952482223510742, -14.262985229492188, -13.573487281799316, -12.883990287780762, -12.194493293762207, -11.504995346069336, -10.815498352050781, -10.126001358032227, -9.436504364013672, -8.747007369995117, -8.057509422302246, -7.368012428283691, -6.678515434265137, -5.989017963409424, -5.299521446228027, -4.610024452209473, -3.9205269813537598, -3.231029987335205, -2.5415327548980713, -1.8520355224609375, -1.1625385284423828, -0.4730410575866699, 0.21645593643188477, 0.9059531092643738, 1.5954502820968628, 2.284947395324707, 2.974444627761841, 3.6639418601989746, 4.353438854217529, 5.042936325073242, 5.732433319091797, 6.421930313110352, 7.1114277839660645, 7.800924777984619, 8.490422248840332, 9.179919242858887, 9.869416236877441, 10.558914184570312, 11.248411178588867, 11.937908172607422, 12.627405166625977, 13.316902160644531, 14.006400108337402, 14.695897102355957, 15.385394096374512, 16.074892044067383, 16.764389038085938, 17.453886032104492, 18.143383026123047, 18.8328800201416, 19.522377014160156, 20.211875915527344, 20.901371002197266, 21.590869903564453, 22.280364990234375, 22.96986198425293, 23.659358978271484, 24.34885597229004, 25.038352966308594, 25.72785186767578, 26.417346954345703, 27.10684585571289, 27.796342849731445]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 7.0, 5.0, 9.0, 9.0, 12.0, 18.0, 24.0, 36.0, 40.0, 46.0, 37.0, 60.0, 61.0, 78.0, 58.0, 59.0, 64.0, 66.0, 57.0, 46.0, 34.0, 40.0, 38.0, 26.0, 17.0, 9.0, 11.0, 11.0, 6.0, 11.0, 5.0, 1.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.256053924560547, -5.034274101257324, -4.812494277954102, -4.590714454650879, -4.3689351081848145, -4.147155284881592, -3.925375461578369, -3.7035956382751465, -3.481815814971924, -3.260035991668701, -3.0382564067840576, -2.816476583480835, -2.5946967601776123, -2.3729171752929688, -2.151137351989746, -1.9293575286865234, -1.7075779438018799, -1.4857982397079468, -1.2640184164047241, -1.042238712310791, -0.8204589486122131, -0.5986791849136353, -0.37689948081970215, -0.1551196575164795, 0.06666004657745361, 0.2884398102760315, 0.5102195739746094, 0.7319992780685425, 0.9537790417671204, 1.1755588054656982, 1.3973385095596313, 1.619118332862854, 1.840898036956787, 2.0626778602600098, 2.2844574451446533, 2.506237268447876, 2.7280170917510986, 2.949796676635742, 3.171576499938965, 3.3933563232421875, 3.61513614654541, 3.836915969848633, 4.0586957931518555, 4.280475616455078, 4.502254962921143, 4.724034786224365, 4.945814609527588, 5.1675944328308105, 5.389373779296875, 5.611153602600098, 5.83293342590332, 6.054713249206543, 6.276492595672607, 6.49827241897583, 6.720052242279053, 6.941832065582275, 7.163611888885498, 7.385391712188721, 7.607171535491943, 7.828950881958008, 8.05073070526123, 8.272510528564453, 8.494290351867676, 8.716070175170898, 8.937849998474121]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 7.0, 9.0, 20.0, 31.0, 93.0, 201.0, 563.0, 4911.0, 4160226.0, 26140.0, 1261.0, 393.0, 177.0, 100.0, 59.0, 30.0, 16.0, 11.0, 9.0, 4.0, 4.0, 4.0, 0.0, 2.0, 2.0, 0.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.890625, -11.4901123046875, -11.089599609375, -10.6890869140625, -10.28857421875, -9.8880615234375, -9.487548828125, -9.0870361328125, -8.6865234375, -8.2860107421875, -7.885498046875, -7.4849853515625, -7.08447265625, -6.6839599609375, -6.283447265625, -5.8829345703125, -5.482421875, -5.0819091796875, -4.681396484375, -4.2808837890625, -3.88037109375, -3.4798583984375, -3.079345703125, -2.6788330078125, -2.2783203125, -1.8778076171875, -1.477294921875, -1.0767822265625, -0.67626953125, -0.2757568359375, 0.124755859375, 0.5252685546875, 0.92578125, 1.3262939453125, 1.726806640625, 2.1273193359375, 2.52783203125, 2.9283447265625, 3.328857421875, 3.7293701171875, 4.1298828125, 4.5303955078125, 4.930908203125, 5.3314208984375, 5.73193359375, 6.1324462890625, 6.532958984375, 6.9334716796875, 7.333984375, 7.7344970703125, 8.135009765625, 8.5355224609375, 8.93603515625, 9.3365478515625, 9.737060546875, 10.1375732421875, 10.5380859375, 10.9385986328125, 11.339111328125, 11.7396240234375, 12.14013671875, 12.5406494140625, 12.941162109375, 13.3416748046875, 13.7421875]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 7.0, 7.0, 12.0, 14.0, 39.0, 62.0, 114.0, 143.0, 155.0, 160.0, 102.0, 80.0, 37.0, 29.0, 14.0, 12.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26171875, -0.252593994140625, -0.24346923828125, -0.234344482421875, -0.2252197265625, -0.216094970703125, -0.20697021484375, -0.197845458984375, -0.188720703125, -0.179595947265625, -0.17047119140625, -0.161346435546875, -0.1522216796875, -0.143096923828125, -0.13397216796875, -0.124847412109375, -0.11572265625, -0.106597900390625, -0.09747314453125, -0.088348388671875, -0.0792236328125, -0.070098876953125, -0.06097412109375, -0.051849365234375, -0.042724609375, -0.033599853515625, -0.02447509765625, -0.015350341796875, -0.0062255859375, 0.002899169921875, 0.01202392578125, 0.021148681640625, 0.0302734375, 0.039398193359375, 0.04852294921875, 0.057647705078125, 0.0667724609375, 0.075897216796875, 0.08502197265625, 0.094146728515625, 0.103271484375, 0.112396240234375, 0.12152099609375, 0.130645751953125, 0.1397705078125, 0.148895263671875, 0.15802001953125, 0.167144775390625, 0.17626953125, 0.185394287109375, 0.19451904296875, 0.203643798828125, 0.2127685546875, 0.221893310546875, 0.23101806640625, 0.240142822265625, 0.249267578125, 0.258392333984375, 0.26751708984375, 0.276641845703125, 0.2857666015625, 0.294891357421875, 0.30401611328125, 0.313140869140625, 0.322265625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 6.0, 8.0, 10.0, 14.0, 15.0, 30.0, 37.0, 34.0, 44.0, 73.0, 87.0, 109.0, 119.0, 163.0, 1075.0, 463141.0, 3726703.0, 1601.0, 267.0, 142.0, 107.0, 85.0, 70.0, 76.0, 52.0, 57.0, 39.0, 35.0, 26.0, 21.0, 15.0, 7.0, 4.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-12.6953125, -12.3331298828125, -11.970947265625, -11.6087646484375, -11.24658203125, -10.8843994140625, -10.522216796875, -10.1600341796875, -9.7978515625, -9.4356689453125, -9.073486328125, -8.7113037109375, -8.34912109375, -7.9869384765625, -7.624755859375, -7.2625732421875, -6.900390625, -6.5382080078125, -6.176025390625, -5.8138427734375, -5.45166015625, -5.0894775390625, -4.727294921875, -4.3651123046875, -4.0029296875, -3.6407470703125, -3.278564453125, -2.9163818359375, -2.55419921875, -2.1920166015625, -1.829833984375, -1.4676513671875, -1.10546875, -0.7432861328125, -0.381103515625, -0.0189208984375, 0.34326171875, 0.7054443359375, 1.067626953125, 1.4298095703125, 1.7919921875, 2.1541748046875, 2.516357421875, 2.8785400390625, 3.24072265625, 3.6029052734375, 3.965087890625, 4.3272705078125, 4.689453125, 5.0516357421875, 5.413818359375, 5.7760009765625, 6.13818359375, 6.5003662109375, 6.862548828125, 7.2247314453125, 7.5869140625, 7.9490966796875, 8.311279296875, 8.6734619140625, 9.03564453125, 9.3978271484375, 9.760009765625, 10.1221923828125, 10.484375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 8.0, 8.0, 10.0, 34.0, 78.0, 319.0, 2847.0, 609.0, 113.0, 35.0, 11.0, 10.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3486328125, -0.3125762939453125, -0.276519775390625, -0.2404632568359375, -0.20440673828125, -0.1683502197265625, -0.132293701171875, -0.0962371826171875, -0.0601806640625, -0.0241241455078125, 0.011932373046875, 0.0479888916015625, 0.08404541015625, 0.1201019287109375, 0.156158447265625, 0.1922149658203125, 0.228271484375, 0.2643280029296875, 0.300384521484375, 0.3364410400390625, 0.37249755859375, 0.4085540771484375, 0.444610595703125, 0.4806671142578125, 0.5167236328125, 0.5527801513671875, 0.588836669921875, 0.6248931884765625, 0.66094970703125, 0.6970062255859375, 0.733062744140625, 0.7691192626953125, 0.80517578125, 0.8412322998046875, 0.877288818359375, 0.9133453369140625, 0.94940185546875, 0.9854583740234375, 1.021514892578125, 1.0575714111328125, 1.0936279296875, 1.1296844482421875, 1.165740966796875, 1.2017974853515625, 1.23785400390625, 1.2739105224609375, 1.309967041015625, 1.3460235595703125, 1.382080078125, 1.4181365966796875, 1.454193115234375, 1.4902496337890625, 1.52630615234375, 1.5623626708984375, 1.598419189453125, 1.6344757080078125, 1.6705322265625, 1.7065887451171875, 1.742645263671875, 1.7787017822265625, 1.81475830078125, 1.8508148193359375, 1.886871337890625, 1.9229278564453125, 1.958984375]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 13.0, 35.0, 88.0, 542.0, 248.0, 53.0, 15.0, 1.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.062538146972656, -11.574601173400879, -11.086664199829102, -10.598726272583008, -10.11078929901123, -9.622852325439453, -9.134915351867676, -8.646978378295898, -8.159040451049805, -7.671103477478027, -7.183166027069092, -6.6952290534973145, -6.207291603088379, -5.719354629516602, -5.231417655944824, -4.743480682373047, -4.2555437088012695, -3.767606496810913, -3.2796692848205566, -2.7917323112487793, -2.303795099258423, -1.8158578872680664, -1.327920913696289, -0.8399837017059326, -0.35204648971557617, 0.1358906626701355, 0.6238278150558472, 1.111764907836914, 1.5997021198272705, 2.087639331817627, 2.5755763053894043, 3.0635135173797607, 3.551450729370117, 4.0393877029418945, 4.52732515335083, 5.015262126922607, 5.503199577331543, 5.99113655090332, 6.479073524475098, 6.967010498046875, 7.4549479484558105, 7.942884922027588, 8.430822372436523, 8.9187593460083, 9.406696319580078, 9.894634246826172, 10.382570266723633, 10.870508193969727, 11.358445167541504, 11.846382141113281, 12.334319114685059, 12.822256088256836, 13.31019401550293, 13.798130989074707, 14.286067962646484, 14.774004936218262, 15.261941909790039, 15.749878883361816, 16.237815856933594, 16.725753784179688, 17.21368980407715, 17.701627731323242, 18.189563751220703, 18.677501678466797, 19.16543960571289]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 7.0, 14.0, 25.0, 53.0, 88.0, 75.0, 117.0, 128.0, 134.0, 126.0, 94.0, 59.0, 37.0, 22.0, 14.0, 8.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.903992652893066, -5.729015827178955, -5.554039001464844, -5.379061698913574, -5.204084873199463, -5.029108047485352, -4.85413122177124, -4.679154396057129, -4.504177570343018, -4.329200744628906, -4.154223918914795, -3.9792468547821045, -3.804270029067993, -3.6292929649353027, -3.4543161392211914, -3.27933931350708, -3.1043622493743896, -2.9293854236602783, -2.754408359527588, -2.5794315338134766, -2.4044547080993652, -2.229477882385254, -2.0545008182525635, -1.8795239925384521, -1.7045470476150513, -1.5295701026916504, -1.354593276977539, -1.1796163320541382, -1.0046393871307373, -0.829662561416626, -0.6546856164932251, -0.47970879077911377, -0.3047318458557129, -0.1297549456357956, 0.045221954584121704, 0.2201988697052002, 0.3951757550239563, 0.5701526403427124, 0.7451295852661133, 0.9201064109802246, 1.0950833559036255, 1.2700603008270264, 1.4450371265411377, 1.6200140714645386, 1.7949910163879395, 1.9699678421020508, 2.144944667816162, 2.3199214935302734, 2.494898557662964, 2.669875383377075, 2.8448524475097656, 3.019829273223877, 3.1948060989379883, 3.3697829246520996, 3.54475998878479, 3.7197368144989014, 3.894713878631592, 4.069690704345703, 4.2446675300598145, 4.419644355773926, 4.594621658325195, 4.769598484039307, 4.944575309753418, 5.119552135467529, 5.294528961181641]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 2.0, 11.0, 3.0, 9.0, 5.0, 10.0, 15.0, 10.0, 33.0, 49.0, 71.0, 92.0, 199.0, 413.0, 938.0, 2667.0, 11728.0, 134652.0, 818723.0, 67396.0, 7918.0, 2032.0, 752.0, 337.0, 184.0, 103.0, 61.0, 34.0, 31.0, 19.0, 16.0, 12.0, 8.0, 8.0, 7.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-4.62890625, -4.505096435546875, -4.38128662109375, -4.257476806640625, -4.1336669921875, -4.009857177734375, -3.88604736328125, -3.762237548828125, -3.638427734375, -3.514617919921875, -3.39080810546875, -3.266998291015625, -3.1431884765625, -3.019378662109375, -2.89556884765625, -2.771759033203125, -2.64794921875, -2.524139404296875, -2.40032958984375, -2.276519775390625, -2.1527099609375, -2.028900146484375, -1.90509033203125, -1.781280517578125, -1.657470703125, -1.533660888671875, -1.40985107421875, -1.286041259765625, -1.1622314453125, -1.038421630859375, -0.91461181640625, -0.790802001953125, -0.6669921875, -0.543182373046875, -0.41937255859375, -0.295562744140625, -0.1717529296875, -0.047943115234375, 0.07586669921875, 0.199676513671875, 0.323486328125, 0.447296142578125, 0.57110595703125, 0.694915771484375, 0.8187255859375, 0.942535400390625, 1.06634521484375, 1.190155029296875, 1.31396484375, 1.437774658203125, 1.56158447265625, 1.685394287109375, 1.8092041015625, 1.933013916015625, 2.05682373046875, 2.180633544921875, 2.304443359375, 2.428253173828125, 2.55206298828125, 2.675872802734375, 2.7996826171875, 2.923492431640625, 3.04730224609375, 3.171112060546875, 3.294921875]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 5.0, 8.0, 13.0, 21.0, 42.0, 64.0, 107.0, 119.0, 161.0, 120.0, 108.0, 87.0, 66.0, 35.0, 17.0, 13.0, 4.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.290771484375, -0.27957916259765625, -0.2683868408203125, -0.25719451904296875, -0.246002197265625, -0.23480987548828125, -0.2236175537109375, -0.21242523193359375, -0.20123291015625, -0.19004058837890625, -0.1788482666015625, -0.16765594482421875, -0.156463623046875, -0.14527130126953125, -0.1340789794921875, -0.12288665771484375, -0.1116943359375, -0.10050201416015625, -0.0893096923828125, -0.07811737060546875, -0.066925048828125, -0.05573272705078125, -0.0445404052734375, -0.03334808349609375, -0.02215576171875, -0.01096343994140625, 0.0002288818359375, 0.01142120361328125, 0.022613525390625, 0.03380584716796875, 0.0449981689453125, 0.05619049072265625, 0.0673828125, 0.07857513427734375, 0.0897674560546875, 0.10095977783203125, 0.112152099609375, 0.12334442138671875, 0.1345367431640625, 0.14572906494140625, 0.15692138671875, 0.16811370849609375, 0.1793060302734375, 0.19049835205078125, 0.201690673828125, 0.21288299560546875, 0.2240753173828125, 0.23526763916015625, 0.2464599609375, 0.25765228271484375, 0.2688446044921875, 0.28003692626953125, 0.291229248046875, 0.30242156982421875, 0.3136138916015625, 0.32480621337890625, 0.33599853515625, 0.34719085693359375, 0.3583831787109375, 0.36957550048828125, 0.380767822265625, 0.39196014404296875, 0.4031524658203125, 0.41434478759765625, 0.425537109375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 2.0, 5.0, 6.0, 4.0, 18.0, 22.0, 23.0, 39.0, 48.0, 81.0, 88.0, 158.0, 217.0, 360.0, 650.0, 1258.0, 3017.0, 8533.0, 31487.0, 142713.0, 500468.0, 277310.0, 59049.0, 14721.0, 4582.0, 1654.0, 763.0, 478.0, 250.0, 161.0, 126.0, 75.0, 61.0, 41.0, 32.0, 13.0, 13.0, 7.0, 11.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0], "bins": [-1.7490234375, -1.698638916015625, -1.64825439453125, -1.597869873046875, -1.5474853515625, -1.497100830078125, -1.44671630859375, -1.396331787109375, -1.345947265625, -1.295562744140625, -1.24517822265625, -1.194793701171875, -1.1444091796875, -1.094024658203125, -1.04364013671875, -0.993255615234375, -0.94287109375, -0.892486572265625, -0.84210205078125, -0.791717529296875, -0.7413330078125, -0.690948486328125, -0.64056396484375, -0.590179443359375, -0.539794921875, -0.489410400390625, -0.43902587890625, -0.388641357421875, -0.3382568359375, -0.287872314453125, -0.23748779296875, -0.187103271484375, -0.13671875, -0.086334228515625, -0.03594970703125, 0.014434814453125, 0.0648193359375, 0.115203857421875, 0.16558837890625, 0.215972900390625, 0.266357421875, 0.316741943359375, 0.36712646484375, 0.417510986328125, 0.4678955078125, 0.518280029296875, 0.56866455078125, 0.619049072265625, 0.66943359375, 0.719818115234375, 0.77020263671875, 0.820587158203125, 0.8709716796875, 0.921356201171875, 0.97174072265625, 1.022125244140625, 1.072509765625, 1.122894287109375, 1.17327880859375, 1.223663330078125, 1.2740478515625, 1.324432373046875, 1.37481689453125, 1.425201416015625, 1.4755859375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 2.0, 0.0, 5.0, 8.0, 9.0, 11.0, 11.0, 20.0, 20.0, 31.0, 34.0, 36.0, 48.0, 50.0, 56.0, 63.0, 76.0, 63.0, 67.0, 48.0, 66.0, 47.0, 40.0, 42.0, 25.0, 37.0, 20.0, 21.0, 17.0, 7.0, 13.0, 3.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9716796875, -0.9374847412109375, -0.903289794921875, -0.8690948486328125, -0.83489990234375, -0.8007049560546875, -0.766510009765625, -0.7323150634765625, -0.6981201171875, -0.6639251708984375, -0.629730224609375, -0.5955352783203125, -0.56134033203125, -0.5271453857421875, -0.492950439453125, -0.4587554931640625, -0.424560546875, -0.3903656005859375, -0.356170654296875, -0.3219757080078125, -0.28778076171875, -0.2535858154296875, -0.219390869140625, -0.1851959228515625, -0.1510009765625, -0.1168060302734375, -0.082611083984375, -0.0484161376953125, -0.01422119140625, 0.0199737548828125, 0.054168701171875, 0.0883636474609375, 0.12255859375, 0.1567535400390625, 0.190948486328125, 0.2251434326171875, 0.25933837890625, 0.2935333251953125, 0.327728271484375, 0.3619232177734375, 0.3961181640625, 0.4303131103515625, 0.464508056640625, 0.4987030029296875, 0.53289794921875, 0.5670928955078125, 0.601287841796875, 0.6354827880859375, 0.669677734375, 0.7038726806640625, 0.738067626953125, 0.7722625732421875, 0.80645751953125, 0.8406524658203125, 0.874847412109375, 0.9090423583984375, 0.9432373046875, 0.9774322509765625, 1.011627197265625, 1.0458221435546875, 1.08001708984375, 1.1142120361328125, 1.148406982421875, 1.1826019287109375, 1.216796875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 1.0, 5.0, 4.0, 8.0, 10.0, 17.0, 29.0, 18.0, 49.0, 53.0, 89.0, 117.0, 228.0, 457.0, 945.0, 2823.0, 12164.0, 172265.0, 815859.0, 34933.0, 5300.0, 1639.0, 720.0, 299.0, 178.0, 103.0, 71.0, 48.0, 26.0, 24.0, 15.0, 13.0, 9.0, 7.0, 3.0, 6.0, 4.0, 5.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0], "bins": [-1.87890625, -1.814666748046875, -1.75042724609375, -1.686187744140625, -1.6219482421875, -1.557708740234375, -1.49346923828125, -1.429229736328125, -1.364990234375, -1.300750732421875, -1.23651123046875, -1.172271728515625, -1.1080322265625, -1.043792724609375, -0.97955322265625, -0.915313720703125, -0.85107421875, -0.786834716796875, -0.72259521484375, -0.658355712890625, -0.5941162109375, -0.529876708984375, -0.46563720703125, -0.401397705078125, -0.337158203125, -0.272918701171875, -0.20867919921875, -0.144439697265625, -0.0802001953125, -0.015960693359375, 0.04827880859375, 0.112518310546875, 0.1767578125, 0.240997314453125, 0.30523681640625, 0.369476318359375, 0.4337158203125, 0.497955322265625, 0.56219482421875, 0.626434326171875, 0.690673828125, 0.754913330078125, 0.81915283203125, 0.883392333984375, 0.9476318359375, 1.011871337890625, 1.07611083984375, 1.140350341796875, 1.20458984375, 1.268829345703125, 1.33306884765625, 1.397308349609375, 1.4615478515625, 1.525787353515625, 1.59002685546875, 1.654266357421875, 1.718505859375, 1.782745361328125, 1.84698486328125, 1.911224365234375, 1.9754638671875, 2.039703369140625, 2.10394287109375, 2.168182373046875, 2.232421875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 7.0, 6.0, 10.0, 18.0, 22.0, 37.0, 47.0, 82.0, 143.0, 198.0, 171.0, 91.0, 60.0, 37.0, 22.0, 17.0, 9.0, 8.0, 5.0, 3.0, 7.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00024247169494628906, -0.0002358369529247284, -0.00022920221090316772, -0.00022256746888160706, -0.0002159327268600464, -0.00020929798483848572, -0.00020266324281692505, -0.00019602850079536438, -0.0001893937587738037, -0.00018275901675224304, -0.00017612427473068237, -0.0001694895327091217, -0.00016285479068756104, -0.00015622004866600037, -0.0001495853066444397, -0.00014295056462287903, -0.00013631582260131836, -0.0001296810805797577, -0.00012304633855819702, -0.00011641159653663635, -0.00010977685451507568, -0.00010314211249351501, -9.650737047195435e-05, -8.987262845039368e-05, -8.323788642883301e-05, -7.660314440727234e-05, -6.996840238571167e-05, -6.3333660364151e-05, -5.669891834259033e-05, -5.006417632102966e-05, -4.3429434299468994e-05, -3.6794692277908325e-05, -3.0159950256347656e-05, -2.3525208234786987e-05, -1.689046621322632e-05, -1.025572419166565e-05, -3.6209821701049805e-06, 3.0137598514556885e-06, 9.648501873016357e-06, 1.6283243894577026e-05, 2.2917985916137695e-05, 2.9552727937698364e-05, 3.618746995925903e-05, 4.28222119808197e-05, 4.945695400238037e-05, 5.609169602394104e-05, 6.272643804550171e-05, 6.936118006706238e-05, 7.599592208862305e-05, 8.263066411018372e-05, 8.926540613174438e-05, 9.590014815330505e-05, 0.00010253489017486572, 0.00010916963219642639, 0.00011580437421798706, 0.00012243911623954773, 0.0001290738582611084, 0.00013570860028266907, 0.00014234334230422974, 0.0001489780843257904, 0.00015561282634735107, 0.00016224756836891174, 0.0001688823103904724, 0.00017551705241203308, 0.00018215179443359375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 6.0, 7.0, 9.0, 13.0, 19.0, 30.0, 65.0, 96.0, 162.0, 320.0, 745.0, 2156.0, 7774.0, 50880.0, 844427.0, 124782.0, 12118.0, 3052.0, 1042.0, 384.0, 209.0, 100.0, 61.0, 34.0, 14.0, 19.0, 10.0, 8.0, 4.0, 5.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.341796875, -2.2812042236328125, -2.220611572265625, -2.1600189208984375, -2.09942626953125, -2.0388336181640625, -1.978240966796875, -1.9176483154296875, -1.8570556640625, -1.7964630126953125, -1.735870361328125, -1.6752777099609375, -1.61468505859375, -1.5540924072265625, -1.493499755859375, -1.4329071044921875, -1.372314453125, -1.3117218017578125, -1.251129150390625, -1.1905364990234375, -1.12994384765625, -1.0693511962890625, -1.008758544921875, -0.9481658935546875, -0.8875732421875, -0.8269805908203125, -0.766387939453125, -0.7057952880859375, -0.64520263671875, -0.5846099853515625, -0.524017333984375, -0.4634246826171875, -0.40283203125, -0.3422393798828125, -0.281646728515625, -0.2210540771484375, -0.16046142578125, -0.0998687744140625, -0.039276123046875, 0.0213165283203125, 0.0819091796875, 0.1425018310546875, 0.203094482421875, 0.2636871337890625, 0.32427978515625, 0.3848724365234375, 0.445465087890625, 0.5060577392578125, 0.566650390625, 0.6272430419921875, 0.687835693359375, 0.7484283447265625, 0.80902099609375, 0.8696136474609375, 0.930206298828125, 0.9907989501953125, 1.0513916015625, 1.1119842529296875, 1.172576904296875, 1.2331695556640625, 1.29376220703125, 1.3543548583984375, 1.414947509765625, 1.4755401611328125, 1.5361328125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 2.0, 2.0, 6.0, 9.0, 4.0, 9.0, 15.0, 20.0, 36.0, 46.0, 47.0, 76.0, 129.0, 105.0, 121.0, 95.0, 82.0, 51.0, 40.0, 27.0, 27.0, 9.0, 10.0, 8.0, 5.0, 4.0, 5.0, 0.0, 2.0, 3.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.73974609375, -0.718505859375, -0.697265625, -0.676025390625, -0.65478515625, -0.633544921875, -0.6123046875, -0.591064453125, -0.56982421875, -0.548583984375, -0.52734375, -0.506103515625, -0.48486328125, -0.463623046875, -0.4423828125, -0.421142578125, -0.39990234375, -0.378662109375, -0.357421875, -0.336181640625, -0.31494140625, -0.293701171875, -0.2724609375, -0.251220703125, -0.22998046875, -0.208740234375, -0.1875, -0.166259765625, -0.14501953125, -0.123779296875, -0.1025390625, -0.081298828125, -0.06005859375, -0.038818359375, -0.017578125, 0.003662109375, 0.02490234375, 0.046142578125, 0.0673828125, 0.088623046875, 0.10986328125, 0.131103515625, 0.15234375, 0.173583984375, 0.19482421875, 0.216064453125, 0.2373046875, 0.258544921875, 0.27978515625, 0.301025390625, 0.322265625, 0.343505859375, 0.36474609375, 0.385986328125, 0.4072265625, 0.428466796875, 0.44970703125, 0.470947265625, 0.4921875, 0.513427734375, 0.53466796875, 0.555908203125, 0.5771484375, 0.598388671875, 0.61962890625]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 9.0, 17.0, 33.0, 63.0, 144.0, 199.0, 242.0, 146.0, 73.0, 38.0, 21.0, 9.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.205010414123535, -9.782374382019043, -9.359739303588867, -8.937103271484375, -8.5144681930542, -8.091832160949707, -7.669196605682373, -7.246561050415039, -6.823925495147705, -6.401289939880371, -5.978654384613037, -5.556018829345703, -5.133382797241211, -4.710747718811035, -4.288111686706543, -3.865476131439209, -3.442840576171875, -3.020205020904541, -2.597569465637207, -2.174933671951294, -1.75229811668396, -1.329662561416626, -0.9070267677307129, -0.4843912124633789, -0.06175565719604492, 0.36087995767593384, 0.7835155725479126, 1.2061512470245361, 1.6287868022918701, 2.051422357559204, 2.474058151245117, 2.896693706512451, 3.3193283081054688, 3.7419638633728027, 4.164599418640137, 4.587235450744629, 5.009870529174805, 5.432506561279297, 5.855142116546631, 6.277777671813965, 6.700413227081299, 7.123048782348633, 7.545684337615967, 7.968319892883301, 8.390955924987793, 8.813591003417969, 9.236227035522461, 9.658863067626953, 10.081498146057129, 10.504134178161621, 10.926769256591797, 11.349405288696289, 11.772040367126465, 12.194676399230957, 12.617311477661133, 13.039947509765625, 13.462583541870117, 13.88521957397461, 14.307854652404785, 14.730490684509277, 15.153125762939453, 15.575761795043945, 15.998397827148438, 16.421031951904297, 16.84366798400879]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 5.0, 10.0, 7.0, 11.0, 11.0, 19.0, 18.0, 31.0, 29.0, 39.0, 42.0, 41.0, 51.0, 44.0, 51.0, 61.0, 58.0, 51.0, 47.0, 59.0, 47.0, 44.0, 32.0, 39.0, 33.0, 23.0, 24.0, 21.0, 9.0, 12.0, 7.0, 7.0, 6.0, 4.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.999790191650391, -5.7956647872924805, -5.591538906097412, -5.387413501739502, -5.183288097381592, -4.979162216186523, -4.775036811828613, -4.570911407470703, -4.366786003112793, -4.162660598754883, -3.9585349559783936, -3.7544093132019043, -3.550283908843994, -3.346158266067505, -3.1420326232910156, -2.9379072189331055, -2.733781337738037, -2.529655694961548, -2.3255302906036377, -2.1214046478271484, -1.9172791242599487, -1.713153600692749, -1.5090279579162598, -1.30490243434906, -1.1007769107818604, -0.8966513872146606, -0.6925258040428162, -0.4884002208709717, -0.284274697303772, -0.08014917373657227, 0.12397646903991699, 0.3281019926071167, 0.5322275161743164, 0.7363530397415161, 0.9404786229133606, 1.144604206085205, 1.3487297296524048, 1.5528552532196045, 1.7569808959960938, 1.9611064195632935, 2.165231943130493, 2.3693575859069824, 2.5734829902648926, 2.777608633041382, 2.981734275817871, 3.1858596801757812, 3.3899853229522705, 3.5941109657287598, 3.79823637008667, 4.00236177444458, 4.206487655639648, 4.410613059997559, 4.614738464355469, 4.818863868713379, 5.022989749908447, 5.227115154266357, 5.431241035461426, 5.635366439819336, 5.839492321014404, 6.0436177253723145, 6.247743129730225, 6.451869010925293, 6.655994415283203, 6.860119819641113, 7.064245223999023]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 7.0, 9.0, 8.0, 12.0, 37.0, 47.0, 82.0, 168.0, 346.0, 969.0, 2938.0, 12042.0, 124431.0, 4002103.0, 40983.0, 6583.0, 1827.0, 662.0, 363.0, 183.0, 113.0, 97.0, 69.0, 42.0, 33.0, 35.0, 12.0, 11.0, 17.0, 10.0, 7.0, 9.0, 3.0, 4.0, 2.0, 5.0, 4.0, 8.0, 3.0, 1.0, 4.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0], "bins": [-4.5234375, -4.35784912109375, -4.1922607421875, -4.02667236328125, -3.861083984375, -3.69549560546875, -3.5299072265625, -3.36431884765625, -3.19873046875, -3.03314208984375, -2.8675537109375, -2.70196533203125, -2.536376953125, -2.37078857421875, -2.2052001953125, -2.03961181640625, -1.8740234375, -1.70843505859375, -1.5428466796875, -1.37725830078125, -1.211669921875, -1.04608154296875, -0.8804931640625, -0.71490478515625, -0.54931640625, -0.38372802734375, -0.2181396484375, -0.05255126953125, 0.113037109375, 0.27862548828125, 0.4442138671875, 0.60980224609375, 0.775390625, 0.94097900390625, 1.1065673828125, 1.27215576171875, 1.437744140625, 1.60333251953125, 1.7689208984375, 1.93450927734375, 2.10009765625, 2.26568603515625, 2.4312744140625, 2.59686279296875, 2.762451171875, 2.92803955078125, 3.0936279296875, 3.25921630859375, 3.4248046875, 3.59039306640625, 3.7559814453125, 3.92156982421875, 4.087158203125, 4.25274658203125, 4.4183349609375, 4.58392333984375, 4.74951171875, 4.91510009765625, 5.0806884765625, 5.24627685546875, 5.411865234375, 5.57745361328125, 5.7430419921875, 5.90863037109375, 6.07421875]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 12.0, 7.0, 5.0, 26.0, 44.0, 62.0, 85.0, 113.0, 136.0, 132.0, 98.0, 91.0, 58.0, 54.0, 31.0, 20.0, 11.0, 7.0, 5.0, 2.0, 1.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.328857421875, -0.31723785400390625, -0.3056182861328125, -0.29399871826171875, -0.282379150390625, -0.27075958251953125, -0.2591400146484375, -0.24752044677734375, -0.23590087890625, -0.22428131103515625, -0.2126617431640625, -0.20104217529296875, -0.189422607421875, -0.17780303955078125, -0.1661834716796875, -0.15456390380859375, -0.1429443359375, -0.13132476806640625, -0.1197052001953125, -0.10808563232421875, -0.096466064453125, -0.08484649658203125, -0.0732269287109375, -0.06160736083984375, -0.04998779296875, -0.03836822509765625, -0.0267486572265625, -0.01512908935546875, -0.003509521484375, 0.00811004638671875, 0.0197296142578125, 0.03134918212890625, 0.04296875, 0.05458831787109375, 0.0662078857421875, 0.07782745361328125, 0.089447021484375, 0.10106658935546875, 0.1126861572265625, 0.12430572509765625, 0.13592529296875, 0.14754486083984375, 0.1591644287109375, 0.17078399658203125, 0.182403564453125, 0.19402313232421875, 0.2056427001953125, 0.21726226806640625, 0.2288818359375, 0.24050140380859375, 0.2521209716796875, 0.26374053955078125, 0.275360107421875, 0.28697967529296875, 0.2985992431640625, 0.31021881103515625, 0.32183837890625, 0.33345794677734375, 0.3450775146484375, 0.35669708251953125, 0.368316650390625, 0.37993621826171875, 0.3915557861328125, 0.40317535400390625, 0.414794921875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 5.0, 9.0, 13.0, 22.0, 33.0, 63.0, 108.0, 227.0, 423.0, 1206.0, 4852.0, 48228.0, 4069008.0, 62549.0, 5106.0, 1167.0, 478.0, 290.0, 170.0, 115.0, 61.0, 49.0, 36.0, 19.0, 19.0, 10.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.1328125, -5.9443359375, -5.755859375, -5.5673828125, -5.37890625, -5.1904296875, -5.001953125, -4.8134765625, -4.625, -4.4365234375, -4.248046875, -4.0595703125, -3.87109375, -3.6826171875, -3.494140625, -3.3056640625, -3.1171875, -2.9287109375, -2.740234375, -2.5517578125, -2.36328125, -2.1748046875, -1.986328125, -1.7978515625, -1.609375, -1.4208984375, -1.232421875, -1.0439453125, -0.85546875, -0.6669921875, -0.478515625, -0.2900390625, -0.1015625, 0.0869140625, 0.275390625, 0.4638671875, 0.65234375, 0.8408203125, 1.029296875, 1.2177734375, 1.40625, 1.5947265625, 1.783203125, 1.9716796875, 2.16015625, 2.3486328125, 2.537109375, 2.7255859375, 2.9140625, 3.1025390625, 3.291015625, 3.4794921875, 3.66796875, 3.8564453125, 4.044921875, 4.2333984375, 4.421875, 4.6103515625, 4.798828125, 4.9873046875, 5.17578125, 5.3642578125, 5.552734375, 5.7412109375, 5.9296875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 7.0, 8.0, 6.0, 17.0, 18.0, 25.0, 33.0, 60.0, 121.0, 311.0, 1954.0, 1023.0, 232.0, 93.0, 48.0, 35.0, 31.0, 17.0, 9.0, 14.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.421142578125, -0.3999290466308594, -0.37871551513671875, -0.3575019836425781, -0.3362884521484375, -0.3150749206542969, -0.29386138916015625, -0.2726478576660156, -0.251434326171875, -0.23022079467773438, -0.20900726318359375, -0.18779373168945312, -0.1665802001953125, -0.14536666870117188, -0.12415313720703125, -0.10293960571289062, -0.08172607421875, -0.060512542724609375, -0.03929901123046875, -0.018085479736328125, 0.0031280517578125, 0.024341583251953125, 0.04555511474609375, 0.06676864624023438, 0.087982177734375, 0.10919570922851562, 0.13040924072265625, 0.15162277221679688, 0.1728363037109375, 0.19404983520507812, 0.21526336669921875, 0.23647689819335938, 0.2576904296875, 0.2789039611816406, 0.30011749267578125, 0.3213310241699219, 0.3425445556640625, 0.3637580871582031, 0.38497161865234375, 0.4061851501464844, 0.427398681640625, 0.4486122131347656, 0.46982574462890625, 0.4910392761230469, 0.5122528076171875, 0.5334663391113281, 0.5546798706054688, 0.5758934020996094, 0.59710693359375, 0.6183204650878906, 0.6395339965820312, 0.6607475280761719, 0.6819610595703125, 0.7031745910644531, 0.7243881225585938, 0.7456016540527344, 0.766815185546875, 0.7880287170410156, 0.8092422485351562, 0.8304557800292969, 0.8516693115234375, 0.8728828430175781, 0.8940963745117188, 0.9153099060058594, 0.9365234375]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 7.0, 17.0, 35.0, 88.0, 233.0, 335.0, 180.0, 59.0, 13.0, 9.0, 9.0, 4.0, 2.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5915632247924805, -4.385827541351318, -4.180091381072998, -3.974355697631836, -3.7686197757720947, -3.5628838539123535, -3.3571481704711914, -3.15141224861145, -2.945676326751709, -2.7399404048919678, -2.5342044830322266, -2.3284687995910645, -2.1227328777313232, -1.916996955871582, -1.7112611532211304, -1.5055253505706787, -1.2997894287109375, -1.0940535068511963, -0.8883177042007446, -0.6825818419456482, -0.47684597969055176, -0.27111005783081055, -0.06537425518035889, 0.14036154747009277, 0.346097469329834, 0.5518333315849304, 0.7575691938400269, 0.9633050560951233, 1.1690409183502197, 1.374776840209961, 1.5805126428604126, 1.7862484455108643, 1.9919843673706055, 2.1977202892303467, 2.403456211090088, 2.60919189453125, 2.814927816390991, 3.0206637382507324, 3.2263994216918945, 3.4321353435516357, 3.637871265411377, 3.843607187271118, 4.049343109130859, 4.2550787925720215, 4.460814476013184, 4.666550636291504, 4.872286319732666, 5.078022003173828, 5.283758163452148, 5.4894938468933105, 5.695230007171631, 5.900965690612793, 6.106701850891113, 6.312437534332275, 6.5181732177734375, 6.723909378051758, 6.92964506149292, 7.135380744934082, 7.341116905212402, 7.5468525886535645, 7.752588272094727, 7.958324432373047, 8.164060592651367, 8.369795799255371, 8.575531959533691]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 6.0, 6.0, 8.0, 17.0, 20.0, 33.0, 41.0, 54.0, 59.0, 69.0, 93.0, 102.0, 106.0, 85.0, 56.0, 59.0, 45.0, 41.0, 29.0, 20.0, 15.0, 13.0, 9.0, 8.0, 5.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8537631034851074, -2.7675726413726807, -2.681381940841675, -2.595191478729248, -2.5090010166168213, -2.4228103160858154, -2.3366198539733887, -2.250429153442383, -2.164238691329956, -2.0780482292175293, -1.991857647895813, -1.9056670665740967, -1.8194764852523804, -1.733285903930664, -1.6470954418182373, -1.560904860496521, -1.4747143983840942, -1.388523817062378, -1.3023333549499512, -1.2161427736282349, -1.1299521923065186, -1.0437617301940918, -0.9575711488723755, -0.8713805675506592, -0.7851900458335876, -0.6989995241165161, -0.6128089427947998, -0.5266184210777283, -0.44042786955833435, -0.35423731803894043, -0.2680467963218689, -0.1818562150001526, -0.09566569328308105, -0.00947514921426773, 0.0767153948545456, 0.16290593147277832, 0.24909648299217224, 0.33528703451156616, 0.4214775562286377, 0.507668137550354, 0.5938586592674255, 0.6800491809844971, 0.7662397623062134, 0.8524302840232849, 0.9386208057403564, 1.0248113870620728, 1.111001968383789, 1.1971924304962158, 1.2833830118179321, 1.3695735931396484, 1.4557640552520752, 1.5419546365737915, 1.6281452178955078, 1.7143356800079346, 1.8005262613296509, 1.8867168426513672, 1.972907304763794, 2.0590977668762207, 2.1452884674072266, 2.2314789295196533, 2.31766939163208, 2.403860092163086, 2.4900505542755127, 2.5762410163879395, 2.6624317169189453]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 4.0, 4.0, 7.0, 9.0, 6.0, 15.0, 13.0, 31.0, 34.0, 56.0, 82.0, 116.0, 182.0, 327.0, 615.0, 1376.0, 3610.0, 13287.0, 94959.0, 711062.0, 193081.0, 21152.0, 5044.0, 1715.0, 742.0, 394.0, 212.0, 134.0, 94.0, 56.0, 40.0, 25.0, 21.0, 12.0, 11.0, 13.0, 4.0, 5.0, 1.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.076171875, -2.98736572265625, -2.8985595703125, -2.80975341796875, -2.720947265625, -2.63214111328125, -2.5433349609375, -2.45452880859375, -2.36572265625, -2.27691650390625, -2.1881103515625, -2.09930419921875, -2.010498046875, -1.92169189453125, -1.8328857421875, -1.74407958984375, -1.6552734375, -1.56646728515625, -1.4776611328125, -1.38885498046875, -1.300048828125, -1.21124267578125, -1.1224365234375, -1.03363037109375, -0.94482421875, -0.85601806640625, -0.7672119140625, -0.67840576171875, -0.589599609375, -0.50079345703125, -0.4119873046875, -0.32318115234375, -0.234375, -0.14556884765625, -0.0567626953125, 0.03204345703125, 0.120849609375, 0.20965576171875, 0.2984619140625, 0.38726806640625, 0.47607421875, 0.56488037109375, 0.6536865234375, 0.74249267578125, 0.831298828125, 0.92010498046875, 1.0089111328125, 1.09771728515625, 1.1865234375, 1.27532958984375, 1.3641357421875, 1.45294189453125, 1.541748046875, 1.63055419921875, 1.7193603515625, 1.80816650390625, 1.89697265625, 1.98577880859375, 2.0745849609375, 2.16339111328125, 2.252197265625, 2.34100341796875, 2.4298095703125, 2.51861572265625, 2.607421875]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 6.0, 8.0, 16.0, 23.0, 40.0, 54.0, 79.0, 108.0, 115.0, 113.0, 106.0, 103.0, 70.0, 60.0, 36.0, 21.0, 16.0, 6.0, 5.0, 6.0, 5.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.322998046875, -0.3112945556640625, -0.299591064453125, -0.2878875732421875, -0.27618408203125, -0.2644805908203125, -0.252777099609375, -0.2410736083984375, -0.2293701171875, -0.2176666259765625, -0.205963134765625, -0.1942596435546875, -0.18255615234375, -0.1708526611328125, -0.159149169921875, -0.1474456787109375, -0.1357421875, -0.1240386962890625, -0.112335205078125, -0.1006317138671875, -0.08892822265625, -0.0772247314453125, -0.065521240234375, -0.0538177490234375, -0.0421142578125, -0.0304107666015625, -0.018707275390625, -0.0070037841796875, 0.00469970703125, 0.0164031982421875, 0.028106689453125, 0.0398101806640625, 0.051513671875, 0.0632171630859375, 0.074920654296875, 0.0866241455078125, 0.09832763671875, 0.1100311279296875, 0.121734619140625, 0.1334381103515625, 0.1451416015625, 0.1568450927734375, 0.168548583984375, 0.1802520751953125, 0.19195556640625, 0.2036590576171875, 0.215362548828125, 0.2270660400390625, 0.23876953125, 0.2504730224609375, 0.262176513671875, 0.2738800048828125, 0.28558349609375, 0.2972869873046875, 0.308990478515625, 0.3206939697265625, 0.3323974609375, 0.3441009521484375, 0.355804443359375, 0.3675079345703125, 0.37921142578125, 0.3909149169921875, 0.402618408203125, 0.4143218994140625, 0.426025390625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 8.0, 6.0, 6.0, 12.0, 12.0, 19.0, 34.0, 41.0, 58.0, 69.0, 102.0, 199.0, 241.0, 486.0, 758.0, 1419.0, 3092.0, 7192.0, 19880.0, 60874.0, 199670.0, 416620.0, 230112.0, 70265.0, 22114.0, 8270.0, 3334.0, 1582.0, 790.0, 431.0, 287.0, 171.0, 112.0, 91.0, 59.0, 32.0, 27.0, 22.0, 19.0, 13.0, 6.0, 7.0, 6.0, 7.0, 3.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.3056640625, -1.26556396484375, -1.2254638671875, -1.18536376953125, -1.145263671875, -1.10516357421875, -1.0650634765625, -1.02496337890625, -0.98486328125, -0.94476318359375, -0.9046630859375, -0.86456298828125, -0.824462890625, -0.78436279296875, -0.7442626953125, -0.70416259765625, -0.6640625, -0.62396240234375, -0.5838623046875, -0.54376220703125, -0.503662109375, -0.46356201171875, -0.4234619140625, -0.38336181640625, -0.34326171875, -0.30316162109375, -0.2630615234375, -0.22296142578125, -0.182861328125, -0.14276123046875, -0.1026611328125, -0.06256103515625, -0.0224609375, 0.01763916015625, 0.0577392578125, 0.09783935546875, 0.137939453125, 0.17803955078125, 0.2181396484375, 0.25823974609375, 0.29833984375, 0.33843994140625, 0.3785400390625, 0.41864013671875, 0.458740234375, 0.49884033203125, 0.5389404296875, 0.57904052734375, 0.619140625, 0.65924072265625, 0.6993408203125, 0.73944091796875, 0.779541015625, 0.81964111328125, 0.8597412109375, 0.89984130859375, 0.93994140625, 0.98004150390625, 1.0201416015625, 1.06024169921875, 1.100341796875, 1.14044189453125, 1.1805419921875, 1.22064208984375, 1.2607421875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 0.0, 1.0, 4.0, 3.0, 6.0, 11.0, 10.0, 8.0, 12.0, 21.0, 25.0, 16.0, 23.0, 31.0, 27.0, 31.0, 33.0, 32.0, 42.0, 48.0, 51.0, 46.0, 37.0, 46.0, 43.0, 42.0, 31.0, 44.0, 33.0, 30.0, 25.0, 39.0, 24.0, 20.0, 22.0, 16.0, 12.0, 15.0, 6.0, 11.0, 5.0, 8.0, 4.0, 5.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.8994140625, -0.8723068237304688, -0.8451995849609375, -0.8180923461914062, -0.790985107421875, -0.7638778686523438, -0.7367706298828125, -0.7096633911132812, -0.68255615234375, -0.6554489135742188, -0.6283416748046875, -0.6012344360351562, -0.574127197265625, -0.5470199584960938, -0.5199127197265625, -0.49280548095703125, -0.4656982421875, -0.43859100341796875, -0.4114837646484375, -0.38437652587890625, -0.357269287109375, -0.33016204833984375, -0.3030548095703125, -0.27594757080078125, -0.24884033203125, -0.22173309326171875, -0.1946258544921875, -0.16751861572265625, -0.140411376953125, -0.11330413818359375, -0.0861968994140625, -0.05908966064453125, -0.031982421875, -0.00487518310546875, 0.0222320556640625, 0.04933929443359375, 0.076446533203125, 0.10355377197265625, 0.1306610107421875, 0.15776824951171875, 0.18487548828125, 0.21198272705078125, 0.2390899658203125, 0.26619720458984375, 0.293304443359375, 0.32041168212890625, 0.3475189208984375, 0.37462615966796875, 0.4017333984375, 0.42884063720703125, 0.4559478759765625, 0.48305511474609375, 0.510162353515625, 0.5372695922851562, 0.5643768310546875, 0.5914840698242188, 0.61859130859375, 0.6456985473632812, 0.6728057861328125, 0.6999130249023438, 0.727020263671875, 0.7541275024414062, 0.7812347412109375, 0.8083419799804688, 0.83544921875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 7.0, 5.0, 7.0, 9.0, 22.0, 21.0, 21.0, 34.0, 44.0, 68.0, 116.0, 188.0, 394.0, 860.0, 2171.0, 6244.0, 23669.0, 172745.0, 728892.0, 89522.0, 15862.0, 4548.0, 1624.0, 691.0, 345.0, 168.0, 79.0, 50.0, 31.0, 27.0, 23.0, 21.0, 14.0, 7.0, 6.0, 3.0, 2.0, 4.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.998046875, -0.9672088623046875, -0.936370849609375, -0.9055328369140625, -0.87469482421875, -0.8438568115234375, -0.813018798828125, -0.7821807861328125, -0.7513427734375, -0.7205047607421875, -0.689666748046875, -0.6588287353515625, -0.62799072265625, -0.5971527099609375, -0.566314697265625, -0.5354766845703125, -0.504638671875, -0.4738006591796875, -0.442962646484375, -0.4121246337890625, -0.38128662109375, -0.3504486083984375, -0.319610595703125, -0.2887725830078125, -0.2579345703125, -0.2270965576171875, -0.196258544921875, -0.1654205322265625, -0.13458251953125, -0.1037445068359375, -0.072906494140625, -0.0420684814453125, -0.01123046875, 0.0196075439453125, 0.050445556640625, 0.0812835693359375, 0.11212158203125, 0.1429595947265625, 0.173797607421875, 0.2046356201171875, 0.2354736328125, 0.2663116455078125, 0.297149658203125, 0.3279876708984375, 0.35882568359375, 0.3896636962890625, 0.420501708984375, 0.4513397216796875, 0.482177734375, 0.5130157470703125, 0.543853759765625, 0.5746917724609375, 0.60552978515625, 0.6363677978515625, 0.667205810546875, 0.6980438232421875, 0.7288818359375, 0.7597198486328125, 0.790557861328125, 0.8213958740234375, 0.85223388671875, 0.8830718994140625, 0.913909912109375, 0.9447479248046875, 0.9755859375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 3.0, 4.0, 8.0, 14.0, 22.0, 31.0, 36.0, 62.0, 107.0, 175.0, 186.0, 141.0, 76.0, 44.0, 22.0, 23.0, 19.0, 9.0, 6.0, 1.0, 4.0, 2.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00020837783813476562, -0.00020262226462364197, -0.0001968666911125183, -0.00019111111760139465, -0.000185355544090271, -0.00017959997057914734, -0.00017384439706802368, -0.00016808882355690002, -0.00016233325004577637, -0.0001565776765346527, -0.00015082210302352905, -0.0001450665295124054, -0.00013931095600128174, -0.00013355538249015808, -0.00012779980897903442, -0.00012204423546791077, -0.00011628866195678711, -0.00011053308844566345, -0.0001047775149345398, -9.902194142341614e-05, -9.326636791229248e-05, -8.751079440116882e-05, -8.175522089004517e-05, -7.599964737892151e-05, -7.024407386779785e-05, -6.44885003566742e-05, -5.873292684555054e-05, -5.297735333442688e-05, -4.722177982330322e-05, -4.1466206312179565e-05, -3.571063280105591e-05, -2.995505928993225e-05, -2.4199485778808594e-05, -1.8443912267684937e-05, -1.268833875656128e-05, -6.932765245437622e-06, -1.1771917343139648e-06, 4.578381776809692e-06, 1.033395528793335e-05, 1.6089528799057007e-05, 2.1845102310180664e-05, 2.760067582130432e-05, 3.335624933242798e-05, 3.9111822843551636e-05, 4.486739635467529e-05, 5.062296986579895e-05, 5.637854337692261e-05, 6.213411688804626e-05, 6.788969039916992e-05, 7.364526391029358e-05, 7.940083742141724e-05, 8.51564109325409e-05, 9.091198444366455e-05, 9.666755795478821e-05, 0.00010242313146591187, 0.00010817870497703552, 0.00011393427848815918, 0.00011968985199928284, 0.0001254454255104065, 0.00013120099902153015, 0.0001369565725326538, 0.00014271214604377747, 0.00014846771955490112, 0.00015422329306602478, 0.00015997886657714844]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 5.0, 1.0, 5.0, 6.0, 9.0, 6.0, 12.0, 17.0, 26.0, 37.0, 44.0, 89.0, 121.0, 223.0, 392.0, 829.0, 1992.0, 5598.0, 21805.0, 151649.0, 742135.0, 98770.0, 16798.0, 4795.0, 1667.0, 707.0, 330.0, 182.0, 121.0, 50.0, 50.0, 30.0, 21.0, 12.0, 10.0, 4.0, 7.0, 0.0, 4.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.72216796875, -0.6913223266601562, -0.6604766845703125, -0.6296310424804688, -0.598785400390625, -0.5679397583007812, -0.5370941162109375, -0.5062484741210938, -0.47540283203125, -0.44455718994140625, -0.4137115478515625, -0.38286590576171875, -0.352020263671875, -0.32117462158203125, -0.2903289794921875, -0.25948333740234375, -0.2286376953125, -0.19779205322265625, -0.1669464111328125, -0.13610076904296875, -0.105255126953125, -0.07440948486328125, -0.0435638427734375, -0.01271820068359375, 0.01812744140625, 0.04897308349609375, 0.0798187255859375, 0.11066436767578125, 0.141510009765625, 0.17235565185546875, 0.2032012939453125, 0.23404693603515625, 0.264892578125, 0.29573822021484375, 0.3265838623046875, 0.35742950439453125, 0.388275146484375, 0.41912078857421875, 0.4499664306640625, 0.48081207275390625, 0.51165771484375, 0.5425033569335938, 0.5733489990234375, 0.6041946411132812, 0.635040283203125, 0.6658859252929688, 0.6967315673828125, 0.7275772094726562, 0.7584228515625, 0.7892684936523438, 0.8201141357421875, 0.8509597778320312, 0.881805419921875, 0.9126510620117188, 0.9434967041015625, 0.9743423461914062, 1.00518798828125, 1.0360336303710938, 1.0668792724609375, 1.0977249145507812, 1.128570556640625, 1.1594161987304688, 1.1902618408203125, 1.2211074829101562, 1.251953125]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 8.0, 1.0, 2.0, 1.0, 3.0, 3.0, 6.0, 6.0, 20.0, 12.0, 26.0, 31.0, 55.0, 74.0, 115.0, 122.0, 135.0, 125.0, 77.0, 47.0, 40.0, 30.0, 21.0, 12.0, 15.0, 10.0, 5.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.662109375, -0.64190673828125, -0.6217041015625, -0.60150146484375, -0.581298828125, -0.56109619140625, -0.5408935546875, -0.52069091796875, -0.50048828125, -0.48028564453125, -0.4600830078125, -0.43988037109375, -0.419677734375, -0.39947509765625, -0.3792724609375, -0.35906982421875, -0.3388671875, -0.31866455078125, -0.2984619140625, -0.27825927734375, -0.258056640625, -0.23785400390625, -0.2176513671875, -0.19744873046875, -0.17724609375, -0.15704345703125, -0.1368408203125, -0.11663818359375, -0.096435546875, -0.07623291015625, -0.0560302734375, -0.03582763671875, -0.015625, 0.00457763671875, 0.0247802734375, 0.04498291015625, 0.065185546875, 0.08538818359375, 0.1055908203125, 0.12579345703125, 0.14599609375, 0.16619873046875, 0.1864013671875, 0.20660400390625, 0.226806640625, 0.24700927734375, 0.2672119140625, 0.28741455078125, 0.3076171875, 0.32781982421875, 0.3480224609375, 0.36822509765625, 0.388427734375, 0.40863037109375, 0.4288330078125, 0.44903564453125, 0.46923828125, 0.48944091796875, 0.5096435546875, 0.52984619140625, 0.550048828125, 0.57025146484375, 0.5904541015625, 0.61065673828125, 0.630859375]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 9.0, 22.0, 35.0, 87.0, 229.0, 309.0, 189.0, 71.0, 32.0, 15.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.56186294555664, -23.955339431762695, -23.34881591796875, -22.742292404174805, -22.13576889038086, -21.529247283935547, -20.9227237701416, -20.316200256347656, -19.70967674255371, -19.103153228759766, -18.49662971496582, -17.890106201171875, -17.283584594726562, -16.677061080932617, -16.070537567138672, -15.464014053344727, -14.857490539550781, -14.250967025756836, -13.64444351196289, -13.037920951843262, -12.431397438049316, -11.824873924255371, -11.218351364135742, -10.611827850341797, -10.005304336547852, -9.398780822753906, -8.792257308959961, -8.185734748840332, -7.579211235046387, -6.972687721252441, -6.366164684295654, -5.759641647338867, -5.1531171798706055, -4.54659366607666, -3.940070629119873, -3.333547353744507, -2.7270240783691406, -2.1205008029937744, -1.5139775276184082, -0.9074544906616211, -0.3009309768676758, 0.30559229850769043, 0.9121155738830566, 1.5186388492584229, 2.125162124633789, 2.7316854000091553, 3.3382086753845215, 3.9447317123413086, 4.551255226135254, 5.157778739929199, 5.764301776885986, 6.370824813842773, 6.977348327636719, 7.583871841430664, 8.19039535522461, 8.796917915344238, 9.403441429138184, 10.009964942932129, 10.616487503051758, 11.223011016845703, 11.829534530639648, 12.436058044433594, 13.042581558227539, 13.649104118347168, 14.255627632141113]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 5.0, 4.0, 4.0, 6.0, 16.0, 15.0, 10.0, 16.0, 21.0, 32.0, 47.0, 42.0, 38.0, 44.0, 53.0, 54.0, 47.0, 63.0, 60.0, 60.0, 60.0, 53.0, 48.0, 31.0, 23.0, 36.0, 19.0, 20.0, 14.0, 18.0, 11.0, 7.0, 10.0, 11.0, 5.0, 5.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-8.05985164642334, -7.851208209991455, -7.64256477355957, -7.433920860290527, -7.225277423858643, -7.016633987426758, -6.807990074157715, -6.59934663772583, -6.390703201293945, -6.1820597648620605, -5.973416328430176, -5.764772415161133, -5.556128978729248, -5.347485542297363, -5.13884162902832, -4.9301981925964355, -4.721554756164551, -4.512911319732666, -4.304267883300781, -4.095623970031738, -3.8869805335998535, -3.6783370971679688, -3.469693422317505, -3.261049747467041, -3.0524063110351562, -2.8437628746032715, -2.6351191997528076, -2.4264755249023438, -2.217832088470459, -2.009188652038574, -1.8005449771881104, -1.591901421546936, -1.3832578659057617, -1.1746143102645874, -0.9659707546234131, -0.7573271989822388, -0.5486836433410645, -0.34004008769989014, -0.13139653205871582, 0.0772470235824585, 0.2858905792236328, 0.49453413486480713, 0.7031776905059814, 0.9118212461471558, 1.12046480178833, 1.3291083574295044, 1.5377519130706787, 1.746395468711853, 1.9550390243530273, 2.163682460784912, 2.372326135635376, 2.58096981048584, 2.7896132469177246, 2.9982566833496094, 3.2069003582000732, 3.415544033050537, 3.624187469482422, 3.8328309059143066, 4.041474342346191, 4.250118255615234, 4.458761692047119, 4.667405128479004, 4.876049041748047, 5.084692478179932, 5.293335914611816]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 1.0, 3.0, 7.0, 12.0, 15.0, 22.0, 42.0, 60.0, 73.0, 132.0, 234.0, 475.0, 1028.0, 2776.0, 9995.0, 59699.0, 4037014.0, 67162.0, 10291.0, 2792.0, 1031.0, 468.0, 297.0, 154.0, 109.0, 99.0, 49.0, 43.0, 54.0, 28.0, 22.0, 11.0, 14.0, 23.0, 8.0, 8.0, 7.0, 3.0, 6.0, 6.0, 5.0, 5.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.927734375, -2.797760009765625, -2.66778564453125, -2.537811279296875, -2.4078369140625, -2.277862548828125, -2.14788818359375, -2.017913818359375, -1.887939453125, -1.757965087890625, -1.62799072265625, -1.498016357421875, -1.3680419921875, -1.238067626953125, -1.10809326171875, -0.978118896484375, -0.84814453125, -0.718170166015625, -0.58819580078125, -0.458221435546875, -0.3282470703125, -0.198272705078125, -0.06829833984375, 0.061676025390625, 0.191650390625, 0.321624755859375, 0.45159912109375, 0.581573486328125, 0.7115478515625, 0.841522216796875, 0.97149658203125, 1.101470947265625, 1.2314453125, 1.361419677734375, 1.49139404296875, 1.621368408203125, 1.7513427734375, 1.881317138671875, 2.01129150390625, 2.141265869140625, 2.271240234375, 2.401214599609375, 2.53118896484375, 2.661163330078125, 2.7911376953125, 2.921112060546875, 3.05108642578125, 3.181060791015625, 3.31103515625, 3.441009521484375, 3.57098388671875, 3.700958251953125, 3.8309326171875, 3.960906982421875, 4.09088134765625, 4.220855712890625, 4.350830078125, 4.480804443359375, 4.61077880859375, 4.740753173828125, 4.8707275390625, 5.000701904296875, 5.13067626953125, 5.260650634765625, 5.390625]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 8.0, 6.0, 8.0, 15.0, 25.0, 47.0, 71.0, 90.0, 93.0, 119.0, 115.0, 91.0, 92.0, 69.0, 49.0, 36.0, 23.0, 14.0, 10.0, 4.0, 3.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.31640625, -0.3047943115234375, -0.293182373046875, -0.2815704345703125, -0.26995849609375, -0.2583465576171875, -0.246734619140625, -0.2351226806640625, -0.2235107421875, -0.2118988037109375, -0.200286865234375, -0.1886749267578125, -0.17706298828125, -0.1654510498046875, -0.153839111328125, -0.1422271728515625, -0.130615234375, -0.1190032958984375, -0.107391357421875, -0.0957794189453125, -0.08416748046875, -0.0725555419921875, -0.060943603515625, -0.0493316650390625, -0.0377197265625, -0.0261077880859375, -0.014495849609375, -0.0028839111328125, 0.00872802734375, 0.0203399658203125, 0.031951904296875, 0.0435638427734375, 0.05517578125, 0.0667877197265625, 0.078399658203125, 0.0900115966796875, 0.10162353515625, 0.1132354736328125, 0.124847412109375, 0.1364593505859375, 0.1480712890625, 0.1596832275390625, 0.171295166015625, 0.1829071044921875, 0.19451904296875, 0.2061309814453125, 0.217742919921875, 0.2293548583984375, 0.240966796875, 0.2525787353515625, 0.264190673828125, 0.2758026123046875, 0.28741455078125, 0.2990264892578125, 0.310638427734375, 0.3222503662109375, 0.3338623046875, 0.3454742431640625, 0.357086181640625, 0.3686981201171875, 0.38031005859375, 0.3919219970703125, 0.403533935546875, 0.4151458740234375, 0.4267578125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 9.0, 6.0, 10.0, 13.0, 40.0, 49.0, 100.0, 149.0, 341.0, 633.0, 1595.0, 4766.0, 21390.0, 432061.0, 3691061.0, 31908.0, 6374.0, 1964.0, 805.0, 401.0, 230.0, 128.0, 89.0, 50.0, 32.0, 30.0, 18.0, 11.0, 9.0, 3.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-5.2265625, -5.099456787109375, -4.97235107421875, -4.845245361328125, -4.7181396484375, -4.591033935546875, -4.46392822265625, -4.336822509765625, -4.209716796875, -4.082611083984375, -3.95550537109375, -3.828399658203125, -3.7012939453125, -3.574188232421875, -3.44708251953125, -3.319976806640625, -3.19287109375, -3.065765380859375, -2.93865966796875, -2.811553955078125, -2.6844482421875, -2.557342529296875, -2.43023681640625, -2.303131103515625, -2.176025390625, -2.048919677734375, -1.92181396484375, -1.794708251953125, -1.6676025390625, -1.540496826171875, -1.41339111328125, -1.286285400390625, -1.1591796875, -1.032073974609375, -0.90496826171875, -0.777862548828125, -0.6507568359375, -0.523651123046875, -0.39654541015625, -0.269439697265625, -0.142333984375, -0.015228271484375, 0.11187744140625, 0.238983154296875, 0.3660888671875, 0.493194580078125, 0.62030029296875, 0.747406005859375, 0.87451171875, 1.001617431640625, 1.12872314453125, 1.255828857421875, 1.3829345703125, 1.510040283203125, 1.63714599609375, 1.764251708984375, 1.891357421875, 2.018463134765625, 2.14556884765625, 2.272674560546875, 2.3997802734375, 2.526885986328125, 2.65399169921875, 2.781097412109375, 2.908203125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 5.0, 6.0, 11.0, 17.0, 16.0, 22.0, 38.0, 63.0, 119.0, 388.0, 2373.0, 670.0, 168.0, 71.0, 33.0, 20.0, 16.0, 11.0, 8.0, 5.0, 5.0, 3.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51025390625, -0.48667144775390625, -0.4630889892578125, -0.43950653076171875, -0.415924072265625, -0.39234161376953125, -0.3687591552734375, -0.34517669677734375, -0.32159423828125, -0.29801177978515625, -0.2744293212890625, -0.25084686279296875, -0.227264404296875, -0.20368194580078125, -0.1800994873046875, -0.15651702880859375, -0.1329345703125, -0.10935211181640625, -0.0857696533203125, -0.06218719482421875, -0.038604736328125, -0.01502227783203125, 0.0085601806640625, 0.03214263916015625, 0.05572509765625, 0.07930755615234375, 0.1028900146484375, 0.12647247314453125, 0.150054931640625, 0.17363739013671875, 0.1972198486328125, 0.22080230712890625, 0.244384765625, 0.26796722412109375, 0.2915496826171875, 0.31513214111328125, 0.338714599609375, 0.36229705810546875, 0.3858795166015625, 0.40946197509765625, 0.43304443359375, 0.45662689208984375, 0.4802093505859375, 0.5037918090820312, 0.527374267578125, 0.5509567260742188, 0.5745391845703125, 0.5981216430664062, 0.6217041015625, 0.6452865600585938, 0.6688690185546875, 0.6924514770507812, 0.716033935546875, 0.7396163940429688, 0.7631988525390625, 0.7867813110351562, 0.81036376953125, 0.8339462280273438, 0.8575286865234375, 0.8811111450195312, 0.904693603515625, 0.9282760620117188, 0.9518585205078125, 0.9754409790039062, 0.9990234375]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 7.0, 13.0, 43.0, 96.0, 249.0, 325.0, 174.0, 62.0, 23.0, 10.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.948447227478027, -6.703046798706055, -6.457646369934082, -6.212245941162109, -5.966845512390137, -5.721445083618164, -5.476044654846191, -5.230644226074219, -4.985243797302246, -4.739843368530273, -4.494442939758301, -4.249042510986328, -4.0036420822143555, -3.758241653442383, -3.512840986251831, -3.2674405574798584, -3.0220398902893066, -2.776639461517334, -2.5312390327453613, -2.2858386039733887, -2.040438175201416, -1.7950376272201538, -1.5496370792388916, -1.304236650466919, -1.0588362216949463, -0.8134357929229736, -0.5680353045463562, -0.32263481616973877, -0.07723438739776611, 0.16816604137420654, 0.41356658935546875, 0.6589670181274414, 0.9043674468994141, 1.1497678756713867, 1.3951683044433594, 1.6405688524246216, 1.8859692811965942, 2.1313695907592773, 2.376770257949829, 2.6221706867218018, 2.8675711154937744, 3.112971544265747, 3.3583719730377197, 3.6037726402282715, 3.849173069000244, 4.094573497772217, 4.3399739265441895, 4.585374355316162, 4.830774784088135, 5.076175212860107, 5.32157564163208, 5.566976070404053, 5.812376499176025, 6.057776927947998, 6.303177833557129, 6.548578262329102, 6.793978691101074, 7.039379119873047, 7.2847795486450195, 7.530179977416992, 7.775580406188965, 8.020980834960938, 8.26638126373291, 8.511781692504883, 8.757182121276855]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 2.0, 10.0, 5.0, 10.0, 13.0, 16.0, 14.0, 22.0, 28.0, 24.0, 21.0, 36.0, 43.0, 48.0, 52.0, 45.0, 44.0, 45.0, 54.0, 57.0, 33.0, 39.0, 49.0, 35.0, 26.0, 32.0, 27.0, 32.0, 23.0, 22.0, 21.0, 10.0, 17.0, 6.0, 10.0, 9.0, 7.0, 6.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4789817333221436, -1.424920916557312, -1.3708600997924805, -1.316799283027649, -1.2627384662628174, -1.2086775302886963, -1.1546168327331543, -1.1005558967590332, -1.0464950799942017, -0.9924342632293701, -0.9383734464645386, -0.884312629699707, -0.8302517533302307, -0.7761909365653992, -0.7221301198005676, -0.6680692434310913, -0.6140084862709045, -0.559947669506073, -0.5058868527412415, -0.4518260061740875, -0.3977651596069336, -0.34370434284210205, -0.2896435260772705, -0.23558267951011658, -0.18152186274528503, -0.1274610310792923, -0.07340020686388016, -0.019339382648468018, 0.03472144901752472, 0.08878228068351746, 0.142843097448349, 0.19690394401550293, 0.2509647607803345, 0.305025577545166, 0.35908642411231995, 0.4131472408771515, 0.4672080874443054, 0.521268904209137, 0.5753297209739685, 0.6293905973434448, 0.6834514141082764, 0.7375122308731079, 0.7915730476379395, 0.845633864402771, 0.8996947407722473, 0.9537555575370789, 1.0078163146972656, 1.0618772506713867, 1.1159379482269287, 1.1699987649917603, 1.2240595817565918, 1.2781203985214233, 1.3321812152862549, 1.386242151260376, 1.440302848815918, 1.494363784790039, 1.5484246015548706, 1.6024854183197021, 1.6565462350845337, 1.7106070518493652, 1.7646678686141968, 1.8187286853790283, 1.8727896213531494, 1.926850438117981, 1.9809112548828125]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 5.0, 11.0, 13.0, 11.0, 24.0, 33.0, 43.0, 66.0, 119.0, 200.0, 366.0, 598.0, 1482.0, 3640.0, 13257.0, 81294.0, 628492.0, 276388.0, 31248.0, 6819.0, 2339.0, 975.0, 459.0, 238.0, 150.0, 81.0, 61.0, 37.0, 34.0, 19.0, 20.0, 11.0, 7.0, 5.0, 5.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3671875, -2.275299072265625, -2.18341064453125, -2.091522216796875, -1.9996337890625, -1.907745361328125, -1.81585693359375, -1.723968505859375, -1.632080078125, -1.540191650390625, -1.44830322265625, -1.356414794921875, -1.2645263671875, -1.172637939453125, -1.08074951171875, -0.988861083984375, -0.89697265625, -0.805084228515625, -0.71319580078125, -0.621307373046875, -0.5294189453125, -0.437530517578125, -0.34564208984375, -0.253753662109375, -0.161865234375, -0.069976806640625, 0.02191162109375, 0.113800048828125, 0.2056884765625, 0.297576904296875, 0.38946533203125, 0.481353759765625, 0.5732421875, 0.665130615234375, 0.75701904296875, 0.848907470703125, 0.9407958984375, 1.032684326171875, 1.12457275390625, 1.216461181640625, 1.308349609375, 1.400238037109375, 1.49212646484375, 1.584014892578125, 1.6759033203125, 1.767791748046875, 1.85968017578125, 1.951568603515625, 2.04345703125, 2.135345458984375, 2.22723388671875, 2.319122314453125, 2.4110107421875, 2.502899169921875, 2.59478759765625, 2.686676025390625, 2.778564453125, 2.870452880859375, 2.96234130859375, 3.054229736328125, 3.1461181640625, 3.238006591796875, 3.32989501953125, 3.421783447265625, 3.513671875]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 8.0, 7.0, 8.0, 7.0, 23.0, 34.0, 46.0, 73.0, 68.0, 96.0, 108.0, 111.0, 100.0, 87.0, 58.0, 59.0, 34.0, 18.0, 19.0, 10.0, 11.0, 4.0, 5.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.3203125, -0.3080902099609375, -0.295867919921875, -0.2836456298828125, -0.27142333984375, -0.2592010498046875, -0.246978759765625, -0.2347564697265625, -0.2225341796875, -0.2103118896484375, -0.198089599609375, -0.1858673095703125, -0.17364501953125, -0.1614227294921875, -0.149200439453125, -0.1369781494140625, -0.124755859375, -0.1125335693359375, -0.100311279296875, -0.0880889892578125, -0.07586669921875, -0.0636444091796875, -0.051422119140625, -0.0391998291015625, -0.0269775390625, -0.0147552490234375, -0.002532958984375, 0.0096893310546875, 0.02191162109375, 0.0341339111328125, 0.046356201171875, 0.0585784912109375, 0.07080078125, 0.0830230712890625, 0.095245361328125, 0.1074676513671875, 0.11968994140625, 0.1319122314453125, 0.144134521484375, 0.1563568115234375, 0.1685791015625, 0.1808013916015625, 0.193023681640625, 0.2052459716796875, 0.21746826171875, 0.2296905517578125, 0.241912841796875, 0.2541351318359375, 0.266357421875, 0.2785797119140625, 0.290802001953125, 0.3030242919921875, 0.31524658203125, 0.3274688720703125, 0.339691162109375, 0.3519134521484375, 0.3641357421875, 0.3763580322265625, 0.388580322265625, 0.4008026123046875, 0.41302490234375, 0.4252471923828125, 0.437469482421875, 0.4496917724609375, 0.4619140625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 5.0, 6.0, 9.0, 21.0, 18.0, 29.0, 61.0, 109.0, 196.0, 329.0, 614.0, 1503.0, 3931.0, 15120.0, 81796.0, 490465.0, 379661.0, 57515.0, 11380.0, 3378.0, 1196.0, 579.0, 273.0, 143.0, 88.0, 44.0, 32.0, 20.0, 9.0, 4.0, 5.0, 5.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.49609375, -2.42657470703125, -2.3570556640625, -2.28753662109375, -2.218017578125, -2.14849853515625, -2.0789794921875, -2.00946044921875, -1.93994140625, -1.87042236328125, -1.8009033203125, -1.73138427734375, -1.661865234375, -1.59234619140625, -1.5228271484375, -1.45330810546875, -1.3837890625, -1.31427001953125, -1.2447509765625, -1.17523193359375, -1.105712890625, -1.03619384765625, -0.9666748046875, -0.89715576171875, -0.82763671875, -0.75811767578125, -0.6885986328125, -0.61907958984375, -0.549560546875, -0.48004150390625, -0.4105224609375, -0.34100341796875, -0.271484375, -0.20196533203125, -0.1324462890625, -0.06292724609375, 0.006591796875, 0.07611083984375, 0.1456298828125, 0.21514892578125, 0.28466796875, 0.35418701171875, 0.4237060546875, 0.49322509765625, 0.562744140625, 0.63226318359375, 0.7017822265625, 0.77130126953125, 0.8408203125, 0.91033935546875, 0.9798583984375, 1.04937744140625, 1.118896484375, 1.18841552734375, 1.2579345703125, 1.32745361328125, 1.39697265625, 1.46649169921875, 1.5360107421875, 1.60552978515625, 1.675048828125, 1.74456787109375, 1.8140869140625, 1.88360595703125, 1.953125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 6.0, 1.0, 4.0, 6.0, 4.0, 2.0, 11.0, 11.0, 21.0, 13.0, 18.0, 20.0, 29.0, 34.0, 37.0, 38.0, 44.0, 59.0, 50.0, 53.0, 47.0, 46.0, 54.0, 48.0, 37.0, 47.0, 46.0, 29.0, 29.0, 26.0, 22.0, 22.0, 26.0, 12.0, 11.0, 7.0, 10.0, 10.0, 8.0, 4.0, 6.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.93408203125, -0.8997726440429688, -0.8654632568359375, -0.8311538696289062, -0.796844482421875, -0.7625350952148438, -0.7282257080078125, -0.6939163208007812, -0.65960693359375, -0.6252975463867188, -0.5909881591796875, -0.5566787719726562, -0.522369384765625, -0.48805999755859375, -0.4537506103515625, -0.41944122314453125, -0.3851318359375, -0.35082244873046875, -0.3165130615234375, -0.28220367431640625, -0.247894287109375, -0.21358489990234375, -0.1792755126953125, -0.14496612548828125, -0.11065673828125, -0.07634735107421875, -0.0420379638671875, -0.00772857666015625, 0.026580810546875, 0.06089019775390625, 0.0951995849609375, 0.12950897216796875, 0.163818359375, 0.19812774658203125, 0.2324371337890625, 0.26674652099609375, 0.301055908203125, 0.33536529541015625, 0.3696746826171875, 0.40398406982421875, 0.43829345703125, 0.47260284423828125, 0.5069122314453125, 0.5412216186523438, 0.575531005859375, 0.6098403930664062, 0.6441497802734375, 0.6784591674804688, 0.7127685546875, 0.7470779418945312, 0.7813873291015625, 0.8156967163085938, 0.850006103515625, 0.8843154907226562, 0.9186248779296875, 0.9529342651367188, 0.98724365234375, 1.0215530395507812, 1.0558624267578125, 1.0901718139648438, 1.124481201171875, 1.1587905883789062, 1.1930999755859375, 1.2274093627929688, 1.26171875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 3.0, 3.0, 4.0, 10.0, 13.0, 6.0, 15.0, 28.0, 43.0, 54.0, 130.0, 187.0, 366.0, 985.0, 2796.0, 12259.0, 105854.0, 849691.0, 63280.0, 8988.0, 2275.0, 770.0, 337.0, 186.0, 79.0, 57.0, 38.0, 34.0, 14.0, 10.0, 14.0, 10.0, 2.0, 7.0, 5.0, 5.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.626953125, -1.576751708984375, -1.52655029296875, -1.476348876953125, -1.4261474609375, -1.375946044921875, -1.32574462890625, -1.275543212890625, -1.225341796875, -1.175140380859375, -1.12493896484375, -1.074737548828125, -1.0245361328125, -0.974334716796875, -0.92413330078125, -0.873931884765625, -0.82373046875, -0.773529052734375, -0.72332763671875, -0.673126220703125, -0.6229248046875, -0.572723388671875, -0.52252197265625, -0.472320556640625, -0.422119140625, -0.371917724609375, -0.32171630859375, -0.271514892578125, -0.2213134765625, -0.171112060546875, -0.12091064453125, -0.070709228515625, -0.0205078125, 0.029693603515625, 0.07989501953125, 0.130096435546875, 0.1802978515625, 0.230499267578125, 0.28070068359375, 0.330902099609375, 0.381103515625, 0.431304931640625, 0.48150634765625, 0.531707763671875, 0.5819091796875, 0.632110595703125, 0.68231201171875, 0.732513427734375, 0.78271484375, 0.832916259765625, 0.88311767578125, 0.933319091796875, 0.9835205078125, 1.033721923828125, 1.08392333984375, 1.134124755859375, 1.184326171875, 1.234527587890625, 1.28472900390625, 1.334930419921875, 1.3851318359375, 1.435333251953125, 1.48553466796875, 1.535736083984375, 1.5859375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 5.0, 7.0, 5.0, 5.0, 14.0, 14.0, 28.0, 39.0, 58.0, 88.0, 146.0, 148.0, 124.0, 94.0, 68.0, 32.0, 34.0, 17.0, 9.0, 10.0, 7.0, 7.0, 5.0, 7.0, 2.0, 1.0, 2.0, 4.0, 1.0, 2.0, 3.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.00021529197692871094, -0.00020903348922729492, -0.0002027750015258789, -0.0001965165138244629, -0.00019025802612304688, -0.00018399953842163086, -0.00017774105072021484, -0.00017148256301879883, -0.0001652240753173828, -0.0001589655876159668, -0.00015270709991455078, -0.00014644861221313477, -0.00014019012451171875, -0.00013393163681030273, -0.00012767314910888672, -0.0001214146614074707, -0.00011515617370605469, -0.00010889768600463867, -0.00010263919830322266, -9.638071060180664e-05, -9.012222290039062e-05, -8.386373519897461e-05, -7.76052474975586e-05, -7.134675979614258e-05, -6.508827209472656e-05, -5.882978439331055e-05, -5.257129669189453e-05, -4.6312808990478516e-05, -4.00543212890625e-05, -3.3795833587646484e-05, -2.753734588623047e-05, -2.1278858184814453e-05, -1.5020370483398438e-05, -8.761882781982422e-06, -2.5033950805664062e-06, 3.7550926208496094e-06, 1.0013580322265625e-05, 1.627206802368164e-05, 2.2530555725097656e-05, 2.8789043426513672e-05, 3.504753112792969e-05, 4.13060188293457e-05, 4.756450653076172e-05, 5.3822994232177734e-05, 6.008148193359375e-05, 6.633996963500977e-05, 7.259845733642578e-05, 7.88569450378418e-05, 8.511543273925781e-05, 9.137392044067383e-05, 9.763240814208984e-05, 0.00010389089584350586, 0.00011014938354492188, 0.00011640787124633789, 0.0001226663589477539, 0.00012892484664916992, 0.00013518333435058594, 0.00014144182205200195, 0.00014770030975341797, 0.00015395879745483398, 0.00016021728515625, 0.00016647577285766602, 0.00017273426055908203, 0.00017899274826049805, 0.00018525123596191406]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 4.0, 10.0, 6.0, 7.0, 10.0, 12.0, 18.0, 25.0, 54.0, 88.0, 156.0, 268.0, 562.0, 1268.0, 4178.0, 25605.0, 810881.0, 188945.0, 11994.0, 2566.0, 926.0, 440.0, 238.0, 124.0, 56.0, 35.0, 31.0, 22.0, 13.0, 3.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8056640625, -1.7383270263671875, -1.670989990234375, -1.6036529541015625, -1.53631591796875, -1.4689788818359375, -1.401641845703125, -1.3343048095703125, -1.2669677734375, -1.1996307373046875, -1.132293701171875, -1.0649566650390625, -0.99761962890625, -0.9302825927734375, -0.862945556640625, -0.7956085205078125, -0.728271484375, -0.6609344482421875, -0.593597412109375, -0.5262603759765625, -0.45892333984375, -0.3915863037109375, -0.324249267578125, -0.2569122314453125, -0.1895751953125, -0.1222381591796875, -0.054901123046875, 0.0124359130859375, 0.07977294921875, 0.1471099853515625, 0.214447021484375, 0.2817840576171875, 0.34912109375, 0.4164581298828125, 0.483795166015625, 0.5511322021484375, 0.61846923828125, 0.6858062744140625, 0.753143310546875, 0.8204803466796875, 0.8878173828125, 0.9551544189453125, 1.022491455078125, 1.0898284912109375, 1.15716552734375, 1.2245025634765625, 1.291839599609375, 1.3591766357421875, 1.426513671875, 1.4938507080078125, 1.561187744140625, 1.6285247802734375, 1.69586181640625, 1.7631988525390625, 1.830535888671875, 1.8978729248046875, 1.9652099609375, 2.0325469970703125, 2.099884033203125, 2.1672210693359375, 2.23455810546875, 2.3018951416015625, 2.369232177734375, 2.4365692138671875, 2.50390625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 6.0, 12.0, 19.0, 22.0, 34.0, 54.0, 73.0, 110.0, 180.0, 169.0, 128.0, 65.0, 36.0, 31.0, 19.0, 8.0, 10.0, 9.0, 4.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0556640625, -1.0254898071289062, -0.9953155517578125, -0.9651412963867188, -0.934967041015625, -0.9047927856445312, -0.8746185302734375, -0.8444442749023438, -0.81427001953125, -0.7840957641601562, -0.7539215087890625, -0.7237472534179688, -0.693572998046875, -0.6633987426757812, -0.6332244873046875, -0.6030502319335938, -0.5728759765625, -0.5427017211914062, -0.5125274658203125, -0.48235321044921875, -0.452178955078125, -0.42200469970703125, -0.3918304443359375, -0.36165618896484375, -0.33148193359375, -0.30130767822265625, -0.2711334228515625, -0.24095916748046875, -0.210784912109375, -0.18061065673828125, -0.1504364013671875, -0.12026214599609375, -0.090087890625, -0.05991363525390625, -0.0297393798828125, 0.00043487548828125, 0.030609130859375, 0.06078338623046875, 0.0909576416015625, 0.12113189697265625, 0.15130615234375, 0.18148040771484375, 0.2116546630859375, 0.24182891845703125, 0.272003173828125, 0.30217742919921875, 0.3323516845703125, 0.36252593994140625, 0.3927001953125, 0.42287445068359375, 0.4530487060546875, 0.48322296142578125, 0.513397216796875, 0.5435714721679688, 0.5737457275390625, 0.6039199829101562, 0.63409423828125, 0.6642684936523438, 0.6944427490234375, 0.7246170043945312, 0.754791259765625, 0.7849655151367188, 0.8151397705078125, 0.8453140258789062, 0.87548828125]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 8.0, 11.0, 14.0, 30.0, 51.0, 115.0, 183.0, 218.0, 175.0, 100.0, 44.0, 25.0, 22.0, 4.0, 2.0, 4.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.00187873840332, -7.482860565185547, -6.963841915130615, -6.444823265075684, -5.92580509185791, -5.406786918640137, -4.887768268585205, -4.368749618530273, -3.8497314453125, -3.3307130336761475, -2.811694622039795, -2.2926762104034424, -1.7736577987670898, -1.2546393871307373, -0.7356209754943848, -0.21660256385803223, 0.3024158477783203, 0.8214342594146729, 1.3404526710510254, 1.859471082687378, 2.3784894943237305, 2.897507905960083, 3.4165263175964355, 3.935544729232788, 4.454563140869141, 4.973581314086914, 5.492599964141846, 6.011618614196777, 6.530636787414551, 7.049654960632324, 7.568673610687256, 8.087692260742188, 8.606710433959961, 9.125728607177734, 9.644746780395508, 10.163765907287598, 10.682784080505371, 11.201802253723145, 11.720821380615234, 12.239839553833008, 12.758857727050781, 13.277875900268555, 13.796894073486328, 14.315913200378418, 14.834931373596191, 15.353949546813965, 15.872968673706055, 16.391986846923828, 16.9110050201416, 17.430023193359375, 17.94904136657715, 18.468059539794922, 18.987079620361328, 19.5060977935791, 20.025115966796875, 20.54413414001465, 21.063152313232422, 21.582170486450195, 22.10118865966797, 22.620206832885742, 23.139225006103516, 23.658245086669922, 24.177263259887695, 24.69628143310547, 25.215299606323242]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 4.0, 7.0, 14.0, 10.0, 14.0, 14.0, 20.0, 20.0, 25.0, 28.0, 34.0, 52.0, 50.0, 54.0, 52.0, 66.0, 48.0, 57.0, 63.0, 43.0, 55.0, 48.0, 37.0, 35.0, 27.0, 27.0, 21.0, 18.0, 14.0, 16.0, 11.0, 5.0, 6.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.04636287689209, -5.812415599822998, -5.578468322753906, -5.344521522521973, -5.110574245452881, -4.876626968383789, -4.642679691314697, -4.4087324142456055, -4.174785137176514, -3.940837860107422, -3.706890821456909, -3.4729435443878174, -3.2389962673187256, -3.005049228668213, -2.771101951599121, -2.5371546745300293, -2.3032076358795166, -2.069260358810425, -1.8353132009506226, -1.6013660430908203, -1.3674187660217285, -1.1334716081619263, -0.899524450302124, -0.6655771732330322, -0.43163001537323, -0.19768281280994415, 0.036264389753341675, 0.2702115774154663, 0.5041587948799133, 0.7381060123443604, 0.9720531702041626, 1.2060004472732544, 1.4399476051330566, 1.6738947629928589, 1.9078420400619507, 2.141789197921753, 2.3757364749908447, 2.6096835136413574, 2.843630790710449, 3.077578067779541, 3.311525344848633, 3.5454726219177246, 3.7794196605682373, 4.01336669921875, 4.247313976287842, 4.481261253356934, 4.715208530426025, 4.949155807495117, 5.183102607727051, 5.417049884796143, 5.650997161865234, 5.884943962097168, 6.11889123916626, 6.352838516235352, 6.586785793304443, 6.820733070373535, 7.054680347442627, 7.288627624511719, 7.5225749015808105, 7.756522178649902, 7.990468978881836, 8.224416732788086, 8.45836353302002, 8.692310333251953, 8.926258087158203]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 19.0, 30.0, 48.0, 98.0, 186.0, 409.0, 896.0, 2451.0, 9659.0, 66338.0, 3995051.0, 101035.0, 12961.0, 2810.0, 973.0, 439.0, 276.0, 179.0, 113.0, 71.0, 68.0, 38.0, 43.0, 23.0, 16.0, 15.0, 13.0, 4.0, 6.0, 5.0, 4.0, 3.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.419921875, -3.268463134765625, -3.11700439453125, -2.965545654296875, -2.8140869140625, -2.662628173828125, -2.51116943359375, -2.359710693359375, -2.208251953125, -2.056793212890625, -1.90533447265625, -1.753875732421875, -1.6024169921875, -1.450958251953125, -1.29949951171875, -1.148040771484375, -0.99658203125, -0.845123291015625, -0.69366455078125, -0.542205810546875, -0.3907470703125, -0.239288330078125, -0.08782958984375, 0.063629150390625, 0.215087890625, 0.366546630859375, 0.51800537109375, 0.669464111328125, 0.8209228515625, 0.972381591796875, 1.12384033203125, 1.275299072265625, 1.4267578125, 1.578216552734375, 1.72967529296875, 1.881134033203125, 2.0325927734375, 2.184051513671875, 2.33551025390625, 2.486968994140625, 2.638427734375, 2.789886474609375, 2.94134521484375, 3.092803955078125, 3.2442626953125, 3.395721435546875, 3.54718017578125, 3.698638916015625, 3.85009765625, 4.001556396484375, 4.15301513671875, 4.304473876953125, 4.4559326171875, 4.607391357421875, 4.75885009765625, 4.910308837890625, 5.061767578125, 5.213226318359375, 5.36468505859375, 5.516143798828125, 5.6676025390625, 5.819061279296875, 5.97052001953125, 6.121978759765625, 6.2734375]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 3.0, 5.0, 5.0, 4.0, 7.0, 4.0, 7.0, 12.0, 30.0, 42.0, 49.0, 59.0, 84.0, 95.0, 94.0, 95.0, 90.0, 78.0, 61.0, 55.0, 37.0, 18.0, 27.0, 13.0, 9.0, 8.0, 5.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.285888671875, -0.2740287780761719, -0.26216888427734375, -0.2503089904785156, -0.2384490966796875, -0.22658920288085938, -0.21472930908203125, -0.20286941528320312, -0.191009521484375, -0.17914962768554688, -0.16728973388671875, -0.15542984008789062, -0.1435699462890625, -0.13171005249023438, -0.11985015869140625, -0.10799026489257812, -0.09613037109375, -0.08427047729492188, -0.07241058349609375, -0.060550689697265625, -0.0486907958984375, -0.036830902099609375, -0.02497100830078125, -0.013111114501953125, -0.001251220703125, 0.010608673095703125, 0.02246856689453125, 0.034328460693359375, 0.0461883544921875, 0.058048248291015625, 0.06990814208984375, 0.08176803588867188, 0.0936279296875, 0.10548782348632812, 0.11734771728515625, 0.12920761108398438, 0.1410675048828125, 0.15292739868164062, 0.16478729248046875, 0.17664718627929688, 0.188507080078125, 0.20036697387695312, 0.21222686767578125, 0.22408676147460938, 0.2359466552734375, 0.24780654907226562, 0.25966644287109375, 0.2715263366699219, 0.28338623046875, 0.2952461242675781, 0.30710601806640625, 0.3189659118652344, 0.3308258056640625, 0.3426856994628906, 0.35454559326171875, 0.3664054870605469, 0.378265380859375, 0.3901252746582031, 0.40198516845703125, 0.4138450622558594, 0.4257049560546875, 0.4375648498535156, 0.44942474365234375, 0.4612846374511719, 0.47314453125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 3.0, 2.0, 4.0, 6.0, 4.0, 8.0, 11.0, 15.0, 14.0, 36.0, 73.0, 107.0, 153.0, 288.0, 558.0, 1192.0, 2903.0, 9605.0, 49739.0, 3809965.0, 287198.0, 22373.0, 5702.0, 2110.0, 985.0, 499.0, 274.0, 168.0, 95.0, 53.0, 49.0, 22.0, 24.0, 17.0, 5.0, 9.0, 4.0, 4.0, 5.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.609375, -5.464752197265625, -5.32012939453125, -5.175506591796875, -5.0308837890625, -4.886260986328125, -4.74163818359375, -4.597015380859375, -4.452392578125, -4.307769775390625, -4.16314697265625, -4.018524169921875, -3.8739013671875, -3.729278564453125, -3.58465576171875, -3.440032958984375, -3.29541015625, -3.150787353515625, -3.00616455078125, -2.861541748046875, -2.7169189453125, -2.572296142578125, -2.42767333984375, -2.283050537109375, -2.138427734375, -1.993804931640625, -1.84918212890625, -1.704559326171875, -1.5599365234375, -1.415313720703125, -1.27069091796875, -1.126068115234375, -0.9814453125, -0.836822509765625, -0.69219970703125, -0.547576904296875, -0.4029541015625, -0.258331298828125, -0.11370849609375, 0.030914306640625, 0.175537109375, 0.320159912109375, 0.46478271484375, 0.609405517578125, 0.7540283203125, 0.898651123046875, 1.04327392578125, 1.187896728515625, 1.33251953125, 1.477142333984375, 1.62176513671875, 1.766387939453125, 1.9110107421875, 2.055633544921875, 2.20025634765625, 2.344879150390625, 2.489501953125, 2.634124755859375, 2.77874755859375, 2.923370361328125, 3.0679931640625, 3.212615966796875, 3.35723876953125, 3.501861572265625, 3.646484375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 6.0, 5.0, 11.0, 18.0, 14.0, 24.0, 23.0, 49.0, 89.0, 180.0, 540.0, 2022.0, 665.0, 171.0, 72.0, 52.0, 34.0, 26.0, 25.0, 7.0, 9.0, 6.0, 7.0, 2.0, 2.0, 3.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.994140625, -0.9593353271484375, -0.924530029296875, -0.8897247314453125, -0.85491943359375, -0.8201141357421875, -0.785308837890625, -0.7505035400390625, -0.7156982421875, -0.6808929443359375, -0.646087646484375, -0.6112823486328125, -0.57647705078125, -0.5416717529296875, -0.506866455078125, -0.4720611572265625, -0.437255859375, -0.4024505615234375, -0.367645263671875, -0.3328399658203125, -0.29803466796875, -0.2632293701171875, -0.228424072265625, -0.1936187744140625, -0.1588134765625, -0.1240081787109375, -0.089202880859375, -0.0543975830078125, -0.01959228515625, 0.0152130126953125, 0.050018310546875, 0.0848236083984375, 0.11962890625, 0.1544342041015625, 0.189239501953125, 0.2240447998046875, 0.25885009765625, 0.2936553955078125, 0.328460693359375, 0.3632659912109375, 0.3980712890625, 0.4328765869140625, 0.467681884765625, 0.5024871826171875, 0.53729248046875, 0.5720977783203125, 0.606903076171875, 0.6417083740234375, 0.676513671875, 0.7113189697265625, 0.746124267578125, 0.7809295654296875, 0.81573486328125, 0.8505401611328125, 0.885345458984375, 0.9201507568359375, 0.9549560546875, 0.9897613525390625, 1.024566650390625, 1.0593719482421875, 1.09417724609375, 1.1289825439453125, 1.163787841796875, 1.1985931396484375, 1.2333984375]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 12.0, 18.0, 74.0, 229.0, 434.0, 180.0, 43.0, 9.0, 3.0, 5.0, 0.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.375373363494873, -6.826822280883789, -6.278271675109863, -5.729720592498779, -5.181169509887695, -4.6326189041137695, -4.0840678215026855, -3.5355169773101807, -2.986966133117676, -2.438415288925171, -1.8898643255233765, -1.341313362121582, -0.7927625179290771, -0.24421167373657227, 0.3043394088745117, 0.8528902530670166, 1.4014410972595215, 1.9499919414520264, 2.4985427856445312, 3.0470938682556152, 3.59564471244812, 4.144195556640625, 4.692746639251709, 5.241297721862793, 5.789848327636719, 6.338399410247803, 6.8869500160217285, 7.4355010986328125, 7.984051704406738, 8.532602310180664, 9.081153869628906, 9.629704475402832, 10.17825698852539, 10.726807594299316, 11.275359153747559, 11.823909759521484, 12.37246036529541, 12.921010971069336, 13.469562530517578, 14.018113136291504, 14.56666374206543, 15.115214347839355, 15.663765907287598, 16.212316513061523, 16.760868072509766, 17.309417724609375, 17.857969284057617, 18.40652084350586, 18.95507049560547, 19.50362205505371, 20.05217170715332, 20.600723266601562, 21.149274826049805, 21.697824478149414, 22.246376037597656, 22.7949275970459, 23.34347915649414, 23.892030715942383, 24.440580368041992, 24.989131927490234, 25.537683486938477, 26.086233139038086, 26.634784698486328, 27.18333625793457, 27.73188591003418]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 2.0, 11.0, 12.0, 10.0, 15.0, 48.0, 60.0, 72.0, 82.0, 106.0, 90.0, 105.0, 88.0, 76.0, 53.0, 50.0, 31.0, 40.0, 29.0, 14.0, 4.0, 1.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.436782360076904, -6.256065845489502, -6.0753493309021, -5.8946332931518555, -5.713916778564453, -5.533200263977051, -5.352483749389648, -5.171767234802246, -4.991050720214844, -4.810334205627441, -4.629617691040039, -4.448901176452637, -4.268185138702393, -4.08746862411499, -3.906752109527588, -3.7260355949401855, -3.5453195571899414, -3.364603042602539, -3.183886766433716, -3.0031702518463135, -2.8224539756774902, -2.641737461090088, -2.4610209465026855, -2.280304431915283, -2.09958815574646, -1.9188717603683472, -1.7381553649902344, -1.557438850402832, -1.3767224550247192, -1.1960060596466064, -1.015289545059204, -0.8345731496810913, -0.6538572311401367, -0.47314080595970154, -0.29242438077926636, -0.11170792579650879, 0.069008469581604, 0.2497248649597168, 0.43044137954711914, 0.6111577749252319, 0.7918741703033447, 0.9725905656814575, 1.1533069610595703, 1.3340234756469727, 1.5147398710250854, 1.6954562664031982, 1.8761727809906006, 2.056889057159424, 2.237605571746826, 2.4183220863342285, 2.5990383625030518, 2.779754877090454, 2.9604711532592773, 3.1411876678466797, 3.321904182434082, 3.5026206970214844, 3.6833369731903076, 3.86405348777771, 4.044769763946533, 4.2254862785339355, 4.406202793121338, 4.586918830871582, 4.767635345458984, 4.948351860046387, 5.129068374633789]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 6.0, 1.0, 6.0, 13.0, 15.0, 12.0, 16.0, 27.0, 46.0, 53.0, 99.0, 124.0, 187.0, 306.0, 526.0, 1057.0, 2356.0, 6631.0, 29248.0, 271570.0, 640698.0, 76078.0, 12449.0, 3698.0, 1515.0, 735.0, 365.0, 241.0, 144.0, 117.0, 63.0, 46.0, 28.0, 24.0, 13.0, 17.0, 8.0, 6.0, 5.0, 3.0, 2.0, 0.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.189453125, -3.09051513671875, -2.9915771484375, -2.89263916015625, -2.793701171875, -2.69476318359375, -2.5958251953125, -2.49688720703125, -2.39794921875, -2.29901123046875, -2.2000732421875, -2.10113525390625, -2.002197265625, -1.90325927734375, -1.8043212890625, -1.70538330078125, -1.6064453125, -1.50750732421875, -1.4085693359375, -1.30963134765625, -1.210693359375, -1.11175537109375, -1.0128173828125, -0.91387939453125, -0.81494140625, -0.71600341796875, -0.6170654296875, -0.51812744140625, -0.419189453125, -0.32025146484375, -0.2213134765625, -0.12237548828125, -0.0234375, 0.07550048828125, 0.1744384765625, 0.27337646484375, 0.372314453125, 0.47125244140625, 0.5701904296875, 0.66912841796875, 0.76806640625, 0.86700439453125, 0.9659423828125, 1.06488037109375, 1.163818359375, 1.26275634765625, 1.3616943359375, 1.46063232421875, 1.5595703125, 1.65850830078125, 1.7574462890625, 1.85638427734375, 1.955322265625, 2.05426025390625, 2.1531982421875, 2.25213623046875, 2.35107421875, 2.45001220703125, 2.5489501953125, 2.64788818359375, 2.746826171875, 2.84576416015625, 2.9447021484375, 3.04364013671875, 3.142578125]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 4.0, 5.0, 14.0, 14.0, 21.0, 35.0, 47.0, 95.0, 116.0, 122.0, 122.0, 100.0, 95.0, 82.0, 36.0, 32.0, 27.0, 14.0, 4.0, 5.0, 2.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.47998046875, -0.463623046875, -0.447265625, -0.430908203125, -0.41455078125, -0.398193359375, -0.3818359375, -0.365478515625, -0.34912109375, -0.332763671875, -0.31640625, -0.300048828125, -0.28369140625, -0.267333984375, -0.2509765625, -0.234619140625, -0.21826171875, -0.201904296875, -0.185546875, -0.169189453125, -0.15283203125, -0.136474609375, -0.1201171875, -0.103759765625, -0.08740234375, -0.071044921875, -0.0546875, -0.038330078125, -0.02197265625, -0.005615234375, 0.0107421875, 0.027099609375, 0.04345703125, 0.059814453125, 0.076171875, 0.092529296875, 0.10888671875, 0.125244140625, 0.1416015625, 0.157958984375, 0.17431640625, 0.190673828125, 0.20703125, 0.223388671875, 0.23974609375, 0.256103515625, 0.2724609375, 0.288818359375, 0.30517578125, 0.321533203125, 0.337890625, 0.354248046875, 0.37060546875, 0.386962890625, 0.4033203125, 0.419677734375, 0.43603515625, 0.452392578125, 0.46875, 0.485107421875, 0.50146484375, 0.517822265625, 0.5341796875, 0.550537109375, 0.56689453125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 5.0, 7.0, 7.0, 13.0, 12.0, 19.0, 21.0, 36.0, 36.0, 74.0, 85.0, 139.0, 185.0, 292.0, 519.0, 862.0, 1605.0, 3193.0, 6824.0, 16420.0, 42460.0, 117174.0, 295449.0, 332344.0, 143017.0, 51696.0, 19660.0, 8194.0, 3741.0, 1745.0, 1041.0, 552.0, 358.0, 231.0, 162.0, 110.0, 80.0, 54.0, 40.0, 22.0, 25.0, 11.0, 11.0, 11.0, 6.0, 7.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.0888671875, -1.0526885986328125, -1.016510009765625, -0.9803314208984375, -0.94415283203125, -0.9079742431640625, -0.871795654296875, -0.8356170654296875, -0.7994384765625, -0.7632598876953125, -0.727081298828125, -0.6909027099609375, -0.65472412109375, -0.6185455322265625, -0.582366943359375, -0.5461883544921875, -0.510009765625, -0.4738311767578125, -0.437652587890625, -0.4014739990234375, -0.36529541015625, -0.3291168212890625, -0.292938232421875, -0.2567596435546875, -0.2205810546875, -0.1844024658203125, -0.148223876953125, -0.1120452880859375, -0.07586669921875, -0.0396881103515625, -0.003509521484375, 0.0326690673828125, 0.06884765625, 0.1050262451171875, 0.141204833984375, 0.1773834228515625, 0.21356201171875, 0.2497406005859375, 0.285919189453125, 0.3220977783203125, 0.3582763671875, 0.3944549560546875, 0.430633544921875, 0.4668121337890625, 0.50299072265625, 0.5391693115234375, 0.575347900390625, 0.6115264892578125, 0.647705078125, 0.6838836669921875, 0.720062255859375, 0.7562408447265625, 0.79241943359375, 0.8285980224609375, 0.864776611328125, 0.9009552001953125, 0.9371337890625, 0.9733123779296875, 1.009490966796875, 1.0456695556640625, 1.08184814453125, 1.1180267333984375, 1.154205322265625, 1.1903839111328125, 1.2265625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 4.0, 6.0, 6.0, 9.0, 9.0, 7.0, 14.0, 16.0, 9.0, 22.0, 20.0, 30.0, 34.0, 29.0, 49.0, 37.0, 43.0, 39.0, 40.0, 50.0, 55.0, 61.0, 40.0, 38.0, 41.0, 45.0, 17.0, 34.0, 33.0, 28.0, 24.0, 17.0, 15.0, 22.0, 15.0, 7.0, 5.0, 7.0, 4.0, 4.0, 4.0, 2.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.1015625, -1.0679168701171875, -1.034271240234375, -1.0006256103515625, -0.96697998046875, -0.9333343505859375, -0.899688720703125, -0.8660430908203125, -0.8323974609375, -0.7987518310546875, -0.765106201171875, -0.7314605712890625, -0.69781494140625, -0.6641693115234375, -0.630523681640625, -0.5968780517578125, -0.563232421875, -0.5295867919921875, -0.495941162109375, -0.4622955322265625, -0.42864990234375, -0.3950042724609375, -0.361358642578125, -0.3277130126953125, -0.2940673828125, -0.2604217529296875, -0.226776123046875, -0.1931304931640625, -0.15948486328125, -0.1258392333984375, -0.092193603515625, -0.0585479736328125, -0.02490234375, 0.0087432861328125, 0.042388916015625, 0.0760345458984375, 0.10968017578125, 0.1433258056640625, 0.176971435546875, 0.2106170654296875, 0.2442626953125, 0.2779083251953125, 0.311553955078125, 0.3451995849609375, 0.37884521484375, 0.4124908447265625, 0.446136474609375, 0.4797821044921875, 0.513427734375, 0.5470733642578125, 0.580718994140625, 0.6143646240234375, 0.64801025390625, 0.6816558837890625, 0.715301513671875, 0.7489471435546875, 0.7825927734375, 0.8162384033203125, 0.849884033203125, 0.8835296630859375, 0.91717529296875, 0.9508209228515625, 0.984466552734375, 1.0181121826171875, 1.0517578125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 7.0, 7.0, 4.0, 10.0, 12.0, 14.0, 40.0, 47.0, 70.0, 119.0, 180.0, 338.0, 627.0, 1230.0, 2664.0, 6608.0, 20800.0, 102768.0, 661638.0, 203922.0, 31487.0, 9148.0, 3544.0, 1503.0, 741.0, 392.0, 239.0, 156.0, 78.0, 47.0, 27.0, 39.0, 15.0, 7.0, 11.0, 11.0, 6.0, 3.0, 2.0, 1.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0693359375, -1.036590576171875, -1.00384521484375, -0.971099853515625, -0.9383544921875, -0.905609130859375, -0.87286376953125, -0.840118408203125, -0.807373046875, -0.774627685546875, -0.74188232421875, -0.709136962890625, -0.6763916015625, -0.643646240234375, -0.61090087890625, -0.578155517578125, -0.54541015625, -0.512664794921875, -0.47991943359375, -0.447174072265625, -0.4144287109375, -0.381683349609375, -0.34893798828125, -0.316192626953125, -0.283447265625, -0.250701904296875, -0.21795654296875, -0.185211181640625, -0.1524658203125, -0.119720458984375, -0.08697509765625, -0.054229736328125, -0.021484375, 0.011260986328125, 0.04400634765625, 0.076751708984375, 0.1094970703125, 0.142242431640625, 0.17498779296875, 0.207733154296875, 0.240478515625, 0.273223876953125, 0.30596923828125, 0.338714599609375, 0.3714599609375, 0.404205322265625, 0.43695068359375, 0.469696044921875, 0.50244140625, 0.535186767578125, 0.56793212890625, 0.600677490234375, 0.6334228515625, 0.666168212890625, 0.69891357421875, 0.731658935546875, 0.764404296875, 0.797149658203125, 0.82989501953125, 0.862640380859375, 0.8953857421875, 0.928131103515625, 0.96087646484375, 0.993621826171875, 1.0263671875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 3.0, 5.0, 6.0, 7.0, 9.0, 12.0, 11.0, 21.0, 21.0, 31.0, 49.0, 69.0, 77.0, 127.0, 142.0, 101.0, 80.0, 49.0, 54.0, 25.0, 25.0, 13.0, 12.0, 14.0, 10.0, 10.0, 2.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0001386404037475586, -0.00013392791152000427, -0.00012921541929244995, -0.00012450292706489563, -0.00011979043483734131, -0.00011507794260978699, -0.00011036545038223267, -0.00010565295815467834, -0.00010094046592712402, -9.62279736995697e-05, -9.151548147201538e-05, -8.680298924446106e-05, -8.209049701690674e-05, -7.737800478935242e-05, -7.26655125617981e-05, -6.795302033424377e-05, -6.324052810668945e-05, -5.852803587913513e-05, -5.381554365158081e-05, -4.910305142402649e-05, -4.439055919647217e-05, -3.967806696891785e-05, -3.4965574741363525e-05, -3.0253082513809204e-05, -2.5540590286254883e-05, -2.082809805870056e-05, -1.611560583114624e-05, -1.1403113603591919e-05, -6.690621376037598e-06, -1.9781291484832764e-06, 2.734363079071045e-06, 7.446855306625366e-06, 1.2159347534179688e-05, 1.687183976173401e-05, 2.158433198928833e-05, 2.629682421684265e-05, 3.100931644439697e-05, 3.5721808671951294e-05, 4.0434300899505615e-05, 4.5146793127059937e-05, 4.985928535461426e-05, 5.457177758216858e-05, 5.92842698097229e-05, 6.399676203727722e-05, 6.870925426483154e-05, 7.342174649238586e-05, 7.813423871994019e-05, 8.284673094749451e-05, 8.755922317504883e-05, 9.227171540260315e-05, 9.698420763015747e-05, 0.00010169669985771179, 0.00010640919208526611, 0.00011112168431282043, 0.00011583417654037476, 0.00012054666876792908, 0.0001252591609954834, 0.00012997165322303772, 0.00013468414545059204, 0.00013939663767814636, 0.00014410912990570068, 0.000148821622133255, 0.00015353411436080933, 0.00015824660658836365, 0.00016295909881591797]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 7.0, 15.0, 8.0, 21.0, 39.0, 68.0, 126.0, 258.0, 570.0, 1640.0, 5671.0, 30867.0, 754638.0, 233066.0, 16004.0, 3560.0, 1085.0, 457.0, 192.0, 109.0, 44.0, 43.0, 23.0, 10.0, 9.0, 11.0, 5.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.26171875, -2.19677734375, -2.1318359375, -2.06689453125, -2.001953125, -1.93701171875, -1.8720703125, -1.80712890625, -1.7421875, -1.67724609375, -1.6123046875, -1.54736328125, -1.482421875, -1.41748046875, -1.3525390625, -1.28759765625, -1.22265625, -1.15771484375, -1.0927734375, -1.02783203125, -0.962890625, -0.89794921875, -0.8330078125, -0.76806640625, -0.703125, -0.63818359375, -0.5732421875, -0.50830078125, -0.443359375, -0.37841796875, -0.3134765625, -0.24853515625, -0.18359375, -0.11865234375, -0.0537109375, 0.01123046875, 0.076171875, 0.14111328125, 0.2060546875, 0.27099609375, 0.3359375, 0.40087890625, 0.4658203125, 0.53076171875, 0.595703125, 0.66064453125, 0.7255859375, 0.79052734375, 0.85546875, 0.92041015625, 0.9853515625, 1.05029296875, 1.115234375, 1.18017578125, 1.2451171875, 1.31005859375, 1.375, 1.43994140625, 1.5048828125, 1.56982421875, 1.634765625, 1.69970703125, 1.7646484375, 1.82958984375, 1.89453125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 5.0, 4.0, 4.0, 12.0, 7.0, 10.0, 15.0, 14.0, 12.0, 14.0, 29.0, 55.0, 76.0, 100.0, 127.0, 143.0, 125.0, 78.0, 47.0, 40.0, 26.0, 17.0, 16.0, 6.0, 4.0, 7.0, 2.0, 4.0, 6.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.91162109375, -0.8832244873046875, -0.854827880859375, -0.8264312744140625, -0.79803466796875, -0.7696380615234375, -0.741241455078125, -0.7128448486328125, -0.6844482421875, -0.6560516357421875, -0.627655029296875, -0.5992584228515625, -0.57086181640625, -0.5424652099609375, -0.514068603515625, -0.4856719970703125, -0.457275390625, -0.4288787841796875, -0.400482177734375, -0.3720855712890625, -0.34368896484375, -0.3152923583984375, -0.286895751953125, -0.2584991455078125, -0.2301025390625, -0.2017059326171875, -0.173309326171875, -0.1449127197265625, -0.11651611328125, -0.0881195068359375, -0.059722900390625, -0.0313262939453125, -0.0029296875, 0.0254669189453125, 0.053863525390625, 0.0822601318359375, 0.11065673828125, 0.1390533447265625, 0.167449951171875, 0.1958465576171875, 0.2242431640625, 0.2526397705078125, 0.281036376953125, 0.3094329833984375, 0.33782958984375, 0.3662261962890625, 0.394622802734375, 0.4230194091796875, 0.451416015625, 0.4798126220703125, 0.508209228515625, 0.5366058349609375, 0.56500244140625, 0.5933990478515625, 0.621795654296875, 0.6501922607421875, 0.6785888671875, 0.7069854736328125, 0.735382080078125, 0.7637786865234375, 0.79217529296875, 0.8205718994140625, 0.848968505859375, 0.8773651123046875, 0.90576171875]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 4.0, 9.0, 10.0, 23.0, 32.0, 40.0, 59.0, 113.0, 111.0, 144.0, 141.0, 117.0, 79.0, 38.0, 36.0, 20.0, 7.0, 11.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-13.018125534057617, -12.676589012145996, -12.335051536560059, -11.993515014648438, -11.651978492736816, -11.310441970825195, -10.968904495239258, -10.627367973327637, -10.285831451416016, -9.944294929504395, -9.602757453918457, -9.261220932006836, -8.919684410095215, -8.578147888183594, -8.236610412597656, -7.895073890686035, -7.553536415100098, -7.211999416351318, -6.870462894439697, -6.528925895690918, -6.187389373779297, -5.845852375030518, -5.504315376281738, -5.162778854370117, -4.821241855621338, -4.479704856872559, -4.1381683349609375, -3.796631336212158, -3.455094575881958, -3.113557815551758, -2.7720208168029785, -2.4304840564727783, -2.0889463424682617, -1.7474095821380615, -1.4058727025985718, -1.064335823059082, -0.7227990627288818, -0.38126230239868164, -0.039725303649902344, 0.30181145668029785, 0.643348217010498, 0.984885036945343, 1.326421856880188, 1.6679587364196777, 2.009495496749878, 2.351032257080078, 2.6925692558288574, 3.0341060161590576, 3.375642776489258, 3.717179536819458, 4.058716297149658, 4.4002532958984375, 4.741789817810059, 5.083326816558838, 5.424863815307617, 5.766400337219238, 6.107937335968018, 6.449474334716797, 6.791010856628418, 7.132547855377197, 7.474084854125977, 7.815621376037598, 8.157157897949219, 8.498695373535156, 8.840231895446777]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 2.0, 4.0, 4.0, 5.0, 5.0, 11.0, 13.0, 12.0, 12.0, 22.0, 17.0, 28.0, 15.0, 24.0, 16.0, 23.0, 27.0, 32.0, 31.0, 31.0, 43.0, 31.0, 35.0, 46.0, 36.0, 29.0, 48.0, 34.0, 38.0, 33.0, 40.0, 27.0, 33.0, 24.0, 32.0, 21.0, 22.0, 21.0, 13.0, 8.0, 11.0, 10.0, 7.0, 3.0, 5.0, 4.0, 3.0, 5.0, 4.0, 2.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-5.346571445465088, -5.179823875427246, -5.013076305389404, -4.8463287353515625, -4.679581165313721, -4.512833595275879, -4.346086025238037, -4.179338455200195, -4.0125908851623535, -3.8458433151245117, -3.67909574508667, -3.512348175048828, -3.3456006050109863, -3.1788530349731445, -3.0121054649353027, -2.845357894897461, -2.678610324859619, -2.5118627548217773, -2.3451151847839355, -2.1783676147460938, -2.011620044708252, -1.8448724746704102, -1.6781249046325684, -1.5113773345947266, -1.3446297645568848, -1.177882194519043, -1.0111346244812012, -0.8443870544433594, -0.6776394844055176, -0.5108919143676758, -0.344144344329834, -0.1773967742919922, -0.010649681091308594, 0.1560978889465332, 0.322845458984375, 0.4895930290222168, 0.6563405990600586, 0.8230881690979004, 0.9898357391357422, 1.156583309173584, 1.3233308792114258, 1.4900784492492676, 1.6568260192871094, 1.8235735893249512, 1.990321159362793, 2.1570687294006348, 2.3238162994384766, 2.4905638694763184, 2.65731143951416, 2.824059009552002, 2.9908065795898438, 3.1575541496276855, 3.3243017196655273, 3.491049289703369, 3.657796859741211, 3.8245444297790527, 3.9912919998168945, 4.158039569854736, 4.324787139892578, 4.49153470993042, 4.658282279968262, 4.8250298500061035, 4.991777420043945, 5.158524990081787, 5.325272560119629]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 6.0, 7.0, 7.0, 8.0, 6.0, 10.0, 8.0, 22.0, 22.0, 34.0, 82.0, 138.0, 338.0, 925.0, 3384.0, 19195.0, 3827233.0, 326171.0, 12301.0, 2553.0, 831.0, 365.0, 197.0, 122.0, 83.0, 61.0, 37.0, 35.0, 26.0, 22.0, 21.0, 13.0, 7.0, 6.0, 2.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.37109375, -5.212646484375, -5.05419921875, -4.895751953125, -4.7373046875, -4.578857421875, -4.42041015625, -4.261962890625, -4.103515625, -3.945068359375, -3.78662109375, -3.628173828125, -3.4697265625, -3.311279296875, -3.15283203125, -2.994384765625, -2.8359375, -2.677490234375, -2.51904296875, -2.360595703125, -2.2021484375, -2.043701171875, -1.88525390625, -1.726806640625, -1.568359375, -1.409912109375, -1.25146484375, -1.093017578125, -0.9345703125, -0.776123046875, -0.61767578125, -0.459228515625, -0.30078125, -0.142333984375, 0.01611328125, 0.174560546875, 0.3330078125, 0.491455078125, 0.64990234375, 0.808349609375, 0.966796875, 1.125244140625, 1.28369140625, 1.442138671875, 1.6005859375, 1.759033203125, 1.91748046875, 2.075927734375, 2.234375, 2.392822265625, 2.55126953125, 2.709716796875, 2.8681640625, 3.026611328125, 3.18505859375, 3.343505859375, 3.501953125, 3.660400390625, 3.81884765625, 3.977294921875, 4.1357421875, 4.294189453125, 4.45263671875, 4.611083984375, 4.76953125]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 8.0, 5.0, 11.0, 29.0, 33.0, 56.0, 68.0, 89.0, 103.0, 108.0, 84.0, 112.0, 76.0, 77.0, 42.0, 37.0, 23.0, 11.0, 11.0, 0.0, 2.0, 2.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.448486328125, -0.4330406188964844, -0.41759490966796875, -0.4021492004394531, -0.3867034912109375, -0.3712577819824219, -0.35581207275390625, -0.3403663635253906, -0.324920654296875, -0.3094749450683594, -0.29402923583984375, -0.2785835266113281, -0.2631378173828125, -0.24769210815429688, -0.23224639892578125, -0.21680068969726562, -0.20135498046875, -0.18590927124023438, -0.17046356201171875, -0.15501785278320312, -0.1395721435546875, -0.12412643432617188, -0.10868072509765625, -0.09323501586914062, -0.077789306640625, -0.062343597412109375, -0.04689788818359375, -0.031452178955078125, -0.0160064697265625, -0.000560760498046875, 0.01488494873046875, 0.030330657958984375, 0.0457763671875, 0.061222076416015625, 0.07666778564453125, 0.09211349487304688, 0.1075592041015625, 0.12300491333007812, 0.13845062255859375, 0.15389633178710938, 0.169342041015625, 0.18478775024414062, 0.20023345947265625, 0.21567916870117188, 0.2311248779296875, 0.24657058715820312, 0.26201629638671875, 0.2774620056152344, 0.29290771484375, 0.3083534240722656, 0.32379913330078125, 0.3392448425292969, 0.3546905517578125, 0.3701362609863281, 0.38558197021484375, 0.4010276794433594, 0.416473388671875, 0.4319190979003906, 0.44736480712890625, 0.4628105163574219, 0.4782562255859375, 0.4937019348144531, 0.5091476440429688, 0.5245933532714844, 0.5400390625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 4.0, 8.0, 13.0, 27.0, 44.0, 59.0, 124.0, 236.0, 410.0, 772.0, 1561.0, 3212.0, 7509.0, 21593.0, 123156.0, 3807792.0, 186433.0, 25979.0, 8326.0, 3542.0, 1641.0, 801.0, 424.0, 258.0, 137.0, 71.0, 47.0, 32.0, 28.0, 7.0, 12.0, 7.0, 1.0, 6.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.4921875, -2.42010498046875, -2.3480224609375, -2.27593994140625, -2.203857421875, -2.13177490234375, -2.0596923828125, -1.98760986328125, -1.91552734375, -1.84344482421875, -1.7713623046875, -1.69927978515625, -1.627197265625, -1.55511474609375, -1.4830322265625, -1.41094970703125, -1.3388671875, -1.26678466796875, -1.1947021484375, -1.12261962890625, -1.050537109375, -0.97845458984375, -0.9063720703125, -0.83428955078125, -0.76220703125, -0.69012451171875, -0.6180419921875, -0.54595947265625, -0.473876953125, -0.40179443359375, -0.3297119140625, -0.25762939453125, -0.185546875, -0.11346435546875, -0.0413818359375, 0.03070068359375, 0.102783203125, 0.17486572265625, 0.2469482421875, 0.31903076171875, 0.39111328125, 0.46319580078125, 0.5352783203125, 0.60736083984375, 0.679443359375, 0.75152587890625, 0.8236083984375, 0.89569091796875, 0.9677734375, 1.03985595703125, 1.1119384765625, 1.18402099609375, 1.256103515625, 1.32818603515625, 1.4002685546875, 1.47235107421875, 1.54443359375, 1.61651611328125, 1.6885986328125, 1.76068115234375, 1.832763671875, 1.90484619140625, 1.9769287109375, 2.04901123046875, 2.12109375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 7.0, 2.0, 3.0, 5.0, 7.0, 5.0, 5.0, 12.0, 10.0, 19.0, 18.0, 24.0, 46.0, 77.0, 135.0, 290.0, 1064.0, 1585.0, 337.0, 168.0, 92.0, 47.0, 23.0, 22.0, 14.0, 8.0, 8.0, 7.0, 8.0, 4.0, 5.0, 4.0, 1.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.57568359375, -0.5565567016601562, -0.5374298095703125, -0.5183029174804688, -0.499176025390625, -0.48004913330078125, -0.4609222412109375, -0.44179534912109375, -0.42266845703125, -0.40354156494140625, -0.3844146728515625, -0.36528778076171875, -0.346160888671875, -0.32703399658203125, -0.3079071044921875, -0.28878021240234375, -0.2696533203125, -0.25052642822265625, -0.2313995361328125, -0.21227264404296875, -0.193145751953125, -0.17401885986328125, -0.1548919677734375, -0.13576507568359375, -0.11663818359375, -0.09751129150390625, -0.0783843994140625, -0.05925750732421875, -0.040130615234375, -0.02100372314453125, -0.0018768310546875, 0.01725006103515625, 0.036376953125, 0.05550384521484375, 0.0746307373046875, 0.09375762939453125, 0.112884521484375, 0.13201141357421875, 0.1511383056640625, 0.17026519775390625, 0.18939208984375, 0.20851898193359375, 0.2276458740234375, 0.24677276611328125, 0.265899658203125, 0.28502655029296875, 0.3041534423828125, 0.32328033447265625, 0.3424072265625, 0.36153411865234375, 0.3806610107421875, 0.39978790283203125, 0.418914794921875, 0.43804168701171875, 0.4571685791015625, 0.47629547119140625, 0.49542236328125, 0.5145492553710938, 0.5336761474609375, 0.5528030395507812, 0.571929931640625, 0.5910568237304688, 0.6101837158203125, 0.6293106079101562, 0.6484375]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 6.0, 7.0, 9.0, 13.0, 36.0, 50.0, 95.0, 179.0, 203.0, 186.0, 102.0, 52.0, 35.0, 12.0, 8.0, 10.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.484475612640381, -6.312633991241455, -6.140791893005371, -5.968950271606445, -5.7971086502075195, -5.6252665519714355, -5.45342493057251, -5.281582832336426, -5.1097412109375, -4.937899589538574, -4.76605749130249, -4.5942158699035645, -4.4223737716674805, -4.250532150268555, -4.078690528869629, -3.906848669052124, -3.735006809234619, -3.5631649494171143, -3.3913230895996094, -3.2194814682006836, -3.0476396083831787, -2.875797748565674, -2.703956127166748, -2.532114267349243, -2.3602724075317383, -2.1884305477142334, -2.0165886878967285, -1.8447470664978027, -1.6729052066802979, -1.501063346862793, -1.3292216062545776, -1.1573798656463623, -0.9855375289916992, -0.8136957287788391, -0.641853928565979, -0.4700121283531189, -0.2981703281402588, -0.12632852792739868, 0.045513272285461426, 0.21735501289367676, 0.38919687271118164, 0.5610386729240417, 0.7328804731369019, 0.904722273349762, 1.076564073562622, 1.248405933380127, 1.4202476739883423, 1.5920894145965576, 1.7639312744140625, 1.9357731342315674, 2.1076149940490723, 2.279456615447998, 2.451298475265503, 2.623140335083008, 2.7949819564819336, 2.9668238162994385, 3.1386656761169434, 3.3105075359344482, 3.482349395751953, 3.654191017150879, 3.826032876968384, 3.9978747367858887, 4.1697163581848145, 4.341558456420898, 4.513400077819824]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 2.0, 3.0, 9.0, 10.0, 13.0, 9.0, 16.0, 20.0, 25.0, 27.0, 38.0, 33.0, 48.0, 40.0, 40.0, 51.0, 45.0, 42.0, 54.0, 56.0, 49.0, 57.0, 52.0, 53.0, 40.0, 20.0, 27.0, 20.0, 20.0, 13.0, 14.0, 14.0, 15.0, 14.0, 4.0, 3.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.7820212841033936, -2.7063207626342773, -2.6306204795837402, -2.554919958114624, -2.479219675064087, -2.4035191535949707, -2.3278188705444336, -2.2521183490753174, -2.176417827606201, -2.100717306137085, -2.025017023086548, -1.9493165016174316, -1.873616099357605, -1.7979156970977783, -1.7222152948379517, -1.646514892578125, -1.5708144903182983, -1.4951140880584717, -1.419413685798645, -1.3437132835388184, -1.2680127620697021, -1.1923123598098755, -1.1166119575500488, -1.0409114360809326, -0.9652110934257507, -0.8895106911659241, -0.8138102293014526, -0.738109827041626, -0.6624094247817993, -0.5867089629173279, -0.5110085606575012, -0.4353080987930298, -0.3596076965332031, -0.2839072644710541, -0.20820684731006622, -0.13250643014907837, -0.05680599808692932, 0.018894433975219727, 0.09459483623504639, 0.17029529809951782, 0.24599570035934448, 0.32169613242149353, 0.3973965644836426, 0.47309696674346924, 0.5487973690032959, 0.6244978308677673, 0.700198233127594, 0.7758986949920654, 0.8515990972518921, 0.9272994995117188, 1.0029999017715454, 1.078700304031372, 1.1544008255004883, 1.230101227760315, 1.3058016300201416, 1.3815021514892578, 1.457202434539795, 1.5329028367996216, 1.6086032390594482, 1.6843037605285645, 1.7600041627883911, 1.8357045650482178, 1.9114049673080444, 1.987105369567871, 2.0628058910369873]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 2.0, 5.0, 7.0, 9.0, 18.0, 20.0, 18.0, 25.0, 43.0, 68.0, 122.0, 159.0, 283.0, 485.0, 1002.0, 2080.0, 5410.0, 18791.0, 119398.0, 629306.0, 227381.0, 31164.0, 7452.0, 2675.0, 1209.0, 552.0, 316.0, 176.0, 106.0, 89.0, 53.0, 27.0, 32.0, 15.0, 18.0, 8.0, 8.0, 7.0, 5.0, 4.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.771484375, -2.681060791015625, -2.59063720703125, -2.500213623046875, -2.4097900390625, -2.319366455078125, -2.22894287109375, -2.138519287109375, -2.048095703125, -1.957672119140625, -1.86724853515625, -1.776824951171875, -1.6864013671875, -1.595977783203125, -1.50555419921875, -1.415130615234375, -1.32470703125, -1.234283447265625, -1.14385986328125, -1.053436279296875, -0.9630126953125, -0.872589111328125, -0.78216552734375, -0.691741943359375, -0.601318359375, -0.510894775390625, -0.42047119140625, -0.330047607421875, -0.2396240234375, -0.149200439453125, -0.05877685546875, 0.031646728515625, 0.1220703125, 0.212493896484375, 0.30291748046875, 0.393341064453125, 0.4837646484375, 0.574188232421875, 0.66461181640625, 0.755035400390625, 0.845458984375, 0.935882568359375, 1.02630615234375, 1.116729736328125, 1.2071533203125, 1.297576904296875, 1.38800048828125, 1.478424072265625, 1.56884765625, 1.659271240234375, 1.74969482421875, 1.840118408203125, 1.9305419921875, 2.020965576171875, 2.11138916015625, 2.201812744140625, 2.292236328125, 2.382659912109375, 2.47308349609375, 2.563507080078125, 2.6539306640625, 2.744354248046875, 2.83477783203125, 2.925201416015625, 3.015625]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 3.0, 4.0, 10.0, 15.0, 13.0, 32.0, 34.0, 53.0, 73.0, 82.0, 90.0, 101.0, 98.0, 105.0, 79.0, 67.0, 57.0, 35.0, 21.0, 5.0, 9.0, 4.0, 3.0, 1.0, 1.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.458251953125, -0.4423789978027344, -0.42650604248046875, -0.4106330871582031, -0.3947601318359375, -0.3788871765136719, -0.36301422119140625, -0.3471412658691406, -0.331268310546875, -0.3153953552246094, -0.29952239990234375, -0.2836494445800781, -0.2677764892578125, -0.2519035339355469, -0.23603057861328125, -0.22015762329101562, -0.20428466796875, -0.18841171264648438, -0.17253875732421875, -0.15666580200195312, -0.1407928466796875, -0.12491989135742188, -0.10904693603515625, -0.09317398071289062, -0.077301025390625, -0.061428070068359375, -0.04555511474609375, -0.029682159423828125, -0.0138092041015625, 0.002063751220703125, 0.01793670654296875, 0.033809661865234375, 0.0496826171875, 0.06555557250976562, 0.08142852783203125, 0.09730148315429688, 0.1131744384765625, 0.12904739379882812, 0.14492034912109375, 0.16079330444335938, 0.176666259765625, 0.19253921508789062, 0.20841217041015625, 0.22428512573242188, 0.2401580810546875, 0.2560310363769531, 0.27190399169921875, 0.2877769470214844, 0.30364990234375, 0.3195228576660156, 0.33539581298828125, 0.3512687683105469, 0.3671417236328125, 0.3830146789550781, 0.39888763427734375, 0.4147605895996094, 0.430633544921875, 0.4465065002441406, 0.46237945556640625, 0.4782524108886719, 0.4941253662109375, 0.5099983215332031, 0.5258712768554688, 0.5417442321777344, 0.5576171875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 5.0, 7.0, 11.0, 17.0, 16.0, 17.0, 27.0, 42.0, 50.0, 63.0, 109.0, 161.0, 256.0, 459.0, 713.0, 1310.0, 2663.0, 5906.0, 14786.0, 40392.0, 120400.0, 317846.0, 336441.0, 133286.0, 44544.0, 16207.0, 6586.0, 2943.0, 1338.0, 739.0, 403.0, 259.0, 167.0, 97.0, 90.0, 54.0, 35.0, 36.0, 17.0, 21.0, 11.0, 6.0, 6.0, 5.0, 3.0, 6.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2236328125, -1.1842193603515625, -1.144805908203125, -1.1053924560546875, -1.06597900390625, -1.0265655517578125, -0.987152099609375, -0.9477386474609375, -0.9083251953125, -0.8689117431640625, -0.829498291015625, -0.7900848388671875, -0.75067138671875, -0.7112579345703125, -0.671844482421875, -0.6324310302734375, -0.593017578125, -0.5536041259765625, -0.514190673828125, -0.4747772216796875, -0.43536376953125, -0.3959503173828125, -0.356536865234375, -0.3171234130859375, -0.2777099609375, -0.2382965087890625, -0.198883056640625, -0.1594696044921875, -0.12005615234375, -0.0806427001953125, -0.041229248046875, -0.0018157958984375, 0.03759765625, 0.0770111083984375, 0.116424560546875, 0.1558380126953125, 0.19525146484375, 0.2346649169921875, 0.274078369140625, 0.3134918212890625, 0.3529052734375, 0.3923187255859375, 0.431732177734375, 0.4711456298828125, 0.51055908203125, 0.5499725341796875, 0.589385986328125, 0.6287994384765625, 0.668212890625, 0.7076263427734375, 0.747039794921875, 0.7864532470703125, 0.82586669921875, 0.8652801513671875, 0.904693603515625, 0.9441070556640625, 0.9835205078125, 1.0229339599609375, 1.062347412109375, 1.1017608642578125, 1.14117431640625, 1.1805877685546875, 1.220001220703125, 1.2594146728515625, 1.298828125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 9.0, 10.0, 8.0, 12.0, 14.0, 15.0, 20.0, 26.0, 33.0, 40.0, 37.0, 34.0, 36.0, 46.0, 48.0, 46.0, 51.0, 37.0, 52.0, 41.0, 45.0, 46.0, 44.0, 47.0, 22.0, 29.0, 30.0, 27.0, 18.0, 18.0, 8.0, 7.0, 12.0, 9.0, 6.0, 5.0, 9.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2548828125, -1.2169036865234375, -1.178924560546875, -1.1409454345703125, -1.10296630859375, -1.0649871826171875, -1.027008056640625, -0.9890289306640625, -0.9510498046875, -0.9130706787109375, -0.875091552734375, -0.8371124267578125, -0.79913330078125, -0.7611541748046875, -0.723175048828125, -0.6851959228515625, -0.647216796875, -0.6092376708984375, -0.571258544921875, -0.5332794189453125, -0.49530029296875, -0.4573211669921875, -0.419342041015625, -0.3813629150390625, -0.3433837890625, -0.3054046630859375, -0.267425537109375, -0.2294464111328125, -0.19146728515625, -0.1534881591796875, -0.115509033203125, -0.0775299072265625, -0.03955078125, -0.0015716552734375, 0.036407470703125, 0.0743865966796875, 0.11236572265625, 0.1503448486328125, 0.188323974609375, 0.2263031005859375, 0.2642822265625, 0.3022613525390625, 0.340240478515625, 0.3782196044921875, 0.41619873046875, 0.4541778564453125, 0.492156982421875, 0.5301361083984375, 0.568115234375, 0.6060943603515625, 0.644073486328125, 0.6820526123046875, 0.72003173828125, 0.7580108642578125, 0.795989990234375, 0.8339691162109375, 0.8719482421875, 0.9099273681640625, 0.947906494140625, 0.9858856201171875, 1.02386474609375, 1.0618438720703125, 1.099822998046875, 1.1378021240234375, 1.17578125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 7.0, 9.0, 17.0, 37.0, 47.0, 88.0, 181.0, 313.0, 857.0, 3091.0, 20045.0, 341728.0, 640843.0, 34733.0, 4606.0, 1085.0, 396.0, 197.0, 101.0, 73.0, 40.0, 22.0, 10.0, 9.0, 4.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-1.85546875, -1.80548095703125, -1.7554931640625, -1.70550537109375, -1.655517578125, -1.60552978515625, -1.5555419921875, -1.50555419921875, -1.45556640625, -1.40557861328125, -1.3555908203125, -1.30560302734375, -1.255615234375, -1.20562744140625, -1.1556396484375, -1.10565185546875, -1.0556640625, -1.00567626953125, -0.9556884765625, -0.90570068359375, -0.855712890625, -0.80572509765625, -0.7557373046875, -0.70574951171875, -0.65576171875, -0.60577392578125, -0.5557861328125, -0.50579833984375, -0.455810546875, -0.40582275390625, -0.3558349609375, -0.30584716796875, -0.255859375, -0.20587158203125, -0.1558837890625, -0.10589599609375, -0.055908203125, -0.00592041015625, 0.0440673828125, 0.09405517578125, 0.14404296875, 0.19403076171875, 0.2440185546875, 0.29400634765625, 0.343994140625, 0.39398193359375, 0.4439697265625, 0.49395751953125, 0.5439453125, 0.59393310546875, 0.6439208984375, 0.69390869140625, 0.743896484375, 0.79388427734375, 0.8438720703125, 0.89385986328125, 0.94384765625, 0.99383544921875, 1.0438232421875, 1.09381103515625, 1.143798828125, 1.19378662109375, 1.2437744140625, 1.29376220703125, 1.34375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 5.0, 3.0, 6.0, 7.0, 12.0, 16.0, 31.0, 47.0, 76.0, 96.0, 131.0, 160.0, 136.0, 93.0, 60.0, 41.0, 24.0, 12.0, 9.0, 7.0, 5.0, 7.0, 3.0, 7.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00019216537475585938, -0.00018562376499176025, -0.00017908215522766113, -0.000172540545463562, -0.0001659989356994629, -0.00015945732593536377, -0.00015291571617126465, -0.00014637410640716553, -0.0001398324966430664, -0.00013329088687896729, -0.00012674927711486816, -0.00012020766735076904, -0.00011366605758666992, -0.0001071244478225708, -0.00010058283805847168, -9.404122829437256e-05, -8.749961853027344e-05, -8.095800876617432e-05, -7.44163990020752e-05, -6.787478923797607e-05, -6.133317947387695e-05, -5.479156970977783e-05, -4.824995994567871e-05, -4.170835018157959e-05, -3.516674041748047e-05, -2.8625130653381348e-05, -2.2083520889282227e-05, -1.5541911125183105e-05, -9.000301361083984e-06, -2.4586915969848633e-06, 4.082918167114258e-06, 1.0624527931213379e-05, 1.71661376953125e-05, 2.370774745941162e-05, 3.0249357223510742e-05, 3.679096698760986e-05, 4.3332576751708984e-05, 4.9874186515808105e-05, 5.6415796279907227e-05, 6.295740604400635e-05, 6.949901580810547e-05, 7.604062557220459e-05, 8.258223533630371e-05, 8.912384510040283e-05, 9.566545486450195e-05, 0.00010220706462860107, 0.0001087486743927002, 0.00011529028415679932, 0.00012183189392089844, 0.00012837350368499756, 0.00013491511344909668, 0.0001414567232131958, 0.00014799833297729492, 0.00015453994274139404, 0.00016108155250549316, 0.00016762316226959229, 0.0001741647720336914, 0.00018070638179779053, 0.00018724799156188965, 0.00019378960132598877, 0.0002003312110900879, 0.000206872820854187, 0.00021341443061828613, 0.00021995604038238525, 0.00022649765014648438]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 6.0, 8.0, 10.0, 9.0, 24.0, 46.0, 48.0, 98.0, 175.0, 471.0, 1610.0, 8752.0, 113499.0, 855823.0, 60008.0, 6007.0, 1202.0, 365.0, 178.0, 95.0, 46.0, 30.0, 18.0, 17.0, 8.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5234375, -1.465728759765625, -1.40802001953125, -1.350311279296875, -1.2926025390625, -1.234893798828125, -1.17718505859375, -1.119476318359375, -1.061767578125, -1.004058837890625, -0.94635009765625, -0.888641357421875, -0.8309326171875, -0.773223876953125, -0.71551513671875, -0.657806396484375, -0.60009765625, -0.542388916015625, -0.48468017578125, -0.426971435546875, -0.3692626953125, -0.311553955078125, -0.25384521484375, -0.196136474609375, -0.138427734375, -0.080718994140625, -0.02301025390625, 0.034698486328125, 0.0924072265625, 0.150115966796875, 0.20782470703125, 0.265533447265625, 0.3232421875, 0.380950927734375, 0.43865966796875, 0.496368408203125, 0.5540771484375, 0.611785888671875, 0.66949462890625, 0.727203369140625, 0.784912109375, 0.842620849609375, 0.90032958984375, 0.958038330078125, 1.0157470703125, 1.073455810546875, 1.13116455078125, 1.188873291015625, 1.24658203125, 1.304290771484375, 1.36199951171875, 1.419708251953125, 1.4774169921875, 1.535125732421875, 1.59283447265625, 1.650543212890625, 1.708251953125, 1.765960693359375, 1.82366943359375, 1.881378173828125, 1.9390869140625, 1.996795654296875, 2.05450439453125, 2.112213134765625, 2.169921875]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 6.0, 1.0, 9.0, 12.0, 20.0, 27.0, 41.0, 51.0, 85.0, 111.0, 113.0, 140.0, 133.0, 81.0, 58.0, 39.0, 32.0, 20.0, 12.0, 6.0, 6.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.56494140625, -0.5354843139648438, -0.5060272216796875, -0.47657012939453125, -0.447113037109375, -0.41765594482421875, -0.3881988525390625, -0.35874176025390625, -0.32928466796875, -0.29982757568359375, -0.2703704833984375, -0.24091339111328125, -0.211456298828125, -0.18199920654296875, -0.1525421142578125, -0.12308502197265625, -0.0936279296875, -0.06417083740234375, -0.0347137451171875, -0.00525665283203125, 0.024200439453125, 0.05365753173828125, 0.0831146240234375, 0.11257171630859375, 0.14202880859375, 0.17148590087890625, 0.2009429931640625, 0.23040008544921875, 0.259857177734375, 0.28931427001953125, 0.3187713623046875, 0.34822845458984375, 0.377685546875, 0.40714263916015625, 0.4365997314453125, 0.46605682373046875, 0.495513916015625, 0.5249710083007812, 0.5544281005859375, 0.5838851928710938, 0.61334228515625, 0.6427993774414062, 0.6722564697265625, 0.7017135620117188, 0.731170654296875, 0.7606277465820312, 0.7900848388671875, 0.8195419311523438, 0.8489990234375, 0.8784561157226562, 0.9079132080078125, 0.9373703002929688, 0.966827392578125, 0.9962844848632812, 1.0257415771484375, 1.0551986694335938, 1.08465576171875, 1.1141128540039062, 1.1435699462890625, 1.1730270385742188, 1.202484130859375, 1.2319412231445312, 1.2613983154296875, 1.2908554077148438, 1.3203125]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 6.0, 17.0, 40.0, 111.0, 216.0, 321.0, 174.0, 76.0, 32.0, 8.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.068765640258789, -11.287035942077637, -10.505306243896484, -9.723577499389648, -8.941847801208496, -8.160118103027344, -7.37838888168335, -6.5966596603393555, -5.814929962158203, -5.033200263977051, -4.251471042633057, -3.4697415828704834, -2.68801212310791, -1.906282663345337, -1.1245532035827637, -0.34282398223876953, 0.4389057159423828, 1.220635175704956, 2.0023646354675293, 2.7840940952301025, 3.565823554992676, 4.347553253173828, 5.129282474517822, 5.911011695861816, 6.692741394042969, 7.474471092224121, 8.256200790405273, 9.03792953491211, 9.819659233093262, 10.601388931274414, 11.38311767578125, 12.164847373962402, 12.946578979492188, 13.72830867767334, 14.510038375854492, 15.291767120361328, 16.073497772216797, 16.855226516723633, 17.63695526123047, 18.418685913085938, 19.200414657592773, 19.98214340209961, 20.763874053955078, 21.545602798461914, 22.32733154296875, 23.10906219482422, 23.890790939331055, 24.67251968383789, 25.45425033569336, 26.235979080200195, 27.017709732055664, 27.7994384765625, 28.58116912841797, 29.362897872924805, 30.14462661743164, 30.92635726928711, 31.708086013793945, 32.48981475830078, 33.27154541015625, 34.05327606201172, 34.83500289916992, 35.61673355102539, 36.39846420288086, 37.18019104003906, 37.96192169189453]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 2.0, 6.0, 4.0, 5.0, 8.0, 6.0, 13.0, 19.0, 13.0, 17.0, 19.0, 20.0, 28.0, 20.0, 29.0, 38.0, 39.0, 30.0, 41.0, 45.0, 38.0, 51.0, 32.0, 46.0, 40.0, 39.0, 46.0, 28.0, 42.0, 32.0, 23.0, 24.0, 23.0, 27.0, 17.0, 21.0, 12.0, 11.0, 9.0, 7.0, 9.0, 2.0, 5.0, 3.0, 6.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.174185752868652, -5.975380897521973, -5.776576519012451, -5.5777716636657715, -5.37896728515625, -5.18016242980957, -4.981357574462891, -4.782553195953369, -4.583748817443848, -4.384943962097168, -4.1861395835876465, -3.987334728240967, -3.7885303497314453, -3.5897254943847656, -3.390920877456665, -3.1921162605285645, -2.9933114051818848, -2.794506788253784, -2.5957021713256836, -2.396897315979004, -2.1980929374694824, -1.9992882013320923, -1.8004834651947021, -1.6016788482666016, -1.402874231338501, -1.2040696144104004, -1.0052649974822998, -0.8064602613449097, -0.6076556444168091, -0.4088510274887085, -0.21004629135131836, -0.011241674423217773, 0.18756341934204102, 0.386368066072464, 0.585172712802887, 0.7839773893356323, 0.9827820062637329, 1.1815866231918335, 1.3803913593292236, 1.5791959762573242, 1.7780005931854248, 1.9768052101135254, 2.175609827041626, 2.3744144439697266, 2.5732192993164062, 2.7720236778259277, 2.9708285331726074, 3.169633150100708, 3.3684377670288086, 3.567242383956909, 3.7660470008850098, 3.9648518562316895, 4.163656234741211, 4.362461090087891, 4.56126594543457, 4.760070323944092, 4.958874702453613, 5.157679557800293, 5.3564839363098145, 5.555288791656494, 5.754093170166016, 5.952898025512695, 6.151702880859375, 6.3505072593688965, 6.549312114715576]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 9.0, 8.0, 8.0, 9.0, 11.0, 24.0, 36.0, 52.0, 80.0, 132.0, 239.0, 461.0, 1318.0, 4155.0, 18081.0, 452383.0, 3683279.0, 25534.0, 5238.0, 1654.0, 637.0, 308.0, 188.0, 113.0, 84.0, 58.0, 39.0, 30.0, 19.0, 23.0, 22.0, 9.0, 7.0, 6.0, 3.0, 6.0, 2.0, 4.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-4.69921875, -4.5614013671875, -4.423583984375, -4.2857666015625, -4.14794921875, -4.0101318359375, -3.872314453125, -3.7344970703125, -3.5966796875, -3.4588623046875, -3.321044921875, -3.1832275390625, -3.04541015625, -2.9075927734375, -2.769775390625, -2.6319580078125, -2.494140625, -2.3563232421875, -2.218505859375, -2.0806884765625, -1.94287109375, -1.8050537109375, -1.667236328125, -1.5294189453125, -1.3916015625, -1.2537841796875, -1.115966796875, -0.9781494140625, -0.84033203125, -0.7025146484375, -0.564697265625, -0.4268798828125, -0.2890625, -0.1512451171875, -0.013427734375, 0.1243896484375, 0.26220703125, 0.4000244140625, 0.537841796875, 0.6756591796875, 0.8134765625, 0.9512939453125, 1.089111328125, 1.2269287109375, 1.36474609375, 1.5025634765625, 1.640380859375, 1.7781982421875, 1.916015625, 2.0538330078125, 2.191650390625, 2.3294677734375, 2.46728515625, 2.6051025390625, 2.742919921875, 2.8807373046875, 3.0185546875, 3.1563720703125, 3.294189453125, 3.4320068359375, 3.56982421875, 3.7076416015625, 3.845458984375, 3.9832763671875, 4.12109375]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 7.0, 8.0, 15.0, 13.0, 21.0, 25.0, 40.0, 45.0, 68.0, 69.0, 87.0, 86.0, 86.0, 72.0, 85.0, 64.0, 61.0, 47.0, 34.0, 22.0, 9.0, 12.0, 6.0, 5.0, 3.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.454833984375, -0.4397926330566406, -0.42475128173828125, -0.4097099304199219, -0.3946685791015625, -0.3796272277832031, -0.36458587646484375, -0.3495445251464844, -0.334503173828125, -0.3194618225097656, -0.30442047119140625, -0.2893791198730469, -0.2743377685546875, -0.2592964172363281, -0.24425506591796875, -0.22921371459960938, -0.21417236328125, -0.19913101196289062, -0.18408966064453125, -0.16904830932617188, -0.1540069580078125, -0.13896560668945312, -0.12392425537109375, -0.10888290405273438, -0.093841552734375, -0.07880020141601562, -0.06375885009765625, -0.048717498779296875, -0.0336761474609375, -0.018634796142578125, -0.00359344482421875, 0.011447906494140625, 0.0264892578125, 0.041530609130859375, 0.05657196044921875, 0.07161331176757812, 0.0866546630859375, 0.10169601440429688, 0.11673736572265625, 0.13177871704101562, 0.146820068359375, 0.16186141967773438, 0.17690277099609375, 0.19194412231445312, 0.2069854736328125, 0.22202682495117188, 0.23706817626953125, 0.2521095275878906, 0.26715087890625, 0.2821922302246094, 0.29723358154296875, 0.3122749328613281, 0.3273162841796875, 0.3423576354980469, 0.35739898681640625, 0.3724403381347656, 0.387481689453125, 0.4025230407714844, 0.41756439208984375, 0.4326057434082031, 0.4476470947265625, 0.4626884460449219, 0.47772979736328125, 0.4927711486816406, 0.5078125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 6.0, 4.0, 7.0, 6.0, 12.0, 11.0, 20.0, 36.0, 45.0, 72.0, 118.0, 198.0, 320.0, 545.0, 892.0, 1615.0, 3346.0, 7419.0, 19648.0, 70440.0, 1489584.0, 2484813.0, 77961.0, 21003.0, 8015.0, 3686.0, 1916.0, 1016.0, 551.0, 363.0, 199.0, 133.0, 102.0, 63.0, 41.0, 28.0, 13.0, 13.0, 10.0, 4.0, 2.0, 3.0, 2.0, 6.0, 1.0, 2.0, 1.0], "bins": [-2.365234375, -2.30303955078125, -2.2408447265625, -2.17864990234375, -2.116455078125, -2.05426025390625, -1.9920654296875, -1.92987060546875, -1.86767578125, -1.80548095703125, -1.7432861328125, -1.68109130859375, -1.618896484375, -1.55670166015625, -1.4945068359375, -1.43231201171875, -1.3701171875, -1.30792236328125, -1.2457275390625, -1.18353271484375, -1.121337890625, -1.05914306640625, -0.9969482421875, -0.93475341796875, -0.87255859375, -0.81036376953125, -0.7481689453125, -0.68597412109375, -0.623779296875, -0.56158447265625, -0.4993896484375, -0.43719482421875, -0.375, -0.31280517578125, -0.2506103515625, -0.18841552734375, -0.126220703125, -0.06402587890625, -0.0018310546875, 0.06036376953125, 0.12255859375, 0.18475341796875, 0.2469482421875, 0.30914306640625, 0.371337890625, 0.43353271484375, 0.4957275390625, 0.55792236328125, 0.6201171875, 0.68231201171875, 0.7445068359375, 0.80670166015625, 0.868896484375, 0.93109130859375, 0.9932861328125, 1.05548095703125, 1.11767578125, 1.17987060546875, 1.2420654296875, 1.30426025390625, 1.366455078125, 1.42864990234375, 1.4908447265625, 1.55303955078125, 1.615234375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 5.0, 6.0, 15.0, 10.0, 21.0, 40.0, 35.0, 68.0, 183.0, 468.0, 2085.0, 686.0, 180.0, 97.0, 46.0, 35.0, 20.0, 14.0, 13.0, 9.0, 7.0, 10.0, 3.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.94189453125, -0.9089431762695312, -0.8759918212890625, -0.8430404663085938, -0.810089111328125, -0.7771377563476562, -0.7441864013671875, -0.7112350463867188, -0.67828369140625, -0.6453323364257812, -0.6123809814453125, -0.5794296264648438, -0.546478271484375, -0.5135269165039062, -0.4805755615234375, -0.44762420654296875, -0.4146728515625, -0.38172149658203125, -0.3487701416015625, -0.31581878662109375, -0.282867431640625, -0.24991607666015625, -0.2169647216796875, -0.18401336669921875, -0.15106201171875, -0.11811065673828125, -0.0851593017578125, -0.05220794677734375, -0.019256591796875, 0.01369476318359375, 0.0466461181640625, 0.07959747314453125, 0.112548828125, 0.14550018310546875, 0.1784515380859375, 0.21140289306640625, 0.244354248046875, 0.27730560302734375, 0.3102569580078125, 0.34320831298828125, 0.37615966796875, 0.40911102294921875, 0.4420623779296875, 0.47501373291015625, 0.507965087890625, 0.5409164428710938, 0.5738677978515625, 0.6068191528320312, 0.6397705078125, 0.6727218627929688, 0.7056732177734375, 0.7386245727539062, 0.771575927734375, 0.8045272827148438, 0.8374786376953125, 0.8704299926757812, 0.90338134765625, 0.9363327026367188, 0.9692840576171875, 1.0022354125976562, 1.035186767578125, 1.0681381225585938, 1.1010894775390625, 1.1340408325195312, 1.1669921875]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 6.0, 36.0, 106.0, 288.0, 328.0, 148.0, 54.0, 23.0, 9.0, 6.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.847047805786133, -11.43986701965332, -11.032686233520508, -10.625505447387695, -10.2183256149292, -9.811144828796387, -9.403964042663574, -8.996783256530762, -8.589603424072266, -8.182422637939453, -7.775242328643799, -7.368061542510986, -6.960881233215332, -6.5537004470825195, -6.146519660949707, -5.7393388748168945, -5.332158088684082, -4.9249773025512695, -4.517796993255615, -4.110616207122803, -3.7034356594085693, -3.296255111694336, -2.8890743255615234, -2.48189377784729, -2.0747132301330566, -1.6675326824188232, -1.2603520154953003, -0.8531713485717773, -0.44599080085754395, -0.03881025314331055, 0.36837053298950195, 0.7755510807037354, 1.1827316284179688, 1.5899121761322021, 1.997092843055725, 2.404273509979248, 2.8114540576934814, 3.218634605407715, 3.6258153915405273, 4.03299617767334, 4.440176486968994, 4.847357273101807, 5.254537582397461, 5.661718368530273, 6.068899154663086, 6.47607946395874, 6.883260250091553, 7.290440559387207, 7.6976213455200195, 8.104802131652832, 8.511982917785645, 8.91916275024414, 9.326343536376953, 9.733524322509766, 10.140705108642578, 10.54788589477539, 10.955066680908203, 11.362247467041016, 11.769428253173828, 12.17660903930664, 12.583788871765137, 12.99096965789795, 13.398150444030762, 13.805331230163574, 14.21251106262207]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 0.0, 3.0, 11.0, 10.0, 17.0, 16.0, 14.0, 13.0, 17.0, 33.0, 32.0, 49.0, 33.0, 48.0, 56.0, 58.0, 57.0, 49.0, 41.0, 59.0, 54.0, 51.0, 41.0, 37.0, 43.0, 32.0, 21.0, 28.0, 22.0, 20.0, 14.0, 5.0, 8.0, 2.0, 3.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.402423858642578, -3.296762228012085, -3.191100597381592, -3.0854389667510986, -2.9797773361206055, -2.874115467071533, -2.76845383644104, -2.662792205810547, -2.5571305751800537, -2.4514689445495605, -2.3458073139190674, -2.240145683288574, -2.134483814239502, -2.028822422027588, -1.9231605529785156, -1.8174989223480225, -1.7118372917175293, -1.6061756610870361, -1.500514030456543, -1.3948522806167603, -1.289190649986267, -1.183529019355774, -1.0778672695159912, -0.972205638885498, -0.8665440082550049, -0.7608823776245117, -0.6552206873893738, -0.5495589971542358, -0.4438973665237427, -0.3382357358932495, -0.23257404565811157, -0.12691235542297363, -0.02125072479248047, 0.08441093564033508, 0.19007259607315063, 0.2957342565059662, 0.40139591693878174, 0.5070575475692749, 0.6127192378044128, 0.7183809280395508, 0.824042558670044, 0.9297041893005371, 1.0353658199310303, 1.141027569770813, 1.2466892004013062, 1.3523508310317993, 1.458012580871582, 1.5636742115020752, 1.6693358421325684, 1.7749974727630615, 1.8806591033935547, 1.9863208532333374, 2.091982364654541, 2.1976442337036133, 2.3033058643341064, 2.4089674949645996, 2.5146291255950928, 2.620290756225586, 2.725952386856079, 2.8316140174865723, 2.9372758865356445, 3.0429372787475586, 3.148599147796631, 3.254260778427124, 3.359922409057617]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 4.0, 2.0, 3.0, 15.0, 12.0, 11.0, 20.0, 56.0, 58.0, 80.0, 164.0, 288.0, 617.0, 1353.0, 3865.0, 15188.0, 117427.0, 792467.0, 97288.0, 13539.0, 3518.0, 1237.0, 575.0, 292.0, 167.0, 101.0, 56.0, 52.0, 37.0, 18.0, 9.0, 12.0, 9.0, 5.0, 9.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.75390625, -3.638275146484375, -3.52264404296875, -3.407012939453125, -3.2913818359375, -3.175750732421875, -3.06011962890625, -2.944488525390625, -2.828857421875, -2.713226318359375, -2.59759521484375, -2.481964111328125, -2.3663330078125, -2.250701904296875, -2.13507080078125, -2.019439697265625, -1.90380859375, -1.788177490234375, -1.67254638671875, -1.556915283203125, -1.4412841796875, -1.325653076171875, -1.21002197265625, -1.094390869140625, -0.978759765625, -0.863128662109375, -0.74749755859375, -0.631866455078125, -0.5162353515625, -0.400604248046875, -0.28497314453125, -0.169342041015625, -0.0537109375, 0.061920166015625, 0.17755126953125, 0.293182373046875, 0.4088134765625, 0.524444580078125, 0.64007568359375, 0.755706787109375, 0.871337890625, 0.986968994140625, 1.10260009765625, 1.218231201171875, 1.3338623046875, 1.449493408203125, 1.56512451171875, 1.680755615234375, 1.79638671875, 1.912017822265625, 2.02764892578125, 2.143280029296875, 2.2589111328125, 2.374542236328125, 2.49017333984375, 2.605804443359375, 2.721435546875, 2.837066650390625, 2.95269775390625, 3.068328857421875, 3.1839599609375, 3.299591064453125, 3.41522216796875, 3.530853271484375, 3.646484375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 6.0, 7.0, 8.0, 19.0, 17.0, 28.0, 40.0, 58.0, 70.0, 74.0, 100.0, 86.0, 92.0, 81.0, 75.0, 74.0, 50.0, 29.0, 27.0, 19.0, 16.0, 12.0, 2.0, 2.0, 3.0, 1.0, 5.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.44677734375, -0.43021392822265625, -0.4136505126953125, -0.39708709716796875, -0.380523681640625, -0.36396026611328125, -0.3473968505859375, -0.33083343505859375, -0.31427001953125, -0.29770660400390625, -0.2811431884765625, -0.26457977294921875, -0.248016357421875, -0.23145294189453125, -0.2148895263671875, -0.19832611083984375, -0.1817626953125, -0.16519927978515625, -0.1486358642578125, -0.13207244873046875, -0.115509033203125, -0.09894561767578125, -0.0823822021484375, -0.06581878662109375, -0.04925537109375, -0.03269195556640625, -0.0161285400390625, 0.00043487548828125, 0.016998291015625, 0.03356170654296875, 0.0501251220703125, 0.06668853759765625, 0.083251953125, 0.09981536865234375, 0.1163787841796875, 0.13294219970703125, 0.149505615234375, 0.16606903076171875, 0.1826324462890625, 0.19919586181640625, 0.21575927734375, 0.23232269287109375, 0.2488861083984375, 0.26544952392578125, 0.282012939453125, 0.29857635498046875, 0.3151397705078125, 0.33170318603515625, 0.3482666015625, 0.36483001708984375, 0.3813934326171875, 0.39795684814453125, 0.414520263671875, 0.43108367919921875, 0.4476470947265625, 0.46421051025390625, 0.48077392578125, 0.49733734130859375, 0.5139007568359375, 0.5304641723632812, 0.547027587890625, 0.5635910034179688, 0.5801544189453125, 0.5967178344726562, 0.61328125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 6.0, 7.0, 11.0, 9.0, 8.0, 23.0, 24.0, 37.0, 65.0, 107.0, 152.0, 264.0, 549.0, 1125.0, 2496.0, 6729.0, 21732.0, 95293.0, 522385.0, 320087.0, 54820.0, 14188.0, 4674.0, 1865.0, 856.0, 440.0, 222.0, 124.0, 87.0, 51.0, 28.0, 26.0, 21.0, 10.0, 8.0, 4.0, 8.0, 1.0, 7.0, 5.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.73828125, -1.6800079345703125, -1.621734619140625, -1.5634613037109375, -1.50518798828125, -1.4469146728515625, -1.388641357421875, -1.3303680419921875, -1.2720947265625, -1.2138214111328125, -1.155548095703125, -1.0972747802734375, -1.03900146484375, -0.9807281494140625, -0.922454833984375, -0.8641815185546875, -0.805908203125, -0.7476348876953125, -0.689361572265625, -0.6310882568359375, -0.57281494140625, -0.5145416259765625, -0.456268310546875, -0.3979949951171875, -0.3397216796875, -0.2814483642578125, -0.223175048828125, -0.1649017333984375, -0.10662841796875, -0.0483551025390625, 0.009918212890625, 0.0681915283203125, 0.12646484375, 0.1847381591796875, 0.243011474609375, 0.3012847900390625, 0.35955810546875, 0.4178314208984375, 0.476104736328125, 0.5343780517578125, 0.5926513671875, 0.6509246826171875, 0.709197998046875, 0.7674713134765625, 0.82574462890625, 0.8840179443359375, 0.942291259765625, 1.0005645751953125, 1.058837890625, 1.1171112060546875, 1.175384521484375, 1.2336578369140625, 1.29193115234375, 1.3502044677734375, 1.408477783203125, 1.4667510986328125, 1.5250244140625, 1.5832977294921875, 1.641571044921875, 1.6998443603515625, 1.75811767578125, 1.8163909912109375, 1.874664306640625, 1.9329376220703125, 1.9912109375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 7.0, 4.0, 5.0, 12.0, 7.0, 9.0, 17.0, 17.0, 16.0, 17.0, 16.0, 23.0, 32.0, 36.0, 38.0, 41.0, 48.0, 49.0, 42.0, 53.0, 41.0, 40.0, 43.0, 36.0, 38.0, 44.0, 44.0, 43.0, 29.0, 31.0, 19.0, 18.0, 13.0, 15.0, 13.0, 8.0, 14.0, 5.0, 7.0, 6.0, 0.0, 1.0, 3.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2822265625, -1.2428131103515625, -1.203399658203125, -1.1639862060546875, -1.12457275390625, -1.0851593017578125, -1.045745849609375, -1.0063323974609375, -0.9669189453125, -0.9275054931640625, -0.888092041015625, -0.8486785888671875, -0.80926513671875, -0.7698516845703125, -0.730438232421875, -0.6910247802734375, -0.651611328125, -0.6121978759765625, -0.572784423828125, -0.5333709716796875, -0.49395751953125, -0.4545440673828125, -0.415130615234375, -0.3757171630859375, -0.3363037109375, -0.2968902587890625, -0.257476806640625, -0.2180633544921875, -0.17864990234375, -0.1392364501953125, -0.099822998046875, -0.0604095458984375, -0.02099609375, 0.0184173583984375, 0.057830810546875, 0.0972442626953125, 0.13665771484375, 0.1760711669921875, 0.215484619140625, 0.2548980712890625, 0.2943115234375, 0.3337249755859375, 0.373138427734375, 0.4125518798828125, 0.45196533203125, 0.4913787841796875, 0.530792236328125, 0.5702056884765625, 0.609619140625, 0.6490325927734375, 0.688446044921875, 0.7278594970703125, 0.76727294921875, 0.8066864013671875, 0.846099853515625, 0.8855133056640625, 0.9249267578125, 0.9643402099609375, 1.003753662109375, 1.0431671142578125, 1.08258056640625, 1.1219940185546875, 1.161407470703125, 1.2008209228515625, 1.240234375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 2.0, 4.0, 2.0, 6.0, 7.0, 12.0, 19.0, 15.0, 33.0, 55.0, 105.0, 228.0, 479.0, 1321.0, 4566.0, 24387.0, 355895.0, 616515.0, 35929.0, 6216.0, 1642.0, 530.0, 241.0, 125.0, 69.0, 34.0, 31.0, 20.0, 17.0, 13.0, 8.0, 4.0, 8.0, 2.0, 8.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.0322265625, -0.9967498779296875, -0.961273193359375, -0.9257965087890625, -0.89031982421875, -0.8548431396484375, -0.819366455078125, -0.7838897705078125, -0.7484130859375, -0.7129364013671875, -0.677459716796875, -0.6419830322265625, -0.60650634765625, -0.5710296630859375, -0.535552978515625, -0.5000762939453125, -0.464599609375, -0.4291229248046875, -0.393646240234375, -0.3581695556640625, -0.32269287109375, -0.2872161865234375, -0.251739501953125, -0.2162628173828125, -0.1807861328125, -0.1453094482421875, -0.109832763671875, -0.0743560791015625, -0.03887939453125, -0.0034027099609375, 0.032073974609375, 0.0675506591796875, 0.10302734375, 0.1385040283203125, 0.173980712890625, 0.2094573974609375, 0.24493408203125, 0.2804107666015625, 0.315887451171875, 0.3513641357421875, 0.3868408203125, 0.4223175048828125, 0.457794189453125, 0.4932708740234375, 0.52874755859375, 0.5642242431640625, 0.599700927734375, 0.6351776123046875, 0.670654296875, 0.7061309814453125, 0.741607666015625, 0.7770843505859375, 0.81256103515625, 0.8480377197265625, 0.883514404296875, 0.9189910888671875, 0.9544677734375, 0.9899444580078125, 1.025421142578125, 1.0608978271484375, 1.09637451171875, 1.1318511962890625, 1.167327880859375, 1.2028045654296875, 1.23828125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 7.0, 12.0, 13.0, 20.0, 21.0, 32.0, 72.0, 111.0, 209.0, 182.0, 114.0, 70.0, 46.0, 22.0, 21.0, 14.0, 11.0, 12.0, 5.0, 0.0, 3.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00015091896057128906, -0.00014552287757396698, -0.0001401267945766449, -0.00013473071157932281, -0.00012933462858200073, -0.00012393854558467865, -0.00011854246258735657, -0.00011314637959003448, -0.0001077502965927124, -0.00010235421359539032, -9.695813059806824e-05, -9.156204760074615e-05, -8.616596460342407e-05, -8.076988160610199e-05, -7.537379860877991e-05, -6.997771561145782e-05, -6.458163261413574e-05, -5.918554961681366e-05, -5.378946661949158e-05, -4.8393383622169495e-05, -4.299730062484741e-05, -3.760121762752533e-05, -3.220513463020325e-05, -2.6809051632881165e-05, -2.1412968635559082e-05, -1.6016885638237e-05, -1.0620802640914917e-05, -5.2247196435928345e-06, 1.7136335372924805e-07, 5.5674463510513306e-06, 1.0963529348373413e-05, 1.6359612345695496e-05, 2.1755695343017578e-05, 2.715177834033966e-05, 3.254786133766174e-05, 3.7943944334983826e-05, 4.334002733230591e-05, 4.873611032962799e-05, 5.413219332695007e-05, 5.9528276324272156e-05, 6.492435932159424e-05, 7.032044231891632e-05, 7.57165253162384e-05, 8.111260831356049e-05, 8.650869131088257e-05, 9.190477430820465e-05, 9.730085730552673e-05, 0.00010269694030284882, 0.0001080930233001709, 0.00011348910629749298, 0.00011888518929481506, 0.00012428127229213715, 0.00012967735528945923, 0.0001350734382867813, 0.0001404695212841034, 0.00014586560428142548, 0.00015126168727874756, 0.00015665777027606964, 0.00016205385327339172, 0.0001674499362707138, 0.0001728460192680359, 0.00017824210226535797, 0.00018363818526268005, 0.00018903426826000214, 0.00019443035125732422]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 4.0, 0.0, 7.0, 6.0, 10.0, 28.0, 24.0, 60.0, 73.0, 99.0, 193.0, 423.0, 929.0, 2782.0, 13661.0, 185350.0, 800559.0, 36331.0, 5241.0, 1496.0, 607.0, 259.0, 143.0, 96.0, 54.0, 53.0, 21.0, 15.0, 10.0, 5.0, 7.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2705078125, -1.225494384765625, -1.18048095703125, -1.135467529296875, -1.0904541015625, -1.045440673828125, -1.00042724609375, -0.955413818359375, -0.910400390625, -0.865386962890625, -0.82037353515625, -0.775360107421875, -0.7303466796875, -0.685333251953125, -0.64031982421875, -0.595306396484375, -0.55029296875, -0.505279541015625, -0.46026611328125, -0.415252685546875, -0.3702392578125, -0.325225830078125, -0.28021240234375, -0.235198974609375, -0.190185546875, -0.145172119140625, -0.10015869140625, -0.055145263671875, -0.0101318359375, 0.034881591796875, 0.07989501953125, 0.124908447265625, 0.169921875, 0.214935302734375, 0.25994873046875, 0.304962158203125, 0.3499755859375, 0.394989013671875, 0.44000244140625, 0.485015869140625, 0.530029296875, 0.575042724609375, 0.62005615234375, 0.665069580078125, 0.7100830078125, 0.755096435546875, 0.80010986328125, 0.845123291015625, 0.89013671875, 0.935150146484375, 0.98016357421875, 1.025177001953125, 1.0701904296875, 1.115203857421875, 1.16021728515625, 1.205230712890625, 1.250244140625, 1.295257568359375, 1.34027099609375, 1.385284423828125, 1.4302978515625, 1.475311279296875, 1.52032470703125, 1.565338134765625, 1.6103515625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 2.0, 5.0, 8.0, 13.0, 18.0, 22.0, 42.0, 42.0, 93.0, 151.0, 190.0, 159.0, 97.0, 40.0, 31.0, 22.0, 21.0, 19.0, 11.0, 3.0, 6.0, 2.0, 6.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.916015625, -0.8878860473632812, -0.8597564697265625, -0.8316268920898438, -0.803497314453125, -0.7753677368164062, -0.7472381591796875, -0.7191085815429688, -0.69097900390625, -0.6628494262695312, -0.6347198486328125, -0.6065902709960938, -0.578460693359375, -0.5503311157226562, -0.5222015380859375, -0.49407196044921875, -0.4659423828125, -0.43781280517578125, -0.4096832275390625, -0.38155364990234375, -0.353424072265625, -0.32529449462890625, -0.2971649169921875, -0.26903533935546875, -0.24090576171875, -0.21277618408203125, -0.1846466064453125, -0.15651702880859375, -0.128387451171875, -0.10025787353515625, -0.0721282958984375, -0.04399871826171875, -0.015869140625, 0.01226043701171875, 0.0403900146484375, 0.06851959228515625, 0.096649169921875, 0.12477874755859375, 0.1529083251953125, 0.18103790283203125, 0.20916748046875, 0.23729705810546875, 0.2654266357421875, 0.29355621337890625, 0.321685791015625, 0.34981536865234375, 0.3779449462890625, 0.40607452392578125, 0.4342041015625, 0.46233367919921875, 0.4904632568359375, 0.5185928344726562, 0.546722412109375, 0.5748519897460938, 0.6029815673828125, 0.6311111450195312, 0.65924072265625, 0.6873703002929688, 0.7154998779296875, 0.7436294555664062, 0.771759033203125, 0.7998886108398438, 0.8280181884765625, 0.8561477661132812, 0.88427734375]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 11.0, 9.0, 34.0, 51.0, 89.0, 128.0, 167.0, 192.0, 143.0, 93.0, 49.0, 18.0, 13.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.13174057006836, -21.66269874572754, -21.19365692138672, -20.7246150970459, -20.255573272705078, -19.786529541015625, -19.317487716674805, -18.848445892333984, -18.379404067993164, -17.910362243652344, -17.441320419311523, -16.972278594970703, -16.503236770629883, -16.034194946289062, -15.565152168273926, -15.096109390258789, -14.627067565917969, -14.158025741577148, -13.688983917236328, -13.219941139221191, -12.750899314880371, -12.28185749053955, -11.81281566619873, -11.343772888183594, -10.87473201751709, -10.40569019317627, -9.93664836883545, -9.467605590820312, -8.998563766479492, -8.529521942138672, -8.060480117797852, -7.591437816619873, -7.1223955154418945, -6.653353691101074, -6.184311389923096, -5.715269565582275, -5.246227264404297, -4.777185440063477, -4.308143615722656, -3.8391013145446777, -3.3700592517852783, -2.901017189025879, -2.4319751262664795, -1.9629331827163696, -1.4938911199569702, -1.0248491764068604, -0.5558071136474609, -0.08676505088806152, 0.3822770118713379, 0.8513190746307373, 1.3203611373901367, 1.7894030809402466, 2.2584452629089355, 2.727487087249756, 3.1965291500091553, 3.6655712127685547, 4.134613037109375, 4.603654861450195, 5.072697162628174, 5.541738986968994, 6.010781288146973, 6.479823112487793, 6.948864936828613, 7.417907238006592, 7.88694953918457]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 4.0, 2.0, 2.0, 2.0, 4.0, 4.0, 12.0, 10.0, 15.0, 14.0, 13.0, 15.0, 21.0, 23.0, 27.0, 29.0, 19.0, 35.0, 30.0, 35.0, 33.0, 35.0, 45.0, 40.0, 43.0, 31.0, 35.0, 31.0, 29.0, 38.0, 46.0, 41.0, 30.0, 33.0, 32.0, 24.0, 15.0, 18.0, 11.0, 21.0, 5.0, 10.0, 11.0, 6.0, 10.0, 4.0, 3.0, 4.0, 2.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.049078941345215, -4.876288890838623, -4.703498363494873, -4.530708312988281, -4.357917785644531, -4.1851277351379395, -4.012337684631348, -3.8395471572875977, -3.666757106781006, -3.493966817855835, -3.321176528930664, -3.1483864784240723, -2.9755961894989014, -2.8028059005737305, -2.6300156116485596, -2.4572253227233887, -2.2844350337982178, -2.111644744873047, -1.9388545751571655, -1.7660642862319946, -1.5932741165161133, -1.4204838275909424, -1.2476935386657715, -1.0749033689498901, -0.9021130800247192, -0.7293228507041931, -0.556532621383667, -0.3837423324584961, -0.21095210313796997, -0.03816187381744385, 0.13462841510772705, 0.3074185848236084, 0.4802088737487793, 0.6529991030693054, 0.8257893323898315, 0.9985796213150024, 1.1713697910308838, 1.3441600799560547, 1.5169503688812256, 1.689740538597107, 1.8625308275222778, 2.035320997238159, 2.20811128616333, 2.380901575088501, 2.553691864013672, 2.7264819145202637, 2.8992724418640137, 3.0720624923706055, 3.2448527812957764, 3.4176430702209473, 3.590433359146118, 3.763223648071289, 3.936013698577881, 4.108803749084473, 4.281594276428223, 4.4543843269348145, 4.6271748542785645, 4.799964904785156, 4.972755432128906, 5.145545482635498, 5.318336009979248, 5.49112606048584, 5.66391658782959, 5.836706638336182, 6.009496688842773]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 12.0, 3.0, 9.0, 11.0, 13.0, 27.0, 30.0, 41.0, 75.0, 139.0, 256.0, 586.0, 1617.0, 5729.0, 37030.0, 4058061.0, 78360.0, 8462.0, 2237.0, 757.0, 307.0, 178.0, 96.0, 55.0, 50.0, 24.0, 27.0, 10.0, 26.0, 10.0, 9.0, 9.0, 8.0, 3.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.609375, -4.463623046875, -4.31787109375, -4.172119140625, -4.0263671875, -3.880615234375, -3.73486328125, -3.589111328125, -3.443359375, -3.297607421875, -3.15185546875, -3.006103515625, -2.8603515625, -2.714599609375, -2.56884765625, -2.423095703125, -2.27734375, -2.131591796875, -1.98583984375, -1.840087890625, -1.6943359375, -1.548583984375, -1.40283203125, -1.257080078125, -1.111328125, -0.965576171875, -0.81982421875, -0.674072265625, -0.5283203125, -0.382568359375, -0.23681640625, -0.091064453125, 0.0546875, 0.200439453125, 0.34619140625, 0.491943359375, 0.6376953125, 0.783447265625, 0.92919921875, 1.074951171875, 1.220703125, 1.366455078125, 1.51220703125, 1.657958984375, 1.8037109375, 1.949462890625, 2.09521484375, 2.240966796875, 2.38671875, 2.532470703125, 2.67822265625, 2.823974609375, 2.9697265625, 3.115478515625, 3.26123046875, 3.406982421875, 3.552734375, 3.698486328125, 3.84423828125, 3.989990234375, 4.1357421875, 4.281494140625, 4.42724609375, 4.572998046875, 4.71875]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 5.0, 1.0, 4.0, 9.0, 19.0, 15.0, 20.0, 33.0, 51.0, 67.0, 68.0, 77.0, 100.0, 82.0, 89.0, 102.0, 65.0, 56.0, 47.0, 24.0, 20.0, 15.0, 18.0, 6.0, 2.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.447021484375, -0.4301261901855469, -0.41323089599609375, -0.3963356018066406, -0.3794403076171875, -0.3625450134277344, -0.34564971923828125, -0.3287544250488281, -0.311859130859375, -0.2949638366699219, -0.27806854248046875, -0.2611732482910156, -0.2442779541015625, -0.22738265991210938, -0.21048736572265625, -0.19359207153320312, -0.17669677734375, -0.15980148315429688, -0.14290618896484375, -0.12601089477539062, -0.1091156005859375, -0.09222030639648438, -0.07532501220703125, -0.058429718017578125, -0.041534423828125, -0.024639129638671875, -0.00774383544921875, 0.009151458740234375, 0.0260467529296875, 0.042942047119140625, 0.05983734130859375, 0.07673263549804688, 0.0936279296875, 0.11052322387695312, 0.12741851806640625, 0.14431381225585938, 0.1612091064453125, 0.17810440063476562, 0.19499969482421875, 0.21189498901367188, 0.228790283203125, 0.24568557739257812, 0.26258087158203125, 0.2794761657714844, 0.2963714599609375, 0.3132667541503906, 0.33016204833984375, 0.3470573425292969, 0.36395263671875, 0.3808479309082031, 0.39774322509765625, 0.4146385192871094, 0.4315338134765625, 0.4484291076660156, 0.46532440185546875, 0.4822196960449219, 0.499114990234375, 0.5160102844238281, 0.5329055786132812, 0.5498008728027344, 0.5666961669921875, 0.5835914611816406, 0.6004867553710938, 0.6173820495605469, 0.63427734375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 6.0, 13.0, 17.0, 18.0, 25.0, 55.0, 92.0, 134.0, 233.0, 383.0, 758.0, 1512.0, 3327.0, 9038.0, 39792.0, 3343764.0, 749819.0, 31198.0, 7914.0, 3072.0, 1394.0, 703.0, 382.0, 229.0, 140.0, 97.0, 60.0, 37.0, 25.0, 9.0, 12.0, 6.0, 6.0, 6.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.671875, -3.5750732421875, -3.478271484375, -3.3814697265625, -3.28466796875, -3.1878662109375, -3.091064453125, -2.9942626953125, -2.8974609375, -2.8006591796875, -2.703857421875, -2.6070556640625, -2.51025390625, -2.4134521484375, -2.316650390625, -2.2198486328125, -2.123046875, -2.0262451171875, -1.929443359375, -1.8326416015625, -1.73583984375, -1.6390380859375, -1.542236328125, -1.4454345703125, -1.3486328125, -1.2518310546875, -1.155029296875, -1.0582275390625, -0.96142578125, -0.8646240234375, -0.767822265625, -0.6710205078125, -0.57421875, -0.4774169921875, -0.380615234375, -0.2838134765625, -0.18701171875, -0.0902099609375, 0.006591796875, 0.1033935546875, 0.2001953125, 0.2969970703125, 0.393798828125, 0.4906005859375, 0.58740234375, 0.6842041015625, 0.781005859375, 0.8778076171875, 0.974609375, 1.0714111328125, 1.168212890625, 1.2650146484375, 1.36181640625, 1.4586181640625, 1.555419921875, 1.6522216796875, 1.7490234375, 1.8458251953125, 1.942626953125, 2.0394287109375, 2.13623046875, 2.2330322265625, 2.329833984375, 2.4266357421875, 2.5234375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 5.0, 5.0, 5.0, 8.0, 20.0, 18.0, 27.0, 56.0, 118.0, 524.0, 2745.0, 307.0, 96.0, 48.0, 30.0, 17.0, 13.0, 8.0, 8.0, 6.0, 4.0, 1.0, 0.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1796875, -1.1408233642578125, -1.101959228515625, -1.0630950927734375, -1.02423095703125, -0.9853668212890625, -0.946502685546875, -0.9076385498046875, -0.8687744140625, -0.8299102783203125, -0.791046142578125, -0.7521820068359375, -0.71331787109375, -0.6744537353515625, -0.635589599609375, -0.5967254638671875, -0.557861328125, -0.5189971923828125, -0.480133056640625, -0.4412689208984375, -0.40240478515625, -0.3635406494140625, -0.324676513671875, -0.2858123779296875, -0.2469482421875, -0.2080841064453125, -0.169219970703125, -0.1303558349609375, -0.09149169921875, -0.0526275634765625, -0.013763427734375, 0.0251007080078125, 0.06396484375, 0.1028289794921875, 0.141693115234375, 0.1805572509765625, 0.21942138671875, 0.2582855224609375, 0.297149658203125, 0.3360137939453125, 0.3748779296875, 0.4137420654296875, 0.452606201171875, 0.4914703369140625, 0.53033447265625, 0.5691986083984375, 0.608062744140625, 0.6469268798828125, 0.685791015625, 0.7246551513671875, 0.763519287109375, 0.8023834228515625, 0.84124755859375, 0.8801116943359375, 0.918975830078125, 0.9578399658203125, 0.9967041015625, 1.0355682373046875, 1.074432373046875, 1.1132965087890625, 1.15216064453125, 1.1910247802734375, 1.229888916015625, 1.2687530517578125, 1.3076171875]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 5.0, 9.0, 21.0, 35.0, 74.0, 131.0, 218.0, 223.0, 121.0, 71.0, 33.0, 21.0, 14.0, 12.0, 5.0, 6.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.330661773681641, -5.115939140319824, -4.901216506958008, -4.686493396759033, -4.471770763397217, -4.2570481300354, -4.042325019836426, -3.8276023864746094, -3.612879753112793, -3.3981571197509766, -3.183434247970581, -2.9687113761901855, -2.753988742828369, -2.5392661094665527, -2.3245432376861572, -2.1098203659057617, -1.8950977325439453, -1.6803749799728394, -1.4656522274017334, -1.2509294748306274, -1.0362067222595215, -0.8214839696884155, -0.6067612171173096, -0.3920384645462036, -0.17731571197509766, 0.0374070405960083, 0.25212979316711426, 0.4668525457382202, 0.6815752983093262, 0.8962980508804321, 1.111020803451538, 1.325743556022644, 1.54046630859375, 1.755189061164856, 1.969911813735962, 2.1846346855163574, 2.399357318878174, 2.6140799522399902, 2.8288028240203857, 3.0435256958007812, 3.2582483291625977, 3.472970962524414, 3.6876938343048096, 3.902416706085205, 4.1171393394470215, 4.331861972808838, 4.5465850830078125, 4.761307716369629, 4.976030349731445, 5.190752983093262, 5.405475616455078, 5.620198726654053, 5.834921360015869, 6.0496439933776855, 6.26436710357666, 6.479089736938477, 6.693812370300293, 6.908535003662109, 7.123257637023926, 7.3379807472229, 7.552703380584717, 7.767426013946533, 7.982149124145508, 8.196871757507324, 8.41159439086914]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 9.0, 5.0, 10.0, 7.0, 10.0, 9.0, 7.0, 15.0, 12.0, 19.0, 22.0, 44.0, 35.0, 36.0, 43.0, 31.0, 47.0, 50.0, 52.0, 53.0, 51.0, 53.0, 52.0, 42.0, 39.0, 48.0, 23.0, 32.0, 21.0, 22.0, 25.0, 11.0, 12.0, 19.0, 5.0, 8.0, 6.0, 7.0, 6.0, 3.0, 3.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.448403835296631, -2.3606741428375244, -2.272944450378418, -2.1852149963378906, -2.097485303878784, -2.0097556114196777, -1.9220259189605713, -1.8342962265014648, -1.746566653251648, -1.6588369607925415, -1.5711073875427246, -1.4833776950836182, -1.3956480026245117, -1.3079184293746948, -1.2201887369155884, -1.1324591636657715, -1.044729471206665, -0.9569998383522034, -0.8692702054977417, -0.7815405130386353, -0.6938108801841736, -0.6060812473297119, -0.5183515548706055, -0.4306219220161438, -0.34289228916168213, -0.25516265630722046, -0.1674329936504364, -0.07970333099365234, 0.008026301860809326, 0.095755934715271, 0.18348562717437744, 0.2712152600288391, 0.3589451313018799, 0.44667476415634155, 0.5344043970108032, 0.6221340894699097, 0.7098637223243713, 0.797593355178833, 0.8853230476379395, 0.9730526804924011, 1.0607823133468628, 1.1485120058059692, 1.2362415790557861, 1.3239712715148926, 1.411700963973999, 1.499430537223816, 1.5871602296829224, 1.6748898029327393, 1.7626194953918457, 1.8503491878509521, 1.938078761100769, 2.025808334350586, 2.1135380268096924, 2.201267719268799, 2.2889974117279053, 2.3767271041870117, 2.464456558227539, 2.5521862506866455, 2.639915943145752, 2.7276453971862793, 2.8153750896453857, 2.903104782104492, 2.9908344745635986, 3.078564167022705, 3.1662938594818115]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 5.0, 5.0, 6.0, 11.0, 12.0, 19.0, 19.0, 22.0, 43.0, 61.0, 85.0, 170.0, 296.0, 540.0, 1234.0, 3015.0, 9783.0, 50418.0, 548556.0, 384013.0, 37128.0, 8178.0, 2621.0, 1059.0, 527.0, 262.0, 158.0, 96.0, 54.0, 37.0, 42.0, 18.0, 20.0, 13.0, 6.0, 8.0, 4.0, 2.0, 0.0, 5.0, 3.0, 5.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.080078125, -2.977142333984375, -2.87420654296875, -2.771270751953125, -2.6683349609375, -2.565399169921875, -2.46246337890625, -2.359527587890625, -2.256591796875, -2.153656005859375, -2.05072021484375, -1.947784423828125, -1.8448486328125, -1.741912841796875, -1.63897705078125, -1.536041259765625, -1.43310546875, -1.330169677734375, -1.22723388671875, -1.124298095703125, -1.0213623046875, -0.918426513671875, -0.81549072265625, -0.712554931640625, -0.609619140625, -0.506683349609375, -0.40374755859375, -0.300811767578125, -0.1978759765625, -0.094940185546875, 0.00799560546875, 0.110931396484375, 0.2138671875, 0.316802978515625, 0.41973876953125, 0.522674560546875, 0.6256103515625, 0.728546142578125, 0.83148193359375, 0.934417724609375, 1.037353515625, 1.140289306640625, 1.24322509765625, 1.346160888671875, 1.4490966796875, 1.552032470703125, 1.65496826171875, 1.757904052734375, 1.86083984375, 1.963775634765625, 2.06671142578125, 2.169647216796875, 2.2725830078125, 2.375518798828125, 2.47845458984375, 2.581390380859375, 2.684326171875, 2.787261962890625, 2.89019775390625, 2.993133544921875, 3.0960693359375, 3.199005126953125, 3.30194091796875, 3.404876708984375, 3.5078125]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 3.0, 2.0, 1.0, 9.0, 17.0, 28.0, 39.0, 39.0, 41.0, 60.0, 79.0, 82.0, 80.0, 89.0, 88.0, 77.0, 70.0, 58.0, 42.0, 29.0, 22.0, 8.0, 14.0, 8.0, 3.0, 4.0, 3.0, 6.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.498046875, -0.48040008544921875, -0.4627532958984375, -0.44510650634765625, -0.427459716796875, -0.40981292724609375, -0.3921661376953125, -0.37451934814453125, -0.35687255859375, -0.33922576904296875, -0.3215789794921875, -0.30393218994140625, -0.286285400390625, -0.26863861083984375, -0.2509918212890625, -0.23334503173828125, -0.2156982421875, -0.19805145263671875, -0.1804046630859375, -0.16275787353515625, -0.145111083984375, -0.12746429443359375, -0.1098175048828125, -0.09217071533203125, -0.07452392578125, -0.05687713623046875, -0.0392303466796875, -0.02158355712890625, -0.003936767578125, 0.01371002197265625, 0.0313568115234375, 0.04900360107421875, 0.066650390625, 0.08429718017578125, 0.1019439697265625, 0.11959075927734375, 0.137237548828125, 0.15488433837890625, 0.1725311279296875, 0.19017791748046875, 0.20782470703125, 0.22547149658203125, 0.2431182861328125, 0.26076507568359375, 0.278411865234375, 0.29605865478515625, 0.3137054443359375, 0.33135223388671875, 0.3489990234375, 0.36664581298828125, 0.3842926025390625, 0.40193939208984375, 0.419586181640625, 0.43723297119140625, 0.4548797607421875, 0.47252655029296875, 0.49017333984375, 0.5078201293945312, 0.5254669189453125, 0.5431137084960938, 0.560760498046875, 0.5784072875976562, 0.5960540771484375, 0.6137008666992188, 0.63134765625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 7.0, 1.0, 5.0, 2.0, 6.0, 9.0, 12.0, 17.0, 19.0, 26.0, 47.0, 69.0, 130.0, 251.0, 400.0, 880.0, 1791.0, 4183.0, 11441.0, 38003.0, 164196.0, 537513.0, 217914.0, 48738.0, 13768.0, 4958.0, 2127.0, 944.0, 481.0, 213.0, 150.0, 77.0, 42.0, 42.0, 21.0, 15.0, 6.0, 16.0, 8.0, 3.0, 8.0, 3.0, 5.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.69140625, -1.6378631591796875, -1.584320068359375, -1.5307769775390625, -1.47723388671875, -1.4236907958984375, -1.370147705078125, -1.3166046142578125, -1.2630615234375, -1.2095184326171875, -1.155975341796875, -1.1024322509765625, -1.04888916015625, -0.9953460693359375, -0.941802978515625, -0.8882598876953125, -0.834716796875, -0.7811737060546875, -0.727630615234375, -0.6740875244140625, -0.62054443359375, -0.5670013427734375, -0.513458251953125, -0.4599151611328125, -0.4063720703125, -0.3528289794921875, -0.299285888671875, -0.2457427978515625, -0.19219970703125, -0.1386566162109375, -0.085113525390625, -0.0315704345703125, 0.02197265625, 0.0755157470703125, 0.129058837890625, 0.1826019287109375, 0.23614501953125, 0.2896881103515625, 0.343231201171875, 0.3967742919921875, 0.4503173828125, 0.5038604736328125, 0.557403564453125, 0.6109466552734375, 0.66448974609375, 0.7180328369140625, 0.771575927734375, 0.8251190185546875, 0.878662109375, 0.9322052001953125, 0.985748291015625, 1.0392913818359375, 1.09283447265625, 1.1463775634765625, 1.199920654296875, 1.2534637451171875, 1.3070068359375, 1.3605499267578125, 1.414093017578125, 1.4676361083984375, 1.52117919921875, 1.5747222900390625, 1.628265380859375, 1.6818084716796875, 1.7353515625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 2.0, 1.0, 3.0, 5.0, 6.0, 6.0, 16.0, 7.0, 15.0, 20.0, 17.0, 13.0, 22.0, 22.0, 31.0, 27.0, 30.0, 40.0, 43.0, 39.0, 44.0, 51.0, 45.0, 42.0, 33.0, 43.0, 32.0, 45.0, 36.0, 30.0, 31.0, 22.0, 27.0, 24.0, 15.0, 22.0, 19.0, 17.0, 9.0, 9.0, 10.0, 12.0, 4.0, 5.0, 4.0, 2.0, 0.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.24609375, -1.2064361572265625, -1.166778564453125, -1.1271209716796875, -1.08746337890625, -1.0478057861328125, -1.008148193359375, -0.9684906005859375, -0.9288330078125, -0.8891754150390625, -0.849517822265625, -0.8098602294921875, -0.77020263671875, -0.7305450439453125, -0.690887451171875, -0.6512298583984375, -0.611572265625, -0.5719146728515625, -0.532257080078125, -0.4925994873046875, -0.45294189453125, -0.4132843017578125, -0.373626708984375, -0.3339691162109375, -0.2943115234375, -0.2546539306640625, -0.214996337890625, -0.1753387451171875, -0.13568115234375, -0.0960235595703125, -0.056365966796875, -0.0167083740234375, 0.02294921875, 0.0626068115234375, 0.102264404296875, 0.1419219970703125, 0.18157958984375, 0.2212371826171875, 0.260894775390625, 0.3005523681640625, 0.3402099609375, 0.3798675537109375, 0.419525146484375, 0.4591827392578125, 0.49884033203125, 0.5384979248046875, 0.578155517578125, 0.6178131103515625, 0.657470703125, 0.6971282958984375, 0.736785888671875, 0.7764434814453125, 0.81610107421875, 0.8557586669921875, 0.895416259765625, 0.9350738525390625, 0.9747314453125, 1.0143890380859375, 1.054046630859375, 1.0937042236328125, 1.13336181640625, 1.1730194091796875, 1.212677001953125, 1.2523345947265625, 1.2919921875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 2.0, 4.0, 10.0, 7.0, 6.0, 10.0, 21.0, 25.0, 41.0, 65.0, 116.0, 237.0, 494.0, 1063.0, 2875.0, 9265.0, 42361.0, 347531.0, 556359.0, 68435.0, 13137.0, 3902.0, 1361.0, 558.0, 292.0, 139.0, 95.0, 44.0, 36.0, 17.0, 17.0, 8.0, 7.0, 6.0, 0.0, 3.0, 8.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.7158203125, -0.6942138671875, -0.672607421875, -0.6510009765625, -0.62939453125, -0.6077880859375, -0.586181640625, -0.5645751953125, -0.54296875, -0.5213623046875, -0.499755859375, -0.4781494140625, -0.45654296875, -0.4349365234375, -0.413330078125, -0.3917236328125, -0.3701171875, -0.3485107421875, -0.326904296875, -0.3052978515625, -0.28369140625, -0.2620849609375, -0.240478515625, -0.2188720703125, -0.197265625, -0.1756591796875, -0.154052734375, -0.1324462890625, -0.11083984375, -0.0892333984375, -0.067626953125, -0.0460205078125, -0.0244140625, -0.0028076171875, 0.018798828125, 0.0404052734375, 0.06201171875, 0.0836181640625, 0.105224609375, 0.1268310546875, 0.1484375, 0.1700439453125, 0.191650390625, 0.2132568359375, 0.23486328125, 0.2564697265625, 0.278076171875, 0.2996826171875, 0.3212890625, 0.3428955078125, 0.364501953125, 0.3861083984375, 0.40771484375, 0.4293212890625, 0.450927734375, 0.4725341796875, 0.494140625, 0.5157470703125, 0.537353515625, 0.5589599609375, 0.58056640625, 0.6021728515625, 0.623779296875, 0.6453857421875, 0.6669921875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 5.0, 2.0, 2.0, 6.0, 2.0, 7.0, 10.0, 5.0, 14.0, 27.0, 30.0, 42.0, 86.0, 128.0, 171.0, 146.0, 114.0, 73.0, 33.0, 24.0, 25.0, 9.0, 12.0, 9.0, 8.0, 4.0, 5.0, 5.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001500844955444336, -0.00014537759125232697, -0.00014067068696022034, -0.0001359637826681137, -0.00013125687837600708, -0.00012654997408390045, -0.00012184306979179382, -0.0001171361654996872, -0.00011242926120758057, -0.00010772235691547394, -0.00010301545262336731, -9.830854833126068e-05, -9.360164403915405e-05, -8.889473974704742e-05, -8.41878354549408e-05, -7.948093116283417e-05, -7.477402687072754e-05, -7.006712257862091e-05, -6.536021828651428e-05, -6.0653313994407654e-05, -5.5946409702301025e-05, -5.12395054101944e-05, -4.653260111808777e-05, -4.182569682598114e-05, -3.711879253387451e-05, -3.241188824176788e-05, -2.7704983949661255e-05, -2.2998079657554626e-05, -1.8291175365447998e-05, -1.358427107334137e-05, -8.877366781234741e-06, -4.170462489128113e-06, 5.364418029785156e-07, 5.243346095085144e-06, 9.950250387191772e-06, 1.4657154679298401e-05, 1.936405897140503e-05, 2.4070963263511658e-05, 2.8777867555618286e-05, 3.3484771847724915e-05, 3.819167613983154e-05, 4.289858043193817e-05, 4.76054847240448e-05, 5.231238901615143e-05, 5.701929330825806e-05, 6.172619760036469e-05, 6.643310189247131e-05, 7.114000618457794e-05, 7.584691047668457e-05, 8.05538147687912e-05, 8.526071906089783e-05, 8.996762335300446e-05, 9.467452764511108e-05, 9.938143193721771e-05, 0.00010408833622932434, 0.00010879524052143097, 0.0001135021448135376, 0.00011820904910564423, 0.00012291595339775085, 0.00012762285768985748, 0.0001323297619819641, 0.00013703666627407074, 0.00014174357056617737, 0.000146450474858284, 0.00015115737915039062]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 6.0, 2.0, 4.0, 10.0, 10.0, 14.0, 16.0, 30.0, 44.0, 59.0, 116.0, 205.0, 405.0, 941.0, 2590.0, 9051.0, 46025.0, 494516.0, 440027.0, 41778.0, 8391.0, 2452.0, 947.0, 404.0, 213.0, 111.0, 68.0, 37.0, 31.0, 13.0, 12.0, 9.0, 8.0, 3.0, 3.0, 3.0, 0.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.67822265625, -0.654815673828125, -0.63140869140625, -0.608001708984375, -0.5845947265625, -0.561187744140625, -0.53778076171875, -0.514373779296875, -0.490966796875, -0.467559814453125, -0.44415283203125, -0.420745849609375, -0.3973388671875, -0.373931884765625, -0.35052490234375, -0.327117919921875, -0.3037109375, -0.280303955078125, -0.25689697265625, -0.233489990234375, -0.2100830078125, -0.186676025390625, -0.16326904296875, -0.139862060546875, -0.116455078125, -0.093048095703125, -0.06964111328125, -0.046234130859375, -0.0228271484375, 0.000579833984375, 0.02398681640625, 0.047393798828125, 0.07080078125, 0.094207763671875, 0.11761474609375, 0.141021728515625, 0.1644287109375, 0.187835693359375, 0.21124267578125, 0.234649658203125, 0.258056640625, 0.281463623046875, 0.30487060546875, 0.328277587890625, 0.3516845703125, 0.375091552734375, 0.39849853515625, 0.421905517578125, 0.4453125, 0.468719482421875, 0.49212646484375, 0.515533447265625, 0.5389404296875, 0.562347412109375, 0.58575439453125, 0.609161376953125, 0.632568359375, 0.655975341796875, 0.67938232421875, 0.702789306640625, 0.7261962890625, 0.749603271484375, 0.77301025390625, 0.796417236328125, 0.81982421875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 1.0, 4.0, 1.0, 5.0, 1.0, 8.0, 6.0, 6.0, 10.0, 11.0, 13.0, 8.0, 30.0, 22.0, 37.0, 68.0, 93.0, 98.0, 117.0, 82.0, 96.0, 85.0, 55.0, 36.0, 28.0, 25.0, 15.0, 8.0, 15.0, 4.0, 3.0, 5.0, 5.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.487548828125, -0.47306060791015625, -0.4585723876953125, -0.44408416748046875, -0.429595947265625, -0.41510772705078125, -0.4006195068359375, -0.38613128662109375, -0.37164306640625, -0.35715484619140625, -0.3426666259765625, -0.32817840576171875, -0.313690185546875, -0.29920196533203125, -0.2847137451171875, -0.27022552490234375, -0.2557373046875, -0.24124908447265625, -0.2267608642578125, -0.21227264404296875, -0.197784423828125, -0.18329620361328125, -0.1688079833984375, -0.15431976318359375, -0.13983154296875, -0.12534332275390625, -0.1108551025390625, -0.09636688232421875, -0.081878662109375, -0.06739044189453125, -0.0529022216796875, -0.03841400146484375, -0.02392578125, -0.00943756103515625, 0.0050506591796875, 0.01953887939453125, 0.034027099609375, 0.04851531982421875, 0.0630035400390625, 0.07749176025390625, 0.09197998046875, 0.10646820068359375, 0.1209564208984375, 0.13544464111328125, 0.149932861328125, 0.16442108154296875, 0.1789093017578125, 0.19339752197265625, 0.2078857421875, 0.22237396240234375, 0.2368621826171875, 0.25135040283203125, 0.265838623046875, 0.28032684326171875, 0.2948150634765625, 0.30930328369140625, 0.32379150390625, 0.33827972412109375, 0.3527679443359375, 0.36725616455078125, 0.381744384765625, 0.39623260498046875, 0.4107208251953125, 0.42520904541015625, 0.439697265625]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 7.0, 15.0, 16.0, 33.0, 54.0, 99.0, 140.0, 179.0, 183.0, 117.0, 70.0, 52.0, 23.0, 14.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.855772018432617, -15.42529582977295, -14.994818687438965, -14.564342498779297, -14.133865356445312, -13.703389167785645, -13.27291202545166, -12.842435836791992, -12.411958694458008, -11.98148250579834, -11.551005363464355, -11.120529174804688, -10.690052032470703, -10.259575843811035, -9.82909870147705, -9.398622512817383, -8.968145370483398, -8.53766918182373, -8.107192039489746, -7.67671537399292, -7.246238708496094, -6.815762519836426, -6.385285377502441, -5.954809188842773, -5.5243330001831055, -5.093856334686279, -4.663379669189453, -4.232903003692627, -3.802426338195801, -3.3719499111175537, -2.9414732456207275, -2.5109965801239014, -2.080519676208496, -1.65004301071167, -1.2195663452148438, -0.7890897989273071, -0.35861313343048096, 0.07186341285705566, 0.5023400783538818, 0.932816743850708, 1.3632934093475342, 1.7937700748443604, 2.2242467403411865, 2.6547231674194336, 3.0851998329162598, 3.515676498413086, 3.946153163909912, 4.376629829406738, 4.8071064949035645, 5.237583160400391, 5.668059825897217, 6.098536491394043, 6.529013156890869, 6.959489822387695, 7.389966011047363, 7.820443153381348, 8.250919342041016, 8.681395530700684, 9.111872673034668, 9.542348861694336, 9.97282600402832, 10.403302192687988, 10.833779335021973, 11.26425552368164, 11.694732666015625]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 7.0, 1.0, 2.0, 6.0, 4.0, 12.0, 9.0, 9.0, 15.0, 13.0, 14.0, 20.0, 23.0, 19.0, 30.0, 26.0, 34.0, 36.0, 37.0, 45.0, 44.0, 56.0, 38.0, 51.0, 40.0, 39.0, 42.0, 43.0, 41.0, 40.0, 33.0, 27.0, 20.0, 34.0, 19.0, 14.0, 14.0, 14.0, 7.0, 6.0, 6.0, 6.0, 6.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.959950923919678, -5.761819362640381, -5.563688278198242, -5.365556716918945, -5.167425155639648, -4.969293594360352, -4.771162509918213, -4.573030948638916, -4.374899864196777, -4.1767683029174805, -3.9786369800567627, -3.780505657196045, -3.582374095916748, -3.3842427730560303, -3.1861114501953125, -2.9879798889160156, -2.7898483276367188, -2.591717004776001, -2.393585443496704, -2.1954541206359863, -1.997322678565979, -1.7991912364959717, -1.601059913635254, -1.4029284715652466, -1.2047970294952393, -1.006665587425232, -0.8085342049598694, -0.6104028224945068, -0.4122713804244995, -0.2141399383544922, -0.016008615493774414, 0.1821228265762329, 0.38025474548339844, 0.5783861875534058, 0.7765175700187683, 0.9746489524841309, 1.1727803945541382, 1.3709118366241455, 1.5690431594848633, 1.7671746015548706, 1.965306043624878, 2.1634373664855957, 2.3615689277648926, 2.5597002506256104, 2.757831573486328, 2.955963134765625, 3.1540944576263428, 3.3522257804870605, 3.5503573417663574, 3.748488664627075, 3.946620225906372, 4.14475154876709, 4.342883110046387, 4.541014671325684, 4.739145755767822, 4.937277317047119, 5.135408401489258, 5.333539962768555, 5.531671047210693, 5.72980260848999, 5.927934169769287, 6.126065254211426, 6.324196815490723, 6.5223283767700195, 6.720459938049316]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 6.0, 11.0, 10.0, 17.0, 19.0, 13.0, 29.0, 60.0, 77.0, 160.0, 292.0, 633.0, 1548.0, 4461.0, 16604.0, 187481.0, 3927645.0, 42074.0, 8124.0, 2648.0, 1094.0, 527.0, 287.0, 148.0, 90.0, 51.0, 40.0, 28.0, 35.0, 19.0, 11.0, 10.0, 4.0, 7.0, 4.0, 6.0, 6.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.375, -4.2393798828125, -4.103759765625, -3.9681396484375, -3.83251953125, -3.6968994140625, -3.561279296875, -3.4256591796875, -3.2900390625, -3.1544189453125, -3.018798828125, -2.8831787109375, -2.74755859375, -2.6119384765625, -2.476318359375, -2.3406982421875, -2.205078125, -2.0694580078125, -1.933837890625, -1.7982177734375, -1.66259765625, -1.5269775390625, -1.391357421875, -1.2557373046875, -1.1201171875, -0.9844970703125, -0.848876953125, -0.7132568359375, -0.57763671875, -0.4420166015625, -0.306396484375, -0.1707763671875, -0.03515625, 0.1004638671875, 0.236083984375, 0.3717041015625, 0.50732421875, 0.6429443359375, 0.778564453125, 0.9141845703125, 1.0498046875, 1.1854248046875, 1.321044921875, 1.4566650390625, 1.59228515625, 1.7279052734375, 1.863525390625, 1.9991455078125, 2.134765625, 2.2703857421875, 2.406005859375, 2.5416259765625, 2.67724609375, 2.8128662109375, 2.948486328125, 3.0841064453125, 3.2197265625, 3.3553466796875, 3.490966796875, 3.6265869140625, 3.76220703125, 3.8978271484375, 4.033447265625, 4.1690673828125, 4.3046875]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 4.0, 5.0, 4.0, 6.0, 15.0, 32.0, 23.0, 45.0, 63.0, 65.0, 68.0, 82.0, 83.0, 74.0, 87.0, 84.0, 60.0, 58.0, 37.0, 28.0, 23.0, 16.0, 13.0, 7.0, 4.0, 6.0, 1.0, 5.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5078125, -0.49040985107421875, -0.4730072021484375, -0.45560455322265625, -0.438201904296875, -0.42079925537109375, -0.4033966064453125, -0.38599395751953125, -0.36859130859375, -0.35118865966796875, -0.3337860107421875, -0.31638336181640625, -0.298980712890625, -0.28157806396484375, -0.2641754150390625, -0.24677276611328125, -0.2293701171875, -0.21196746826171875, -0.1945648193359375, -0.17716217041015625, -0.159759521484375, -0.14235687255859375, -0.1249542236328125, -0.10755157470703125, -0.09014892578125, -0.07274627685546875, -0.0553436279296875, -0.03794097900390625, -0.020538330078125, -0.00313568115234375, 0.0142669677734375, 0.03166961669921875, 0.049072265625, 0.06647491455078125, 0.0838775634765625, 0.10128021240234375, 0.118682861328125, 0.13608551025390625, 0.1534881591796875, 0.17089080810546875, 0.18829345703125, 0.20569610595703125, 0.2230987548828125, 0.24050140380859375, 0.257904052734375, 0.27530670166015625, 0.2927093505859375, 0.31011199951171875, 0.3275146484375, 0.34491729736328125, 0.3623199462890625, 0.37972259521484375, 0.397125244140625, 0.41452789306640625, 0.4319305419921875, 0.44933319091796875, 0.46673583984375, 0.48413848876953125, 0.5015411376953125, 0.5189437866210938, 0.536346435546875, 0.5537490844726562, 0.5711517333984375, 0.5885543823242188, 0.60595703125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 5.0, 7.0, 9.0, 17.0, 21.0, 41.0, 64.0, 84.0, 147.0, 245.0, 403.0, 645.0, 1226.0, 2224.0, 4301.0, 9600.0, 24731.0, 98217.0, 3522723.0, 448675.0, 51024.0, 16115.0, 6707.0, 3149.0, 1653.0, 901.0, 534.0, 292.0, 191.0, 124.0, 72.0, 48.0, 31.0, 35.0, 12.0, 6.0, 5.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.72265625, -2.6506195068359375, -2.578582763671875, -2.5065460205078125, -2.43450927734375, -2.3624725341796875, -2.290435791015625, -2.2183990478515625, -2.1463623046875, -2.0743255615234375, -2.002288818359375, -1.9302520751953125, -1.85821533203125, -1.7861785888671875, -1.714141845703125, -1.6421051025390625, -1.570068359375, -1.4980316162109375, -1.425994873046875, -1.3539581298828125, -1.28192138671875, -1.2098846435546875, -1.137847900390625, -1.0658111572265625, -0.9937744140625, -0.9217376708984375, -0.849700927734375, -0.7776641845703125, -0.70562744140625, -0.6335906982421875, -0.561553955078125, -0.4895172119140625, -0.41748046875, -0.3454437255859375, -0.273406982421875, -0.2013702392578125, -0.12933349609375, -0.0572967529296875, 0.014739990234375, 0.0867767333984375, 0.1588134765625, 0.2308502197265625, 0.302886962890625, 0.3749237060546875, 0.44696044921875, 0.5189971923828125, 0.591033935546875, 0.6630706787109375, 0.735107421875, 0.8071441650390625, 0.879180908203125, 0.9512176513671875, 1.02325439453125, 1.0952911376953125, 1.167327880859375, 1.2393646240234375, 1.3114013671875, 1.3834381103515625, 1.455474853515625, 1.5275115966796875, 1.59954833984375, 1.6715850830078125, 1.743621826171875, 1.8156585693359375, 1.8876953125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 5.0, 6.0, 7.0, 2.0, 6.0, 6.0, 12.0, 7.0, 19.0, 22.0, 30.0, 59.0, 62.0, 123.0, 341.0, 2366.0, 577.0, 174.0, 92.0, 44.0, 35.0, 21.0, 14.0, 10.0, 9.0, 8.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.0146484375, -0.9853744506835938, -0.9561004638671875, -0.9268264770507812, -0.897552490234375, -0.8682785034179688, -0.8390045166015625, -0.8097305297851562, -0.78045654296875, -0.7511825561523438, -0.7219085693359375, -0.6926345825195312, -0.663360595703125, -0.6340866088867188, -0.6048126220703125, -0.5755386352539062, -0.5462646484375, -0.5169906616210938, -0.4877166748046875, -0.45844268798828125, -0.429168701171875, -0.39989471435546875, -0.3706207275390625, -0.34134674072265625, -0.31207275390625, -0.28279876708984375, -0.2535247802734375, -0.22425079345703125, -0.194976806640625, -0.16570281982421875, -0.1364288330078125, -0.10715484619140625, -0.077880859375, -0.04860687255859375, -0.0193328857421875, 0.00994110107421875, 0.039215087890625, 0.06848907470703125, 0.0977630615234375, 0.12703704833984375, 0.15631103515625, 0.18558502197265625, 0.2148590087890625, 0.24413299560546875, 0.273406982421875, 0.30268096923828125, 0.3319549560546875, 0.36122894287109375, 0.3905029296875, 0.41977691650390625, 0.4490509033203125, 0.47832489013671875, 0.507598876953125, 0.5368728637695312, 0.5661468505859375, 0.5954208374023438, 0.62469482421875, 0.6539688110351562, 0.6832427978515625, 0.7125167846679688, 0.741790771484375, 0.7710647583007812, 0.8003387451171875, 0.8296127319335938, 0.85888671875]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 5.0, 3.0, 6.0, 2.0, 13.0, 20.0, 82.0, 165.0, 305.0, 260.0, 85.0, 44.0, 16.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.4218854904174805, -6.096843242645264, -5.771800994873047, -5.44675874710083, -5.121716499328613, -4.7966742515563965, -4.47163200378418, -4.146589756011963, -3.821547508239746, -3.4965052604675293, -3.1714630126953125, -2.8464207649230957, -2.521378517150879, -2.196336269378662, -1.8712940216064453, -1.5462517738342285, -1.2212095260620117, -0.8961672782897949, -0.5711250305175781, -0.24608278274536133, 0.07895946502685547, 0.40400171279907227, 0.7290439605712891, 1.0540862083435059, 1.3791284561157227, 1.7041707038879395, 2.0292129516601562, 2.354255199432373, 2.67929744720459, 3.0043396949768066, 3.3293819427490234, 3.6544241905212402, 3.9794654846191406, 4.304507732391357, 4.629549980163574, 4.954592227935791, 5.279634475708008, 5.604676723480225, 5.929718971252441, 6.254761219024658, 6.579803466796875, 6.904845714569092, 7.229887962341309, 7.554930210113525, 7.879972457885742, 8.205015182495117, 8.530056953430176, 8.855098724365234, 9.18014144897461, 9.505184173583984, 9.830225944519043, 10.155267715454102, 10.480310440063477, 10.805353164672852, 11.13039493560791, 11.455436706542969, 11.780479431152344, 12.105522155761719, 12.430563926696777, 12.755605697631836, 13.080648422241211, 13.405691146850586, 13.730732917785645, 14.055774688720703, 14.380817413330078]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 0.0, 2.0, 5.0, 4.0, 2.0, 8.0, 9.0, 6.0, 8.0, 19.0, 18.0, 21.0, 18.0, 25.0, 32.0, 20.0, 41.0, 25.0, 44.0, 35.0, 34.0, 39.0, 39.0, 50.0, 45.0, 46.0, 35.0, 53.0, 45.0, 31.0, 27.0, 30.0, 36.0, 17.0, 28.0, 16.0, 14.0, 11.0, 17.0, 16.0, 6.0, 10.0, 8.0, 6.0, 4.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.838697671890259, -2.761110782623291, -2.6835241317749023, -2.6059372425079346, -2.528350591659546, -2.450763702392578, -2.3731770515441895, -2.2955901622772217, -2.218003273010254, -2.140416383743286, -2.0628297328948975, -1.9852429628372192, -1.907656192779541, -1.8300693035125732, -1.752482533454895, -1.6748957633972168, -1.5973091125488281, -1.51972234249115, -1.4421355724334717, -1.3645488023757935, -1.2869620323181152, -1.2093751430511475, -1.1317883729934692, -1.054201602935791, -0.9766148328781128, -0.8990280628204346, -0.8214412927627563, -0.7438544631004333, -0.6662676930427551, -0.5886809229850769, -0.5110940933227539, -0.4335073232650757, -0.35592055320739746, -0.27833378314971924, -0.20074698328971863, -0.12316019833087921, -0.045573413372039795, 0.03201335668563843, 0.10960015654563904, 0.18718695640563965, 0.26477372646331787, 0.3423604965209961, 0.4199472963809967, 0.4975340962409973, 0.5751208662986755, 0.6527076363563538, 0.7302944660186768, 0.807881236076355, 0.8854680061340332, 0.9630547761917114, 1.0406415462493896, 1.1182283163070679, 1.195815086364746, 1.2734019756317139, 1.350988745689392, 1.4285755157470703, 1.5061622858047485, 1.5837490558624268, 1.661335825920105, 1.7389225959777832, 1.816509485244751, 1.8940961360931396, 1.9716830253601074, 2.049269676208496, 2.126856565475464]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 5.0, 7.0, 12.0, 11.0, 33.0, 49.0, 44.0, 88.0, 104.0, 167.0, 263.0, 445.0, 805.0, 1630.0, 3900.0, 11052.0, 43049.0, 229758.0, 566465.0, 146725.0, 29580.0, 8113.0, 3093.0, 1405.0, 685.0, 382.0, 244.0, 148.0, 92.0, 58.0, 50.0, 32.0, 21.0, 13.0, 12.0, 4.0, 4.0, 4.0, 3.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9296875, -2.844451904296875, -2.75921630859375, -2.673980712890625, -2.5887451171875, -2.503509521484375, -2.41827392578125, -2.333038330078125, -2.247802734375, -2.162567138671875, -2.07733154296875, -1.992095947265625, -1.9068603515625, -1.821624755859375, -1.73638916015625, -1.651153564453125, -1.56591796875, -1.480682373046875, -1.39544677734375, -1.310211181640625, -1.2249755859375, -1.139739990234375, -1.05450439453125, -0.969268798828125, -0.884033203125, -0.798797607421875, -0.71356201171875, -0.628326416015625, -0.5430908203125, -0.457855224609375, -0.37261962890625, -0.287384033203125, -0.2021484375, -0.116912841796875, -0.03167724609375, 0.053558349609375, 0.1387939453125, 0.224029541015625, 0.30926513671875, 0.394500732421875, 0.479736328125, 0.564971923828125, 0.65020751953125, 0.735443115234375, 0.8206787109375, 0.905914306640625, 0.99114990234375, 1.076385498046875, 1.16162109375, 1.246856689453125, 1.33209228515625, 1.417327880859375, 1.5025634765625, 1.587799072265625, 1.67303466796875, 1.758270263671875, 1.843505859375, 1.928741455078125, 2.01397705078125, 2.099212646484375, 2.1844482421875, 2.269683837890625, 2.35491943359375, 2.440155029296875, 2.525390625]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 7.0, 4.0, 12.0, 9.0, 9.0, 20.0, 28.0, 36.0, 51.0, 51.0, 64.0, 58.0, 67.0, 89.0, 79.0, 64.0, 65.0, 55.0, 57.0, 48.0, 32.0, 24.0, 19.0, 22.0, 12.0, 5.0, 5.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.5283203125, -0.51129150390625, -0.4942626953125, -0.47723388671875, -0.460205078125, -0.44317626953125, -0.4261474609375, -0.40911865234375, -0.39208984375, -0.37506103515625, -0.3580322265625, -0.34100341796875, -0.323974609375, -0.30694580078125, -0.2899169921875, -0.27288818359375, -0.255859375, -0.23883056640625, -0.2218017578125, -0.20477294921875, -0.187744140625, -0.17071533203125, -0.1536865234375, -0.13665771484375, -0.11962890625, -0.10260009765625, -0.0855712890625, -0.06854248046875, -0.051513671875, -0.03448486328125, -0.0174560546875, -0.00042724609375, 0.0166015625, 0.03363037109375, 0.0506591796875, 0.06768798828125, 0.084716796875, 0.10174560546875, 0.1187744140625, 0.13580322265625, 0.15283203125, 0.16986083984375, 0.1868896484375, 0.20391845703125, 0.220947265625, 0.23797607421875, 0.2550048828125, 0.27203369140625, 0.2890625, 0.30609130859375, 0.3231201171875, 0.34014892578125, 0.357177734375, 0.37420654296875, 0.3912353515625, 0.40826416015625, 0.42529296875, 0.44232177734375, 0.4593505859375, 0.47637939453125, 0.493408203125, 0.51043701171875, 0.5274658203125, 0.54449462890625, 0.5615234375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 1.0, 7.0, 8.0, 9.0, 20.0, 21.0, 27.0, 31.0, 48.0, 92.0, 122.0, 197.0, 238.0, 428.0, 667.0, 1175.0, 2054.0, 3973.0, 8227.0, 18135.0, 42032.0, 107004.0, 266111.0, 335961.0, 154835.0, 60106.0, 24725.0, 10814.0, 5128.0, 2685.0, 1375.0, 847.0, 490.0, 312.0, 199.0, 137.0, 78.0, 61.0, 51.0, 30.0, 22.0, 15.0, 14.0, 9.0, 11.0, 9.0, 3.0, 3.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1826171875, -1.1434478759765625, -1.104278564453125, -1.0651092529296875, -1.02593994140625, -0.9867706298828125, -0.947601318359375, -0.9084320068359375, -0.8692626953125, -0.8300933837890625, -0.790924072265625, -0.7517547607421875, -0.71258544921875, -0.6734161376953125, -0.634246826171875, -0.5950775146484375, -0.555908203125, -0.5167388916015625, -0.477569580078125, -0.4384002685546875, -0.39923095703125, -0.3600616455078125, -0.320892333984375, -0.2817230224609375, -0.2425537109375, -0.2033843994140625, -0.164215087890625, -0.1250457763671875, -0.08587646484375, -0.0467071533203125, -0.007537841796875, 0.0316314697265625, 0.07080078125, 0.1099700927734375, 0.149139404296875, 0.1883087158203125, 0.22747802734375, 0.2666473388671875, 0.305816650390625, 0.3449859619140625, 0.3841552734375, 0.4233245849609375, 0.462493896484375, 0.5016632080078125, 0.54083251953125, 0.5800018310546875, 0.619171142578125, 0.6583404541015625, 0.697509765625, 0.7366790771484375, 0.775848388671875, 0.8150177001953125, 0.85418701171875, 0.8933563232421875, 0.932525634765625, 0.9716949462890625, 1.0108642578125, 1.0500335693359375, 1.089202880859375, 1.1283721923828125, 1.16754150390625, 1.2067108154296875, 1.245880126953125, 1.2850494384765625, 1.32421875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 5.0, 6.0, 6.0, 11.0, 12.0, 12.0, 13.0, 18.0, 25.0, 16.0, 27.0, 30.0, 30.0, 37.0, 42.0, 37.0, 47.0, 50.0, 57.0, 38.0, 56.0, 52.0, 46.0, 44.0, 47.0, 31.0, 30.0, 26.0, 17.0, 24.0, 19.0, 20.0, 24.0, 16.0, 12.0, 6.0, 2.0, 2.0, 5.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6904296875, -1.6351470947265625, -1.579864501953125, -1.5245819091796875, -1.46929931640625, -1.4140167236328125, -1.358734130859375, -1.3034515380859375, -1.2481689453125, -1.1928863525390625, -1.137603759765625, -1.0823211669921875, -1.02703857421875, -0.9717559814453125, -0.916473388671875, -0.8611907958984375, -0.805908203125, -0.7506256103515625, -0.695343017578125, -0.6400604248046875, -0.58477783203125, -0.5294952392578125, -0.474212646484375, -0.4189300537109375, -0.3636474609375, -0.3083648681640625, -0.253082275390625, -0.1977996826171875, -0.14251708984375, -0.0872344970703125, -0.031951904296875, 0.0233306884765625, 0.07861328125, 0.1338958740234375, 0.189178466796875, 0.2444610595703125, 0.29974365234375, 0.3550262451171875, 0.410308837890625, 0.4655914306640625, 0.5208740234375, 0.5761566162109375, 0.631439208984375, 0.6867218017578125, 0.74200439453125, 0.7972869873046875, 0.852569580078125, 0.9078521728515625, 0.963134765625, 1.0184173583984375, 1.073699951171875, 1.1289825439453125, 1.18426513671875, 1.2395477294921875, 1.294830322265625, 1.3501129150390625, 1.4053955078125, 1.4606781005859375, 1.515960693359375, 1.5712432861328125, 1.62652587890625, 1.6818084716796875, 1.737091064453125, 1.7923736572265625, 1.84765625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 10.0, 7.0, 11.0, 10.0, 20.0, 35.0, 68.0, 101.0, 174.0, 265.0, 495.0, 956.0, 1999.0, 5078.0, 17794.0, 106133.0, 694279.0, 183555.0, 26045.0, 6649.0, 2360.0, 1136.0, 555.0, 337.0, 185.0, 102.0, 67.0, 45.0, 35.0, 21.0, 10.0, 8.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-1.23828125, -1.2044677734375, -1.170654296875, -1.1368408203125, -1.10302734375, -1.0692138671875, -1.035400390625, -1.0015869140625, -0.9677734375, -0.9339599609375, -0.900146484375, -0.8663330078125, -0.83251953125, -0.7987060546875, -0.764892578125, -0.7310791015625, -0.697265625, -0.6634521484375, -0.629638671875, -0.5958251953125, -0.56201171875, -0.5281982421875, -0.494384765625, -0.4605712890625, -0.4267578125, -0.3929443359375, -0.359130859375, -0.3253173828125, -0.29150390625, -0.2576904296875, -0.223876953125, -0.1900634765625, -0.15625, -0.1224365234375, -0.088623046875, -0.0548095703125, -0.02099609375, 0.0128173828125, 0.046630859375, 0.0804443359375, 0.1142578125, 0.1480712890625, 0.181884765625, 0.2156982421875, 0.24951171875, 0.2833251953125, 0.317138671875, 0.3509521484375, 0.384765625, 0.4185791015625, 0.452392578125, 0.4862060546875, 0.52001953125, 0.5538330078125, 0.587646484375, 0.6214599609375, 0.6552734375, 0.6890869140625, 0.722900390625, 0.7567138671875, 0.79052734375, 0.8243408203125, 0.858154296875, 0.8919677734375, 0.92578125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 3.0, 4.0, 5.0, 8.0, 12.0, 15.0, 16.0, 31.0, 32.0, 37.0, 50.0, 79.0, 93.0, 115.0, 122.0, 83.0, 81.0, 50.0, 41.0, 32.0, 23.0, 22.0, 11.0, 7.0, 6.0, 5.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011920928955078125, -0.000115223228931427, -0.00011123716831207275, -0.0001072511076927185, -0.00010326504707336426, -9.927898645401001e-05, -9.529292583465576e-05, -9.130686521530151e-05, -8.732080459594727e-05, -8.333474397659302e-05, -7.934868335723877e-05, -7.536262273788452e-05, -7.137656211853027e-05, -6.739050149917603e-05, -6.340444087982178e-05, -5.941838026046753e-05, -5.543231964111328e-05, -5.144625902175903e-05, -4.7460198402404785e-05, -4.347413778305054e-05, -3.948807716369629e-05, -3.550201654434204e-05, -3.151595592498779e-05, -2.7529895305633545e-05, -2.3543834686279297e-05, -1.955777406692505e-05, -1.55717134475708e-05, -1.1585652828216553e-05, -7.599592208862305e-06, -3.6135315895080566e-06, 3.725290298461914e-07, 4.3585896492004395e-06, 8.344650268554688e-06, 1.2330710887908936e-05, 1.6316771507263184e-05, 2.030283212661743e-05, 2.428889274597168e-05, 2.8274953365325928e-05, 3.2261013984680176e-05, 3.6247074604034424e-05, 4.023313522338867e-05, 4.421919584274292e-05, 4.820525646209717e-05, 5.2191317081451416e-05, 5.6177377700805664e-05, 6.016343832015991e-05, 6.414949893951416e-05, 6.813555955886841e-05, 7.212162017822266e-05, 7.61076807975769e-05, 8.009374141693115e-05, 8.40798020362854e-05, 8.806586265563965e-05, 9.20519232749939e-05, 9.603798389434814e-05, 0.00010002404451370239, 0.00010401010513305664, 0.00010799616575241089, 0.00011198222637176514, 0.00011596828699111938, 0.00011995434761047363, 0.00012394040822982788, 0.00012792646884918213, 0.00013191252946853638, 0.00013589859008789062]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 3.0, 6.0, 9.0, 8.0, 11.0, 20.0, 22.0, 34.0, 50.0, 82.0, 155.0, 208.0, 462.0, 1000.0, 2785.0, 10472.0, 65227.0, 735368.0, 204023.0, 20978.0, 4669.0, 1549.0, 655.0, 297.0, 166.0, 89.0, 64.0, 47.0, 32.0, 17.0, 14.0, 7.0, 5.0, 6.0, 6.0, 2.0, 5.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.72265625, -1.6744232177734375, -1.626190185546875, -1.5779571533203125, -1.52972412109375, -1.4814910888671875, -1.433258056640625, -1.3850250244140625, -1.3367919921875, -1.2885589599609375, -1.240325927734375, -1.1920928955078125, -1.14385986328125, -1.0956268310546875, -1.047393798828125, -0.9991607666015625, -0.950927734375, -0.9026947021484375, -0.854461669921875, -0.8062286376953125, -0.75799560546875, -0.7097625732421875, -0.661529541015625, -0.6132965087890625, -0.5650634765625, -0.5168304443359375, -0.468597412109375, -0.4203643798828125, -0.37213134765625, -0.3238983154296875, -0.275665283203125, -0.2274322509765625, -0.17919921875, -0.1309661865234375, -0.082733154296875, -0.0345001220703125, 0.01373291015625, 0.0619659423828125, 0.110198974609375, 0.1584320068359375, 0.2066650390625, 0.2548980712890625, 0.303131103515625, 0.3513641357421875, 0.39959716796875, 0.4478302001953125, 0.496063232421875, 0.5442962646484375, 0.592529296875, 0.6407623291015625, 0.688995361328125, 0.7372283935546875, 0.78546142578125, 0.8336944580078125, 0.881927490234375, 0.9301605224609375, 0.9783935546875, 1.0266265869140625, 1.074859619140625, 1.1230926513671875, 1.17132568359375, 1.2195587158203125, 1.267791748046875, 1.3160247802734375, 1.3642578125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 5.0, 1.0, 3.0, 10.0, 14.0, 12.0, 11.0, 29.0, 32.0, 64.0, 69.0, 134.0, 116.0, 138.0, 106.0, 66.0, 53.0, 40.0, 19.0, 22.0, 18.0, 10.0, 5.0, 8.0, 5.0, 6.0, 5.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7939453125, -0.7579193115234375, -0.721893310546875, -0.6858673095703125, -0.64984130859375, -0.6138153076171875, -0.577789306640625, -0.5417633056640625, -0.5057373046875, -0.4697113037109375, -0.433685302734375, -0.3976593017578125, -0.36163330078125, -0.3256072998046875, -0.289581298828125, -0.2535552978515625, -0.217529296875, -0.1815032958984375, -0.145477294921875, -0.1094512939453125, -0.07342529296875, -0.0373992919921875, -0.001373291015625, 0.0346527099609375, 0.0706787109375, 0.1067047119140625, 0.142730712890625, 0.1787567138671875, 0.21478271484375, 0.2508087158203125, 0.286834716796875, 0.3228607177734375, 0.35888671875, 0.3949127197265625, 0.430938720703125, 0.4669647216796875, 0.50299072265625, 0.5390167236328125, 0.575042724609375, 0.6110687255859375, 0.6470947265625, 0.6831207275390625, 0.719146728515625, 0.7551727294921875, 0.79119873046875, 0.8272247314453125, 0.863250732421875, 0.8992767333984375, 0.935302734375, 0.9713287353515625, 1.007354736328125, 1.0433807373046875, 1.07940673828125, 1.1154327392578125, 1.151458740234375, 1.1874847412109375, 1.2235107421875, 1.2595367431640625, 1.295562744140625, 1.3315887451171875, 1.36761474609375, 1.4036407470703125, 1.439666748046875, 1.4756927490234375, 1.51171875]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 10.0, 13.0, 41.0, 73.0, 171.0, 248.0, 202.0, 123.0, 67.0, 28.0, 12.0, 9.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.453231811523438, -12.651277542114258, -11.849323272705078, -11.047369956970215, -10.245415687561035, -9.443461418151855, -8.641508102416992, -7.8395538330078125, -7.037599563598633, -6.235645294189453, -5.433691501617432, -4.63173770904541, -3.8297834396362305, -3.027829170227051, -2.2258753776550293, -1.4239215850830078, -0.6219673156738281, 0.17998671531677246, 0.981940746307373, 1.7838947772979736, 2.585848808288574, 3.387803077697754, 4.189756870269775, 4.991710662841797, 5.793664932250977, 6.595619201660156, 7.397572994232178, 8.1995267868042, 9.001481056213379, 9.803435325622559, 10.605388641357422, 11.407342910766602, 12.209297180175781, 13.011251449584961, 13.81320571899414, 14.615159034729004, 15.417113304138184, 16.219066619873047, 17.021020889282227, 17.822975158691406, 18.624929428100586, 19.426883697509766, 20.228837966918945, 21.030792236328125, 21.832744598388672, 22.634700775146484, 23.43665313720703, 24.23860740661621, 25.04056167602539, 25.84251594543457, 26.64447021484375, 27.44642448425293, 28.24837875366211, 29.050331115722656, 29.852285385131836, 30.654239654541016, 31.456193923950195, 32.258148193359375, 33.06010055541992, 33.862056732177734, 34.66400909423828, 35.465965270996094, 36.26791763305664, 37.06986999511719, 37.871826171875]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 11.0, 4.0, 4.0, 2.0, 13.0, 4.0, 12.0, 12.0, 11.0, 20.0, 22.0, 22.0, 23.0, 25.0, 24.0, 28.0, 41.0, 34.0, 38.0, 34.0, 38.0, 33.0, 33.0, 39.0, 41.0, 34.0, 39.0, 46.0, 35.0, 29.0, 29.0, 34.0, 26.0, 19.0, 20.0, 20.0, 18.0, 11.0, 12.0, 13.0, 10.0, 6.0, 6.0, 6.0, 9.0, 5.0, 1.0, 1.0, 5.0, 3.0, 2.0, 0.0, 0.0, 3.0], "bins": [-8.649946212768555, -8.391485214233398, -8.133024215698242, -7.874563694000244, -7.616103172302246, -7.35764217376709, -7.099181175231934, -6.840720176696777, -6.582259654998779, -6.323798656463623, -6.065338134765625, -5.806877136230469, -5.5484161376953125, -5.2899556159973145, -5.031494617462158, -4.77303409576416, -4.514573097229004, -4.256112098693848, -3.9976515769958496, -3.7391905784606934, -3.480729818344116, -3.222269058227539, -2.963808059692383, -2.7053472995758057, -2.4468865394592285, -2.1884257793426514, -1.9299649000167847, -1.671504020690918, -1.4130432605743408, -1.1545825004577637, -0.896121621131897, -0.6376607418060303, -0.3791999816894531, -0.1207391619682312, 0.13772165775299072, 0.39618247747421265, 0.6546432971954346, 0.9131040573120117, 1.1715649366378784, 1.4300258159637451, 1.6884865760803223, 1.9469473361968994, 2.2054080963134766, 2.463869094848633, 2.72232985496521, 2.980790615081787, 3.2392516136169434, 3.4977123737335205, 3.7561731338500977, 4.014634132385254, 4.273094654083252, 4.531555652618408, 4.790016174316406, 5.0484771728515625, 5.306938171386719, 5.565399169921875, 5.823859691619873, 6.082320690155029, 6.340781211853027, 6.599242210388184, 6.85770320892334, 7.116163730621338, 7.374624729156494, 7.633085250854492, 7.891546249389648]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 5.0, 3.0, 3.0, 3.0, 6.0, 7.0, 9.0, 18.0, 23.0, 26.0, 40.0, 69.0, 135.0, 221.0, 466.0, 996.0, 2392.0, 6302.0, 20065.0, 126046.0, 3900478.0, 108570.0, 18398.0, 5692.0, 2255.0, 942.0, 466.0, 248.0, 110.0, 83.0, 55.0, 44.0, 32.0, 15.0, 17.0, 15.0, 10.0, 7.0, 4.0, 3.0, 6.0, 1.0, 3.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.140625, -4.0205078125, -3.900390625, -3.7802734375, -3.66015625, -3.5400390625, -3.419921875, -3.2998046875, -3.1796875, -3.0595703125, -2.939453125, -2.8193359375, -2.69921875, -2.5791015625, -2.458984375, -2.3388671875, -2.21875, -2.0986328125, -1.978515625, -1.8583984375, -1.73828125, -1.6181640625, -1.498046875, -1.3779296875, -1.2578125, -1.1376953125, -1.017578125, -0.8974609375, -0.77734375, -0.6572265625, -0.537109375, -0.4169921875, -0.296875, -0.1767578125, -0.056640625, 0.0634765625, 0.18359375, 0.3037109375, 0.423828125, 0.5439453125, 0.6640625, 0.7841796875, 0.904296875, 1.0244140625, 1.14453125, 1.2646484375, 1.384765625, 1.5048828125, 1.625, 1.7451171875, 1.865234375, 1.9853515625, 2.10546875, 2.2255859375, 2.345703125, 2.4658203125, 2.5859375, 2.7060546875, 2.826171875, 2.9462890625, 3.06640625, 3.1865234375, 3.306640625, 3.4267578125, 3.546875]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 4.0, 3.0, 9.0, 17.0, 17.0, 15.0, 17.0, 26.0, 37.0, 26.0, 51.0, 54.0, 64.0, 52.0, 69.0, 79.0, 71.0, 53.0, 50.0, 43.0, 44.0, 45.0, 41.0, 29.0, 22.0, 22.0, 11.0, 10.0, 7.0, 8.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.53662109375, -0.5196609497070312, -0.5027008056640625, -0.48574066162109375, -0.468780517578125, -0.45182037353515625, -0.4348602294921875, -0.41790008544921875, -0.40093994140625, -0.38397979736328125, -0.3670196533203125, -0.35005950927734375, -0.333099365234375, -0.31613922119140625, -0.2991790771484375, -0.28221893310546875, -0.2652587890625, -0.24829864501953125, -0.2313385009765625, -0.21437835693359375, -0.197418212890625, -0.18045806884765625, -0.1634979248046875, -0.14653778076171875, -0.12957763671875, -0.11261749267578125, -0.0956573486328125, -0.07869720458984375, -0.061737060546875, -0.04477691650390625, -0.0278167724609375, -0.01085662841796875, 0.006103515625, 0.02306365966796875, 0.0400238037109375, 0.05698394775390625, 0.073944091796875, 0.09090423583984375, 0.1078643798828125, 0.12482452392578125, 0.14178466796875, 0.15874481201171875, 0.1757049560546875, 0.19266510009765625, 0.209625244140625, 0.22658538818359375, 0.2435455322265625, 0.26050567626953125, 0.2774658203125, 0.29442596435546875, 0.3113861083984375, 0.32834625244140625, 0.345306396484375, 0.36226654052734375, 0.3792266845703125, 0.39618682861328125, 0.41314697265625, 0.43010711669921875, 0.4470672607421875, 0.46402740478515625, 0.480987548828125, 0.49794769287109375, 0.5149078369140625, 0.5318679809570312, 0.548828125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 6.0, 8.0, 18.0, 20.0, 31.0, 46.0, 72.0, 134.0, 207.0, 381.0, 685.0, 1373.0, 2818.0, 6995.0, 21173.0, 96751.0, 3620301.0, 379282.0, 43344.0, 12034.0, 4462.0, 1920.0, 991.0, 540.0, 260.0, 156.0, 100.0, 60.0, 41.0, 23.0, 25.0, 9.0, 10.0, 6.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.57421875, -3.474273681640625, -3.37432861328125, -3.274383544921875, -3.1744384765625, -3.074493408203125, -2.97454833984375, -2.874603271484375, -2.774658203125, -2.674713134765625, -2.57476806640625, -2.474822998046875, -2.3748779296875, -2.274932861328125, -2.17498779296875, -2.075042724609375, -1.97509765625, -1.875152587890625, -1.77520751953125, -1.675262451171875, -1.5753173828125, -1.475372314453125, -1.37542724609375, -1.275482177734375, -1.175537109375, -1.075592041015625, -0.97564697265625, -0.875701904296875, -0.7757568359375, -0.675811767578125, -0.57586669921875, -0.475921630859375, -0.3759765625, -0.276031494140625, -0.17608642578125, -0.076141357421875, 0.0238037109375, 0.123748779296875, 0.22369384765625, 0.323638916015625, 0.423583984375, 0.523529052734375, 0.62347412109375, 0.723419189453125, 0.8233642578125, 0.923309326171875, 1.02325439453125, 1.123199462890625, 1.22314453125, 1.323089599609375, 1.42303466796875, 1.522979736328125, 1.6229248046875, 1.722869873046875, 1.82281494140625, 1.922760009765625, 2.022705078125, 2.122650146484375, 2.22259521484375, 2.322540283203125, 2.4224853515625, 2.522430419921875, 2.62237548828125, 2.722320556640625, 2.822265625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 4.0, 2.0, 2.0, 1.0, 5.0, 3.0, 11.0, 5.0, 7.0, 12.0, 14.0, 17.0, 24.0, 43.0, 48.0, 97.0, 193.0, 598.0, 2221.0, 374.0, 134.0, 79.0, 49.0, 30.0, 27.0, 20.0, 16.0, 7.0, 9.0, 6.0, 7.0, 4.0, 1.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.142578125, -1.1022491455078125, -1.061920166015625, -1.0215911865234375, -0.98126220703125, -0.9409332275390625, -0.900604248046875, -0.8602752685546875, -0.8199462890625, -0.7796173095703125, -0.739288330078125, -0.6989593505859375, -0.65863037109375, -0.6183013916015625, -0.577972412109375, -0.5376434326171875, -0.497314453125, -0.4569854736328125, -0.416656494140625, -0.3763275146484375, -0.33599853515625, -0.2956695556640625, -0.255340576171875, -0.2150115966796875, -0.1746826171875, -0.1343536376953125, -0.094024658203125, -0.0536956787109375, -0.01336669921875, 0.0269622802734375, 0.067291259765625, 0.1076202392578125, 0.14794921875, 0.1882781982421875, 0.228607177734375, 0.2689361572265625, 0.30926513671875, 0.3495941162109375, 0.389923095703125, 0.4302520751953125, 0.4705810546875, 0.5109100341796875, 0.551239013671875, 0.5915679931640625, 0.63189697265625, 0.6722259521484375, 0.712554931640625, 0.7528839111328125, 0.793212890625, 0.8335418701171875, 0.873870849609375, 0.9141998291015625, 0.95452880859375, 0.9948577880859375, 1.035186767578125, 1.0755157470703125, 1.1158447265625, 1.1561737060546875, 1.196502685546875, 1.2368316650390625, 1.27716064453125, 1.3174896240234375, 1.357818603515625, 1.3981475830078125, 1.4384765625]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 8.0, 15.0, 6.0, 33.0, 78.0, 180.0, 257.0, 222.0, 123.0, 50.0, 15.0, 8.0, 7.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.920326232910156, -14.491230010986328, -14.062132835388184, -13.633036613464355, -13.203940391540527, -12.774843215942383, -12.345746994018555, -11.916650772094727, -11.487554550170898, -11.05845832824707, -10.629361152648926, -10.200264930725098, -9.77116870880127, -9.342071533203125, -8.912975311279297, -8.483879089355469, -8.054781913757324, -7.625685214996338, -7.19658899307251, -6.767492294311523, -6.338396072387695, -5.909299373626709, -5.480202674865723, -5.0511064529418945, -4.622009754180908, -4.192913055419922, -3.7638168334960938, -3.3347201347351074, -2.9056236743927, -2.476527214050293, -2.0474305152893066, -1.6183340549468994, -1.1892375946044922, -0.7601410746574402, -0.3310445547103882, 0.0980520248413086, 0.5271484851837158, 0.956244945526123, 1.3853416442871094, 1.8144381046295166, 2.243534564971924, 2.672631025314331, 3.1017274856567383, 3.5308241844177246, 3.959920644760132, 4.389017105102539, 4.818113803863525, 5.247210502624512, 5.67630672454834, 6.105403423309326, 6.534499645233154, 6.963596343994141, 7.392692565917969, 7.821789264678955, 8.250885963439941, 8.67998218536377, 9.109079360961914, 9.538175582885742, 9.967272758483887, 10.396368980407715, 10.825465202331543, 11.254562377929688, 11.683658599853516, 12.112754821777344, 12.541851043701172]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 6.0, 5.0, 8.0, 7.0, 8.0, 17.0, 6.0, 12.0, 21.0, 14.0, 15.0, 18.0, 21.0, 32.0, 25.0, 43.0, 38.0, 38.0, 26.0, 41.0, 47.0, 26.0, 38.0, 44.0, 37.0, 29.0, 47.0, 29.0, 47.0, 32.0, 28.0, 27.0, 28.0, 21.0, 13.0, 14.0, 19.0, 10.0, 10.0, 15.0, 9.0, 4.0, 7.0, 5.0, 5.0, 1.0, 4.0, 4.0, 3.0, 0.0, 2.0, 2.0, 2.0], "bins": [-3.4667015075683594, -3.363508939743042, -3.2603163719177246, -3.157123565673828, -3.0539309978485107, -2.9507384300231934, -2.847545862197876, -2.7443532943725586, -2.641160726547241, -2.537968158721924, -2.4347755908966064, -2.331583023071289, -2.2283902168273926, -2.125197649002075, -2.022005081176758, -1.9188125133514404, -1.8156198263168335, -1.7124272584915161, -1.6092345714569092, -1.5060420036315918, -1.4028494358062744, -1.299656867980957, -1.19646418094635, -1.0932716131210327, -0.9900789856910706, -0.8868863582611084, -0.783693790435791, -0.6805011630058289, -0.5773085355758667, -0.4741159677505493, -0.37092334032058716, -0.2677307724952698, -0.16453814506530762, -0.06134553998708725, 0.04184706509113312, 0.14503967761993408, 0.24823227524757385, 0.3514248728752136, 0.4546175003051758, 0.5578100681304932, 0.6610026955604553, 0.7641953229904175, 0.8673878908157349, 0.970580518245697, 1.0737731456756592, 1.1769657135009766, 1.280158281326294, 1.3833508491516113, 1.4865435361862183, 1.5897361040115356, 1.6929287910461426, 1.79612135887146, 1.8993139266967773, 2.0025064945220947, 2.105699062347412, 2.2088918685913086, 2.312084436416626, 2.4152770042419434, 2.5184695720672607, 2.621662139892578, 2.7248549461364746, 2.828047513961792, 2.9312400817871094, 3.0344326496124268, 3.137625217437744]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 3.0, 5.0, 5.0, 5.0, 10.0, 6.0, 18.0, 24.0, 20.0, 33.0, 71.0, 101.0, 135.0, 207.0, 343.0, 539.0, 897.0, 1849.0, 4229.0, 11004.0, 33464.0, 116797.0, 377571.0, 349159.0, 104442.0, 29820.0, 9929.0, 3844.0, 1810.0, 878.0, 449.0, 299.0, 197.0, 118.0, 88.0, 58.0, 49.0, 25.0, 22.0, 13.0, 13.0, 2.0, 4.0, 3.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-2.68359375, -2.599609375, -2.515625, -2.431640625, -2.34765625, -2.263671875, -2.1796875, -2.095703125, -2.01171875, -1.927734375, -1.84375, -1.759765625, -1.67578125, -1.591796875, -1.5078125, -1.423828125, -1.33984375, -1.255859375, -1.171875, -1.087890625, -1.00390625, -0.919921875, -0.8359375, -0.751953125, -0.66796875, -0.583984375, -0.5, -0.416015625, -0.33203125, -0.248046875, -0.1640625, -0.080078125, 0.00390625, 0.087890625, 0.171875, 0.255859375, 0.33984375, 0.423828125, 0.5078125, 0.591796875, 0.67578125, 0.759765625, 0.84375, 0.927734375, 1.01171875, 1.095703125, 1.1796875, 1.263671875, 1.34765625, 1.431640625, 1.515625, 1.599609375, 1.68359375, 1.767578125, 1.8515625, 1.935546875, 2.01953125, 2.103515625, 2.1875, 2.271484375, 2.35546875, 2.439453125, 2.5234375, 2.607421875, 2.69140625]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 6.0, 4.0, 4.0, 6.0, 11.0, 12.0, 26.0, 29.0, 30.0, 49.0, 36.0, 49.0, 53.0, 56.0, 60.0, 59.0, 65.0, 58.0, 48.0, 63.0, 58.0, 40.0, 34.0, 33.0, 19.0, 23.0, 23.0, 15.0, 10.0, 10.0, 4.0, 5.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.54345703125, -0.5260696411132812, -0.5086822509765625, -0.49129486083984375, -0.473907470703125, -0.45652008056640625, -0.4391326904296875, -0.42174530029296875, -0.40435791015625, -0.38697052001953125, -0.3695831298828125, -0.35219573974609375, -0.334808349609375, -0.31742095947265625, -0.3000335693359375, -0.28264617919921875, -0.2652587890625, -0.24787139892578125, -0.2304840087890625, -0.21309661865234375, -0.195709228515625, -0.17832183837890625, -0.1609344482421875, -0.14354705810546875, -0.12615966796875, -0.10877227783203125, -0.0913848876953125, -0.07399749755859375, -0.056610107421875, -0.03922271728515625, -0.0218353271484375, -0.00444793701171875, 0.012939453125, 0.03032684326171875, 0.0477142333984375, 0.06510162353515625, 0.082489013671875, 0.09987640380859375, 0.1172637939453125, 0.13465118408203125, 0.15203857421875, 0.16942596435546875, 0.1868133544921875, 0.20420074462890625, 0.221588134765625, 0.23897552490234375, 0.2563629150390625, 0.27375030517578125, 0.2911376953125, 0.30852508544921875, 0.3259124755859375, 0.34329986572265625, 0.360687255859375, 0.37807464599609375, 0.3954620361328125, 0.41284942626953125, 0.43023681640625, 0.44762420654296875, 0.4650115966796875, 0.48239898681640625, 0.499786376953125, 0.5171737670898438, 0.5345611572265625, 0.5519485473632812, 0.5693359375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 6.0, 7.0, 4.0, 6.0, 23.0, 24.0, 41.0, 49.0, 88.0, 155.0, 247.0, 498.0, 956.0, 2147.0, 5759.0, 16654.0, 55956.0, 218752.0, 492267.0, 183621.0, 47905.0, 14372.0, 5103.0, 1951.0, 923.0, 445.0, 253.0, 117.0, 97.0, 48.0, 35.0, 19.0, 14.0, 6.0, 6.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.25390625, -2.177337646484375, -2.10076904296875, -2.024200439453125, -1.9476318359375, -1.871063232421875, -1.79449462890625, -1.717926025390625, -1.641357421875, -1.564788818359375, -1.48822021484375, -1.411651611328125, -1.3350830078125, -1.258514404296875, -1.18194580078125, -1.105377197265625, -1.02880859375, -0.952239990234375, -0.87567138671875, -0.799102783203125, -0.7225341796875, -0.645965576171875, -0.56939697265625, -0.492828369140625, -0.416259765625, -0.339691162109375, -0.26312255859375, -0.186553955078125, -0.1099853515625, -0.033416748046875, 0.04315185546875, 0.119720458984375, 0.1962890625, 0.272857666015625, 0.34942626953125, 0.425994873046875, 0.5025634765625, 0.579132080078125, 0.65570068359375, 0.732269287109375, 0.808837890625, 0.885406494140625, 0.96197509765625, 1.038543701171875, 1.1151123046875, 1.191680908203125, 1.26824951171875, 1.344818115234375, 1.42138671875, 1.497955322265625, 1.57452392578125, 1.651092529296875, 1.7276611328125, 1.804229736328125, 1.88079833984375, 1.957366943359375, 2.033935546875, 2.110504150390625, 2.18707275390625, 2.263641357421875, 2.3402099609375, 2.416778564453125, 2.49334716796875, 2.569915771484375, 2.646484375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 5.0, 8.0, 6.0, 6.0, 8.0, 12.0, 13.0, 15.0, 15.0, 13.0, 27.0, 27.0, 33.0, 31.0, 37.0, 23.0, 49.0, 47.0, 46.0, 52.0, 47.0, 53.0, 49.0, 46.0, 40.0, 45.0, 37.0, 31.0, 25.0, 19.0, 21.0, 26.0, 16.0, 22.0, 9.0, 11.0, 8.0, 5.0, 5.0, 4.0, 6.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-1.7626953125, -1.6974334716796875, -1.632171630859375, -1.5669097900390625, -1.50164794921875, -1.4363861083984375, -1.371124267578125, -1.3058624267578125, -1.2406005859375, -1.1753387451171875, -1.110076904296875, -1.0448150634765625, -0.97955322265625, -0.9142913818359375, -0.849029541015625, -0.7837677001953125, -0.718505859375, -0.6532440185546875, -0.587982177734375, -0.5227203369140625, -0.45745849609375, -0.3921966552734375, -0.326934814453125, -0.2616729736328125, -0.1964111328125, -0.1311492919921875, -0.065887451171875, -0.0006256103515625, 0.06463623046875, 0.1298980712890625, 0.195159912109375, 0.2604217529296875, 0.32568359375, 0.3909454345703125, 0.456207275390625, 0.5214691162109375, 0.58673095703125, 0.6519927978515625, 0.717254638671875, 0.7825164794921875, 0.8477783203125, 0.9130401611328125, 0.978302001953125, 1.0435638427734375, 1.10882568359375, 1.1740875244140625, 1.239349365234375, 1.3046112060546875, 1.369873046875, 1.4351348876953125, 1.500396728515625, 1.5656585693359375, 1.63092041015625, 1.6961822509765625, 1.761444091796875, 1.8267059326171875, 1.8919677734375, 1.9572296142578125, 2.022491455078125, 2.0877532958984375, 2.15301513671875, 2.2182769775390625, 2.283538818359375, 2.3488006591796875, 2.4140625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 1.0, 4.0, 6.0, 3.0, 10.0, 21.0, 36.0, 55.0, 125.0, 232.0, 497.0, 998.0, 2678.0, 8101.0, 35122.0, 248874.0, 622199.0, 103412.0, 18013.0, 4964.0, 1719.0, 748.0, 367.0, 178.0, 80.0, 41.0, 30.0, 17.0, 7.0, 2.0, 8.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.56640625, -1.5178985595703125, -1.469390869140625, -1.4208831787109375, -1.37237548828125, -1.3238677978515625, -1.275360107421875, -1.2268524169921875, -1.1783447265625, -1.1298370361328125, -1.081329345703125, -1.0328216552734375, -0.98431396484375, -0.9358062744140625, -0.887298583984375, -0.8387908935546875, -0.790283203125, -0.7417755126953125, -0.693267822265625, -0.6447601318359375, -0.59625244140625, -0.5477447509765625, -0.499237060546875, -0.4507293701171875, -0.4022216796875, -0.3537139892578125, -0.305206298828125, -0.2566986083984375, -0.20819091796875, -0.1596832275390625, -0.111175537109375, -0.0626678466796875, -0.01416015625, 0.0343475341796875, 0.082855224609375, 0.1313629150390625, 0.17987060546875, 0.2283782958984375, 0.276885986328125, 0.3253936767578125, 0.3739013671875, 0.4224090576171875, 0.470916748046875, 0.5194244384765625, 0.56793212890625, 0.6164398193359375, 0.664947509765625, 0.7134552001953125, 0.761962890625, 0.8104705810546875, 0.858978271484375, 0.9074859619140625, 0.95599365234375, 1.0045013427734375, 1.053009033203125, 1.1015167236328125, 1.1500244140625, 1.1985321044921875, 1.247039794921875, 1.2955474853515625, 1.34405517578125, 1.3925628662109375, 1.441070556640625, 1.4895782470703125, 1.5380859375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 7.0, 12.0, 13.0, 16.0, 30.0, 29.0, 51.0, 57.0, 88.0, 129.0, 155.0, 122.0, 88.0, 61.0, 38.0, 27.0, 24.0, 17.0, 16.0, 7.0, 7.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002906322479248047, -0.00028218701481819153, -0.00027374178171157837, -0.0002652965486049652, -0.00025685131549835205, -0.0002484060823917389, -0.00023996084928512573, -0.00023151561617851257, -0.00022307038307189941, -0.00021462514996528625, -0.0002061799168586731, -0.00019773468375205994, -0.00018928945064544678, -0.00018084421753883362, -0.00017239898443222046, -0.0001639537513256073, -0.00015550851821899414, -0.00014706328511238098, -0.00013861805200576782, -0.00013017281889915466, -0.0001217275857925415, -0.00011328235268592834, -0.00010483711957931519, -9.639188647270203e-05, -8.794665336608887e-05, -7.950142025947571e-05, -7.105618715286255e-05, -6.261095404624939e-05, -5.416572093963623e-05, -4.572048783302307e-05, -3.727525472640991e-05, -2.8830021619796753e-05, -2.0384788513183594e-05, -1.1939555406570435e-05, -3.4943222999572754e-06, 4.950910806655884e-06, 1.3396143913269043e-05, 2.1841377019882202e-05, 3.028661012649536e-05, 3.873184323310852e-05, 4.717707633972168e-05, 5.562230944633484e-05, 6.4067542552948e-05, 7.251277565956116e-05, 8.095800876617432e-05, 8.940324187278748e-05, 9.784847497940063e-05, 0.0001062937080860138, 0.00011473894119262695, 0.0001231841742992401, 0.00013162940740585327, 0.00014007464051246643, 0.0001485198736190796, 0.00015696510672569275, 0.0001654103398323059, 0.00017385557293891907, 0.00018230080604553223, 0.00019074603915214539, 0.00019919127225875854, 0.0002076365053653717, 0.00021608173847198486, 0.00022452697157859802, 0.00023297220468521118, 0.00024141743779182434, 0.0002498626708984375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 4.0, 7.0, 8.0, 15.0, 11.0, 26.0, 36.0, 64.0, 132.0, 192.0, 312.0, 628.0, 1597.0, 4679.0, 20202.0, 159130.0, 708228.0, 128674.0, 17655.0, 4138.0, 1448.0, 658.0, 297.0, 146.0, 95.0, 52.0, 38.0, 23.0, 21.0, 12.0, 9.0, 5.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0, 2.0], "bins": [-2.181640625, -2.124908447265625, -2.06817626953125, -2.011444091796875, -1.9547119140625, -1.897979736328125, -1.84124755859375, -1.784515380859375, -1.727783203125, -1.671051025390625, -1.61431884765625, -1.557586669921875, -1.5008544921875, -1.444122314453125, -1.38739013671875, -1.330657958984375, -1.27392578125, -1.217193603515625, -1.16046142578125, -1.103729248046875, -1.0469970703125, -0.990264892578125, -0.93353271484375, -0.876800537109375, -0.820068359375, -0.763336181640625, -0.70660400390625, -0.649871826171875, -0.5931396484375, -0.536407470703125, -0.47967529296875, -0.422943115234375, -0.3662109375, -0.309478759765625, -0.25274658203125, -0.196014404296875, -0.1392822265625, -0.082550048828125, -0.02581787109375, 0.030914306640625, 0.087646484375, 0.144378662109375, 0.20111083984375, 0.257843017578125, 0.3145751953125, 0.371307373046875, 0.42803955078125, 0.484771728515625, 0.54150390625, 0.598236083984375, 0.65496826171875, 0.711700439453125, 0.7684326171875, 0.825164794921875, 0.88189697265625, 0.938629150390625, 0.995361328125, 1.052093505859375, 1.10882568359375, 1.165557861328125, 1.2222900390625, 1.279022216796875, 1.33575439453125, 1.392486572265625, 1.44921875]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 2.0, 4.0, 10.0, 6.0, 11.0, 15.0, 15.0, 25.0, 35.0, 56.0, 62.0, 86.0, 107.0, 121.0, 87.0, 87.0, 69.0, 38.0, 50.0, 30.0, 11.0, 19.0, 17.0, 11.0, 6.0, 5.0, 5.0, 4.0, 8.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.154296875, -1.1088104248046875, -1.063323974609375, -1.0178375244140625, -0.97235107421875, -0.9268646240234375, -0.881378173828125, -0.8358917236328125, -0.7904052734375, -0.7449188232421875, -0.699432373046875, -0.6539459228515625, -0.60845947265625, -0.5629730224609375, -0.517486572265625, -0.4720001220703125, -0.426513671875, -0.3810272216796875, -0.335540771484375, -0.2900543212890625, -0.24456787109375, -0.1990814208984375, -0.153594970703125, -0.1081085205078125, -0.0626220703125, -0.0171356201171875, 0.028350830078125, 0.0738372802734375, 0.11932373046875, 0.1648101806640625, 0.210296630859375, 0.2557830810546875, 0.30126953125, 0.3467559814453125, 0.392242431640625, 0.4377288818359375, 0.48321533203125, 0.5287017822265625, 0.574188232421875, 0.6196746826171875, 0.6651611328125, 0.7106475830078125, 0.756134033203125, 0.8016204833984375, 0.84710693359375, 0.8925933837890625, 0.938079833984375, 0.9835662841796875, 1.029052734375, 1.0745391845703125, 1.120025634765625, 1.1655120849609375, 1.21099853515625, 1.2564849853515625, 1.301971435546875, 1.3474578857421875, 1.3929443359375, 1.4384307861328125, 1.483917236328125, 1.5294036865234375, 1.57489013671875, 1.6203765869140625, 1.665863037109375, 1.7113494873046875, 1.7568359375]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 3.0, 5.0, 3.0, 11.0, 21.0, 13.0, 16.0, 39.0, 62.0, 71.0, 101.0, 108.0, 111.0, 103.0, 96.0, 80.0, 54.0, 33.0, 23.0, 12.0, 13.0, 11.0, 8.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.366525650024414, -12.869441032409668, -12.372356414794922, -11.87527084350586, -11.378186225891113, -10.881101608276367, -10.384016036987305, -9.886931419372559, -9.389846801757812, -8.892762184143066, -8.39567756652832, -7.898591995239258, -7.401507377624512, -6.904422760009766, -6.407337665557861, -5.910252571105957, -5.413167953491211, -4.916083335876465, -4.4189982414245605, -3.9219133853912354, -3.42482852935791, -2.927743673324585, -2.4306588172912598, -1.9335739612579346, -1.4364891052246094, -0.9394042491912842, -0.442319393157959, 0.05476546287536621, 0.5518503189086914, 1.0489351749420166, 1.5460200309753418, 2.043104887008667, 2.540189743041992, 3.0372745990753174, 3.5343594551086426, 4.031444549560547, 4.528529167175293, 5.025613784790039, 5.522698879241943, 6.019783973693848, 6.516868591308594, 7.01395320892334, 7.511038303375244, 8.008123397827148, 8.505208015441895, 9.00229263305664, 9.499378204345703, 9.99646282196045, 10.493547439575195, 10.990632057189941, 11.487716674804688, 11.98480224609375, 12.481886863708496, 12.978971481323242, 13.476057052612305, 13.97314167022705, 14.470226287841797, 14.967310905456543, 15.464395523071289, 15.961481094360352, 16.45856475830078, 16.955650329589844, 17.452735900878906, 17.949819564819336, 18.4469051361084]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 5.0, 7.0, 13.0, 14.0, 10.0, 17.0, 8.0, 15.0, 26.0, 27.0, 31.0, 23.0, 40.0, 42.0, 42.0, 59.0, 43.0, 50.0, 61.0, 40.0, 48.0, 51.0, 32.0, 34.0, 37.0, 42.0, 20.0, 20.0, 23.0, 20.0, 17.0, 15.0, 11.0, 16.0, 6.0, 4.0, 7.0, 9.0, 4.0, 7.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.76424789428711, -9.410740852355957, -9.057234764099121, -8.703727722167969, -8.350220680236816, -7.996714115142822, -7.643207550048828, -7.289700508117676, -6.936193943023682, -6.5826873779296875, -6.229180335998535, -5.875673770904541, -5.522167205810547, -5.1686601638793945, -4.8151535987854, -4.461647033691406, -4.108139991760254, -3.7546331882476807, -3.4011263847351074, -3.0476198196411133, -2.69411301612854, -2.340606212615967, -1.9870996475219727, -1.6335928440093994, -1.2800860404968262, -0.9265792965888977, -0.5730725526809692, -0.21956586837768555, 0.1339409351348877, 0.48744773864746094, 0.8409543037414551, 1.1944611072540283, 1.5479679107666016, 1.9014747142791748, 2.254981517791748, 2.608488082885742, 2.9619948863983154, 3.3155016899108887, 3.669008255004883, 4.022515296936035, 4.376021862030029, 4.729528427124023, 5.083035469055176, 5.43654203414917, 5.790048599243164, 6.143555641174316, 6.4970622062683105, 6.850568771362305, 7.204075813293457, 7.557582378387451, 7.9110894203186035, 8.264595985412598, 8.61810302734375, 8.971609115600586, 9.325116157531738, 9.67862319946289, 10.032129287719727, 10.385636329650879, 10.739142417907715, 11.092649459838867, 11.44615650177002, 11.799663543701172, 12.153169631958008, 12.50667667388916, 12.860183715820312]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 6.0, 10.0, 22.0, 58.0, 93.0, 135.0, 299.0, 578.0, 1294.0, 3091.0, 10447.0, 141955.0, 4011523.0, 17491.0, 4191.0, 1595.0, 711.0, 335.0, 184.0, 95.0, 66.0, 30.0, 27.0, 18.0, 12.0, 5.0, 4.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.4375, -5.24432373046875, -5.0511474609375, -4.85797119140625, -4.664794921875, -4.47161865234375, -4.2784423828125, -4.08526611328125, -3.89208984375, -3.69891357421875, -3.5057373046875, -3.31256103515625, -3.119384765625, -2.92620849609375, -2.7330322265625, -2.53985595703125, -2.3466796875, -2.15350341796875, -1.9603271484375, -1.76715087890625, -1.573974609375, -1.38079833984375, -1.1876220703125, -0.99444580078125, -0.80126953125, -0.60809326171875, -0.4149169921875, -0.22174072265625, -0.028564453125, 0.16461181640625, 0.3577880859375, 0.55096435546875, 0.744140625, 0.93731689453125, 1.1304931640625, 1.32366943359375, 1.516845703125, 1.71002197265625, 1.9031982421875, 2.09637451171875, 2.28955078125, 2.48272705078125, 2.6759033203125, 2.86907958984375, 3.062255859375, 3.25543212890625, 3.4486083984375, 3.64178466796875, 3.8349609375, 4.02813720703125, 4.2213134765625, 4.41448974609375, 4.607666015625, 4.80084228515625, 4.9940185546875, 5.18719482421875, 5.38037109375, 5.57354736328125, 5.7667236328125, 5.95989990234375, 6.153076171875, 6.34625244140625, 6.5394287109375, 6.73260498046875, 6.92578125]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 5.0, 10.0, 11.0, 11.0, 20.0, 18.0, 32.0, 32.0, 33.0, 38.0, 53.0, 34.0, 53.0, 58.0, 47.0, 58.0, 51.0, 63.0, 53.0, 45.0, 47.0, 27.0, 32.0, 29.0, 26.0, 30.0, 18.0, 18.0, 10.0, 11.0, 6.0, 8.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.5556640625, -0.537628173828125, -0.51959228515625, -0.501556396484375, -0.4835205078125, -0.465484619140625, -0.44744873046875, -0.429412841796875, -0.411376953125, -0.393341064453125, -0.37530517578125, -0.357269287109375, -0.3392333984375, -0.321197509765625, -0.30316162109375, -0.285125732421875, -0.26708984375, -0.249053955078125, -0.23101806640625, -0.212982177734375, -0.1949462890625, -0.176910400390625, -0.15887451171875, -0.140838623046875, -0.122802734375, -0.104766845703125, -0.08673095703125, -0.068695068359375, -0.0506591796875, -0.032623291015625, -0.01458740234375, 0.003448486328125, 0.021484375, 0.039520263671875, 0.05755615234375, 0.075592041015625, 0.0936279296875, 0.111663818359375, 0.12969970703125, 0.147735595703125, 0.165771484375, 0.183807373046875, 0.20184326171875, 0.219879150390625, 0.2379150390625, 0.255950927734375, 0.27398681640625, 0.292022705078125, 0.31005859375, 0.328094482421875, 0.34613037109375, 0.364166259765625, 0.3822021484375, 0.400238037109375, 0.41827392578125, 0.436309814453125, 0.454345703125, 0.472381591796875, 0.49041748046875, 0.508453369140625, 0.5264892578125, 0.544525146484375, 0.56256103515625, 0.580596923828125, 0.5986328125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 6.0, 11.0, 8.0, 16.0, 23.0, 32.0, 51.0, 74.0, 102.0, 152.0, 212.0, 322.0, 474.0, 772.0, 1144.0, 1957.0, 3675.0, 7920.0, 22343.0, 132063.0, 3928085.0, 65237.0, 15395.0, 6282.0, 3067.0, 1752.0, 1030.0, 671.0, 444.0, 307.0, 199.0, 147.0, 104.0, 75.0, 44.0, 29.0, 22.0, 20.0, 10.0, 4.0, 6.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.009765625, -2.91375732421875, -2.8177490234375, -2.72174072265625, -2.625732421875, -2.52972412109375, -2.4337158203125, -2.33770751953125, -2.24169921875, -2.14569091796875, -2.0496826171875, -1.95367431640625, -1.857666015625, -1.76165771484375, -1.6656494140625, -1.56964111328125, -1.4736328125, -1.37762451171875, -1.2816162109375, -1.18560791015625, -1.089599609375, -0.99359130859375, -0.8975830078125, -0.80157470703125, -0.70556640625, -0.60955810546875, -0.5135498046875, -0.41754150390625, -0.321533203125, -0.22552490234375, -0.1295166015625, -0.03350830078125, 0.0625, 0.15850830078125, 0.2545166015625, 0.35052490234375, 0.446533203125, 0.54254150390625, 0.6385498046875, 0.73455810546875, 0.83056640625, 0.92657470703125, 1.0225830078125, 1.11859130859375, 1.214599609375, 1.31060791015625, 1.4066162109375, 1.50262451171875, 1.5986328125, 1.69464111328125, 1.7906494140625, 1.88665771484375, 1.982666015625, 2.07867431640625, 2.1746826171875, 2.27069091796875, 2.36669921875, 2.46270751953125, 2.5587158203125, 2.65472412109375, 2.750732421875, 2.84674072265625, 2.9427490234375, 3.03875732421875, 3.134765625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 6.0, 7.0, 4.0, 11.0, 15.0, 19.0, 41.0, 60.0, 146.0, 3015.0, 497.0, 99.0, 43.0, 34.0, 17.0, 12.0, 8.0, 4.0, 5.0, 6.0, 5.0, 5.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.56201171875, -0.5432052612304688, -0.5243988037109375, -0.5055923461914062, -0.486785888671875, -0.46797943115234375, -0.4491729736328125, -0.43036651611328125, -0.41156005859375, -0.39275360107421875, -0.3739471435546875, -0.35514068603515625, -0.336334228515625, -0.31752777099609375, -0.2987213134765625, -0.27991485595703125, -0.2611083984375, -0.24230194091796875, -0.2234954833984375, -0.20468902587890625, -0.185882568359375, -0.16707611083984375, -0.1482696533203125, -0.12946319580078125, -0.11065673828125, -0.09185028076171875, -0.0730438232421875, -0.05423736572265625, -0.035430908203125, -0.01662445068359375, 0.0021820068359375, 0.02098846435546875, 0.039794921875, 0.05860137939453125, 0.0774078369140625, 0.09621429443359375, 0.115020751953125, 0.13382720947265625, 0.1526336669921875, 0.17144012451171875, 0.19024658203125, 0.20905303955078125, 0.2278594970703125, 0.24666595458984375, 0.265472412109375, 0.28427886962890625, 0.3030853271484375, 0.32189178466796875, 0.3406982421875, 0.35950469970703125, 0.3783111572265625, 0.39711761474609375, 0.415924072265625, 0.43473052978515625, 0.4535369873046875, 0.47234344482421875, 0.49114990234375, 0.5099563598632812, 0.5287628173828125, 0.5475692749023438, 0.566375732421875, 0.5851821899414062, 0.6039886474609375, 0.6227951049804688, 0.6416015625]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 7.0, 10.0, 14.0, 24.0, 39.0, 72.0, 101.0, 138.0, 140.0, 122.0, 104.0, 82.0, 56.0, 34.0, 25.0, 16.0, 6.0, 7.0, 5.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5385429859161377, -3.4232499599456787, -3.3079566955566406, -3.1926636695861816, -3.0773706436157227, -2.9620776176452637, -2.8467845916748047, -2.7314913272857666, -2.6161983013153076, -2.5009052753448486, -2.3856120109558105, -2.2703189849853516, -2.1550259590148926, -2.0397329330444336, -1.924439787864685, -1.8091466426849365, -1.6938536167144775, -1.5785605907440186, -1.46326744556427, -1.3479743003845215, -1.2326812744140625, -1.1173882484436035, -1.002095103263855, -0.8868020176887512, -0.7715089321136475, -0.6562158465385437, -0.5409227609634399, -0.4256296753883362, -0.3103365898132324, -0.19504350423812866, -0.0797504186630249, 0.03554266691207886, 0.15083599090576172, 0.2661290764808655, 0.38142216205596924, 0.496715247631073, 0.6120083332061768, 0.7273014187812805, 0.8425945043563843, 0.957887589931488, 1.0731806755065918, 1.1884737014770508, 1.3037668466567993, 1.4190599918365479, 1.5343530178070068, 1.6496460437774658, 1.7649391889572144, 1.880232334136963, 1.9955253601074219, 2.110818386077881, 2.22611141204834, 2.341404676437378, 2.456697702407837, 2.571990728378296, 2.687283992767334, 2.802577018737793, 2.917870044708252, 3.033163070678711, 3.14845609664917, 3.263749361038208, 3.379042387008667, 3.494335412979126, 3.609628677368164, 3.724921703338623, 3.840214729309082]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 4.0, 5.0, 5.0, 10.0, 14.0, 7.0, 10.0, 20.0, 21.0, 23.0, 22.0, 16.0, 28.0, 31.0, 36.0, 41.0, 33.0, 31.0, 50.0, 33.0, 38.0, 53.0, 46.0, 39.0, 22.0, 43.0, 34.0, 42.0, 34.0, 27.0, 25.0, 26.0, 26.0, 16.0, 19.0, 15.0, 13.0, 10.0, 7.0, 9.0, 4.0, 9.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.326143503189087, -1.2843542098999023, -1.2425650358200073, -1.2007757425308228, -1.1589865684509277, -1.1171972751617432, -1.0754081010818481, -1.0336188077926636, -0.9918296337127686, -0.9500404000282288, -0.908251166343689, -0.8664619326591492, -0.8246726989746094, -0.7828834652900696, -0.7410942316055298, -0.6993049383163452, -0.6575157046318054, -0.6157264709472656, -0.5739372372627258, -0.532148003578186, -0.49035876989364624, -0.44856953620910645, -0.40678027272224426, -0.36499103903770447, -0.3232018053531647, -0.2814125716686249, -0.23962333798408508, -0.1978340893983841, -0.1560448557138443, -0.1142556220293045, -0.07246637344360352, -0.03067713975906372, 0.011112093925476074, 0.05290133133530617, 0.09469056874513626, 0.13647980988025665, 0.17826904356479645, 0.22005827724933624, 0.26184752583503723, 0.303636759519577, 0.3454259932041168, 0.3872152268886566, 0.4290044605731964, 0.4707937240600586, 0.5125829577445984, 0.5543721914291382, 0.596161425113678, 0.6379506587982178, 0.6797398924827576, 0.7215291261672974, 0.7633183598518372, 0.805107593536377, 0.8468968272209167, 0.8886860609054565, 0.9304753541946411, 0.9722645282745361, 1.0140538215637207, 1.0558431148529053, 1.0976322889328003, 1.1394215822219849, 1.1812107563018799, 1.2230000495910645, 1.2647892236709595, 1.306578516960144, 1.348367691040039]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 7.0, 4.0, 6.0, 3.0, 7.0, 7.0, 17.0, 24.0, 28.0, 46.0, 64.0, 97.0, 123.0, 183.0, 287.0, 494.0, 747.0, 1404.0, 2528.0, 4816.0, 9699.0, 21099.0, 47029.0, 107881.0, 215145.0, 279670.0, 191212.0, 90952.0, 39527.0, 17562.0, 8350.0, 4192.0, 2195.0, 1218.0, 705.0, 421.0, 276.0, 162.0, 107.0, 76.0, 54.0, 32.0, 33.0, 17.0, 17.0, 11.0, 12.0, 7.0, 4.0, 3.0, 2.0, 4.0, 0.0, 3.0, 3.0], "bins": [-2.09765625, -2.0366668701171875, -1.975677490234375, -1.9146881103515625, -1.85369873046875, -1.7927093505859375, -1.731719970703125, -1.6707305908203125, -1.6097412109375, -1.5487518310546875, -1.487762451171875, -1.4267730712890625, -1.36578369140625, -1.3047943115234375, -1.243804931640625, -1.1828155517578125, -1.121826171875, -1.0608367919921875, -0.999847412109375, -0.9388580322265625, -0.87786865234375, -0.8168792724609375, -0.755889892578125, -0.6949005126953125, -0.6339111328125, -0.5729217529296875, -0.511932373046875, -0.4509429931640625, -0.38995361328125, -0.3289642333984375, -0.267974853515625, -0.2069854736328125, -0.14599609375, -0.0850067138671875, -0.024017333984375, 0.0369720458984375, 0.09796142578125, 0.1589508056640625, 0.219940185546875, 0.2809295654296875, 0.3419189453125, 0.4029083251953125, 0.463897705078125, 0.5248870849609375, 0.58587646484375, 0.6468658447265625, 0.707855224609375, 0.7688446044921875, 0.829833984375, 0.8908233642578125, 0.951812744140625, 1.0128021240234375, 1.07379150390625, 1.1347808837890625, 1.195770263671875, 1.2567596435546875, 1.3177490234375, 1.3787384033203125, 1.439727783203125, 1.5007171630859375, 1.56170654296875, 1.6226959228515625, 1.683685302734375, 1.7446746826171875, 1.8056640625]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 3.0, 9.0, 11.0, 8.0, 18.0, 13.0, 26.0, 21.0, 35.0, 36.0, 31.0, 32.0, 41.0, 44.0, 56.0, 35.0, 45.0, 58.0, 48.0, 44.0, 56.0, 47.0, 49.0, 32.0, 33.0, 33.0, 21.0, 19.0, 23.0, 17.0, 15.0, 8.0, 12.0, 5.0, 4.0, 6.0, 5.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.5556640625, -0.5374526977539062, -0.5192413330078125, -0.5010299682617188, -0.482818603515625, -0.46460723876953125, -0.4463958740234375, -0.42818450927734375, -0.40997314453125, -0.39176177978515625, -0.3735504150390625, -0.35533905029296875, -0.337127685546875, -0.31891632080078125, -0.3007049560546875, -0.28249359130859375, -0.2642822265625, -0.24607086181640625, -0.2278594970703125, -0.20964813232421875, -0.191436767578125, -0.17322540283203125, -0.1550140380859375, -0.13680267333984375, -0.11859130859375, -0.10037994384765625, -0.0821685791015625, -0.06395721435546875, -0.045745849609375, -0.02753448486328125, -0.0093231201171875, 0.00888824462890625, 0.027099609375, 0.04531097412109375, 0.0635223388671875, 0.08173370361328125, 0.099945068359375, 0.11815643310546875, 0.1363677978515625, 0.15457916259765625, 0.17279052734375, 0.19100189208984375, 0.2092132568359375, 0.22742462158203125, 0.245635986328125, 0.26384735107421875, 0.2820587158203125, 0.30027008056640625, 0.3184814453125, 0.33669281005859375, 0.3549041748046875, 0.37311553955078125, 0.391326904296875, 0.40953826904296875, 0.4277496337890625, 0.44596099853515625, 0.46417236328125, 0.48238372802734375, 0.5005950927734375, 0.5188064575195312, 0.537017822265625, 0.5552291870117188, 0.5734405517578125, 0.5916519165039062, 0.60986328125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 4.0, 1.0, 5.0, 1.0, 4.0, 4.0, 8.0, 9.0, 17.0, 19.0, 27.0, 48.0, 74.0, 129.0, 228.0, 486.0, 1101.0, 2948.0, 8414.0, 29370.0, 124487.0, 479158.0, 305398.0, 69884.0, 17785.0, 5361.0, 1898.0, 822.0, 353.0, 189.0, 116.0, 78.0, 45.0, 27.0, 19.0, 14.0, 7.0, 6.0, 7.0, 8.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.865234375, -2.76910400390625, -2.6729736328125, -2.57684326171875, -2.480712890625, -2.38458251953125, -2.2884521484375, -2.19232177734375, -2.09619140625, -2.00006103515625, -1.9039306640625, -1.80780029296875, -1.711669921875, -1.61553955078125, -1.5194091796875, -1.42327880859375, -1.3271484375, -1.23101806640625, -1.1348876953125, -1.03875732421875, -0.942626953125, -0.84649658203125, -0.7503662109375, -0.65423583984375, -0.55810546875, -0.46197509765625, -0.3658447265625, -0.26971435546875, -0.173583984375, -0.07745361328125, 0.0186767578125, 0.11480712890625, 0.2109375, 0.30706787109375, 0.4031982421875, 0.49932861328125, 0.595458984375, 0.69158935546875, 0.7877197265625, 0.88385009765625, 0.97998046875, 1.07611083984375, 1.1722412109375, 1.26837158203125, 1.364501953125, 1.46063232421875, 1.5567626953125, 1.65289306640625, 1.7490234375, 1.84515380859375, 1.9412841796875, 2.03741455078125, 2.133544921875, 2.22967529296875, 2.3258056640625, 2.42193603515625, 2.51806640625, 2.61419677734375, 2.7103271484375, 2.80645751953125, 2.902587890625, 2.99871826171875, 3.0948486328125, 3.19097900390625, 3.287109375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 8.0, 5.0, 13.0, 10.0, 17.0, 21.0, 19.0, 30.0, 34.0, 40.0, 52.0, 50.0, 55.0, 70.0, 63.0, 57.0, 60.0, 64.0, 54.0, 54.0, 46.0, 36.0, 31.0, 26.0, 21.0, 15.0, 14.0, 13.0, 14.0, 5.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.69140625, -4.574737548828125, -4.45806884765625, -4.341400146484375, -4.2247314453125, -4.108062744140625, -3.99139404296875, -3.874725341796875, -3.758056640625, -3.641387939453125, -3.52471923828125, -3.408050537109375, -3.2913818359375, -3.174713134765625, -3.05804443359375, -2.941375732421875, -2.82470703125, -2.708038330078125, -2.59136962890625, -2.474700927734375, -2.3580322265625, -2.241363525390625, -2.12469482421875, -2.008026123046875, -1.891357421875, -1.774688720703125, -1.65802001953125, -1.541351318359375, -1.4246826171875, -1.308013916015625, -1.19134521484375, -1.074676513671875, -0.9580078125, -0.841339111328125, -0.72467041015625, -0.608001708984375, -0.4913330078125, -0.374664306640625, -0.25799560546875, -0.141326904296875, -0.024658203125, 0.092010498046875, 0.20867919921875, 0.325347900390625, 0.4420166015625, 0.558685302734375, 0.67535400390625, 0.792022705078125, 0.90869140625, 1.025360107421875, 1.14202880859375, 1.258697509765625, 1.3753662109375, 1.492034912109375, 1.60870361328125, 1.725372314453125, 1.842041015625, 1.958709716796875, 2.07537841796875, 2.192047119140625, 2.3087158203125, 2.425384521484375, 2.54205322265625, 2.658721923828125, 2.775390625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 9.0, 8.0, 5.0, 9.0, 23.0, 21.0, 35.0, 53.0, 83.0, 168.0, 273.0, 695.0, 1768.0, 6403.0, 37264.0, 591485.0, 374327.0, 27920.0, 5268.0, 1462.0, 628.0, 260.0, 153.0, 69.0, 46.0, 26.0, 27.0, 20.0, 10.0, 9.0, 7.0, 6.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.146484375, -3.053741455078125, -2.96099853515625, -2.868255615234375, -2.7755126953125, -2.682769775390625, -2.59002685546875, -2.497283935546875, -2.404541015625, -2.311798095703125, -2.21905517578125, -2.126312255859375, -2.0335693359375, -1.940826416015625, -1.84808349609375, -1.755340576171875, -1.66259765625, -1.569854736328125, -1.47711181640625, -1.384368896484375, -1.2916259765625, -1.198883056640625, -1.10614013671875, -1.013397216796875, -0.920654296875, -0.827911376953125, -0.73516845703125, -0.642425537109375, -0.5496826171875, -0.456939697265625, -0.36419677734375, -0.271453857421875, -0.1787109375, -0.085968017578125, 0.00677490234375, 0.099517822265625, 0.1922607421875, 0.285003662109375, 0.37774658203125, 0.470489501953125, 0.563232421875, 0.655975341796875, 0.74871826171875, 0.841461181640625, 0.9342041015625, 1.026947021484375, 1.11968994140625, 1.212432861328125, 1.30517578125, 1.397918701171875, 1.49066162109375, 1.583404541015625, 1.6761474609375, 1.768890380859375, 1.86163330078125, 1.954376220703125, 2.047119140625, 2.139862060546875, 2.23260498046875, 2.325347900390625, 2.4180908203125, 2.510833740234375, 2.60357666015625, 2.696319580078125, 2.7890625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 5.0, 5.0, 15.0, 13.0, 9.0, 21.0, 22.0, 29.0, 30.0, 47.0, 58.0, 68.0, 87.0, 81.0, 93.0, 85.0, 66.0, 57.0, 44.0, 30.0, 29.0, 26.0, 18.0, 9.0, 8.0, 10.0, 7.0, 3.0, 4.0, 1.0, 5.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 3.0], "bins": [-0.00023317337036132812, -0.00022704154253005981, -0.0002209097146987915, -0.0002147778868675232, -0.00020864605903625488, -0.00020251423120498657, -0.00019638240337371826, -0.00019025057554244995, -0.00018411874771118164, -0.00017798691987991333, -0.00017185509204864502, -0.0001657232642173767, -0.0001595914363861084, -0.0001534596085548401, -0.00014732778072357178, -0.00014119595289230347, -0.00013506412506103516, -0.00012893229722976685, -0.00012280046939849854, -0.00011666864156723022, -0.00011053681373596191, -0.0001044049859046936, -9.827315807342529e-05, -9.214133024215698e-05, -8.600950241088867e-05, -7.987767457962036e-05, -7.374584674835205e-05, -6.761401891708374e-05, -6.148219108581543e-05, -5.535036325454712e-05, -4.921853542327881e-05, -4.30867075920105e-05, -3.695487976074219e-05, -3.082305192947388e-05, -2.4691224098205566e-05, -1.8559396266937256e-05, -1.2427568435668945e-05, -6.295740604400635e-06, -1.6391277313232422e-07, 5.967915058135986e-06, 1.2099742889404297e-05, 1.8231570720672607e-05, 2.4363398551940918e-05, 3.049522638320923e-05, 3.662705421447754e-05, 4.275888204574585e-05, 4.889070987701416e-05, 5.502253770828247e-05, 6.115436553955078e-05, 6.728619337081909e-05, 7.34180212020874e-05, 7.954984903335571e-05, 8.568167686462402e-05, 9.181350469589233e-05, 9.794533252716064e-05, 0.00010407716035842896, 0.00011020898818969727, 0.00011634081602096558, 0.0001224726438522339, 0.0001286044716835022, 0.0001347362995147705, 0.00014086812734603882, 0.00014699995517730713, 0.00015313178300857544, 0.00015926361083984375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 6.0, 5.0, 7.0, 17.0, 21.0, 30.0, 61.0, 78.0, 161.0, 296.0, 561.0, 1535.0, 4394.0, 18272.0, 124366.0, 732299.0, 138926.0, 19771.0, 4890.0, 1493.0, 628.0, 316.0, 181.0, 96.0, 57.0, 28.0, 15.0, 16.0, 17.0, 4.0, 6.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.328125, -2.2542724609375, -2.180419921875, -2.1065673828125, -2.03271484375, -1.9588623046875, -1.885009765625, -1.8111572265625, -1.7373046875, -1.6634521484375, -1.589599609375, -1.5157470703125, -1.44189453125, -1.3680419921875, -1.294189453125, -1.2203369140625, -1.146484375, -1.0726318359375, -0.998779296875, -0.9249267578125, -0.85107421875, -0.7772216796875, -0.703369140625, -0.6295166015625, -0.5556640625, -0.4818115234375, -0.407958984375, -0.3341064453125, -0.26025390625, -0.1864013671875, -0.112548828125, -0.0386962890625, 0.03515625, 0.1090087890625, 0.182861328125, 0.2567138671875, 0.33056640625, 0.4044189453125, 0.478271484375, 0.5521240234375, 0.6259765625, 0.6998291015625, 0.773681640625, 0.8475341796875, 0.92138671875, 0.9952392578125, 1.069091796875, 1.1429443359375, 1.216796875, 1.2906494140625, 1.364501953125, 1.4383544921875, 1.51220703125, 1.5860595703125, 1.659912109375, 1.7337646484375, 1.8076171875, 1.8814697265625, 1.955322265625, 2.0291748046875, 2.10302734375, 2.1768798828125, 2.250732421875, 2.3245849609375, 2.3984375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 4.0, 7.0, 9.0, 5.0, 11.0, 13.0, 9.0, 21.0, 24.0, 31.0, 47.0, 61.0, 104.0, 139.0, 138.0, 108.0, 66.0, 67.0, 36.0, 30.0, 23.0, 16.0, 10.0, 9.0, 7.0, 6.0, 5.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.384765625, -3.29827880859375, -3.2117919921875, -3.12530517578125, -3.038818359375, -2.95233154296875, -2.8658447265625, -2.77935791015625, -2.69287109375, -2.60638427734375, -2.5198974609375, -2.43341064453125, -2.346923828125, -2.26043701171875, -2.1739501953125, -2.08746337890625, -2.0009765625, -1.91448974609375, -1.8280029296875, -1.74151611328125, -1.655029296875, -1.56854248046875, -1.4820556640625, -1.39556884765625, -1.30908203125, -1.22259521484375, -1.1361083984375, -1.04962158203125, -0.963134765625, -0.87664794921875, -0.7901611328125, -0.70367431640625, -0.6171875, -0.53070068359375, -0.4442138671875, -0.35772705078125, -0.271240234375, -0.18475341796875, -0.0982666015625, -0.01177978515625, 0.07470703125, 0.16119384765625, 0.2476806640625, 0.33416748046875, 0.420654296875, 0.50714111328125, 0.5936279296875, 0.68011474609375, 0.7666015625, 0.85308837890625, 0.9395751953125, 1.02606201171875, 1.112548828125, 1.19903564453125, 1.2855224609375, 1.37200927734375, 1.45849609375, 1.54498291015625, 1.6314697265625, 1.71795654296875, 1.804443359375, 1.89093017578125, 1.9774169921875, 2.06390380859375, 2.150390625]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 0.0, 7.0, 11.0, 18.0, 46.0, 50.0, 126.0, 160.0, 172.0, 153.0, 119.0, 66.0, 40.0, 23.0, 10.0, 4.0, 2.0, 3.0], "bins": [-68.13705444335938, -66.88511657714844, -65.63318634033203, -64.3812484741211, -63.12931442260742, -61.87738037109375, -60.62544250488281, -59.37350845336914, -58.12157440185547, -56.8696403503418, -55.617706298828125, -54.36576843261719, -53.113834381103516, -51.861900329589844, -50.609962463378906, -49.358028411865234, -48.10609436035156, -46.85416030883789, -45.60222625732422, -44.35028839111328, -43.09835433959961, -41.84642028808594, -40.594482421875, -39.34254837036133, -38.090614318847656, -36.838680267333984, -35.58674621582031, -34.334808349609375, -33.0828742980957, -31.83094024658203, -30.579004287719727, -29.327068328857422, -28.075136184692383, -26.823200225830078, -25.571266174316406, -24.319332122802734, -23.06739616394043, -21.815460205078125, -20.563526153564453, -19.31159210205078, -18.059656143188477, -16.807720184326172, -15.5557861328125, -14.303851127624512, -13.051916122436523, -11.799981117248535, -10.548046112060547, -9.296111106872559, -8.04417610168457, -6.792241096496582, -5.540306091308594, -4.2883710861206055, -3.036436080932617, -1.784501075744629, -0.5325660705566406, 0.7193689346313477, 1.971303939819336, 3.223238945007324, 4.4751739501953125, 5.727108955383301, 6.979043960571289, 8.230978965759277, 9.482913970947266, 10.734848976135254, 11.986783981323242]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 6.0, 6.0, 1.0, 5.0, 3.0, 3.0, 3.0, 9.0, 13.0, 12.0, 23.0, 20.0, 35.0, 34.0, 23.0, 40.0, 46.0, 38.0, 58.0, 64.0, 58.0, 64.0, 68.0, 58.0, 47.0, 45.0, 32.0, 38.0, 25.0, 22.0, 26.0, 14.0, 14.0, 14.0, 9.0, 9.0, 5.0, 13.0, 4.0, 1.0, 6.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.822039604187012, -15.275516510009766, -14.728992462158203, -14.182469367980957, -13.635946273803711, -13.089422225952148, -12.542899131774902, -11.996376037597656, -11.449851989746094, -10.903328895568848, -10.356804847717285, -9.810281753540039, -9.263758659362793, -8.717235565185547, -8.170711517333984, -7.624188423156738, -7.077665328979492, -6.531141757965088, -5.984618663787842, -5.4380950927734375, -4.891571998596191, -4.345048427581787, -3.798524856567383, -3.2520015239715576, -2.7054781913757324, -2.1589548587799072, -1.6124314069747925, -1.0659079551696777, -0.5193846225738525, 0.027138710021972656, 0.573662281036377, 1.1201856136322021, 1.666707992553711, 2.213231325149536, 2.7597546577453613, 3.3062782287597656, 3.852801561355591, 4.399324893951416, 4.94584846496582, 5.492371559143066, 6.038895130157471, 6.585418701171875, 7.131941795349121, 7.678465366363525, 8.22498893737793, 8.771512031555176, 9.318035125732422, 9.864559173583984, 10.41108226776123, 10.957605361938477, 11.504129409790039, 12.050652503967285, 12.597175598144531, 13.143699645996094, 13.69022274017334, 14.236745834350586, 14.783269882202148, 15.329792976379395, 15.876317024230957, 16.422840118408203, 16.969364166259766, 17.515886306762695, 18.062410354614258, 18.60893440246582, 19.15545654296875]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 9.0, 11.0, 13.0, 23.0, 39.0, 74.0, 149.0, 397.0, 956.0, 2531.0, 10113.0, 152855.0, 4003942.0, 17367.0, 3673.0, 1172.0, 504.0, 183.0, 116.0, 62.0, 40.0, 16.0, 13.0, 10.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0], "bins": [-9.671875, -9.43682861328125, -9.2017822265625, -8.96673583984375, -8.731689453125, -8.49664306640625, -8.2615966796875, -8.02655029296875, -7.79150390625, -7.55645751953125, -7.3214111328125, -7.08636474609375, -6.851318359375, -6.61627197265625, -6.3812255859375, -6.14617919921875, -5.9111328125, -5.67608642578125, -5.4410400390625, -5.20599365234375, -4.970947265625, -4.73590087890625, -4.5008544921875, -4.26580810546875, -4.03076171875, -3.79571533203125, -3.5606689453125, -3.32562255859375, -3.090576171875, -2.85552978515625, -2.6204833984375, -2.38543701171875, -2.150390625, -1.91534423828125, -1.6802978515625, -1.44525146484375, -1.210205078125, -0.97515869140625, -0.7401123046875, -0.50506591796875, -0.27001953125, -0.03497314453125, 0.2000732421875, 0.43511962890625, 0.670166015625, 0.90521240234375, 1.1402587890625, 1.37530517578125, 1.6103515625, 1.84539794921875, 2.0804443359375, 2.31549072265625, 2.550537109375, 2.78558349609375, 3.0206298828125, 3.25567626953125, 3.49072265625, 3.72576904296875, 3.9608154296875, 4.19586181640625, 4.430908203125, 4.66595458984375, 4.9010009765625, 5.13604736328125, 5.37109375]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [4.0, 1.0, 3.0, 0.0, 1.0, 5.0, 9.0, 8.0, 7.0, 7.0, 9.0, 20.0, 23.0, 21.0, 44.0, 39.0, 53.0, 64.0, 68.0, 59.0, 72.0, 73.0, 69.0, 67.0, 45.0, 47.0, 45.0, 29.0, 34.0, 21.0, 14.0, 18.0, 10.0, 9.0, 5.0, 4.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5556640625, -0.5292205810546875, -0.502777099609375, -0.4763336181640625, -0.44989013671875, -0.4234466552734375, -0.397003173828125, -0.3705596923828125, -0.3441162109375, -0.3176727294921875, -0.291229248046875, -0.2647857666015625, -0.23834228515625, -0.2118988037109375, -0.185455322265625, -0.1590118408203125, -0.132568359375, -0.1061248779296875, -0.079681396484375, -0.0532379150390625, -0.02679443359375, -0.0003509521484375, 0.026092529296875, 0.0525360107421875, 0.0789794921875, 0.1054229736328125, 0.131866455078125, 0.1583099365234375, 0.18475341796875, 0.2111968994140625, 0.237640380859375, 0.2640838623046875, 0.29052734375, 0.3169708251953125, 0.343414306640625, 0.3698577880859375, 0.39630126953125, 0.4227447509765625, 0.449188232421875, 0.4756317138671875, 0.5020751953125, 0.5285186767578125, 0.554962158203125, 0.5814056396484375, 0.60784912109375, 0.6342926025390625, 0.660736083984375, 0.6871795654296875, 0.713623046875, 0.7400665283203125, 0.766510009765625, 0.7929534912109375, 0.81939697265625, 0.8458404541015625, 0.872283935546875, 0.8987274169921875, 0.9251708984375, 0.9516143798828125, 0.978057861328125, 1.0045013427734375, 1.03094482421875, 1.0573883056640625, 1.083831787109375, 1.1102752685546875, 1.13671875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 4.0, 6.0, 16.0, 16.0, 28.0, 30.0, 51.0, 67.0, 110.0, 163.0, 225.0, 364.0, 506.0, 859.0, 1360.0, 2054.0, 3743.0, 7524.0, 17184.0, 54924.0, 3519421.0, 509083.0, 45460.0, 15385.0, 6782.0, 3474.0, 1962.0, 1215.0, 746.0, 487.0, 326.0, 242.0, 152.0, 98.0, 74.0, 43.0, 44.0, 28.0, 11.0, 10.0, 8.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.08203125, -2.95843505859375, -2.8348388671875, -2.71124267578125, -2.587646484375, -2.46405029296875, -2.3404541015625, -2.21685791015625, -2.09326171875, -1.96966552734375, -1.8460693359375, -1.72247314453125, -1.598876953125, -1.47528076171875, -1.3516845703125, -1.22808837890625, -1.1044921875, -0.98089599609375, -0.8572998046875, -0.73370361328125, -0.610107421875, -0.48651123046875, -0.3629150390625, -0.23931884765625, -0.11572265625, 0.00787353515625, 0.1314697265625, 0.25506591796875, 0.378662109375, 0.50225830078125, 0.6258544921875, 0.74945068359375, 0.873046875, 0.99664306640625, 1.1202392578125, 1.24383544921875, 1.367431640625, 1.49102783203125, 1.6146240234375, 1.73822021484375, 1.86181640625, 1.98541259765625, 2.1090087890625, 2.23260498046875, 2.356201171875, 2.47979736328125, 2.6033935546875, 2.72698974609375, 2.8505859375, 2.97418212890625, 3.0977783203125, 3.22137451171875, 3.344970703125, 3.46856689453125, 3.5921630859375, 3.71575927734375, 3.83935546875, 3.96295166015625, 4.0865478515625, 4.21014404296875, 4.333740234375, 4.45733642578125, 4.5809326171875, 4.70452880859375, 4.828125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 3.0, 1.0, 2.0, 7.0, 8.0, 7.0, 18.0, 15.0, 26.0, 37.0, 85.0, 230.0, 3097.0, 273.0, 102.0, 49.0, 21.0, 31.0, 13.0, 14.0, 5.0, 5.0, 8.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0322265625, -0.9961090087890625, -0.959991455078125, -0.9238739013671875, -0.88775634765625, -0.8516387939453125, -0.815521240234375, -0.7794036865234375, -0.7432861328125, -0.7071685791015625, -0.671051025390625, -0.6349334716796875, -0.59881591796875, -0.5626983642578125, -0.526580810546875, -0.4904632568359375, -0.454345703125, -0.4182281494140625, -0.382110595703125, -0.3459930419921875, -0.30987548828125, -0.2737579345703125, -0.237640380859375, -0.2015228271484375, -0.1654052734375, -0.1292877197265625, -0.093170166015625, -0.0570526123046875, -0.02093505859375, 0.0151824951171875, 0.051300048828125, 0.0874176025390625, 0.12353515625, 0.1596527099609375, 0.195770263671875, 0.2318878173828125, 0.26800537109375, 0.3041229248046875, 0.340240478515625, 0.3763580322265625, 0.4124755859375, 0.4485931396484375, 0.484710693359375, 0.5208282470703125, 0.55694580078125, 0.5930633544921875, 0.629180908203125, 0.6652984619140625, 0.701416015625, 0.7375335693359375, 0.773651123046875, 0.8097686767578125, 0.84588623046875, 0.8820037841796875, 0.918121337890625, 0.9542388916015625, 0.9903564453125, 1.0264739990234375, 1.062591552734375, 1.0987091064453125, 1.13482666015625, 1.1709442138671875, 1.207061767578125, 1.2431793212890625, 1.279296875]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 6.0, 1.0, 3.0, 4.0, 7.0, 18.0, 29.0, 29.0, 56.0, 90.0, 137.0, 149.0, 137.0, 110.0, 80.0, 66.0, 24.0, 19.0, 22.0, 12.0, 3.0, 8.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.178412437438965, -3.970205783843994, -3.7619991302490234, -3.5537924766540527, -3.345585823059082, -3.1373791694641113, -2.9291725158691406, -2.72096586227417, -2.512759208679199, -2.3045525550842285, -2.096345901489258, -1.888139247894287, -1.6799325942993164, -1.4717258214950562, -1.2635191679000854, -1.0553125143051147, -0.8471057415008545, -0.6388990879058838, -0.4306924045085907, -0.2224857211112976, -0.014279067516326904, 0.19392764568328857, 0.4021342992782593, 0.61034095287323, 0.8185476064682007, 1.0267542600631714, 1.234960913658142, 1.4431676864624023, 1.651374340057373, 1.8595809936523438, 2.0677876472473145, 2.275994300842285, 2.484200954437256, 2.6924076080322266, 2.9006142616271973, 3.108820915222168, 3.3170275688171387, 3.5252342224121094, 3.73344087600708, 3.941647529602051, 4.1498541831970215, 4.358060836791992, 4.566267490386963, 4.774474143981934, 4.982680797576904, 5.190887451171875, 5.399094104766846, 5.607300758361816, 5.815507888793945, 6.023714542388916, 6.231921195983887, 6.440127849578857, 6.648334503173828, 6.856541156768799, 7.0647478103637695, 7.27295446395874, 7.481161117553711, 7.689367771148682, 7.897574424743652, 8.105781555175781, 8.313987731933594, 8.522194862365723, 8.730401039123535, 8.938608169555664, 9.146814346313477]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 4.0, 1.0, 3.0, 3.0, 5.0, 6.0, 8.0, 10.0, 13.0, 18.0, 16.0, 19.0, 24.0, 33.0, 31.0, 26.0, 26.0, 48.0, 36.0, 30.0, 36.0, 52.0, 43.0, 41.0, 39.0, 34.0, 39.0, 35.0, 34.0, 43.0, 31.0, 29.0, 34.0, 27.0, 31.0, 22.0, 20.0, 9.0, 10.0, 10.0, 10.0, 5.0, 1.0, 2.0, 2.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0], "bins": [-3.6049296855926514, -3.502578020095825, -3.400226354598999, -3.297874689102173, -3.1955230236053467, -3.0931713581085205, -2.9908194541931152, -2.888467788696289, -2.786116123199463, -2.6837644577026367, -2.5814127922058105, -2.4790611267089844, -2.376709461212158, -2.274357795715332, -2.172006130218506, -2.0696544647216797, -1.9673027992248535, -1.8649511337280273, -1.7625994682312012, -1.660247802734375, -1.5578961372375488, -1.4555444717407227, -1.353192687034607, -1.2508410215377808, -1.1484893560409546, -1.0461376905441284, -0.9437860250473022, -0.8414342999458313, -0.7390826344490051, -0.636730968952179, -0.534379243850708, -0.43202757835388184, -0.32967591285705566, -0.2273242324590683, -0.12497255206108093, -0.022620856761932373, 0.0797308087348938, 0.18208247423171997, 0.2844341993331909, 0.3867858648300171, 0.48913753032684326, 0.5914891958236694, 0.6938408613204956, 0.7961925864219666, 0.8985442519187927, 1.0008959770202637, 1.1032476425170898, 1.205599308013916, 1.3079509735107422, 1.4103026390075684, 1.5126543045043945, 1.6150059700012207, 1.7173576354980469, 1.819709300994873, 1.9220610857009888, 2.0244126319885254, 2.1267642974853516, 2.2291159629821777, 2.331467628479004, 2.43381929397583, 2.5361709594726562, 2.6385226249694824, 2.7408742904663086, 2.8432259559631348, 2.94557785987854]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 4.0, 4.0, 8.0, 8.0, 14.0, 13.0, 18.0, 41.0, 57.0, 67.0, 91.0, 127.0, 233.0, 332.0, 558.0, 952.0, 1720.0, 3135.0, 6007.0, 12197.0, 26250.0, 57703.0, 126920.0, 241633.0, 270604.0, 160139.0, 74361.0, 33581.0, 15563.0, 7271.0, 3905.0, 2064.0, 1159.0, 633.0, 399.0, 262.0, 173.0, 113.0, 79.0, 50.0, 32.0, 30.0, 15.0, 9.0, 4.0, 5.0, 5.0, 5.0, 3.0, 1.0, 2.0, 3.0, 0.0, 3.0], "bins": [-1.9404296875, -1.8836212158203125, -1.826812744140625, -1.7700042724609375, -1.71319580078125, -1.6563873291015625, -1.599578857421875, -1.5427703857421875, -1.4859619140625, -1.4291534423828125, -1.372344970703125, -1.3155364990234375, -1.25872802734375, -1.2019195556640625, -1.145111083984375, -1.0883026123046875, -1.031494140625, -0.9746856689453125, -0.917877197265625, -0.8610687255859375, -0.80426025390625, -0.7474517822265625, -0.690643310546875, -0.6338348388671875, -0.5770263671875, -0.5202178955078125, -0.463409423828125, -0.4066009521484375, -0.34979248046875, -0.2929840087890625, -0.236175537109375, -0.1793670654296875, -0.12255859375, -0.0657501220703125, -0.008941650390625, 0.0478668212890625, 0.10467529296875, 0.1614837646484375, 0.218292236328125, 0.2751007080078125, 0.3319091796875, 0.3887176513671875, 0.445526123046875, 0.5023345947265625, 0.55914306640625, 0.6159515380859375, 0.672760009765625, 0.7295684814453125, 0.786376953125, 0.8431854248046875, 0.899993896484375, 0.9568023681640625, 1.01361083984375, 1.0704193115234375, 1.127227783203125, 1.1840362548828125, 1.2408447265625, 1.2976531982421875, 1.354461669921875, 1.4112701416015625, 1.46807861328125, 1.5248870849609375, 1.581695556640625, 1.6385040283203125, 1.6953125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 4.0, 2.0, 4.0, 8.0, 9.0, 13.0, 16.0, 21.0, 12.0, 25.0, 31.0, 43.0, 47.0, 49.0, 42.0, 62.0, 66.0, 68.0, 64.0, 67.0, 56.0, 57.0, 42.0, 38.0, 34.0, 23.0, 21.0, 22.0, 22.0, 13.0, 6.0, 6.0, 8.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7900390625, -0.758056640625, -0.72607421875, -0.694091796875, -0.662109375, -0.630126953125, -0.59814453125, -0.566162109375, -0.5341796875, -0.502197265625, -0.47021484375, -0.438232421875, -0.40625, -0.374267578125, -0.34228515625, -0.310302734375, -0.2783203125, -0.246337890625, -0.21435546875, -0.182373046875, -0.150390625, -0.118408203125, -0.08642578125, -0.054443359375, -0.0224609375, 0.009521484375, 0.04150390625, 0.073486328125, 0.10546875, 0.137451171875, 0.16943359375, 0.201416015625, 0.2333984375, 0.265380859375, 0.29736328125, 0.329345703125, 0.361328125, 0.393310546875, 0.42529296875, 0.457275390625, 0.4892578125, 0.521240234375, 0.55322265625, 0.585205078125, 0.6171875, 0.649169921875, 0.68115234375, 0.713134765625, 0.7451171875, 0.777099609375, 0.80908203125, 0.841064453125, 0.873046875, 0.905029296875, 0.93701171875, 0.968994140625, 1.0009765625, 1.032958984375, 1.06494140625, 1.096923828125, 1.12890625, 1.160888671875, 1.19287109375, 1.224853515625, 1.2568359375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 16.0, 15.0, 21.0, 35.0, 71.0, 123.0, 288.0, 687.0, 2061.0, 8697.0, 58974.0, 639457.0, 303170.0, 27640.0, 5041.0, 1366.0, 448.0, 187.0, 120.0, 53.0, 40.0, 16.0, 15.0, 8.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.70703125, -7.51348876953125, -7.3199462890625, -7.12640380859375, -6.932861328125, -6.73931884765625, -6.5457763671875, -6.35223388671875, -6.15869140625, -5.96514892578125, -5.7716064453125, -5.57806396484375, -5.384521484375, -5.19097900390625, -4.9974365234375, -4.80389404296875, -4.6103515625, -4.41680908203125, -4.2232666015625, -4.02972412109375, -3.836181640625, -3.64263916015625, -3.4490966796875, -3.25555419921875, -3.06201171875, -2.86846923828125, -2.6749267578125, -2.48138427734375, -2.287841796875, -2.09429931640625, -1.9007568359375, -1.70721435546875, -1.513671875, -1.32012939453125, -1.1265869140625, -0.93304443359375, -0.739501953125, -0.54595947265625, -0.3524169921875, -0.15887451171875, 0.03466796875, 0.22821044921875, 0.4217529296875, 0.61529541015625, 0.808837890625, 1.00238037109375, 1.1959228515625, 1.38946533203125, 1.5830078125, 1.77655029296875, 1.9700927734375, 2.16363525390625, 2.357177734375, 2.55072021484375, 2.7442626953125, 2.93780517578125, 3.13134765625, 3.32489013671875, 3.5184326171875, 3.71197509765625, 3.905517578125, 4.09906005859375, 4.2926025390625, 4.48614501953125, 4.6796875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 3.0, 3.0, 6.0, 8.0, 7.0, 15.0, 12.0, 12.0, 24.0, 24.0, 24.0, 31.0, 44.0, 58.0, 59.0, 60.0, 61.0, 75.0, 61.0, 48.0, 61.0, 47.0, 43.0, 48.0, 38.0, 25.0, 22.0, 18.0, 15.0, 12.0, 4.0, 12.0, 5.0, 4.0, 5.0, 5.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.30078125, -6.1280517578125, -5.955322265625, -5.7825927734375, -5.60986328125, -5.4371337890625, -5.264404296875, -5.0916748046875, -4.9189453125, -4.7462158203125, -4.573486328125, -4.4007568359375, -4.22802734375, -4.0552978515625, -3.882568359375, -3.7098388671875, -3.537109375, -3.3643798828125, -3.191650390625, -3.0189208984375, -2.84619140625, -2.6734619140625, -2.500732421875, -2.3280029296875, -2.1552734375, -1.9825439453125, -1.809814453125, -1.6370849609375, -1.46435546875, -1.2916259765625, -1.118896484375, -0.9461669921875, -0.7734375, -0.6007080078125, -0.427978515625, -0.2552490234375, -0.08251953125, 0.0902099609375, 0.262939453125, 0.4356689453125, 0.6083984375, 0.7811279296875, 0.953857421875, 1.1265869140625, 1.29931640625, 1.4720458984375, 1.644775390625, 1.8175048828125, 1.990234375, 2.1629638671875, 2.335693359375, 2.5084228515625, 2.68115234375, 2.8538818359375, 3.026611328125, 3.1993408203125, 3.3720703125, 3.5447998046875, 3.717529296875, 3.8902587890625, 4.06298828125, 4.2357177734375, 4.408447265625, 4.5811767578125, 4.75390625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 9.0, 6.0, 8.0, 19.0, 34.0, 54.0, 121.0, 181.0, 488.0, 1262.0, 5231.0, 51124.0, 856430.0, 122118.0, 8663.0, 1749.0, 538.0, 239.0, 113.0, 75.0, 32.0, 22.0, 17.0, 8.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.20703125, -4.07403564453125, -3.9410400390625, -3.80804443359375, -3.675048828125, -3.54205322265625, -3.4090576171875, -3.27606201171875, -3.14306640625, -3.01007080078125, -2.8770751953125, -2.74407958984375, -2.611083984375, -2.47808837890625, -2.3450927734375, -2.21209716796875, -2.0791015625, -1.94610595703125, -1.8131103515625, -1.68011474609375, -1.547119140625, -1.41412353515625, -1.2811279296875, -1.14813232421875, -1.01513671875, -0.88214111328125, -0.7491455078125, -0.61614990234375, -0.483154296875, -0.35015869140625, -0.2171630859375, -0.08416748046875, 0.048828125, 0.18182373046875, 0.3148193359375, 0.44781494140625, 0.580810546875, 0.71380615234375, 0.8468017578125, 0.97979736328125, 1.11279296875, 1.24578857421875, 1.3787841796875, 1.51177978515625, 1.644775390625, 1.77777099609375, 1.9107666015625, 2.04376220703125, 2.1767578125, 2.30975341796875, 2.4427490234375, 2.57574462890625, 2.708740234375, 2.84173583984375, 2.9747314453125, 3.10772705078125, 3.24072265625, 3.37371826171875, 3.5067138671875, 3.63970947265625, 3.772705078125, 3.90570068359375, 4.0386962890625, 4.17169189453125, 4.3046875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 6.0, 2.0, 1.0, 6.0, 14.0, 9.0, 26.0, 28.0, 40.0, 51.0, 86.0, 119.0, 126.0, 125.0, 111.0, 110.0, 44.0, 38.0, 24.0, 18.0, 10.0, 7.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0], "bins": [-0.0005655288696289062, -0.0005529113113880157, -0.0005402937531471252, -0.0005276761949062347, -0.0005150586366653442, -0.0005024410784244537, -0.0004898235201835632, -0.00047720596194267273, -0.0004645884037017822, -0.0004519708454608917, -0.0004393532872200012, -0.0004267357289791107, -0.0004141181707382202, -0.0004015006124973297, -0.0003888830542564392, -0.0003762654960155487, -0.0003636479377746582, -0.0003510303795337677, -0.0003384128212928772, -0.0003257952630519867, -0.0003131777048110962, -0.0003005601465702057, -0.0002879425883293152, -0.0002753250300884247, -0.0002627074718475342, -0.0002500899136066437, -0.00023747235536575317, -0.00022485479712486267, -0.00021223723888397217, -0.00019961968064308167, -0.00018700212240219116, -0.00017438456416130066, -0.00016176700592041016, -0.00014914944767951965, -0.00013653188943862915, -0.00012391433119773865, -0.00011129677295684814, -9.867921471595764e-05, -8.606165647506714e-05, -7.344409823417664e-05, -6.082653999328613e-05, -4.820898175239563e-05, -3.559142351150513e-05, -2.2973865270614624e-05, -1.0356307029724121e-05, 2.261251211166382e-06, 1.4878809452056885e-05, 2.7496367692947388e-05, 4.011392593383789e-05, 5.2731484174728394e-05, 6.53490424156189e-05, 7.79666006565094e-05, 9.05841588973999e-05, 0.0001032017171382904, 0.00011581927537918091, 0.0001284368336200714, 0.00014105439186096191, 0.00015367195010185242, 0.00016628950834274292, 0.00017890706658363342, 0.00019152462482452393, 0.00020414218306541443, 0.00021675974130630493, 0.00022937729954719543, 0.00024199485778808594]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 8.0, 14.0, 18.0, 26.0, 45.0, 92.0, 210.0, 480.0, 1962.0, 29210.0, 974053.0, 39279.0, 2181.0, 530.0, 206.0, 107.0, 49.0, 31.0, 20.0, 11.0, 8.0, 5.0, 2.0, 7.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6640625, -8.4503173828125, -8.236572265625, -8.0228271484375, -7.80908203125, -7.5953369140625, -7.381591796875, -7.1678466796875, -6.9541015625, -6.7403564453125, -6.526611328125, -6.3128662109375, -6.09912109375, -5.8853759765625, -5.671630859375, -5.4578857421875, -5.244140625, -5.0303955078125, -4.816650390625, -4.6029052734375, -4.38916015625, -4.1754150390625, -3.961669921875, -3.7479248046875, -3.5341796875, -3.3204345703125, -3.106689453125, -2.8929443359375, -2.67919921875, -2.4654541015625, -2.251708984375, -2.0379638671875, -1.82421875, -1.6104736328125, -1.396728515625, -1.1829833984375, -0.96923828125, -0.7554931640625, -0.541748046875, -0.3280029296875, -0.1142578125, 0.0994873046875, 0.313232421875, 0.5269775390625, 0.74072265625, 0.9544677734375, 1.168212890625, 1.3819580078125, 1.595703125, 1.8094482421875, 2.023193359375, 2.2369384765625, 2.45068359375, 2.6644287109375, 2.878173828125, 3.0919189453125, 3.3056640625, 3.5194091796875, 3.733154296875, 3.9468994140625, 4.16064453125, 4.3743896484375, 4.588134765625, 4.8018798828125, 5.015625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 9.0, 17.0, 27.0, 69.0, 173.0, 306.0, 235.0, 109.0, 32.0, 21.0, 6.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.890625, -10.662567138671875, -10.43450927734375, -10.206451416015625, -9.9783935546875, -9.750335693359375, -9.52227783203125, -9.294219970703125, -9.066162109375, -8.838104248046875, -8.61004638671875, -8.381988525390625, -8.1539306640625, -7.925872802734375, -7.69781494140625, -7.469757080078125, -7.24169921875, -7.013641357421875, -6.78558349609375, -6.557525634765625, -6.3294677734375, -6.101409912109375, -5.87335205078125, -5.645294189453125, -5.417236328125, -5.189178466796875, -4.96112060546875, -4.733062744140625, -4.5050048828125, -4.276947021484375, -4.04888916015625, -3.820831298828125, -3.5927734375, -3.364715576171875, -3.13665771484375, -2.908599853515625, -2.6805419921875, -2.452484130859375, -2.22442626953125, -1.996368408203125, -1.768310546875, -1.540252685546875, -1.31219482421875, -1.084136962890625, -0.8560791015625, -0.628021240234375, -0.39996337890625, -0.171905517578125, 0.05615234375, 0.284210205078125, 0.51226806640625, 0.740325927734375, 0.9683837890625, 1.196441650390625, 1.42449951171875, 1.652557373046875, 1.880615234375, 2.108673095703125, 2.33673095703125, 2.564788818359375, 2.7928466796875, 3.020904541015625, 3.24896240234375, 3.477020263671875, 3.705078125]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 11.0, 27.0, 116.0, 362.0, 359.0, 121.0, 13.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.034568786621094, -43.15842819213867, -39.282283782958984, -35.40614318847656, -31.530000686645508, -27.653858184814453, -23.77771759033203, -19.901575088500977, -16.025432586669922, -12.149290084838867, -8.273148536682129, -4.397006988525391, -0.5208644866943359, 3.3552780151367188, 7.231418609619141, 11.107561111450195, 14.98370361328125, 18.859846115112305, 22.73598861694336, 26.61212921142578, 30.488271713256836, 34.36441421508789, 38.24055480957031, 42.11669921875, 45.99283981323242, 49.868980407714844, 53.74512481689453, 57.62126541137695, 61.497406005859375, 65.37355041503906, 69.24969482421875, 73.1258316040039, 77.00196838378906, 80.87811279296875, 84.7542495727539, 88.6303939819336, 92.50653839111328, 96.38267517089844, 100.25881958007812, 104.13496398925781, 108.0111083984375, 111.88725280761719, 115.76338958740234, 119.63953399658203, 123.51567840576172, 127.39181518554688, 131.26795959472656, 135.14410400390625, 139.02023315429688, 142.89637756347656, 146.77252197265625, 150.64865112304688, 154.52479553222656, 158.40093994140625, 162.27708435058594, 166.15322875976562, 170.0293731689453, 173.905517578125, 177.7816619873047, 181.65780639648438, 185.533935546875, 189.4100799560547, 193.28622436523438, 197.16236877441406, 201.03851318359375]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 5.0, 7.0, 4.0, 2.0, 9.0, 9.0, 17.0, 10.0, 16.0, 22.0, 19.0, 26.0, 29.0, 39.0, 36.0, 52.0, 44.0, 38.0, 60.0, 44.0, 77.0, 55.0, 52.0, 47.0, 37.0, 37.0, 34.0, 30.0, 25.0, 24.0, 21.0, 15.0, 10.0, 8.0, 17.0, 5.0, 5.0, 7.0, 5.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.857677459716797, -22.127111434936523, -21.39654541015625, -20.665979385375977, -19.935413360595703, -19.20484733581543, -18.474281311035156, -17.743715286254883, -17.01314926147461, -16.282583236694336, -15.552017211914062, -14.821451187133789, -14.090885162353516, -13.360319137573242, -12.629753112792969, -11.899187088012695, -11.168621063232422, -10.438055038452148, -9.707489013671875, -8.976922988891602, -8.246356964111328, -7.515790939331055, -6.785224914550781, -6.054658889770508, -5.324092864990234, -4.593526840209961, -3.8629608154296875, -3.132394790649414, -2.4018287658691406, -1.6712627410888672, -0.9406967163085938, -0.2101306915283203, 0.5204334259033203, 1.2509994506835938, 1.9815654754638672, 2.7121315002441406, 3.442697525024414, 4.1732635498046875, 4.903829574584961, 5.634395599365234, 6.364961624145508, 7.095527648925781, 7.826093673706055, 8.556659698486328, 9.287225723266602, 10.017791748046875, 10.748357772827148, 11.478923797607422, 12.209489822387695, 12.940055847167969, 13.670621871948242, 14.401187896728516, 15.131753921508789, 15.862319946289062, 16.592885971069336, 17.32345199584961, 18.054018020629883, 18.784584045410156, 19.51515007019043, 20.245716094970703, 20.976282119750977, 21.70684814453125, 22.437414169311523, 23.167980194091797, 23.89854621887207]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 5.0, 4.0, 1.0, 2.0, 5.0, 9.0, 16.0, 23.0, 30.0, 58.0, 103.0, 202.0, 397.0, 794.0, 1750.0, 5336.0, 42106.0, 4122099.0, 15591.0, 3337.0, 1195.0, 566.0, 254.0, 163.0, 85.0, 51.0, 31.0, 15.0, 12.0, 13.0, 7.0, 11.0, 2.0, 6.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.8046875, -8.5322265625, -8.259765625, -7.9873046875, -7.71484375, -7.4423828125, -7.169921875, -6.8974609375, -6.625, -6.3525390625, -6.080078125, -5.8076171875, -5.53515625, -5.2626953125, -4.990234375, -4.7177734375, -4.4453125, -4.1728515625, -3.900390625, -3.6279296875, -3.35546875, -3.0830078125, -2.810546875, -2.5380859375, -2.265625, -1.9931640625, -1.720703125, -1.4482421875, -1.17578125, -0.9033203125, -0.630859375, -0.3583984375, -0.0859375, 0.1865234375, 0.458984375, 0.7314453125, 1.00390625, 1.2763671875, 1.548828125, 1.8212890625, 2.09375, 2.3662109375, 2.638671875, 2.9111328125, 3.18359375, 3.4560546875, 3.728515625, 4.0009765625, 4.2734375, 4.5458984375, 4.818359375, 5.0908203125, 5.36328125, 5.6357421875, 5.908203125, 6.1806640625, 6.453125, 6.7255859375, 6.998046875, 7.2705078125, 7.54296875, 7.8154296875, 8.087890625, 8.3603515625, 8.6328125]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 7.0, 6.0, 11.0, 18.0, 30.0, 31.0, 39.0, 43.0, 58.0, 72.0, 84.0, 87.0, 87.0, 93.0, 79.0, 54.0, 56.0, 33.0, 25.0, 28.0, 16.0, 12.0, 12.0, 5.0, 6.0, 2.0, 4.0, 0.0, 4.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1611328125, -1.1131591796875, -1.065185546875, -1.0172119140625, -0.96923828125, -0.9212646484375, -0.873291015625, -0.8253173828125, -0.77734375, -0.7293701171875, -0.681396484375, -0.6334228515625, -0.58544921875, -0.5374755859375, -0.489501953125, -0.4415283203125, -0.3935546875, -0.3455810546875, -0.297607421875, -0.2496337890625, -0.20166015625, -0.1536865234375, -0.105712890625, -0.0577392578125, -0.009765625, 0.0382080078125, 0.086181640625, 0.1341552734375, 0.18212890625, 0.2301025390625, 0.278076171875, 0.3260498046875, 0.3740234375, 0.4219970703125, 0.469970703125, 0.5179443359375, 0.56591796875, 0.6138916015625, 0.661865234375, 0.7098388671875, 0.7578125, 0.8057861328125, 0.853759765625, 0.9017333984375, 0.94970703125, 0.9976806640625, 1.045654296875, 1.0936279296875, 1.1416015625, 1.1895751953125, 1.237548828125, 1.2855224609375, 1.33349609375, 1.3814697265625, 1.429443359375, 1.4774169921875, 1.525390625, 1.5733642578125, 1.621337890625, 1.6693115234375, 1.71728515625, 1.7652587890625, 1.813232421875, 1.8612060546875, 1.9091796875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 7.0, 4.0, 16.0, 12.0, 25.0, 27.0, 27.0, 76.0, 92.0, 158.0, 273.0, 360.0, 573.0, 1011.0, 1859.0, 3846.0, 9980.0, 48790.0, 4070440.0, 39832.0, 9016.0, 3551.0, 1744.0, 994.0, 514.0, 346.0, 244.0, 141.0, 81.0, 66.0, 55.0, 40.0, 31.0, 13.0, 13.0, 9.0, 5.0, 6.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.41015625, -6.17669677734375, -5.9432373046875, -5.70977783203125, -5.476318359375, -5.24285888671875, -5.0093994140625, -4.77593994140625, -4.54248046875, -4.30902099609375, -4.0755615234375, -3.84210205078125, -3.608642578125, -3.37518310546875, -3.1417236328125, -2.90826416015625, -2.6748046875, -2.44134521484375, -2.2078857421875, -1.97442626953125, -1.740966796875, -1.50750732421875, -1.2740478515625, -1.04058837890625, -0.80712890625, -0.57366943359375, -0.3402099609375, -0.10675048828125, 0.126708984375, 0.36016845703125, 0.5936279296875, 0.82708740234375, 1.060546875, 1.29400634765625, 1.5274658203125, 1.76092529296875, 1.994384765625, 2.22784423828125, 2.4613037109375, 2.69476318359375, 2.92822265625, 3.16168212890625, 3.3951416015625, 3.62860107421875, 3.862060546875, 4.09552001953125, 4.3289794921875, 4.56243896484375, 4.7958984375, 5.02935791015625, 5.2628173828125, 5.49627685546875, 5.729736328125, 5.96319580078125, 6.1966552734375, 6.43011474609375, 6.66357421875, 6.89703369140625, 7.1304931640625, 7.36395263671875, 7.597412109375, 7.83087158203125, 8.0643310546875, 8.29779052734375, 8.53125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 5.0, 12.0, 11.0, 22.0, 37.0, 76.0, 3630.0, 167.0, 52.0, 19.0, 10.0, 6.0, 3.0, 3.0, 3.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.41796875, -1.3607177734375, -1.303466796875, -1.2462158203125, -1.18896484375, -1.1317138671875, -1.074462890625, -1.0172119140625, -0.9599609375, -0.9027099609375, -0.845458984375, -0.7882080078125, -0.73095703125, -0.6737060546875, -0.616455078125, -0.5592041015625, -0.501953125, -0.4447021484375, -0.387451171875, -0.3302001953125, -0.27294921875, -0.2156982421875, -0.158447265625, -0.1011962890625, -0.0439453125, 0.0133056640625, 0.070556640625, 0.1278076171875, 0.18505859375, 0.2423095703125, 0.299560546875, 0.3568115234375, 0.4140625, 0.4713134765625, 0.528564453125, 0.5858154296875, 0.64306640625, 0.7003173828125, 0.757568359375, 0.8148193359375, 0.8720703125, 0.9293212890625, 0.986572265625, 1.0438232421875, 1.10107421875, 1.1583251953125, 1.215576171875, 1.2728271484375, 1.330078125, 1.3873291015625, 1.444580078125, 1.5018310546875, 1.55908203125, 1.6163330078125, 1.673583984375, 1.7308349609375, 1.7880859375, 1.8453369140625, 1.902587890625, 1.9598388671875, 2.01708984375, 2.0743408203125, 2.131591796875, 2.1888427734375, 2.24609375]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 7.0, 7.0, 10.0, 15.0, 28.0, 45.0, 84.0, 119.0, 137.0, 148.0, 116.0, 105.0, 55.0, 42.0, 33.0, 20.0, 10.0, 4.0, 8.0, 7.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.686426162719727, -6.486286640167236, -6.286147117614746, -6.086007118225098, -5.885867595672607, -5.685728073120117, -5.485588550567627, -5.285449028015137, -5.085309028625488, -4.885169506072998, -4.685029983520508, -4.484889984130859, -4.284750461578369, -4.084610939025879, -3.8844714164733887, -3.6843318939208984, -3.484192371368408, -3.284052848815918, -3.0839130878448486, -2.8837735652923584, -2.683633804321289, -2.483494281768799, -2.2833547592163086, -2.0832152366638184, -1.883075475692749, -1.6829358339309692, -1.4827961921691895, -1.2826566696166992, -1.0825170278549194, -0.8823773860931396, -0.6822378635406494, -0.48209822177886963, -0.28195905685424805, -0.08181944489479065, 0.11832016706466675, 0.31845974922180176, 0.5185993909835815, 0.7187390327453613, 0.9188785552978516, 1.1190181970596313, 1.3191578388214111, 1.519297480583191, 1.7194371223449707, 1.919576644897461, 2.119716167449951, 2.3198559284210205, 2.5199954509735107, 2.72013521194458, 2.9202747344970703, 3.1204142570495605, 3.32055401802063, 3.52069354057312, 3.7208333015441895, 3.9209728240966797, 4.12111234664917, 4.32125186920166, 4.521391868591309, 4.721531391143799, 4.921670913696289, 5.1218109130859375, 5.321950435638428, 5.522089958190918, 5.722229480743408, 5.922369003295898, 6.122508525848389]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 5.0, 3.0, 3.0, 7.0, 6.0, 10.0, 17.0, 9.0, 7.0, 18.0, 17.0, 23.0, 20.0, 17.0, 28.0, 33.0, 40.0, 45.0, 39.0, 49.0, 46.0, 40.0, 43.0, 38.0, 40.0, 35.0, 47.0, 51.0, 24.0, 37.0, 30.0, 23.0, 27.0, 19.0, 25.0, 19.0, 19.0, 15.0, 9.0, 7.0, 6.0, 3.0, 2.0, 5.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.822389602661133, -2.73347806930542, -2.644566297531128, -2.555654764175415, -2.466742992401123, -2.37783145904541, -2.2889199256896973, -2.2000083923339844, -2.1110966205596924, -2.0221850872039795, -1.9332733154296875, -1.8443617820739746, -1.7554501295089722, -1.6665384769439697, -1.5776269435882568, -1.4887152910232544, -1.399803638458252, -1.3108919858932495, -1.221980333328247, -1.1330687999725342, -1.0441571474075317, -0.9552454948425293, -0.8663339018821716, -0.777422308921814, -0.6885106563568115, -0.5995990037918091, -0.5106874108314514, -0.42177578806877136, -0.3328641653060913, -0.24395254254341125, -0.1550409197807312, -0.06612932682037354, 0.022782325744628906, 0.11169394850730896, 0.200605571269989, 0.28951719403266907, 0.3784288167953491, 0.4673404395580292, 0.5562520623207092, 0.6451636552810669, 0.7340753078460693, 0.8229869604110718, 0.9118985533714294, 1.000810146331787, 1.0897217988967896, 1.178633451461792, 1.2675449848175049, 1.3564566373825073, 1.4453682899475098, 1.5342799425125122, 1.6231915950775146, 1.7121031284332275, 1.80101478099823, 1.8899264335632324, 1.9788379669189453, 2.067749500274658, 2.15666127204895, 2.245572805404663, 2.334484577178955, 2.423396110534668, 2.512307643890381, 2.601219415664673, 2.6901309490203857, 2.7790427207946777, 2.8679542541503906]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 1.0, 2.0, 3.0, 11.0, 9.0, 8.0, 16.0, 18.0, 40.0, 43.0, 61.0, 108.0, 121.0, 262.0, 409.0, 746.0, 1490.0, 3424.0, 8094.0, 21670.0, 65901.0, 210980.0, 427685.0, 207354.0, 63953.0, 21452.0, 7999.0, 3320.0, 1518.0, 756.0, 433.0, 200.0, 148.0, 93.0, 62.0, 48.0, 35.0, 26.0, 19.0, 11.0, 3.0, 5.0, 6.0, 3.0, 7.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.83984375, -2.749664306640625, -2.65948486328125, -2.569305419921875, -2.4791259765625, -2.388946533203125, -2.29876708984375, -2.208587646484375, -2.118408203125, -2.028228759765625, -1.93804931640625, -1.847869873046875, -1.7576904296875, -1.667510986328125, -1.57733154296875, -1.487152099609375, -1.39697265625, -1.306793212890625, -1.21661376953125, -1.126434326171875, -1.0362548828125, -0.946075439453125, -0.85589599609375, -0.765716552734375, -0.675537109375, -0.585357666015625, -0.49517822265625, -0.404998779296875, -0.3148193359375, -0.224639892578125, -0.13446044921875, -0.044281005859375, 0.0458984375, 0.136077880859375, 0.22625732421875, 0.316436767578125, 0.4066162109375, 0.496795654296875, 0.58697509765625, 0.677154541015625, 0.767333984375, 0.857513427734375, 0.94769287109375, 1.037872314453125, 1.1280517578125, 1.218231201171875, 1.30841064453125, 1.398590087890625, 1.48876953125, 1.578948974609375, 1.66912841796875, 1.759307861328125, 1.8494873046875, 1.939666748046875, 2.02984619140625, 2.120025634765625, 2.210205078125, 2.300384521484375, 2.39056396484375, 2.480743408203125, 2.5709228515625, 2.661102294921875, 2.75128173828125, 2.841461181640625, 2.931640625]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 6.0, 3.0, 10.0, 11.0, 11.0, 18.0, 24.0, 38.0, 42.0, 49.0, 56.0, 65.0, 71.0, 51.0, 71.0, 77.0, 64.0, 52.0, 67.0, 40.0, 40.0, 38.0, 31.0, 15.0, 15.0, 14.0, 6.0, 5.0, 2.0, 3.0, 2.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3916015625, -1.3461456298828125, -1.300689697265625, -1.2552337646484375, -1.20977783203125, -1.1643218994140625, -1.118865966796875, -1.0734100341796875, -1.0279541015625, -0.9824981689453125, -0.937042236328125, -0.8915863037109375, -0.84613037109375, -0.8006744384765625, -0.755218505859375, -0.7097625732421875, -0.664306640625, -0.6188507080078125, -0.573394775390625, -0.5279388427734375, -0.48248291015625, -0.4370269775390625, -0.391571044921875, -0.3461151123046875, -0.3006591796875, -0.2552032470703125, -0.209747314453125, -0.1642913818359375, -0.11883544921875, -0.0733795166015625, -0.027923583984375, 0.0175323486328125, 0.06298828125, 0.1084442138671875, 0.153900146484375, 0.1993560791015625, 0.24481201171875, 0.2902679443359375, 0.335723876953125, 0.3811798095703125, 0.4266357421875, 0.4720916748046875, 0.517547607421875, 0.5630035400390625, 0.60845947265625, 0.6539154052734375, 0.699371337890625, 0.7448272705078125, 0.790283203125, 0.8357391357421875, 0.881195068359375, 0.9266510009765625, 0.97210693359375, 1.0175628662109375, 1.063018798828125, 1.1084747314453125, 1.1539306640625, 1.1993865966796875, 1.244842529296875, 1.2902984619140625, 1.33575439453125, 1.3812103271484375, 1.426666259765625, 1.4721221923828125, 1.517578125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 4.0, 5.0, 6.0, 6.0, 10.0, 15.0, 22.0, 42.0, 59.0, 92.0, 178.0, 355.0, 670.0, 1750.0, 6183.0, 34155.0, 306668.0, 612162.0, 70813.0, 10818.0, 2679.0, 924.0, 396.0, 215.0, 115.0, 66.0, 47.0, 27.0, 24.0, 21.0, 10.0, 8.0, 4.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.375, -4.2078857421875, -4.040771484375, -3.8736572265625, -3.70654296875, -3.5394287109375, -3.372314453125, -3.2052001953125, -3.0380859375, -2.8709716796875, -2.703857421875, -2.5367431640625, -2.36962890625, -2.2025146484375, -2.035400390625, -1.8682861328125, -1.701171875, -1.5340576171875, -1.366943359375, -1.1998291015625, -1.03271484375, -0.8656005859375, -0.698486328125, -0.5313720703125, -0.3642578125, -0.1971435546875, -0.030029296875, 0.1370849609375, 0.30419921875, 0.4713134765625, 0.638427734375, 0.8055419921875, 0.97265625, 1.1397705078125, 1.306884765625, 1.4739990234375, 1.64111328125, 1.8082275390625, 1.975341796875, 2.1424560546875, 2.3095703125, 2.4766845703125, 2.643798828125, 2.8109130859375, 2.97802734375, 3.1451416015625, 3.312255859375, 3.4793701171875, 3.646484375, 3.8135986328125, 3.980712890625, 4.1478271484375, 4.31494140625, 4.4820556640625, 4.649169921875, 4.8162841796875, 4.9833984375, 5.1505126953125, 5.317626953125, 5.4847412109375, 5.65185546875, 5.8189697265625, 5.986083984375, 6.1531982421875, 6.3203125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 3.0, 5.0, 9.0, 12.0, 11.0, 19.0, 14.0, 20.0, 26.0, 25.0, 23.0, 38.0, 33.0, 40.0, 59.0, 50.0, 61.0, 54.0, 58.0, 51.0, 51.0, 52.0, 42.0, 45.0, 50.0, 29.0, 22.0, 20.0, 19.0, 11.0, 9.0, 14.0, 8.0, 5.0, 7.0, 3.0, 0.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.46875, -5.27874755859375, -5.0887451171875, -4.89874267578125, -4.708740234375, -4.51873779296875, -4.3287353515625, -4.13873291015625, -3.94873046875, -3.75872802734375, -3.5687255859375, -3.37872314453125, -3.188720703125, -2.99871826171875, -2.8087158203125, -2.61871337890625, -2.4287109375, -2.23870849609375, -2.0487060546875, -1.85870361328125, -1.668701171875, -1.47869873046875, -1.2886962890625, -1.09869384765625, -0.90869140625, -0.71868896484375, -0.5286865234375, -0.33868408203125, -0.148681640625, 0.04132080078125, 0.2313232421875, 0.42132568359375, 0.611328125, 0.80133056640625, 0.9913330078125, 1.18133544921875, 1.371337890625, 1.56134033203125, 1.7513427734375, 1.94134521484375, 2.13134765625, 2.32135009765625, 2.5113525390625, 2.70135498046875, 2.891357421875, 3.08135986328125, 3.2713623046875, 3.46136474609375, 3.6513671875, 3.84136962890625, 4.0313720703125, 4.22137451171875, 4.411376953125, 4.60137939453125, 4.7913818359375, 4.98138427734375, 5.17138671875, 5.36138916015625, 5.5513916015625, 5.74139404296875, 5.931396484375, 6.12139892578125, 6.3114013671875, 6.50140380859375, 6.69140625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 3.0, 5.0, 11.0, 7.0, 18.0, 22.0, 38.0, 29.0, 68.0, 95.0, 190.0, 307.0, 622.0, 1484.0, 4594.0, 23470.0, 407671.0, 571666.0, 29920.0, 5190.0, 1644.0, 633.0, 315.0, 214.0, 124.0, 70.0, 36.0, 32.0, 23.0, 15.0, 10.0, 9.0, 6.0, 1.0, 2.0, 4.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.923828125, -2.8265380859375, -2.729248046875, -2.6319580078125, -2.53466796875, -2.4373779296875, -2.340087890625, -2.2427978515625, -2.1455078125, -2.0482177734375, -1.950927734375, -1.8536376953125, -1.75634765625, -1.6590576171875, -1.561767578125, -1.4644775390625, -1.3671875, -1.2698974609375, -1.172607421875, -1.0753173828125, -0.97802734375, -0.8807373046875, -0.783447265625, -0.6861572265625, -0.5888671875, -0.4915771484375, -0.394287109375, -0.2969970703125, -0.19970703125, -0.1024169921875, -0.005126953125, 0.0921630859375, 0.189453125, 0.2867431640625, 0.384033203125, 0.4813232421875, 0.57861328125, 0.6759033203125, 0.773193359375, 0.8704833984375, 0.9677734375, 1.0650634765625, 1.162353515625, 1.2596435546875, 1.35693359375, 1.4542236328125, 1.551513671875, 1.6488037109375, 1.74609375, 1.8433837890625, 1.940673828125, 2.0379638671875, 2.13525390625, 2.2325439453125, 2.329833984375, 2.4271240234375, 2.5244140625, 2.6217041015625, 2.718994140625, 2.8162841796875, 2.91357421875, 3.0108642578125, 3.108154296875, 3.2054443359375, 3.302734375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 1.0, 3.0, 4.0, 8.0, 13.0, 25.0, 36.0, 52.0, 72.0, 76.0, 127.0, 128.0, 146.0, 115.0, 59.0, 57.0, 38.0, 20.0, 16.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00025963783264160156, -0.00024629756808280945, -0.00023295730352401733, -0.00021961703896522522, -0.0002062767744064331, -0.000192936509847641, -0.00017959624528884888, -0.00016625598073005676, -0.00015291571617126465, -0.00013957545161247253, -0.00012623518705368042, -0.0001128949224948883, -9.955465793609619e-05, -8.621439337730408e-05, -7.287412881851196e-05, -5.953386425971985e-05, -4.6193599700927734e-05, -3.285333514213562e-05, -1.9513070583343506e-05, -6.172806024551392e-06, 7.167458534240723e-06, 2.0507723093032837e-05, 3.384798765182495e-05, 4.7188252210617065e-05, 6.052851676940918e-05, 7.38687813282013e-05, 8.720904588699341e-05, 0.00010054931044578552, 0.00011388957500457764, 0.00012722983956336975, 0.00014057010412216187, 0.00015391036868095398, 0.0001672506332397461, 0.0001805908977985382, 0.00019393116235733032, 0.00020727142691612244, 0.00022061169147491455, 0.00023395195603370667, 0.0002472922205924988, 0.0002606324851512909, 0.000273972749710083, 0.0002873130142688751, 0.00030065327882766724, 0.00031399354338645935, 0.00032733380794525146, 0.0003406740725040436, 0.0003540143370628357, 0.0003673546016216278, 0.0003806948661804199, 0.00039403513073921204, 0.00040737539529800415, 0.00042071565985679626, 0.0004340559244155884, 0.0004473961889743805, 0.0004607364535331726, 0.0004740767180919647, 0.00048741698265075684, 0.000500757247209549, 0.0005140975117683411, 0.0005274377763271332, 0.0005407780408859253, 0.0005541183054447174, 0.0005674585700035095, 0.0005807988345623016, 0.0005941390991210938]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 1.0, 4.0, 11.0, 5.0, 10.0, 18.0, 17.0, 34.0, 56.0, 99.0, 258.0, 593.0, 1712.0, 6597.0, 59015.0, 884947.0, 84156.0, 7934.0, 1934.0, 659.0, 243.0, 109.0, 54.0, 28.0, 24.0, 12.0, 12.0, 3.0, 5.0, 6.0, 4.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.140625, -4.0093994140625, -3.878173828125, -3.7469482421875, -3.61572265625, -3.4844970703125, -3.353271484375, -3.2220458984375, -3.0908203125, -2.9595947265625, -2.828369140625, -2.6971435546875, -2.56591796875, -2.4346923828125, -2.303466796875, -2.1722412109375, -2.041015625, -1.9097900390625, -1.778564453125, -1.6473388671875, -1.51611328125, -1.3848876953125, -1.253662109375, -1.1224365234375, -0.9912109375, -0.8599853515625, -0.728759765625, -0.5975341796875, -0.46630859375, -0.3350830078125, -0.203857421875, -0.0726318359375, 0.05859375, 0.1898193359375, 0.321044921875, 0.4522705078125, 0.58349609375, 0.7147216796875, 0.845947265625, 0.9771728515625, 1.1083984375, 1.2396240234375, 1.370849609375, 1.5020751953125, 1.63330078125, 1.7645263671875, 1.895751953125, 2.0269775390625, 2.158203125, 2.2894287109375, 2.420654296875, 2.5518798828125, 2.68310546875, 2.8143310546875, 2.945556640625, 3.0767822265625, 3.2080078125, 3.3392333984375, 3.470458984375, 3.6016845703125, 3.73291015625, 3.8641357421875, 3.995361328125, 4.1265869140625, 4.2578125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 7.0, 11.0, 18.0, 26.0, 34.0, 53.0, 73.0, 94.0, 116.0, 116.0, 109.0, 72.0, 80.0, 54.0, 38.0, 23.0, 13.0, 14.0, 4.0, 6.0, 5.0, 5.0, 7.0, 2.0, 3.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.365234375, -2.275848388671875, -2.18646240234375, -2.097076416015625, -2.0076904296875, -1.918304443359375, -1.82891845703125, -1.739532470703125, -1.650146484375, -1.560760498046875, -1.47137451171875, -1.381988525390625, -1.2926025390625, -1.203216552734375, -1.11383056640625, -1.024444580078125, -0.93505859375, -0.845672607421875, -0.75628662109375, -0.666900634765625, -0.5775146484375, -0.488128662109375, -0.39874267578125, -0.309356689453125, -0.219970703125, -0.130584716796875, -0.04119873046875, 0.048187255859375, 0.1375732421875, 0.226959228515625, 0.31634521484375, 0.405731201171875, 0.4951171875, 0.584503173828125, 0.67388916015625, 0.763275146484375, 0.8526611328125, 0.942047119140625, 1.03143310546875, 1.120819091796875, 1.210205078125, 1.299591064453125, 1.38897705078125, 1.478363037109375, 1.5677490234375, 1.657135009765625, 1.74652099609375, 1.835906982421875, 1.92529296875, 2.014678955078125, 2.10406494140625, 2.193450927734375, 2.2828369140625, 2.372222900390625, 2.46160888671875, 2.550994873046875, 2.640380859375, 2.729766845703125, 2.81915283203125, 2.908538818359375, 2.9979248046875, 3.087310791015625, 3.17669677734375, 3.266082763671875, 3.35546875]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 5.0, 11.0, 100.0, 370.0, 407.0, 93.0, 25.0, 3.0, 1.0, 1.0, 1.0], "bins": [-240.26705932617188, -236.05662536621094, -231.84619140625, -227.63575744628906, -223.42532348632812, -219.21487426757812, -215.00445556640625, -210.79400634765625, -206.5835723876953, -202.37313842773438, -198.16270446777344, -193.9522705078125, -189.74183654785156, -185.53140258789062, -181.32095336914062, -177.1105194091797, -172.90008544921875, -168.6896514892578, -164.47921752929688, -160.26878356933594, -156.058349609375, -151.847900390625, -147.63748168945312, -143.42703247070312, -139.21661376953125, -135.0061798095703, -130.79574584960938, -126.58531188964844, -122.37487030029297, -118.16443634033203, -113.9540023803711, -109.74356842041016, -105.53313446044922, -101.32270050048828, -97.11226654052734, -92.90182495117188, -88.69139099121094, -84.48095703125, -80.27052307128906, -76.06008911132812, -71.84964752197266, -67.63921356201172, -63.428775787353516, -59.21834182739258, -55.007904052734375, -50.79747009277344, -46.5870361328125, -42.37660217285156, -38.166168212890625, -33.95573425292969, -29.745296478271484, -25.534862518310547, -21.324426651000977, -17.113990783691406, -12.903556823730469, -8.693120956420898, -4.482683181762695, -0.2722477912902832, 3.938187599182129, 8.148622512817383, 12.359058380126953, 16.569494247436523, 20.77992820739746, 24.99036407470703, 29.2007999420166]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 6.0, 4.0, 2.0, 6.0, 7.0, 12.0, 17.0, 14.0, 24.0, 28.0, 34.0, 47.0, 54.0, 43.0, 59.0, 46.0, 89.0, 60.0, 71.0, 51.0, 51.0, 57.0, 50.0, 44.0, 26.0, 20.0, 24.0, 19.0, 13.0, 10.0, 6.0, 2.0, 4.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-38.46742248535156, -37.43059539794922, -36.393768310546875, -35.35694122314453, -34.32011413574219, -33.28328323364258, -32.246456146240234, -31.20962905883789, -30.172801971435547, -29.135974884033203, -28.09914779663086, -27.062318801879883, -26.02549171447754, -24.988664627075195, -23.95183563232422, -22.915008544921875, -21.87818145751953, -20.841354370117188, -19.804527282714844, -18.767698287963867, -17.730871200561523, -16.69404411315918, -15.65721607208252, -14.62038803100586, -13.583560943603516, -12.546733856201172, -11.509905815124512, -10.473077774047852, -9.436250686645508, -8.399423599243164, -7.362595558166504, -6.325767993927002, -5.288944244384766, -4.252116680145264, -3.2152891159057617, -2.1784615516662598, -1.1416339874267578, -0.10480642318725586, 0.9320211410522461, 1.968848705291748, 3.00567626953125, 4.042503833770752, 5.079331398010254, 6.116158962249756, 7.152986526489258, 8.189813613891602, 9.226641654968262, 10.263469696044922, 11.300296783447266, 12.33712387084961, 13.37395191192627, 14.41077995300293, 15.447607040405273, 16.484434127807617, 17.521263122558594, 18.558090209960938, 19.59491729736328, 20.631744384765625, 21.66857147216797, 22.705400466918945, 23.74222755432129, 24.779054641723633, 25.81588363647461, 26.852710723876953, 27.889537811279297]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 13.0, 6.0, 18.0, 26.0, 37.0, 57.0, 86.0, 155.0, 243.0, 516.0, 1195.0, 2982.0, 9567.0, 95161.0, 4050680.0, 25130.0, 5237.0, 1707.0, 698.0, 349.0, 163.0, 89.0, 59.0, 44.0, 21.0, 10.0, 10.0, 6.0, 4.0, 2.0, 7.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.0, -4.80206298828125, -4.6041259765625, -4.40618896484375, -4.208251953125, -4.01031494140625, -3.8123779296875, -3.61444091796875, -3.41650390625, -3.21856689453125, -3.0206298828125, -2.82269287109375, -2.624755859375, -2.42681884765625, -2.2288818359375, -2.03094482421875, -1.8330078125, -1.63507080078125, -1.4371337890625, -1.23919677734375, -1.041259765625, -0.84332275390625, -0.6453857421875, -0.44744873046875, -0.24951171875, -0.05157470703125, 0.1463623046875, 0.34429931640625, 0.542236328125, 0.74017333984375, 0.9381103515625, 1.13604736328125, 1.333984375, 1.53192138671875, 1.7298583984375, 1.92779541015625, 2.125732421875, 2.32366943359375, 2.5216064453125, 2.71954345703125, 2.91748046875, 3.11541748046875, 3.3133544921875, 3.51129150390625, 3.709228515625, 3.90716552734375, 4.1051025390625, 4.30303955078125, 4.5009765625, 4.69891357421875, 4.8968505859375, 5.09478759765625, 5.292724609375, 5.49066162109375, 5.6885986328125, 5.88653564453125, 6.08447265625, 6.28240966796875, 6.4803466796875, 6.67828369140625, 6.876220703125, 7.07415771484375, 7.2720947265625, 7.47003173828125, 7.66796875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 5.0, 4.0, 5.0, 8.0, 9.0, 24.0, 38.0, 49.0, 61.0, 71.0, 101.0, 99.0, 121.0, 110.0, 84.0, 69.0, 48.0, 37.0, 20.0, 11.0, 11.0, 6.0, 6.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.416015625, -2.3471832275390625, -2.278350830078125, -2.2095184326171875, -2.14068603515625, -2.0718536376953125, -2.003021240234375, -1.9341888427734375, -1.8653564453125, -1.7965240478515625, -1.727691650390625, -1.6588592529296875, -1.59002685546875, -1.5211944580078125, -1.452362060546875, -1.3835296630859375, -1.314697265625, -1.2458648681640625, -1.177032470703125, -1.1082000732421875, -1.03936767578125, -0.9705352783203125, -0.901702880859375, -0.8328704833984375, -0.7640380859375, -0.6952056884765625, -0.626373291015625, -0.5575408935546875, -0.48870849609375, -0.4198760986328125, -0.351043701171875, -0.2822113037109375, -0.21337890625, -0.1445465087890625, -0.075714111328125, -0.0068817138671875, 0.06195068359375, 0.1307830810546875, 0.199615478515625, 0.2684478759765625, 0.3372802734375, 0.4061126708984375, 0.474945068359375, 0.5437774658203125, 0.61260986328125, 0.6814422607421875, 0.750274658203125, 0.8191070556640625, 0.887939453125, 0.9567718505859375, 1.025604248046875, 1.0944366455078125, 1.16326904296875, 1.2321014404296875, 1.300933837890625, 1.3697662353515625, 1.4385986328125, 1.5074310302734375, 1.576263427734375, 1.6450958251953125, 1.71392822265625, 1.7827606201171875, 1.851593017578125, 1.9204254150390625, 1.9892578125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 6.0, 2.0, 7.0, 16.0, 20.0, 31.0, 30.0, 50.0, 53.0, 90.0, 120.0, 197.0, 284.0, 478.0, 789.0, 1373.0, 2659.0, 6049.0, 16002.0, 63934.0, 3877381.0, 179110.0, 28108.0, 9113.0, 3822.0, 1893.0, 1012.0, 563.0, 346.0, 241.0, 167.0, 115.0, 67.0, 41.0, 40.0, 23.0, 17.0, 13.0, 12.0, 6.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.5, -3.36395263671875, -3.2279052734375, -3.09185791015625, -2.955810546875, -2.81976318359375, -2.6837158203125, -2.54766845703125, -2.41162109375, -2.27557373046875, -2.1395263671875, -2.00347900390625, -1.867431640625, -1.73138427734375, -1.5953369140625, -1.45928955078125, -1.3232421875, -1.18719482421875, -1.0511474609375, -0.91510009765625, -0.779052734375, -0.64300537109375, -0.5069580078125, -0.37091064453125, -0.23486328125, -0.09881591796875, 0.0372314453125, 0.17327880859375, 0.309326171875, 0.44537353515625, 0.5814208984375, 0.71746826171875, 0.853515625, 0.98956298828125, 1.1256103515625, 1.26165771484375, 1.397705078125, 1.53375244140625, 1.6697998046875, 1.80584716796875, 1.94189453125, 2.07794189453125, 2.2139892578125, 2.35003662109375, 2.486083984375, 2.62213134765625, 2.7581787109375, 2.89422607421875, 3.0302734375, 3.16632080078125, 3.3023681640625, 3.43841552734375, 3.574462890625, 3.71051025390625, 3.8465576171875, 3.98260498046875, 4.11865234375, 4.25469970703125, 4.3907470703125, 4.52679443359375, 4.662841796875, 4.79888916015625, 4.9349365234375, 5.07098388671875, 5.20703125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 8.0, 9.0, 10.0, 5.0, 18.0, 23.0, 35.0, 53.0, 96.0, 252.0, 3183.0, 170.0, 63.0, 41.0, 32.0, 21.0, 14.0, 8.0, 8.0, 5.0, 6.0, 4.0, 5.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.841796875, -1.779144287109375, -1.71649169921875, -1.653839111328125, -1.5911865234375, -1.528533935546875, -1.46588134765625, -1.403228759765625, -1.340576171875, -1.277923583984375, -1.21527099609375, -1.152618408203125, -1.0899658203125, -1.027313232421875, -0.96466064453125, -0.902008056640625, -0.83935546875, -0.776702880859375, -0.71405029296875, -0.651397705078125, -0.5887451171875, -0.526092529296875, -0.46343994140625, -0.400787353515625, -0.338134765625, -0.275482177734375, -0.21282958984375, -0.150177001953125, -0.0875244140625, -0.024871826171875, 0.03778076171875, 0.100433349609375, 0.1630859375, 0.225738525390625, 0.28839111328125, 0.351043701171875, 0.4136962890625, 0.476348876953125, 0.53900146484375, 0.601654052734375, 0.664306640625, 0.726959228515625, 0.78961181640625, 0.852264404296875, 0.9149169921875, 0.977569580078125, 1.04022216796875, 1.102874755859375, 1.16552734375, 1.228179931640625, 1.29083251953125, 1.353485107421875, 1.4161376953125, 1.478790283203125, 1.54144287109375, 1.604095458984375, 1.666748046875, 1.729400634765625, 1.79205322265625, 1.854705810546875, 1.9173583984375, 1.980010986328125, 2.04266357421875, 2.105316162109375, 2.16796875]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 8.0, 4.0, 17.0, 25.0, 67.0, 126.0, 199.0, 229.0, 166.0, 94.0, 39.0, 15.0, 8.0, 6.0, 5.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.184077262878418, -13.732525825500488, -13.280973434448242, -12.829421997070312, -12.377870559692383, -11.926318168640137, -11.474766731262207, -11.023214340209961, -10.571662902832031, -10.120111465454102, -9.668559074401855, -9.217007637023926, -8.76545524597168, -8.31390380859375, -7.86235237121582, -7.410800457000732, -6.9592485427856445, -6.507696628570557, -6.056144714355469, -5.604593276977539, -5.153041362762451, -4.701489448547363, -4.249938011169434, -3.7983860969543457, -3.346834182739258, -2.89528226852417, -2.443730592727661, -1.9921787977218628, -1.5406270027160645, -1.0890750885009766, -0.6375234127044678, -0.18597173690795898, 0.2655811309814453, 0.7171329259872437, 1.168684720993042, 1.6202365159988403, 2.0717883110046387, 2.5233402252197266, 2.9748919010162354, 3.426443576812744, 3.877995491027832, 4.32954740524292, 4.781099319458008, 5.2326507568359375, 5.684202671051025, 6.135754585266113, 6.587306022644043, 7.038857936859131, 7.490409851074219, 7.941961765289307, 8.393513679504395, 8.845065116882324, 9.29661750793457, 9.7481689453125, 10.19972038269043, 10.65127182006836, 11.102824211120605, 11.554375648498535, 12.005928039550781, 12.457479476928711, 12.90903091430664, 13.360583305358887, 13.812134742736816, 14.263687133789062, 14.715238571166992]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 6.0, 2.0, 5.0, 8.0, 10.0, 6.0, 15.0, 21.0, 25.0, 25.0, 26.0, 27.0, 39.0, 36.0, 37.0, 33.0, 35.0, 46.0, 55.0, 46.0, 48.0, 38.0, 34.0, 48.0, 41.0, 32.0, 46.0, 39.0, 24.0, 28.0, 22.0, 18.0, 19.0, 11.0, 14.0, 13.0, 5.0, 5.0, 8.0, 2.0, 5.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.659075736999512, -4.512619972229004, -4.366164207458496, -4.219708442687988, -4.0732526779174805, -3.9267966747283936, -3.7803406715393066, -3.633884906768799, -3.487429141998291, -3.340973377227783, -3.1945176124572754, -3.0480616092681885, -2.9016058444976807, -2.755150079727173, -2.608694076538086, -2.462238311767578, -2.3157825469970703, -2.1693267822265625, -2.0228710174560547, -1.8764150142669678, -1.72995924949646, -1.5835034847259521, -1.4370476007461548, -1.2905917167663574, -1.1441359519958496, -0.997680127620697, -0.8512243032455444, -0.7047684788703918, -0.5583126544952393, -0.41185683012008667, -0.2654010057449341, -0.11894512176513672, 0.027510643005371094, 0.17396646738052368, 0.32042229175567627, 0.46687811613082886, 0.6133339405059814, 0.759789764881134, 0.9062455892562866, 1.052701473236084, 1.1991572380065918, 1.3456130027770996, 1.492068886756897, 1.6385247707366943, 1.7849805355072021, 1.93143630027771, 2.077892303466797, 2.2243480682373047, 2.3708038330078125, 2.5172595977783203, 2.663715362548828, 2.810171365737915, 2.956627130508423, 3.1030828952789307, 3.2495388984680176, 3.3959946632385254, 3.542450428009033, 3.688906192779541, 3.835361957550049, 3.9818179607391357, 4.128273963928223, 4.2747297286987305, 4.421185493469238, 4.567641258239746, 4.714097023010254]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 3.0, 6.0, 9.0, 12.0, 31.0, 72.0, 120.0, 332.0, 984.0, 3573.0, 21613.0, 241951.0, 680691.0, 86226.0, 9810.0, 2085.0, 603.0, 213.0, 114.0, 47.0, 30.0, 17.0, 7.0, 7.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.86328125, -7.657958984375, -7.45263671875, -7.247314453125, -7.0419921875, -6.836669921875, -6.63134765625, -6.426025390625, -6.220703125, -6.015380859375, -5.81005859375, -5.604736328125, -5.3994140625, -5.194091796875, -4.98876953125, -4.783447265625, -4.578125, -4.372802734375, -4.16748046875, -3.962158203125, -3.7568359375, -3.551513671875, -3.34619140625, -3.140869140625, -2.935546875, -2.730224609375, -2.52490234375, -2.319580078125, -2.1142578125, -1.908935546875, -1.70361328125, -1.498291015625, -1.29296875, -1.087646484375, -0.88232421875, -0.677001953125, -0.4716796875, -0.266357421875, -0.06103515625, 0.144287109375, 0.349609375, 0.554931640625, 0.76025390625, 0.965576171875, 1.1708984375, 1.376220703125, 1.58154296875, 1.786865234375, 1.9921875, 2.197509765625, 2.40283203125, 2.608154296875, 2.8134765625, 3.018798828125, 3.22412109375, 3.429443359375, 3.634765625, 3.840087890625, 4.04541015625, 4.250732421875, 4.4560546875, 4.661376953125, 4.86669921875, 5.072021484375, 5.27734375]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 8.0, 3.0, 9.0, 15.0, 13.0, 36.0, 41.0, 56.0, 76.0, 93.0, 97.0, 110.0, 102.0, 98.0, 75.0, 56.0, 37.0, 22.0, 19.0, 19.0, 8.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.62109375, -2.5492401123046875, -2.477386474609375, -2.4055328369140625, -2.33367919921875, -2.2618255615234375, -2.189971923828125, -2.1181182861328125, -2.0462646484375, -1.9744110107421875, -1.902557373046875, -1.8307037353515625, -1.75885009765625, -1.6869964599609375, -1.615142822265625, -1.5432891845703125, -1.471435546875, -1.3995819091796875, -1.327728271484375, -1.2558746337890625, -1.18402099609375, -1.1121673583984375, -1.040313720703125, -0.9684600830078125, -0.8966064453125, -0.8247528076171875, -0.752899169921875, -0.6810455322265625, -0.60919189453125, -0.5373382568359375, -0.465484619140625, -0.3936309814453125, -0.32177734375, -0.2499237060546875, -0.178070068359375, -0.1062164306640625, -0.03436279296875, 0.0374908447265625, 0.109344482421875, 0.1811981201171875, 0.2530517578125, 0.3249053955078125, 0.396759033203125, 0.4686126708984375, 0.54046630859375, 0.6123199462890625, 0.684173583984375, 0.7560272216796875, 0.827880859375, 0.8997344970703125, 0.971588134765625, 1.0434417724609375, 1.11529541015625, 1.1871490478515625, 1.259002685546875, 1.3308563232421875, 1.4027099609375, 1.4745635986328125, 1.546417236328125, 1.6182708740234375, 1.69012451171875, 1.7619781494140625, 1.833831787109375, 1.9056854248046875, 1.9775390625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 3.0, 5.0, 3.0, 8.0, 5.0, 8.0, 19.0, 23.0, 27.0, 48.0, 82.0, 118.0, 174.0, 335.0, 621.0, 1312.0, 3346.0, 10667.0, 49647.0, 328849.0, 538967.0, 89430.0, 16803.0, 4545.0, 1697.0, 762.0, 404.0, 240.0, 129.0, 89.0, 54.0, 48.0, 35.0, 19.0, 15.0, 6.0, 3.0, 3.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.90625, -4.77056884765625, -4.6348876953125, -4.49920654296875, -4.363525390625, -4.22784423828125, -4.0921630859375, -3.95648193359375, -3.82080078125, -3.68511962890625, -3.5494384765625, -3.41375732421875, -3.278076171875, -3.14239501953125, -3.0067138671875, -2.87103271484375, -2.7353515625, -2.59967041015625, -2.4639892578125, -2.32830810546875, -2.192626953125, -2.05694580078125, -1.9212646484375, -1.78558349609375, -1.64990234375, -1.51422119140625, -1.3785400390625, -1.24285888671875, -1.107177734375, -0.97149658203125, -0.8358154296875, -0.70013427734375, -0.564453125, -0.42877197265625, -0.2930908203125, -0.15740966796875, -0.021728515625, 0.11395263671875, 0.2496337890625, 0.38531494140625, 0.52099609375, 0.65667724609375, 0.7923583984375, 0.92803955078125, 1.063720703125, 1.19940185546875, 1.3350830078125, 1.47076416015625, 1.6064453125, 1.74212646484375, 1.8778076171875, 2.01348876953125, 2.149169921875, 2.28485107421875, 2.4205322265625, 2.55621337890625, 2.69189453125, 2.82757568359375, 2.9632568359375, 3.09893798828125, 3.234619140625, 3.37030029296875, 3.5059814453125, 3.64166259765625, 3.77734375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 5.0, 7.0, 9.0, 6.0, 9.0, 11.0, 10.0, 17.0, 13.0, 27.0, 24.0, 34.0, 29.0, 39.0, 45.0, 54.0, 42.0, 56.0, 55.0, 48.0, 59.0, 46.0, 57.0, 42.0, 45.0, 34.0, 30.0, 24.0, 22.0, 16.0, 10.0, 17.0, 22.0, 11.0, 6.0, 10.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.65625, -5.4912109375, -5.326171875, -5.1611328125, -4.99609375, -4.8310546875, -4.666015625, -4.5009765625, -4.3359375, -4.1708984375, -4.005859375, -3.8408203125, -3.67578125, -3.5107421875, -3.345703125, -3.1806640625, -3.015625, -2.8505859375, -2.685546875, -2.5205078125, -2.35546875, -2.1904296875, -2.025390625, -1.8603515625, -1.6953125, -1.5302734375, -1.365234375, -1.2001953125, -1.03515625, -0.8701171875, -0.705078125, -0.5400390625, -0.375, -0.2099609375, -0.044921875, 0.1201171875, 0.28515625, 0.4501953125, 0.615234375, 0.7802734375, 0.9453125, 1.1103515625, 1.275390625, 1.4404296875, 1.60546875, 1.7705078125, 1.935546875, 2.1005859375, 2.265625, 2.4306640625, 2.595703125, 2.7607421875, 2.92578125, 3.0908203125, 3.255859375, 3.4208984375, 3.5859375, 3.7509765625, 3.916015625, 4.0810546875, 4.24609375, 4.4111328125, 4.576171875, 4.7412109375, 4.90625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 0.0, 9.0, 9.0, 10.0, 22.0, 19.0, 28.0, 92.0, 175.0, 413.0, 989.0, 4112.0, 30756.0, 665431.0, 325858.0, 16437.0, 2750.0, 779.0, 325.0, 142.0, 60.0, 56.0, 28.0, 16.0, 12.0, 5.0, 6.0, 5.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.71484375, -2.6450042724609375, -2.575164794921875, -2.5053253173828125, -2.43548583984375, -2.3656463623046875, -2.295806884765625, -2.2259674072265625, -2.1561279296875, -2.0862884521484375, -2.016448974609375, -1.9466094970703125, -1.87677001953125, -1.8069305419921875, -1.737091064453125, -1.6672515869140625, -1.597412109375, -1.5275726318359375, -1.457733154296875, -1.3878936767578125, -1.31805419921875, -1.2482147216796875, -1.178375244140625, -1.1085357666015625, -1.0386962890625, -0.9688568115234375, -0.899017333984375, -0.8291778564453125, -0.75933837890625, -0.6894989013671875, -0.619659423828125, -0.5498199462890625, -0.47998046875, -0.4101409912109375, -0.340301513671875, -0.2704620361328125, -0.20062255859375, -0.1307830810546875, -0.060943603515625, 0.0088958740234375, 0.0787353515625, 0.1485748291015625, 0.218414306640625, 0.2882537841796875, 0.35809326171875, 0.4279327392578125, 0.497772216796875, 0.5676116943359375, 0.637451171875, 0.7072906494140625, 0.777130126953125, 0.8469696044921875, 0.91680908203125, 0.9866485595703125, 1.056488037109375, 1.1263275146484375, 1.1961669921875, 1.2660064697265625, 1.335845947265625, 1.4056854248046875, 1.47552490234375, 1.5453643798828125, 1.615203857421875, 1.6850433349609375, 1.7548828125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 2.0, 2.0, 10.0, 5.0, 8.0, 12.0, 8.0, 17.0, 24.0, 25.0, 30.0, 31.0, 37.0, 58.0, 72.0, 56.0, 74.0, 78.0, 96.0, 71.0, 77.0, 48.0, 37.0, 37.0, 24.0, 9.0, 8.0, 15.0, 6.0, 7.0, 4.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002162456512451172, -0.00020909495651721954, -0.0002019442617893219, -0.00019479356706142426, -0.0001876428723335266, -0.00018049217760562897, -0.00017334148287773132, -0.00016619078814983368, -0.00015904009342193604, -0.0001518893986940384, -0.00014473870396614075, -0.0001375880092382431, -0.00013043731451034546, -0.00012328661978244781, -0.00011613592505455017, -0.00010898523032665253, -0.00010183453559875488, -9.468384087085724e-05, -8.75331461429596e-05, -8.038245141506195e-05, -7.32317566871643e-05, -6.608106195926666e-05, -5.893036723136902e-05, -5.1779672503471375e-05, -4.462897777557373e-05, -3.7478283047676086e-05, -3.0327588319778442e-05, -2.31768935918808e-05, -1.6026198863983154e-05, -8.87550413608551e-06, -1.7248094081878662e-06, 5.425885319709778e-06, 1.2576580047607422e-05, 1.9727274775505066e-05, 2.687796950340271e-05, 3.4028664231300354e-05, 4.1179358959198e-05, 4.833005368709564e-05, 5.5480748414993286e-05, 6.263144314289093e-05, 6.978213787078857e-05, 7.693283259868622e-05, 8.408352732658386e-05, 9.12342220544815e-05, 9.838491678237915e-05, 0.0001055356115102768, 0.00011268630623817444, 0.00011983700096607208, 0.00012698769569396973, 0.00013413839042186737, 0.00014128908514976501, 0.00014843977987766266, 0.0001555904746055603, 0.00016274116933345795, 0.0001698918640613556, 0.00017704255878925323, 0.00018419325351715088, 0.00019134394824504852, 0.00019849464297294617, 0.0002056453377008438, 0.00021279603242874146, 0.0002199467271566391, 0.00022709742188453674, 0.0002342481166124344, 0.00024139881134033203]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 6.0, 0.0, 1.0, 1.0, 3.0, 1.0, 7.0, 12.0, 10.0, 22.0, 46.0, 55.0, 145.0, 282.0, 623.0, 1870.0, 9430.0, 177368.0, 811795.0, 40487.0, 4369.0, 1161.0, 422.0, 210.0, 95.0, 49.0, 33.0, 19.0, 24.0, 6.0, 0.0, 6.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.328125, -2.245819091796875, -2.16351318359375, -2.081207275390625, -1.9989013671875, -1.916595458984375, -1.83428955078125, -1.751983642578125, -1.669677734375, -1.587371826171875, -1.50506591796875, -1.422760009765625, -1.3404541015625, -1.258148193359375, -1.17584228515625, -1.093536376953125, -1.01123046875, -0.928924560546875, -0.84661865234375, -0.764312744140625, -0.6820068359375, -0.599700927734375, -0.51739501953125, -0.435089111328125, -0.352783203125, -0.270477294921875, -0.18817138671875, -0.105865478515625, -0.0235595703125, 0.058746337890625, 0.14105224609375, 0.223358154296875, 0.3056640625, 0.387969970703125, 0.47027587890625, 0.552581787109375, 0.6348876953125, 0.717193603515625, 0.79949951171875, 0.881805419921875, 0.964111328125, 1.046417236328125, 1.12872314453125, 1.211029052734375, 1.2933349609375, 1.375640869140625, 1.45794677734375, 1.540252685546875, 1.62255859375, 1.704864501953125, 1.78717041015625, 1.869476318359375, 1.9517822265625, 2.034088134765625, 2.11639404296875, 2.198699951171875, 2.281005859375, 2.363311767578125, 2.44561767578125, 2.527923583984375, 2.6102294921875, 2.692535400390625, 2.77484130859375, 2.857147216796875, 2.939453125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 1.0, 11.0, 15.0, 19.0, 34.0, 36.0, 51.0, 67.0, 71.0, 90.0, 88.0, 101.0, 85.0, 71.0, 68.0, 49.0, 44.0, 25.0, 21.0, 16.0, 9.0, 13.0, 7.0, 4.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0380859375, -0.9887847900390625, -0.939483642578125, -0.8901824951171875, -0.84088134765625, -0.7915802001953125, -0.742279052734375, -0.6929779052734375, -0.6436767578125, -0.5943756103515625, -0.545074462890625, -0.4957733154296875, -0.44647216796875, -0.3971710205078125, -0.347869873046875, -0.2985687255859375, -0.249267578125, -0.1999664306640625, -0.150665283203125, -0.1013641357421875, -0.05206298828125, -0.0027618408203125, 0.046539306640625, 0.0958404541015625, 0.1451416015625, 0.1944427490234375, 0.243743896484375, 0.2930450439453125, 0.34234619140625, 0.3916473388671875, 0.440948486328125, 0.4902496337890625, 0.53955078125, 0.5888519287109375, 0.638153076171875, 0.6874542236328125, 0.73675537109375, 0.7860565185546875, 0.835357666015625, 0.8846588134765625, 0.9339599609375, 0.9832611083984375, 1.032562255859375, 1.0818634033203125, 1.13116455078125, 1.1804656982421875, 1.229766845703125, 1.2790679931640625, 1.328369140625, 1.3776702880859375, 1.426971435546875, 1.4762725830078125, 1.52557373046875, 1.5748748779296875, 1.624176025390625, 1.6734771728515625, 1.7227783203125, 1.7720794677734375, 1.821380615234375, 1.8706817626953125, 1.91998291015625, 1.9692840576171875, 2.018585205078125, 2.0678863525390625, 2.1171875]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 7.0, 8.0, 13.0, 27.0, 71.0, 132.0, 197.0, 243.0, 166.0, 77.0, 45.0, 16.0, 10.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.57719802856445, -38.83559799194336, -37.09400177001953, -35.35240173339844, -33.610801696777344, -31.869205474853516, -30.127605438232422, -28.38600730895996, -26.6444091796875, -24.90281105041504, -23.161212921142578, -21.419612884521484, -19.678014755249023, -17.936416625976562, -16.19481658935547, -14.453218460083008, -12.711620330810547, -10.970022201538086, -9.228423118591309, -7.4868245124816895, -5.74522590637207, -4.003627777099609, -2.262028694152832, -0.5204296112060547, 1.2211685180664062, 2.9627671241760254, 4.7043657302856445, 6.445964336395264, 8.187562942504883, 9.929161071777344, 11.670760154724121, 13.412359237670898, 15.153953552246094, 16.895551681518555, 18.637149810791016, 20.37874984741211, 22.12034797668457, 23.86194610595703, 25.603546142578125, 27.345144271850586, 29.086742401123047, 30.828340530395508, 32.56993865966797, 34.31153869628906, 36.053138732910156, 37.794734954833984, 39.53633499145508, 41.277931213378906, 43.01953125, 44.761131286621094, 46.50272750854492, 48.244327545166016, 49.985923767089844, 51.72752380371094, 53.46912384033203, 55.210723876953125, 56.95232009887695, 58.69392013549805, 60.435516357421875, 62.17711639404297, 63.91871643066406, 65.66030883789062, 67.40190887451172, 69.14350891113281, 70.8851089477539]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 10.0, 10.0, 7.0, 17.0, 16.0, 20.0, 29.0, 31.0, 44.0, 41.0, 50.0, 59.0, 79.0, 69.0, 74.0, 62.0, 86.0, 46.0, 49.0, 36.0, 36.0, 27.0, 21.0, 17.0, 22.0, 13.0, 13.0, 7.0, 6.0, 0.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.024574279785156, -30.084320068359375, -29.144065856933594, -28.203811645507812, -27.26355743408203, -26.32330322265625, -25.3830509185791, -24.44279670715332, -23.50254249572754, -22.562288284301758, -21.622034072875977, -20.681779861450195, -19.741527557373047, -18.801273345947266, -17.861019134521484, -16.920764923095703, -15.980510711669922, -15.04025650024414, -14.10000228881836, -13.159749031066895, -12.219494819641113, -11.279240608215332, -10.338987350463867, -9.398733139038086, -8.458478927612305, -7.518224716186523, -6.5779709815979, -5.637717247009277, -4.697463035583496, -3.757208824157715, -2.816955089569092, -1.8767013549804688, -0.9364471435546875, 0.0038068294525146484, 0.9440608024597168, 1.884314775466919, 2.824568748474121, 3.7648229598999023, 4.705076694488525, 5.645330429077148, 6.58558464050293, 7.525838851928711, 8.466093063354492, 9.406346321105957, 10.346600532531738, 11.28685474395752, 12.227108001708984, 13.167362213134766, 14.107616424560547, 15.047870635986328, 15.98812484741211, 16.92837905883789, 17.868633270263672, 18.808887481689453, 19.7491397857666, 20.689393997192383, 21.629648208618164, 22.569902420043945, 23.510156631469727, 24.450410842895508, 25.390663146972656, 26.330917358398438, 27.27117156982422, 28.21142578125, 29.15167999267578]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 11.0, 13.0, 29.0, 58.0, 136.0, 223.0, 470.0, 1214.0, 3637.0, 16445.0, 136630.0, 3826631.0, 183923.0, 18504.0, 4048.0, 1276.0, 530.0, 214.0, 115.0, 62.0, 43.0, 17.0, 16.0, 14.0, 7.0, 8.0, 1.0, 1.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-5.75390625, -5.61199951171875, -5.4700927734375, -5.32818603515625, -5.186279296875, -5.04437255859375, -4.9024658203125, -4.76055908203125, -4.61865234375, -4.47674560546875, -4.3348388671875, -4.19293212890625, -4.051025390625, -3.90911865234375, -3.7672119140625, -3.62530517578125, -3.4833984375, -3.34149169921875, -3.1995849609375, -3.05767822265625, -2.915771484375, -2.77386474609375, -2.6319580078125, -2.49005126953125, -2.34814453125, -2.20623779296875, -2.0643310546875, -1.92242431640625, -1.780517578125, -1.63861083984375, -1.4967041015625, -1.35479736328125, -1.212890625, -1.07098388671875, -0.9290771484375, -0.78717041015625, -0.645263671875, -0.50335693359375, -0.3614501953125, -0.21954345703125, -0.07763671875, 0.06427001953125, 0.2061767578125, 0.34808349609375, 0.489990234375, 0.63189697265625, 0.7738037109375, 0.91571044921875, 1.0576171875, 1.19952392578125, 1.3414306640625, 1.48333740234375, 1.625244140625, 1.76715087890625, 1.9090576171875, 2.05096435546875, 2.19287109375, 2.33477783203125, 2.4766845703125, 2.61859130859375, 2.760498046875, 2.90240478515625, 3.0443115234375, 3.18621826171875, 3.328125]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 2.0, 6.0, 12.0, 10.0, 12.0, 15.0, 18.0, 24.0, 26.0, 32.0, 29.0, 36.0, 36.0, 41.0, 58.0, 52.0, 49.0, 64.0, 58.0, 51.0, 51.0, 55.0, 53.0, 43.0, 33.0, 24.0, 23.0, 17.0, 11.0, 14.0, 18.0, 9.0, 7.0, 1.0, 5.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.81884765625, -0.7853927612304688, -0.7519378662109375, -0.7184829711914062, -0.685028076171875, -0.6515731811523438, -0.6181182861328125, -0.5846633911132812, -0.55120849609375, -0.5177536010742188, -0.4842987060546875, -0.45084381103515625, -0.417388916015625, -0.38393402099609375, -0.3504791259765625, -0.31702423095703125, -0.2835693359375, -0.25011444091796875, -0.2166595458984375, -0.18320465087890625, -0.149749755859375, -0.11629486083984375, -0.0828399658203125, -0.04938507080078125, -0.01593017578125, 0.01752471923828125, 0.0509796142578125, 0.08443450927734375, 0.117889404296875, 0.15134429931640625, 0.1847991943359375, 0.21825408935546875, 0.251708984375, 0.28516387939453125, 0.3186187744140625, 0.35207366943359375, 0.385528564453125, 0.41898345947265625, 0.4524383544921875, 0.48589324951171875, 0.51934814453125, 0.5528030395507812, 0.5862579345703125, 0.6197128295898438, 0.653167724609375, 0.6866226196289062, 0.7200775146484375, 0.7535324096679688, 0.7869873046875, 0.8204421997070312, 0.8538970947265625, 0.8873519897460938, 0.920806884765625, 0.9542617797851562, 0.9877166748046875, 1.0211715698242188, 1.05462646484375, 1.0880813598632812, 1.1215362548828125, 1.1549911499023438, 1.188446044921875, 1.2219009399414062, 1.2553558349609375, 1.2888107299804688, 1.322265625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 3.0, 9.0, 4.0, 4.0, 11.0, 13.0, 32.0, 53.0, 85.0, 213.0, 603.0, 1720.0, 6592.0, 37055.0, 1020777.0, 3061310.0, 53612.0, 8680.0, 2248.0, 687.0, 288.0, 142.0, 57.0, 31.0, 15.0, 17.0, 9.0, 3.0, 2.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.109375, -5.94464111328125, -5.7799072265625, -5.61517333984375, -5.450439453125, -5.28570556640625, -5.1209716796875, -4.95623779296875, -4.79150390625, -4.62677001953125, -4.4620361328125, -4.29730224609375, -4.132568359375, -3.96783447265625, -3.8031005859375, -3.63836669921875, -3.4736328125, -3.30889892578125, -3.1441650390625, -2.97943115234375, -2.814697265625, -2.64996337890625, -2.4852294921875, -2.32049560546875, -2.15576171875, -1.99102783203125, -1.8262939453125, -1.66156005859375, -1.496826171875, -1.33209228515625, -1.1673583984375, -1.00262451171875, -0.837890625, -0.67315673828125, -0.5084228515625, -0.34368896484375, -0.178955078125, -0.01422119140625, 0.1505126953125, 0.31524658203125, 0.47998046875, 0.64471435546875, 0.8094482421875, 0.97418212890625, 1.138916015625, 1.30364990234375, 1.4683837890625, 1.63311767578125, 1.7978515625, 1.96258544921875, 2.1273193359375, 2.29205322265625, 2.456787109375, 2.62152099609375, 2.7862548828125, 2.95098876953125, 3.11572265625, 3.28045654296875, 3.4451904296875, 3.60992431640625, 3.774658203125, 3.93939208984375, 4.1041259765625, 4.26885986328125, 4.43359375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 9.0, 13.0, 7.0, 6.0, 11.0, 16.0, 28.0, 32.0, 41.0, 79.0, 124.0, 225.0, 416.0, 861.0, 1002.0, 494.0, 256.0, 119.0, 103.0, 54.0, 47.0, 30.0, 17.0, 12.0, 15.0, 12.0, 9.0, 11.0, 8.0, 3.0, 2.0, 0.0, 4.0, 0.0, 3.0, 1.0, 3.0, 0.0, 2.0, 3.0, 0.0, 1.0], "bins": [-3.62890625, -3.528472900390625, -3.42803955078125, -3.327606201171875, -3.2271728515625, -3.126739501953125, -3.02630615234375, -2.925872802734375, -2.825439453125, -2.725006103515625, -2.62457275390625, -2.524139404296875, -2.4237060546875, -2.323272705078125, -2.22283935546875, -2.122406005859375, -2.02197265625, -1.921539306640625, -1.82110595703125, -1.720672607421875, -1.6202392578125, -1.519805908203125, -1.41937255859375, -1.318939208984375, -1.218505859375, -1.118072509765625, -1.01763916015625, -0.917205810546875, -0.8167724609375, -0.716339111328125, -0.61590576171875, -0.515472412109375, -0.4150390625, -0.314605712890625, -0.21417236328125, -0.113739013671875, -0.0133056640625, 0.087127685546875, 0.18756103515625, 0.287994384765625, 0.388427734375, 0.488861083984375, 0.58929443359375, 0.689727783203125, 0.7901611328125, 0.890594482421875, 0.99102783203125, 1.091461181640625, 1.19189453125, 1.292327880859375, 1.39276123046875, 1.493194580078125, 1.5936279296875, 1.694061279296875, 1.79449462890625, 1.894927978515625, 1.995361328125, 2.095794677734375, 2.19622802734375, 2.296661376953125, 2.3970947265625, 2.497528076171875, 2.59796142578125, 2.698394775390625, 2.798828125]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 9.0, 12.0, 23.0, 42.0, 87.0, 137.0, 183.0, 166.0, 120.0, 76.0, 44.0, 29.0, 22.0, 11.0, 4.0, 6.0, 2.0, 6.0, 3.0, 4.0, 2.0, 1.0, 4.0, 2.0, 7.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.98832893371582, -21.048076629638672, -20.107824325561523, -19.167572021484375, -18.227319717407227, -17.287067413330078, -16.346813201904297, -15.406561851501465, -14.466309547424316, -13.526057243347168, -12.58580493927002, -11.645551681518555, -10.705299377441406, -9.765047073364258, -8.82479476928711, -7.884542465209961, -6.9442901611328125, -6.004037857055664, -5.063785552978516, -4.123532772064209, -3.1832804679870605, -2.243028163909912, -1.3027753829956055, -0.36252307891845703, 0.5777292251586914, 1.5179816484451294, 2.4582340717315674, 3.398486614227295, 4.338738918304443, 5.278991222381592, 6.219244003295898, 7.159496307373047, 8.099750518798828, 9.040002822875977, 9.980255126953125, 10.920507431030273, 11.860759735107422, 12.80101203918457, 13.741265296936035, 14.681517601013184, 15.621769905090332, 16.562023162841797, 17.502275466918945, 18.442527770996094, 19.382780075073242, 20.32303237915039, 21.26328468322754, 22.203536987304688, 23.143789291381836, 24.084041595458984, 25.024293899536133, 25.96454620361328, 26.90479850769043, 27.845050811767578, 28.78530502319336, 29.725555419921875, 30.665809631347656, 31.606061935424805, 32.54631423950195, 33.486568450927734, 34.42681884765625, 35.36707305908203, 36.30732345581055, 37.24757766723633, 38.187828063964844]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 0.0, 5.0, 1.0, 6.0, 13.0, 8.0, 14.0, 19.0, 20.0, 24.0, 19.0, 41.0, 32.0, 46.0, 39.0, 47.0, 48.0, 41.0, 49.0, 51.0, 43.0, 50.0, 49.0, 40.0, 44.0, 45.0, 34.0, 28.0, 31.0, 21.0, 24.0, 19.0, 17.0, 12.0, 8.0, 6.0, 8.0, 2.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.75447654724121, -17.229167938232422, -16.703859329223633, -16.178550720214844, -15.653243064880371, -15.127934455871582, -14.60262680053711, -14.07731819152832, -13.552009582519531, -13.026700973510742, -12.501392364501953, -11.97608470916748, -11.450776100158691, -10.925467491149902, -10.40015983581543, -9.87485122680664, -9.349542617797852, -8.824234008789062, -8.298925399780273, -7.773617744445801, -7.248309135437012, -6.723000526428223, -6.197692394256592, -5.672384262084961, -5.147075653076172, -4.621767044067383, -4.096458911895752, -3.571150541305542, -3.045842170715332, -2.520533800125122, -1.995225429534912, -1.4699170589447021, -0.9446067810058594, -0.4192984104156494, 0.10600996017456055, 0.6313183307647705, 1.1566267013549805, 1.6819350719451904, 2.2072434425354004, 2.7325518131256104, 3.2578601837158203, 3.7831685543060303, 4.30847692489624, 4.833785057067871, 5.35909366607666, 5.884402275085449, 6.40971040725708, 6.935018539428711, 7.4603271484375, 7.985635757446289, 8.510944366455078, 9.03625202178955, 9.56156063079834, 10.086869239807129, 10.612176895141602, 11.13748550415039, 11.66279411315918, 12.188102722167969, 12.713411331176758, 13.23871898651123, 13.76402759552002, 14.289336204528809, 14.814643859863281, 15.33995246887207, 15.86526107788086]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 12.0, 11.0, 17.0, 27.0, 43.0, 63.0, 95.0, 182.0, 277.0, 488.0, 924.0, 1767.0, 3445.0, 7497.0, 17993.0, 46448.0, 131397.0, 332543.0, 312439.0, 119821.0, 42857.0, 16419.0, 6857.0, 3243.0, 1642.0, 891.0, 470.0, 263.0, 169.0, 91.0, 65.0, 40.0, 16.0, 24.0, 11.0, 5.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.265625, -2.1873779296875, -2.109130859375, -2.0308837890625, -1.95263671875, -1.8743896484375, -1.796142578125, -1.7178955078125, -1.6396484375, -1.5614013671875, -1.483154296875, -1.4049072265625, -1.32666015625, -1.2484130859375, -1.170166015625, -1.0919189453125, -1.013671875, -0.9354248046875, -0.857177734375, -0.7789306640625, -0.70068359375, -0.6224365234375, -0.544189453125, -0.4659423828125, -0.3876953125, -0.3094482421875, -0.231201171875, -0.1529541015625, -0.07470703125, 0.0035400390625, 0.081787109375, 0.1600341796875, 0.23828125, 0.3165283203125, 0.394775390625, 0.4730224609375, 0.55126953125, 0.6295166015625, 0.707763671875, 0.7860107421875, 0.8642578125, 0.9425048828125, 1.020751953125, 1.0989990234375, 1.17724609375, 1.2554931640625, 1.333740234375, 1.4119873046875, 1.490234375, 1.5684814453125, 1.646728515625, 1.7249755859375, 1.80322265625, 1.8814697265625, 1.959716796875, 2.0379638671875, 2.1162109375, 2.1944580078125, 2.272705078125, 2.3509521484375, 2.42919921875, 2.5074462890625, 2.585693359375, 2.6639404296875, 2.7421875]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 2.0, 3.0, 2.0, 5.0, 4.0, 12.0, 7.0, 11.0, 10.0, 13.0, 21.0, 22.0, 22.0, 15.0, 39.0, 35.0, 29.0, 32.0, 44.0, 46.0, 53.0, 46.0, 56.0, 60.0, 47.0, 45.0, 43.0, 41.0, 30.0, 31.0, 27.0, 21.0, 23.0, 24.0, 18.0, 15.0, 16.0, 8.0, 9.0, 2.0, 0.0, 7.0, 5.0, 4.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.78125, -0.75054931640625, -0.7198486328125, -0.68914794921875, -0.658447265625, -0.62774658203125, -0.5970458984375, -0.56634521484375, -0.53564453125, -0.50494384765625, -0.4742431640625, -0.44354248046875, -0.412841796875, -0.38214111328125, -0.3514404296875, -0.32073974609375, -0.2900390625, -0.25933837890625, -0.2286376953125, -0.19793701171875, -0.167236328125, -0.13653564453125, -0.1058349609375, -0.07513427734375, -0.04443359375, -0.01373291015625, 0.0169677734375, 0.04766845703125, 0.078369140625, 0.10906982421875, 0.1397705078125, 0.17047119140625, 0.201171875, 0.23187255859375, 0.2625732421875, 0.29327392578125, 0.323974609375, 0.35467529296875, 0.3853759765625, 0.41607666015625, 0.44677734375, 0.47747802734375, 0.5081787109375, 0.53887939453125, 0.569580078125, 0.60028076171875, 0.6309814453125, 0.66168212890625, 0.6923828125, 0.72308349609375, 0.7537841796875, 0.78448486328125, 0.815185546875, 0.84588623046875, 0.8765869140625, 0.90728759765625, 0.93798828125, 0.96868896484375, 0.9993896484375, 1.03009033203125, 1.060791015625, 1.09149169921875, 1.1221923828125, 1.15289306640625, 1.18359375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 1.0, 1.0, 5.0, 9.0, 16.0, 13.0, 21.0, 29.0, 36.0, 52.0, 67.0, 102.0, 159.0, 245.0, 429.0, 639.0, 1159.0, 2183.0, 4659.0, 13489.0, 54155.0, 292327.0, 542365.0, 100901.0, 22124.0, 6851.0, 2867.0, 1453.0, 830.0, 487.0, 284.0, 193.0, 120.0, 77.0, 60.0, 37.0, 34.0, 15.0, 14.0, 13.0, 8.0, 8.0, 6.0, 5.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.23828125, -3.13446044921875, -3.0306396484375, -2.92681884765625, -2.822998046875, -2.71917724609375, -2.6153564453125, -2.51153564453125, -2.40771484375, -2.30389404296875, -2.2000732421875, -2.09625244140625, -1.992431640625, -1.88861083984375, -1.7847900390625, -1.68096923828125, -1.5771484375, -1.47332763671875, -1.3695068359375, -1.26568603515625, -1.161865234375, -1.05804443359375, -0.9542236328125, -0.85040283203125, -0.74658203125, -0.64276123046875, -0.5389404296875, -0.43511962890625, -0.331298828125, -0.22747802734375, -0.1236572265625, -0.01983642578125, 0.083984375, 0.18780517578125, 0.2916259765625, 0.39544677734375, 0.499267578125, 0.60308837890625, 0.7069091796875, 0.81072998046875, 0.91455078125, 1.01837158203125, 1.1221923828125, 1.22601318359375, 1.329833984375, 1.43365478515625, 1.5374755859375, 1.64129638671875, 1.7451171875, 1.84893798828125, 1.9527587890625, 2.05657958984375, 2.160400390625, 2.26422119140625, 2.3680419921875, 2.47186279296875, 2.57568359375, 2.67950439453125, 2.7833251953125, 2.88714599609375, 2.990966796875, 3.09478759765625, 3.1986083984375, 3.30242919921875, 3.40625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 4.0, 1.0, 2.0, 7.0, 9.0, 9.0, 14.0, 19.0, 17.0, 30.0, 29.0, 29.0, 44.0, 44.0, 40.0, 49.0, 54.0, 41.0, 50.0, 49.0, 51.0, 62.0, 63.0, 54.0, 44.0, 33.0, 32.0, 21.0, 29.0, 13.0, 13.0, 12.0, 4.0, 12.0, 5.0, 7.0, 2.0, 5.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-5.7890625, -5.63079833984375, -5.4725341796875, -5.31427001953125, -5.156005859375, -4.99774169921875, -4.8394775390625, -4.68121337890625, -4.52294921875, -4.36468505859375, -4.2064208984375, -4.04815673828125, -3.889892578125, -3.73162841796875, -3.5733642578125, -3.41510009765625, -3.2568359375, -3.09857177734375, -2.9403076171875, -2.78204345703125, -2.623779296875, -2.46551513671875, -2.3072509765625, -2.14898681640625, -1.99072265625, -1.83245849609375, -1.6741943359375, -1.51593017578125, -1.357666015625, -1.19940185546875, -1.0411376953125, -0.88287353515625, -0.724609375, -0.56634521484375, -0.4080810546875, -0.24981689453125, -0.091552734375, 0.06671142578125, 0.2249755859375, 0.38323974609375, 0.54150390625, 0.69976806640625, 0.8580322265625, 1.01629638671875, 1.174560546875, 1.33282470703125, 1.4910888671875, 1.64935302734375, 1.8076171875, 1.96588134765625, 2.1241455078125, 2.28240966796875, 2.440673828125, 2.59893798828125, 2.7572021484375, 2.91546630859375, 3.07373046875, 3.23199462890625, 3.3902587890625, 3.54852294921875, 3.706787109375, 3.86505126953125, 4.0233154296875, 4.18157958984375, 4.33984375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 8.0, 10.0, 12.0, 11.0, 21.0, 26.0, 38.0, 77.0, 110.0, 185.0, 386.0, 854.0, 2508.0, 11663.0, 136747.0, 823484.0, 61907.0, 7191.0, 1853.0, 683.0, 305.0, 159.0, 96.0, 75.0, 41.0, 26.0, 24.0, 14.0, 15.0, 4.0, 3.0, 9.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.658203125, -1.59283447265625, -1.5274658203125, -1.46209716796875, -1.396728515625, -1.33135986328125, -1.2659912109375, -1.20062255859375, -1.13525390625, -1.06988525390625, -1.0045166015625, -0.93914794921875, -0.873779296875, -0.80841064453125, -0.7430419921875, -0.67767333984375, -0.6123046875, -0.54693603515625, -0.4815673828125, -0.41619873046875, -0.350830078125, -0.28546142578125, -0.2200927734375, -0.15472412109375, -0.08935546875, -0.02398681640625, 0.0413818359375, 0.10675048828125, 0.172119140625, 0.23748779296875, 0.3028564453125, 0.36822509765625, 0.43359375, 0.49896240234375, 0.5643310546875, 0.62969970703125, 0.695068359375, 0.76043701171875, 0.8258056640625, 0.89117431640625, 0.95654296875, 1.02191162109375, 1.0872802734375, 1.15264892578125, 1.218017578125, 1.28338623046875, 1.3487548828125, 1.41412353515625, 1.4794921875, 1.54486083984375, 1.6102294921875, 1.67559814453125, 1.740966796875, 1.80633544921875, 1.8717041015625, 1.93707275390625, 2.00244140625, 2.06781005859375, 2.1331787109375, 2.19854736328125, 2.263916015625, 2.32928466796875, 2.3946533203125, 2.46002197265625, 2.525390625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 5.0, 6.0, 4.0, 15.0, 14.0, 27.0, 22.0, 40.0, 39.0, 58.0, 78.0, 72.0, 118.0, 109.0, 91.0, 57.0, 55.0, 41.0, 39.0, 25.0, 19.0, 22.0, 9.0, 11.0, 5.0, 3.0, 2.0, 5.0, 6.0, 4.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.00032973289489746094, -0.00032123737037181854, -0.00031274184584617615, -0.00030424632132053375, -0.00029575079679489136, -0.00028725527226924896, -0.00027875974774360657, -0.00027026422321796417, -0.0002617686986923218, -0.0002532731741666794, -0.000244777649641037, -0.0002362821251153946, -0.0002277866005897522, -0.0002192910760641098, -0.0002107955515384674, -0.000202300027012825, -0.00019380450248718262, -0.00018530897796154022, -0.00017681345343589783, -0.00016831792891025543, -0.00015982240438461304, -0.00015132687985897064, -0.00014283135533332825, -0.00013433583080768585, -0.00012584030628204346, -0.00011734478175640106, -0.00010884925723075867, -0.00010035373270511627, -9.185820817947388e-05, -8.336268365383148e-05, -7.486715912818909e-05, -6.637163460254669e-05, -5.78761100769043e-05, -4.93805855512619e-05, -4.088506102561951e-05, -3.238953649997711e-05, -2.3894011974334717e-05, -1.5398487448692322e-05, -6.902962923049927e-06, 1.5925616025924683e-06, 1.0088086128234863e-05, 1.8583610653877258e-05, 2.7079135179519653e-05, 3.557465970516205e-05, 4.407018423080444e-05, 5.256570875644684e-05, 6.106123328208923e-05, 6.955675780773163e-05, 7.805228233337402e-05, 8.654780685901642e-05, 9.504333138465881e-05, 0.00010353885591030121, 0.0001120343804359436, 0.000120529904961586, 0.0001290254294872284, 0.0001375209540128708, 0.00014601647853851318, 0.00015451200306415558, 0.00016300752758979797, 0.00017150305211544037, 0.00017999857664108276, 0.00018849410116672516, 0.00019698962569236755, 0.00020548515021800995, 0.00021398067474365234]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 5.0, 11.0, 4.0, 9.0, 9.0, 16.0, 26.0, 29.0, 42.0, 49.0, 72.0, 115.0, 219.0, 346.0, 693.0, 1547.0, 4079.0, 15089.0, 104815.0, 733908.0, 159110.0, 19838.0, 4876.0, 1885.0, 718.0, 389.0, 221.0, 149.0, 81.0, 56.0, 44.0, 25.0, 24.0, 22.0, 12.0, 6.0, 8.0, 6.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8115234375, -1.7620086669921875, -1.712493896484375, -1.6629791259765625, -1.61346435546875, -1.5639495849609375, -1.514434814453125, -1.4649200439453125, -1.4154052734375, -1.3658905029296875, -1.316375732421875, -1.2668609619140625, -1.21734619140625, -1.1678314208984375, -1.118316650390625, -1.0688018798828125, -1.019287109375, -0.9697723388671875, -0.920257568359375, -0.8707427978515625, -0.82122802734375, -0.7717132568359375, -0.722198486328125, -0.6726837158203125, -0.6231689453125, -0.5736541748046875, -0.524139404296875, -0.4746246337890625, -0.42510986328125, -0.3755950927734375, -0.326080322265625, -0.2765655517578125, -0.22705078125, -0.1775360107421875, -0.128021240234375, -0.0785064697265625, -0.02899169921875, 0.0205230712890625, 0.070037841796875, 0.1195526123046875, 0.1690673828125, 0.2185821533203125, 0.268096923828125, 0.3176116943359375, 0.36712646484375, 0.4166412353515625, 0.466156005859375, 0.5156707763671875, 0.565185546875, 0.6147003173828125, 0.664215087890625, 0.7137298583984375, 0.76324462890625, 0.8127593994140625, 0.862274169921875, 0.9117889404296875, 0.9613037109375, 1.0108184814453125, 1.060333251953125, 1.1098480224609375, 1.15936279296875, 1.2088775634765625, 1.258392333984375, 1.3079071044921875, 1.357421875]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 5.0, 4.0, 7.0, 12.0, 24.0, 23.0, 21.0, 34.0, 39.0, 56.0, 63.0, 81.0, 84.0, 83.0, 76.0, 75.0, 70.0, 59.0, 41.0, 33.0, 32.0, 21.0, 13.0, 7.0, 9.0, 8.0, 5.0, 5.0, 4.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5927734375, -1.545074462890625, -1.49737548828125, -1.449676513671875, -1.4019775390625, -1.354278564453125, -1.30657958984375, -1.258880615234375, -1.211181640625, -1.163482666015625, -1.11578369140625, -1.068084716796875, -1.0203857421875, -0.972686767578125, -0.92498779296875, -0.877288818359375, -0.82958984375, -0.781890869140625, -0.73419189453125, -0.686492919921875, -0.6387939453125, -0.591094970703125, -0.54339599609375, -0.495697021484375, -0.447998046875, -0.400299072265625, -0.35260009765625, -0.304901123046875, -0.2572021484375, -0.209503173828125, -0.16180419921875, -0.114105224609375, -0.06640625, -0.018707275390625, 0.02899169921875, 0.076690673828125, 0.1243896484375, 0.172088623046875, 0.21978759765625, 0.267486572265625, 0.315185546875, 0.362884521484375, 0.41058349609375, 0.458282470703125, 0.5059814453125, 0.553680419921875, 0.60137939453125, 0.649078369140625, 0.69677734375, 0.744476318359375, 0.79217529296875, 0.839874267578125, 0.8875732421875, 0.935272216796875, 0.98297119140625, 1.030670166015625, 1.078369140625, 1.126068115234375, 1.17376708984375, 1.221466064453125, 1.2691650390625, 1.316864013671875, 1.36456298828125, 1.412261962890625, 1.4599609375]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 6.0, 6.0, 16.0, 29.0, 56.0, 87.0, 139.0, 177.0, 198.0, 119.0, 70.0, 36.0, 20.0, 18.0, 12.0, 4.0, 8.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.88990020751953, -36.91172790527344, -35.93355941772461, -34.955387115478516, -33.97721481323242, -32.999046325683594, -32.0208740234375, -31.04270362854004, -30.064533233642578, -29.086362838745117, -28.108190536499023, -27.130020141601562, -26.1518497467041, -25.17367935180664, -24.195507049560547, -23.217336654663086, -22.239164352416992, -21.26099395751953, -20.282821655273438, -19.304651260375977, -18.326480865478516, -17.348308563232422, -16.37013816833496, -15.3919677734375, -14.413796424865723, -13.435625076293945, -12.457454681396484, -11.479283332824707, -10.50111198425293, -9.522941589355469, -8.544770240783691, -7.566599369049072, -6.588428497314453, -5.610257625579834, -4.632086753845215, -3.6539154052734375, -2.6757445335388184, -1.6975736618041992, -0.7194023132324219, 0.25876855850219727, 1.2369394302368164, 2.2151103019714355, 3.193281412124634, 4.171452522277832, 5.149623394012451, 6.12779426574707, 7.105965614318848, 8.084136962890625, 9.062307357788086, 10.040478706359863, 11.018649101257324, 11.996820449829102, 12.974990844726562, 13.95316219329834, 14.931333541870117, 15.909503936767578, 16.887676239013672, 17.865846633911133, 18.844018936157227, 19.822189331054688, 20.80035972595215, 21.77853012084961, 22.756702423095703, 23.734872817993164, 24.713043212890625]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 3.0, 5.0, 4.0, 5.0, 6.0, 9.0, 4.0, 7.0, 11.0, 13.0, 13.0, 17.0, 16.0, 21.0, 24.0, 35.0, 29.0, 27.0, 30.0, 35.0, 42.0, 43.0, 58.0, 45.0, 55.0, 44.0, 54.0, 39.0, 42.0, 31.0, 26.0, 27.0, 34.0, 18.0, 23.0, 18.0, 17.0, 17.0, 14.0, 9.0, 6.0, 8.0, 5.0, 4.0, 4.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0], "bins": [-17.36117935180664, -16.849042892456055, -16.33690643310547, -15.824769973754883, -15.312633514404297, -14.800497055053711, -14.288360595703125, -13.776224136352539, -13.264087677001953, -12.751951217651367, -12.239814758300781, -11.727678298950195, -11.21554183959961, -10.703405380249023, -10.191268920898438, -9.679132461547852, -9.166996002197266, -8.65485954284668, -8.142723083496094, -7.630586624145508, -7.118450164794922, -6.606313705444336, -6.09417724609375, -5.582040786743164, -5.069904327392578, -4.557767868041992, -4.045631408691406, -3.5334949493408203, -3.0213584899902344, -2.5092220306396484, -1.9970855712890625, -1.4849491119384766, -0.9728145599365234, -0.4606781005859375, 0.05145835876464844, 0.5635948181152344, 1.0757312774658203, 1.5878677368164062, 2.100004196166992, 2.612140655517578, 3.124277114868164, 3.63641357421875, 4.148550033569336, 4.660686492919922, 5.172822952270508, 5.684959411621094, 6.19709587097168, 6.709232330322266, 7.221368789672852, 7.7335052490234375, 8.245641708374023, 8.75777816772461, 9.269914627075195, 9.782051086425781, 10.294187545776367, 10.806324005126953, 11.318460464477539, 11.830596923828125, 12.342733383178711, 12.854869842529297, 13.367006301879883, 13.879142761230469, 14.391279220581055, 14.90341567993164, 15.415552139282227]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 4.0, 7.0, 8.0, 10.0, 24.0, 31.0, 35.0, 96.0, 182.0, 444.0, 1672.0, 13722.0, 3916003.0, 254689.0, 5755.0, 1017.0, 284.0, 135.0, 68.0, 35.0, 20.0, 15.0, 8.0, 8.0, 5.0, 4.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.9609375, -8.70367431640625, -8.4464111328125, -8.18914794921875, -7.931884765625, -7.67462158203125, -7.4173583984375, -7.16009521484375, -6.90283203125, -6.64556884765625, -6.3883056640625, -6.13104248046875, -5.873779296875, -5.61651611328125, -5.3592529296875, -5.10198974609375, -4.8447265625, -4.58746337890625, -4.3302001953125, -4.07293701171875, -3.815673828125, -3.55841064453125, -3.3011474609375, -3.04388427734375, -2.78662109375, -2.52935791015625, -2.2720947265625, -2.01483154296875, -1.757568359375, -1.50030517578125, -1.2430419921875, -0.98577880859375, -0.728515625, -0.47125244140625, -0.2139892578125, 0.04327392578125, 0.300537109375, 0.55780029296875, 0.8150634765625, 1.07232666015625, 1.32958984375, 1.58685302734375, 1.8441162109375, 2.10137939453125, 2.358642578125, 2.61590576171875, 2.8731689453125, 3.13043212890625, 3.3876953125, 3.64495849609375, 3.9022216796875, 4.15948486328125, 4.416748046875, 4.67401123046875, 4.9312744140625, 5.18853759765625, 5.44580078125, 5.70306396484375, 5.9603271484375, 6.21759033203125, 6.474853515625, 6.73211669921875, 6.9893798828125, 7.24664306640625, 7.50390625]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 5.0, 6.0, 8.0, 15.0, 20.0, 21.0, 31.0, 35.0, 45.0, 59.0, 64.0, 76.0, 68.0, 88.0, 75.0, 82.0, 68.0, 50.0, 44.0, 36.0, 28.0, 35.0, 14.0, 9.0, 7.0, 4.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5537109375, -1.5057525634765625, -1.457794189453125, -1.4098358154296875, -1.36187744140625, -1.3139190673828125, -1.265960693359375, -1.2180023193359375, -1.1700439453125, -1.1220855712890625, -1.074127197265625, -1.0261688232421875, -0.97821044921875, -0.9302520751953125, -0.882293701171875, -0.8343353271484375, -0.786376953125, -0.7384185791015625, -0.690460205078125, -0.6425018310546875, -0.59454345703125, -0.5465850830078125, -0.498626708984375, -0.4506683349609375, -0.4027099609375, -0.3547515869140625, -0.306793212890625, -0.2588348388671875, -0.21087646484375, -0.1629180908203125, -0.114959716796875, -0.0670013427734375, -0.01904296875, 0.0289154052734375, 0.076873779296875, 0.1248321533203125, 0.17279052734375, 0.2207489013671875, 0.268707275390625, 0.3166656494140625, 0.3646240234375, 0.4125823974609375, 0.460540771484375, 0.5084991455078125, 0.55645751953125, 0.6044158935546875, 0.652374267578125, 0.7003326416015625, 0.748291015625, 0.7962493896484375, 0.844207763671875, 0.8921661376953125, 0.94012451171875, 0.9880828857421875, 1.036041259765625, 1.0839996337890625, 1.1319580078125, 1.1799163818359375, 1.227874755859375, 1.2758331298828125, 1.32379150390625, 1.3717498779296875, 1.419708251953125, 1.4676666259765625, 1.515625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 4.0, 3.0, 2.0, 3.0, 3.0, 4.0, 5.0, 9.0, 7.0, 22.0, 42.0, 48.0, 77.0, 116.0, 191.0, 320.0, 510.0, 869.0, 1517.0, 2981.0, 6069.0, 15004.0, 47028.0, 309536.0, 3457861.0, 280138.0, 44739.0, 14621.0, 6167.0, 2765.0, 1587.0, 842.0, 461.0, 290.0, 171.0, 94.0, 62.0, 41.0, 26.0, 19.0, 9.0, 13.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0], "bins": [-2.94140625, -2.86077880859375, -2.7801513671875, -2.69952392578125, -2.618896484375, -2.53826904296875, -2.4576416015625, -2.37701416015625, -2.29638671875, -2.21575927734375, -2.1351318359375, -2.05450439453125, -1.973876953125, -1.89324951171875, -1.8126220703125, -1.73199462890625, -1.6513671875, -1.57073974609375, -1.4901123046875, -1.40948486328125, -1.328857421875, -1.24822998046875, -1.1676025390625, -1.08697509765625, -1.00634765625, -0.92572021484375, -0.8450927734375, -0.76446533203125, -0.683837890625, -0.60321044921875, -0.5225830078125, -0.44195556640625, -0.361328125, -0.28070068359375, -0.2000732421875, -0.11944580078125, -0.038818359375, 0.04180908203125, 0.1224365234375, 0.20306396484375, 0.28369140625, 0.36431884765625, 0.4449462890625, 0.52557373046875, 0.606201171875, 0.68682861328125, 0.7674560546875, 0.84808349609375, 0.9287109375, 1.00933837890625, 1.0899658203125, 1.17059326171875, 1.251220703125, 1.33184814453125, 1.4124755859375, 1.49310302734375, 1.57373046875, 1.65435791015625, 1.7349853515625, 1.81561279296875, 1.896240234375, 1.97686767578125, 2.0574951171875, 2.13812255859375, 2.21875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 6.0, 5.0, 5.0, 8.0, 13.0, 13.0, 27.0, 24.0, 54.0, 91.0, 174.0, 374.0, 1095.0, 1256.0, 484.0, 204.0, 90.0, 43.0, 33.0, 16.0, 15.0, 10.0, 7.0, 5.0, 5.0, 5.0, 4.0, 6.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.14453125, -4.03265380859375, -3.9207763671875, -3.80889892578125, -3.697021484375, -3.58514404296875, -3.4732666015625, -3.36138916015625, -3.24951171875, -3.13763427734375, -3.0257568359375, -2.91387939453125, -2.802001953125, -2.69012451171875, -2.5782470703125, -2.46636962890625, -2.3544921875, -2.24261474609375, -2.1307373046875, -2.01885986328125, -1.906982421875, -1.79510498046875, -1.6832275390625, -1.57135009765625, -1.45947265625, -1.34759521484375, -1.2357177734375, -1.12384033203125, -1.011962890625, -0.90008544921875, -0.7882080078125, -0.67633056640625, -0.564453125, -0.45257568359375, -0.3406982421875, -0.22882080078125, -0.116943359375, -0.00506591796875, 0.1068115234375, 0.21868896484375, 0.33056640625, 0.44244384765625, 0.5543212890625, 0.66619873046875, 0.778076171875, 0.88995361328125, 1.0018310546875, 1.11370849609375, 1.2255859375, 1.33746337890625, 1.4493408203125, 1.56121826171875, 1.673095703125, 1.78497314453125, 1.8968505859375, 2.00872802734375, 2.12060546875, 2.23248291015625, 2.3443603515625, 2.45623779296875, 2.568115234375, 2.67999267578125, 2.7918701171875, 2.90374755859375, 3.015625]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 8.0, 10.0, 20.0, 46.0, 133.0, 301.0, 301.0, 116.0, 34.0, 17.0, 6.0, 2.0, 6.0, 4.0, 0.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.278968811035156, -52.9849739074707, -51.690975189208984, -50.39698028564453, -49.10298156738281, -47.80898666381836, -46.514991760253906, -45.22099304199219, -43.926998138427734, -42.63300323486328, -41.33900451660156, -40.04500961303711, -38.751014709472656, -37.45701599121094, -36.163021087646484, -34.86902618408203, -33.57502746582031, -32.28103256225586, -30.98703384399414, -29.693038940429688, -28.3990421295166, -27.105045318603516, -25.811050415039062, -24.517053604125977, -23.22305679321289, -21.929059982299805, -20.63506317138672, -19.341068267822266, -18.04707145690918, -16.753074645996094, -15.459078788757324, -14.165082931518555, -12.871086120605469, -11.577089309692383, -10.283093452453613, -8.989097595214844, -7.695100784301758, -6.40110445022583, -5.107108116149902, -3.813112258911133, -2.519115447998047, -1.2251191139221191, 0.0688772201538086, 1.3628735542297363, 2.656869888305664, 3.950866222381592, 5.2448625564575195, 6.538858413696289, 7.832855224609375, 9.126852035522461, 10.42084789276123, 11.71484375, 13.008840560913086, 14.302837371826172, 15.596833229064941, 16.89082908630371, 18.184825897216797, 19.478822708129883, 20.77281951904297, 22.066814422607422, 23.360811233520508, 24.654808044433594, 25.948802947998047, 27.242799758911133, 28.53679656982422]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 7.0, 9.0, 6.0, 10.0, 12.0, 11.0, 15.0, 22.0, 30.0, 27.0, 29.0, 34.0, 43.0, 50.0, 47.0, 51.0, 57.0, 50.0, 53.0, 58.0, 36.0, 43.0, 51.0, 45.0, 36.0, 35.0, 25.0, 31.0, 14.0, 15.0, 17.0, 7.0, 6.0, 4.0, 8.0, 4.0, 4.0, 2.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.61648941040039, -13.207945823669434, -12.799402236938477, -12.390857696533203, -11.982314109802246, -11.573770523071289, -11.165226936340332, -10.756683349609375, -10.348138809204102, -9.939595222473145, -9.531051635742188, -9.122507095336914, -8.713963508605957, -8.305419921875, -7.896876335144043, -7.488332271575928, -7.079788684844971, -6.671245098114014, -6.262701034545898, -5.854157447814941, -5.445613384246826, -5.037069797515869, -4.628525733947754, -4.219982147216797, -3.8114383220672607, -3.4028944969177246, -2.9943506717681885, -2.5858068466186523, -2.1772632598876953, -1.7687194347381592, -1.360175609588623, -0.9516317844390869, -0.5430879592895508, -0.13454416394233704, 0.2739996314048767, 0.6825433969497681, 1.0910872220993042, 1.4996309280395508, 1.908174753189087, 2.316718578338623, 2.725262403488159, 3.1338062286376953, 3.5423500537872314, 3.9508938789367676, 4.359437465667725, 4.76798152923584, 5.176525115966797, 5.585068702697754, 5.993612766265869, 6.402156352996826, 6.810700416564941, 7.219244003295898, 7.627788066864014, 8.036331176757812, 8.444875717163086, 8.853419303894043, 9.261962890625, 9.670506477355957, 10.079050064086914, 10.487594604492188, 10.896138191223145, 11.304681777954102, 11.713225364685059, 12.121768951416016, 12.530313491821289]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 5.0, 2.0, 13.0, 12.0, 20.0, 28.0, 40.0, 64.0, 109.0, 149.0, 257.0, 480.0, 833.0, 1505.0, 3100.0, 6720.0, 15431.0, 39453.0, 108448.0, 309147.0, 354240.0, 129062.0, 46449.0, 18021.0, 7418.0, 3594.0, 1789.0, 899.0, 518.0, 287.0, 184.0, 92.0, 58.0, 44.0, 23.0, 18.0, 16.0, 14.0, 4.0, 5.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.19140625, -2.113372802734375, -2.03533935546875, -1.957305908203125, -1.8792724609375, -1.801239013671875, -1.72320556640625, -1.645172119140625, -1.567138671875, -1.489105224609375, -1.41107177734375, -1.333038330078125, -1.2550048828125, -1.176971435546875, -1.09893798828125, -1.020904541015625, -0.94287109375, -0.864837646484375, -0.78680419921875, -0.708770751953125, -0.6307373046875, -0.552703857421875, -0.47467041015625, -0.396636962890625, -0.318603515625, -0.240570068359375, -0.16253662109375, -0.084503173828125, -0.0064697265625, 0.071563720703125, 0.14959716796875, 0.227630615234375, 0.3056640625, 0.383697509765625, 0.46173095703125, 0.539764404296875, 0.6177978515625, 0.695831298828125, 0.77386474609375, 0.851898193359375, 0.929931640625, 1.007965087890625, 1.08599853515625, 1.164031982421875, 1.2420654296875, 1.320098876953125, 1.39813232421875, 1.476165771484375, 1.55419921875, 1.632232666015625, 1.71026611328125, 1.788299560546875, 1.8663330078125, 1.944366455078125, 2.02239990234375, 2.100433349609375, 2.178466796875, 2.256500244140625, 2.33453369140625, 2.412567138671875, 2.4906005859375, 2.568634033203125, 2.64666748046875, 2.724700927734375, 2.802734375]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 4.0, 4.0, 9.0, 14.0, 13.0, 15.0, 27.0, 27.0, 20.0, 32.0, 42.0, 41.0, 44.0, 56.0, 49.0, 45.0, 66.0, 50.0, 61.0, 59.0, 48.0, 48.0, 44.0, 32.0, 26.0, 21.0, 22.0, 21.0, 17.0, 11.0, 13.0, 6.0, 10.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0], "bins": [-1.4892578125, -1.4535446166992188, -1.4178314208984375, -1.3821182250976562, -1.346405029296875, -1.3106918334960938, -1.2749786376953125, -1.2392654418945312, -1.20355224609375, -1.1678390502929688, -1.1321258544921875, -1.0964126586914062, -1.060699462890625, -1.0249862670898438, -0.9892730712890625, -0.9535598754882812, -0.9178466796875, -0.8821334838867188, -0.8464202880859375, -0.8107070922851562, -0.774993896484375, -0.7392807006835938, -0.7035675048828125, -0.6678543090820312, -0.63214111328125, -0.5964279174804688, -0.5607147216796875, -0.5250015258789062, -0.489288330078125, -0.45357513427734375, -0.4178619384765625, -0.38214874267578125, -0.346435546875, -0.31072235107421875, -0.2750091552734375, -0.23929595947265625, -0.203582763671875, -0.16786956787109375, -0.1321563720703125, -0.09644317626953125, -0.06072998046875, -0.02501678466796875, 0.0106964111328125, 0.04640960693359375, 0.082122802734375, 0.11783599853515625, 0.1535491943359375, 0.18926239013671875, 0.2249755859375, 0.26068878173828125, 0.2964019775390625, 0.33211517333984375, 0.367828369140625, 0.40354156494140625, 0.4392547607421875, 0.47496795654296875, 0.51068115234375, 0.5463943481445312, 0.5821075439453125, 0.6178207397460938, 0.653533935546875, 0.6892471313476562, 0.7249603271484375, 0.7606735229492188, 0.79638671875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 5.0, 6.0, 5.0, 8.0, 8.0, 10.0, 12.0, 32.0, 34.0, 37.0, 71.0, 116.0, 145.0, 242.0, 440.0, 849.0, 1995.0, 6117.0, 25868.0, 151380.0, 669992.0, 154587.0, 26290.0, 6241.0, 2074.0, 874.0, 409.0, 236.0, 148.0, 108.0, 67.0, 43.0, 26.0, 24.0, 16.0, 12.0, 10.0, 4.0, 5.0, 6.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.31640625, -3.1912841796875, -3.066162109375, -2.9410400390625, -2.81591796875, -2.6907958984375, -2.565673828125, -2.4405517578125, -2.3154296875, -2.1903076171875, -2.065185546875, -1.9400634765625, -1.81494140625, -1.6898193359375, -1.564697265625, -1.4395751953125, -1.314453125, -1.1893310546875, -1.064208984375, -0.9390869140625, -0.81396484375, -0.6888427734375, -0.563720703125, -0.4385986328125, -0.3134765625, -0.1883544921875, -0.063232421875, 0.0618896484375, 0.18701171875, 0.3121337890625, 0.437255859375, 0.5623779296875, 0.6875, 0.8126220703125, 0.937744140625, 1.0628662109375, 1.18798828125, 1.3131103515625, 1.438232421875, 1.5633544921875, 1.6884765625, 1.8135986328125, 1.938720703125, 2.0638427734375, 2.18896484375, 2.3140869140625, 2.439208984375, 2.5643310546875, 2.689453125, 2.8145751953125, 2.939697265625, 3.0648193359375, 3.18994140625, 3.3150634765625, 3.440185546875, 3.5653076171875, 3.6904296875, 3.8155517578125, 3.940673828125, 4.0657958984375, 4.19091796875, 4.3160400390625, 4.441162109375, 4.5662841796875, 4.69140625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 4.0, 5.0, 8.0, 14.0, 6.0, 12.0, 19.0, 18.0, 22.0, 26.0, 25.0, 32.0, 38.0, 34.0, 36.0, 34.0, 42.0, 38.0, 60.0, 42.0, 43.0, 46.0, 36.0, 39.0, 38.0, 41.0, 41.0, 25.0, 26.0, 26.0, 16.0, 22.0, 15.0, 17.0, 4.0, 15.0, 10.0, 11.0, 5.0, 4.0, 2.0, 5.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.435546875, -3.3251953125, -3.21484375, -3.1044921875, -2.994140625, -2.8837890625, -2.7734375, -2.6630859375, -2.552734375, -2.4423828125, -2.33203125, -2.2216796875, -2.111328125, -2.0009765625, -1.890625, -1.7802734375, -1.669921875, -1.5595703125, -1.44921875, -1.3388671875, -1.228515625, -1.1181640625, -1.0078125, -0.8974609375, -0.787109375, -0.6767578125, -0.56640625, -0.4560546875, -0.345703125, -0.2353515625, -0.125, -0.0146484375, 0.095703125, 0.2060546875, 0.31640625, 0.4267578125, 0.537109375, 0.6474609375, 0.7578125, 0.8681640625, 0.978515625, 1.0888671875, 1.19921875, 1.3095703125, 1.419921875, 1.5302734375, 1.640625, 1.7509765625, 1.861328125, 1.9716796875, 2.08203125, 2.1923828125, 2.302734375, 2.4130859375, 2.5234375, 2.6337890625, 2.744140625, 2.8544921875, 2.96484375, 3.0751953125, 3.185546875, 3.2958984375, 3.40625, 3.5166015625, 3.626953125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 2.0, 2.0, 5.0, 6.0, 9.0, 16.0, 21.0, 32.0, 36.0, 55.0, 83.0, 102.0, 228.0, 416.0, 778.0, 2047.0, 6587.0, 33757.0, 419538.0, 536545.0, 37231.0, 7044.0, 2123.0, 856.0, 384.0, 230.0, 113.0, 79.0, 52.0, 43.0, 31.0, 21.0, 21.0, 15.0, 5.0, 9.0, 6.0, 6.0, 3.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 4.0, 1.0], "bins": [-2.09375, -2.0322113037109375, -1.970672607421875, -1.9091339111328125, -1.84759521484375, -1.7860565185546875, -1.724517822265625, -1.6629791259765625, -1.6014404296875, -1.5399017333984375, -1.478363037109375, -1.4168243408203125, -1.35528564453125, -1.2937469482421875, -1.232208251953125, -1.1706695556640625, -1.109130859375, -1.0475921630859375, -0.986053466796875, -0.9245147705078125, -0.86297607421875, -0.8014373779296875, -0.739898681640625, -0.6783599853515625, -0.6168212890625, -0.5552825927734375, -0.493743896484375, -0.4322052001953125, -0.37066650390625, -0.3091278076171875, -0.247589111328125, -0.1860504150390625, -0.12451171875, -0.0629730224609375, -0.001434326171875, 0.0601043701171875, 0.12164306640625, 0.1831817626953125, 0.244720458984375, 0.3062591552734375, 0.3677978515625, 0.4293365478515625, 0.490875244140625, 0.5524139404296875, 0.61395263671875, 0.6754913330078125, 0.737030029296875, 0.7985687255859375, 0.860107421875, 0.9216461181640625, 0.983184814453125, 1.0447235107421875, 1.10626220703125, 1.1678009033203125, 1.229339599609375, 1.2908782958984375, 1.3524169921875, 1.4139556884765625, 1.475494384765625, 1.5370330810546875, 1.59857177734375, 1.6601104736328125, 1.721649169921875, 1.7831878662109375, 1.8447265625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 6.0, 16.0, 22.0, 53.0, 84.0, 185.0, 241.0, 164.0, 108.0, 51.0, 22.0, 26.0, 7.0, 9.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0010929107666015625, -0.001069914549589157, -0.0010469183325767517, -0.0010239221155643463, -0.001000925898551941, -0.0009779296815395355, -0.0009549334645271301, -0.0009319372475147247, -0.0009089410305023193, -0.0008859448134899139, -0.0008629485964775085, -0.0008399523794651031, -0.0008169561624526978, -0.0007939599454402924, -0.000770963728427887, -0.0007479675114154816, -0.0007249712944030762, -0.0007019750773906708, -0.0006789788603782654, -0.00065598264336586, -0.0006329864263534546, -0.0006099902093410492, -0.0005869939923286438, -0.0005639977753162384, -0.000541001558303833, -0.0005180053412914276, -0.0004950091242790222, -0.0004720129072666168, -0.0004490166902542114, -0.00042602047324180603, -0.00040302425622940063, -0.00038002803921699524, -0.00035703182220458984, -0.00033403560519218445, -0.00031103938817977905, -0.00028804317116737366, -0.00026504695415496826, -0.00024205073714256287, -0.00021905452013015747, -0.00019605830311775208, -0.00017306208610534668, -0.00015006586909294128, -0.0001270696520805359, -0.00010407343506813049, -8.10772180557251e-05, -5.80810010433197e-05, -3.508478403091431e-05, -1.2088567018508911e-05, 1.0907649993896484e-05, 3.390386700630188e-05, 5.6900084018707275e-05, 7.989630103111267e-05, 0.00010289251804351807, 0.00012588873505592346, 0.00014888495206832886, 0.00017188116908073425, 0.00019487738609313965, 0.00021787360310554504, 0.00024086982011795044, 0.00026386603713035583, 0.00028686225414276123, 0.0003098584711551666, 0.000332854688167572, 0.0003558509051799774, 0.0003788471221923828]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 6.0, 8.0, 17.0, 19.0, 27.0, 36.0, 53.0, 100.0, 169.0, 351.0, 790.0, 2121.0, 8610.0, 66158.0, 792662.0, 157376.0, 14823.0, 3199.0, 1045.0, 447.0, 225.0, 119.0, 64.0, 42.0, 28.0, 15.0, 8.0, 6.0, 11.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.16015625, -2.0919189453125, -2.023681640625, -1.9554443359375, -1.88720703125, -1.8189697265625, -1.750732421875, -1.6824951171875, -1.6142578125, -1.5460205078125, -1.477783203125, -1.4095458984375, -1.34130859375, -1.2730712890625, -1.204833984375, -1.1365966796875, -1.068359375, -1.0001220703125, -0.931884765625, -0.8636474609375, -0.79541015625, -0.7271728515625, -0.658935546875, -0.5906982421875, -0.5224609375, -0.4542236328125, -0.385986328125, -0.3177490234375, -0.24951171875, -0.1812744140625, -0.113037109375, -0.0447998046875, 0.0234375, 0.0916748046875, 0.159912109375, 0.2281494140625, 0.29638671875, 0.3646240234375, 0.432861328125, 0.5010986328125, 0.5693359375, 0.6375732421875, 0.705810546875, 0.7740478515625, 0.84228515625, 0.9105224609375, 0.978759765625, 1.0469970703125, 1.115234375, 1.1834716796875, 1.251708984375, 1.3199462890625, 1.38818359375, 1.4564208984375, 1.524658203125, 1.5928955078125, 1.6611328125, 1.7293701171875, 1.797607421875, 1.8658447265625, 1.93408203125, 2.0023193359375, 2.070556640625, 2.1387939453125, 2.20703125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 5.0, 7.0, 10.0, 13.0, 13.0, 16.0, 19.0, 21.0, 28.0, 27.0, 45.0, 45.0, 57.0, 73.0, 74.0, 67.0, 67.0, 74.0, 67.0, 53.0, 26.0, 41.0, 29.0, 24.0, 14.0, 23.0, 10.0, 7.0, 14.0, 8.0, 5.0, 3.0, 3.0, 4.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7265625, -1.6815948486328125, -1.636627197265625, -1.5916595458984375, -1.54669189453125, -1.5017242431640625, -1.456756591796875, -1.4117889404296875, -1.3668212890625, -1.3218536376953125, -1.276885986328125, -1.2319183349609375, -1.18695068359375, -1.1419830322265625, -1.097015380859375, -1.0520477294921875, -1.007080078125, -0.9621124267578125, -0.917144775390625, -0.8721771240234375, -0.82720947265625, -0.7822418212890625, -0.737274169921875, -0.6923065185546875, -0.6473388671875, -0.6023712158203125, -0.557403564453125, -0.5124359130859375, -0.46746826171875, -0.4225006103515625, -0.377532958984375, -0.3325653076171875, -0.28759765625, -0.2426300048828125, -0.197662353515625, -0.1526947021484375, -0.10772705078125, -0.0627593994140625, -0.017791748046875, 0.0271759033203125, 0.0721435546875, 0.1171112060546875, 0.162078857421875, 0.2070465087890625, 0.25201416015625, 0.2969818115234375, 0.341949462890625, 0.3869171142578125, 0.431884765625, 0.4768524169921875, 0.521820068359375, 0.5667877197265625, 0.61175537109375, 0.6567230224609375, 0.701690673828125, 0.7466583251953125, 0.7916259765625, 0.8365936279296875, 0.881561279296875, 0.9265289306640625, 0.97149658203125, 1.0164642333984375, 1.061431884765625, 1.1063995361328125, 1.1513671875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 4.0, 11.0, 27.0, 62.0, 138.0, 188.0, 260.0, 159.0, 78.0, 48.0, 14.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-63.306217193603516, -62.02650833129883, -60.746795654296875, -59.46708679199219, -58.1873779296875, -56.90766525268555, -55.62795639038086, -54.348243713378906, -53.06853485107422, -51.78882598876953, -50.50911331176758, -49.22940444946289, -47.9496955871582, -46.66998291015625, -45.39027404785156, -44.110565185546875, -42.83085632324219, -41.5511474609375, -40.27143478393555, -38.99172592163086, -37.71201705932617, -36.43230438232422, -35.15259552001953, -33.872886657714844, -32.59317398071289, -31.31346321105957, -30.033754348754883, -28.754043579101562, -27.474332809448242, -26.194622039794922, -24.914913177490234, -23.635202407836914, -22.355491638183594, -21.075780868530273, -19.796072006225586, -18.516361236572266, -17.236650466918945, -15.956940650939941, -14.677230834960938, -13.397520065307617, -12.117810249328613, -10.83810043334961, -9.558389663696289, -8.278679847717285, -6.998969554901123, -5.719259262084961, -4.439549446105957, -3.1598386764526367, -1.8801288604736328, -0.6004186868667603, 0.6792914867401123, 1.9590015411376953, 3.2387118339538574, 4.5184221267700195, 5.798131942749023, 7.077842712402344, 8.357552528381348, 9.637262344360352, 10.916973114013672, 12.196682929992676, 13.47639274597168, 14.756103515625, 16.035812377929688, 17.31552505493164, 18.595233917236328]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 5.0, 1.0, 3.0, 4.0, 7.0, 5.0, 11.0, 10.0, 17.0, 24.0, 21.0, 19.0, 39.0, 33.0, 24.0, 43.0, 44.0, 51.0, 62.0, 82.0, 67.0, 60.0, 51.0, 47.0, 40.0, 51.0, 28.0, 25.0, 34.0, 24.0, 16.0, 20.0, 13.0, 13.0, 6.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.01881217956543, -21.38681411743164, -20.754817962646484, -20.122821807861328, -19.49082374572754, -18.85882568359375, -18.226829528808594, -17.594833374023438, -16.96283531188965, -16.33083724975586, -15.698841094970703, -15.06684398651123, -14.434846878051758, -13.802849769592285, -13.170852661132812, -12.53885555267334, -11.906858444213867, -11.274861335754395, -10.642864227294922, -10.01086711883545, -9.378870010375977, -8.746872901916504, -8.114875793457031, -7.482878684997559, -6.850881576538086, -6.218884468078613, -5.586887359619141, -4.954890251159668, -4.322893142700195, -3.6908960342407227, -3.05889892578125, -2.4269018173217773, -1.7949066162109375, -1.1629095077514648, -0.5309123992919922, 0.10108470916748047, 0.7330818176269531, 1.3650789260864258, 1.9970760345458984, 2.629073143005371, 3.2610702514648438, 3.8930673599243164, 4.525064468383789, 5.157061576843262, 5.789058685302734, 6.421055793762207, 7.05305290222168, 7.685050010681152, 8.317047119140625, 8.949044227600098, 9.58104133605957, 10.213038444519043, 10.845035552978516, 11.477032661437988, 12.109029769897461, 12.741026878356934, 13.373023986816406, 14.005021095275879, 14.637018203735352, 15.269015312194824, 15.901012420654297, 16.533008575439453, 17.165006637573242, 17.79700469970703, 18.429000854492188]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 3.0, 4.0, 7.0, 14.0, 19.0, 29.0, 48.0, 72.0, 148.0, 273.0, 556.0, 1035.0, 2658.0, 7449.0, 27200.0, 205931.0, 3347835.0, 540802.0, 43622.0, 10152.0, 3437.0, 1451.0, 709.0, 329.0, 174.0, 83.0, 68.0, 51.0, 26.0, 21.0, 24.0, 9.0, 12.0, 6.0, 7.0, 6.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.50390625, -2.427215576171875, -2.35052490234375, -2.273834228515625, -2.1971435546875, -2.120452880859375, -2.04376220703125, -1.967071533203125, -1.890380859375, -1.813690185546875, -1.73699951171875, -1.660308837890625, -1.5836181640625, -1.506927490234375, -1.43023681640625, -1.353546142578125, -1.27685546875, -1.200164794921875, -1.12347412109375, -1.046783447265625, -0.9700927734375, -0.893402099609375, -0.81671142578125, -0.740020751953125, -0.663330078125, -0.586639404296875, -0.50994873046875, -0.433258056640625, -0.3565673828125, -0.279876708984375, -0.20318603515625, -0.126495361328125, -0.0498046875, 0.026885986328125, 0.10357666015625, 0.180267333984375, 0.2569580078125, 0.333648681640625, 0.41033935546875, 0.487030029296875, 0.563720703125, 0.640411376953125, 0.71710205078125, 0.793792724609375, 0.8704833984375, 0.947174072265625, 1.02386474609375, 1.100555419921875, 1.17724609375, 1.253936767578125, 1.33062744140625, 1.407318115234375, 1.4840087890625, 1.560699462890625, 1.63739013671875, 1.714080810546875, 1.790771484375, 1.867462158203125, 1.94415283203125, 2.020843505859375, 2.0975341796875, 2.174224853515625, 2.25091552734375, 2.327606201171875, 2.404296875]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 6.0, 1.0, 8.0, 7.0, 6.0, 5.0, 8.0, 12.0, 14.0, 16.0, 26.0, 34.0, 33.0, 27.0, 33.0, 41.0, 32.0, 49.0, 36.0, 49.0, 44.0, 43.0, 59.0, 47.0, 52.0, 43.0, 41.0, 44.0, 28.0, 25.0, 23.0, 17.0, 21.0, 12.0, 9.0, 11.0, 10.0, 6.0, 8.0, 6.0, 3.0, 4.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.751953125, -0.7252273559570312, -0.6985015869140625, -0.6717758178710938, -0.645050048828125, -0.6183242797851562, -0.5915985107421875, -0.5648727416992188, -0.53814697265625, -0.5114212036132812, -0.4846954345703125, -0.45796966552734375, -0.431243896484375, -0.40451812744140625, -0.3777923583984375, -0.35106658935546875, -0.3243408203125, -0.29761505126953125, -0.2708892822265625, -0.24416351318359375, -0.217437744140625, -0.19071197509765625, -0.1639862060546875, -0.13726043701171875, -0.11053466796875, -0.08380889892578125, -0.0570831298828125, -0.03035736083984375, -0.003631591796875, 0.02309417724609375, 0.0498199462890625, 0.07654571533203125, 0.103271484375, 0.12999725341796875, 0.1567230224609375, 0.18344879150390625, 0.210174560546875, 0.23690032958984375, 0.2636260986328125, 0.29035186767578125, 0.31707763671875, 0.34380340576171875, 0.3705291748046875, 0.39725494384765625, 0.423980712890625, 0.45070648193359375, 0.4774322509765625, 0.5041580200195312, 0.5308837890625, 0.5576095581054688, 0.5843353271484375, 0.6110610961914062, 0.637786865234375, 0.6645126342773438, 0.6912384033203125, 0.7179641723632812, 0.74468994140625, 0.7714157104492188, 0.7981414794921875, 0.8248672485351562, 0.851593017578125, 0.8783187866210938, 0.9050445556640625, 0.9317703247070312, 0.95849609375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 7.0, 4.0, 9.0, 9.0, 16.0, 36.0, 56.0, 96.0, 153.0, 336.0, 907.0, 2474.0, 9311.0, 52051.0, 1291483.0, 2743678.0, 75479.0, 12515.0, 3386.0, 1187.0, 508.0, 260.0, 130.0, 59.0, 47.0, 42.0, 12.0, 11.0, 6.0, 6.0, 5.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.931640625, -2.814727783203125, -2.69781494140625, -2.580902099609375, -2.4639892578125, -2.347076416015625, -2.23016357421875, -2.113250732421875, -1.996337890625, -1.879425048828125, -1.76251220703125, -1.645599365234375, -1.5286865234375, -1.411773681640625, -1.29486083984375, -1.177947998046875, -1.06103515625, -0.944122314453125, -0.82720947265625, -0.710296630859375, -0.5933837890625, -0.476470947265625, -0.35955810546875, -0.242645263671875, -0.125732421875, -0.008819580078125, 0.10809326171875, 0.225006103515625, 0.3419189453125, 0.458831787109375, 0.57574462890625, 0.692657470703125, 0.8095703125, 0.926483154296875, 1.04339599609375, 1.160308837890625, 1.2772216796875, 1.394134521484375, 1.51104736328125, 1.627960205078125, 1.744873046875, 1.861785888671875, 1.97869873046875, 2.095611572265625, 2.2125244140625, 2.329437255859375, 2.44635009765625, 2.563262939453125, 2.68017578125, 2.797088623046875, 2.91400146484375, 3.030914306640625, 3.1478271484375, 3.264739990234375, 3.38165283203125, 3.498565673828125, 3.615478515625, 3.732391357421875, 3.84930419921875, 3.966217041015625, 4.0831298828125, 4.200042724609375, 4.31695556640625, 4.433868408203125, 4.55078125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 2.0, 6.0, 8.0, 9.0, 14.0, 19.0, 25.0, 39.0, 58.0, 89.0, 154.0, 315.0, 581.0, 1119.0, 748.0, 392.0, 169.0, 94.0, 56.0, 47.0, 33.0, 26.0, 25.0, 18.0, 6.0, 4.0, 4.0, 8.0, 3.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.68359375, -2.57464599609375, -2.4656982421875, -2.35675048828125, -2.247802734375, -2.13885498046875, -2.0299072265625, -1.92095947265625, -1.81201171875, -1.70306396484375, -1.5941162109375, -1.48516845703125, -1.376220703125, -1.26727294921875, -1.1583251953125, -1.04937744140625, -0.9404296875, -0.83148193359375, -0.7225341796875, -0.61358642578125, -0.504638671875, -0.39569091796875, -0.2867431640625, -0.17779541015625, -0.06884765625, 0.04010009765625, 0.1490478515625, 0.25799560546875, 0.366943359375, 0.47589111328125, 0.5848388671875, 0.69378662109375, 0.802734375, 0.91168212890625, 1.0206298828125, 1.12957763671875, 1.238525390625, 1.34747314453125, 1.4564208984375, 1.56536865234375, 1.67431640625, 1.78326416015625, 1.8922119140625, 2.00115966796875, 2.110107421875, 2.21905517578125, 2.3280029296875, 2.43695068359375, 2.5458984375, 2.65484619140625, 2.7637939453125, 2.87274169921875, 2.981689453125, 3.09063720703125, 3.1995849609375, 3.30853271484375, 3.41748046875, 3.52642822265625, 3.6353759765625, 3.74432373046875, 3.853271484375, 3.96221923828125, 4.0711669921875, 4.18011474609375, 4.2890625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 1.0, 4.0, 3.0, 3.0, 3.0, 7.0, 10.0, 14.0, 35.0, 72.0, 101.0, 144.0, 190.0, 159.0, 111.0, 65.0, 25.0, 18.0, 14.0, 7.0, 3.0, 4.0, 4.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-16.693740844726562, -15.918699264526367, -15.143657684326172, -14.368616104125977, -13.593574523925781, -12.818532943725586, -12.04349136352539, -11.268449783325195, -10.493408203125, -9.718366622924805, -8.94332504272461, -8.168283462524414, -7.393241882324219, -6.618200302124023, -5.84315824508667, -5.068116664886475, -4.293074607849121, -3.518033027648926, -2.7429914474487305, -1.967949628829956, -1.1929080486297607, -0.41786646842956543, 0.357175350189209, 1.1322169303894043, 1.9072585105895996, 2.682300090789795, 3.4573416709899902, 4.232383728027344, 5.007425308227539, 5.782466888427734, 6.55750846862793, 7.332550048828125, 8.10759162902832, 8.882633209228516, 9.657674789428711, 10.432716369628906, 11.207757949829102, 11.982799530029297, 12.757841110229492, 13.532882690429688, 14.307924270629883, 15.082965850830078, 15.858007431030273, 16.63304901123047, 17.408090591430664, 18.18313217163086, 18.958173751831055, 19.73321533203125, 20.508258819580078, 21.283300399780273, 22.05834197998047, 22.833383560180664, 23.60842514038086, 24.383466720581055, 25.15850830078125, 25.933549880981445, 26.70859146118164, 27.483633041381836, 28.25867462158203, 29.033716201782227, 29.808757781982422, 30.583799362182617, 31.358840942382812, 32.13388442993164, 32.9089241027832]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 4.0, 5.0, 3.0, 3.0, 3.0, 4.0, 3.0, 8.0, 6.0, 5.0, 12.0, 13.0, 16.0, 4.0, 20.0, 25.0, 22.0, 21.0, 31.0, 33.0, 23.0, 41.0, 44.0, 46.0, 29.0, 42.0, 32.0, 58.0, 47.0, 40.0, 33.0, 38.0, 38.0, 34.0, 23.0, 27.0, 25.0, 27.0, 22.0, 17.0, 17.0, 15.0, 12.0, 14.0, 6.0, 4.0, 2.0, 3.0, 3.0, 6.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-12.627767562866211, -12.270913124084473, -11.914058685302734, -11.557204246520996, -11.200349807739258, -10.84349536895752, -10.486640930175781, -10.12978744506836, -9.772932052612305, -9.416077613830566, -9.059223175048828, -8.70236873626709, -8.345514297485352, -7.988659858703613, -7.631805896759033, -7.274951457977295, -6.918097496032715, -6.561243057250977, -6.204388618469238, -5.8475341796875, -5.490679740905762, -5.133825302124023, -4.776971340179443, -4.420116901397705, -4.063262462615967, -3.7064080238342285, -3.3495535850524902, -2.992699384689331, -2.6358449459075928, -2.2789905071258545, -1.9221363067626953, -1.565281867980957, -1.2084274291992188, -0.8515730500221252, -0.49471867084503174, -0.137864351272583, 0.21899008750915527, 0.5758445262908936, 0.9326987266540527, 1.289553165435791, 1.6464076042175293, 2.0032620429992676, 2.360116481781006, 2.716970682144165, 3.0738251209259033, 3.4306795597076416, 3.787533760070801, 4.144388198852539, 4.501242637634277, 4.858097076416016, 5.214951515197754, 5.571805953979492, 5.9286603927612305, 6.285514831542969, 6.642368793487549, 6.999223232269287, 7.356077671051025, 7.712932109832764, 8.069786071777344, 8.426640510559082, 8.78349494934082, 9.140349388122559, 9.497203826904297, 9.854058265686035, 10.210912704467773]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 4.0, 5.0, 6.0, 9.0, 12.0, 12.0, 20.0, 21.0, 21.0, 49.0, 82.0, 110.0, 207.0, 311.0, 517.0, 908.0, 1468.0, 2894.0, 5469.0, 11133.0, 24019.0, 52738.0, 116123.0, 236343.0, 286601.0, 166245.0, 76529.0, 34615.0, 15637.0, 7682.0, 3813.0, 2000.0, 1167.0, 673.0, 409.0, 238.0, 139.0, 88.0, 65.0, 58.0, 25.0, 27.0, 20.0, 16.0, 2.0, 9.0, 9.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.6767578125, -1.6247406005859375, -1.572723388671875, -1.5207061767578125, -1.46868896484375, -1.4166717529296875, -1.364654541015625, -1.3126373291015625, -1.2606201171875, -1.2086029052734375, -1.156585693359375, -1.1045684814453125, -1.05255126953125, -1.0005340576171875, -0.948516845703125, -0.8964996337890625, -0.844482421875, -0.7924652099609375, -0.740447998046875, -0.6884307861328125, -0.63641357421875, -0.5843963623046875, -0.532379150390625, -0.4803619384765625, -0.4283447265625, -0.3763275146484375, -0.324310302734375, -0.2722930908203125, -0.22027587890625, -0.1682586669921875, -0.116241455078125, -0.0642242431640625, -0.01220703125, 0.0398101806640625, 0.091827392578125, 0.1438446044921875, 0.19586181640625, 0.2478790283203125, 0.299896240234375, 0.3519134521484375, 0.4039306640625, 0.4559478759765625, 0.507965087890625, 0.5599822998046875, 0.61199951171875, 0.6640167236328125, 0.716033935546875, 0.7680511474609375, 0.820068359375, 0.8720855712890625, 0.924102783203125, 0.9761199951171875, 1.02813720703125, 1.0801544189453125, 1.132171630859375, 1.1841888427734375, 1.2362060546875, 1.2882232666015625, 1.340240478515625, 1.3922576904296875, 1.44427490234375, 1.4962921142578125, 1.548309326171875, 1.6003265380859375, 1.65234375]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 4.0, 2.0, 4.0, 5.0, 1.0, 8.0, 2.0, 14.0, 11.0, 13.0, 11.0, 19.0, 18.0, 17.0, 20.0, 27.0, 29.0, 30.0, 28.0, 39.0, 37.0, 39.0, 34.0, 47.0, 39.0, 38.0, 57.0, 33.0, 51.0, 30.0, 34.0, 35.0, 36.0, 26.0, 26.0, 20.0, 21.0, 23.0, 15.0, 19.0, 7.0, 8.0, 14.0, 6.0, 6.0, 4.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.71240234375, -0.6879043579101562, -0.6634063720703125, -0.6389083862304688, -0.614410400390625, -0.5899124145507812, -0.5654144287109375, -0.5409164428710938, -0.51641845703125, -0.49192047119140625, -0.4674224853515625, -0.44292449951171875, -0.418426513671875, -0.39392852783203125, -0.3694305419921875, -0.34493255615234375, -0.3204345703125, -0.29593658447265625, -0.2714385986328125, -0.24694061279296875, -0.222442626953125, -0.19794464111328125, -0.1734466552734375, -0.14894866943359375, -0.12445068359375, -0.09995269775390625, -0.0754547119140625, -0.05095672607421875, -0.026458740234375, -0.00196075439453125, 0.0225372314453125, 0.04703521728515625, 0.071533203125, 0.09603118896484375, 0.1205291748046875, 0.14502716064453125, 0.169525146484375, 0.19402313232421875, 0.2185211181640625, 0.24301910400390625, 0.26751708984375, 0.29201507568359375, 0.3165130615234375, 0.34101104736328125, 0.365509033203125, 0.39000701904296875, 0.4145050048828125, 0.43900299072265625, 0.4635009765625, 0.48799896240234375, 0.5124969482421875, 0.5369949340820312, 0.561492919921875, 0.5859909057617188, 0.6104888916015625, 0.6349868774414062, 0.65948486328125, 0.6839828491210938, 0.7084808349609375, 0.7329788208007812, 0.757476806640625, 0.7819747924804688, 0.8064727783203125, 0.8309707641601562, 0.85546875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 8.0, 3.0, 9.0, 7.0, 16.0, 27.0, 26.0, 38.0, 53.0, 77.0, 120.0, 189.0, 290.0, 406.0, 662.0, 1152.0, 1982.0, 5218.0, 19397.0, 128252.0, 694499.0, 161507.0, 23405.0, 5797.0, 2322.0, 1125.0, 674.0, 434.0, 257.0, 204.0, 116.0, 79.0, 52.0, 57.0, 29.0, 12.0, 20.0, 7.0, 7.0, 5.0, 5.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.353515625, -3.24005126953125, -3.1265869140625, -3.01312255859375, -2.899658203125, -2.78619384765625, -2.6727294921875, -2.55926513671875, -2.44580078125, -2.33233642578125, -2.2188720703125, -2.10540771484375, -1.991943359375, -1.87847900390625, -1.7650146484375, -1.65155029296875, -1.5380859375, -1.42462158203125, -1.3111572265625, -1.19769287109375, -1.084228515625, -0.97076416015625, -0.8572998046875, -0.74383544921875, -0.63037109375, -0.51690673828125, -0.4034423828125, -0.28997802734375, -0.176513671875, -0.06304931640625, 0.0504150390625, 0.16387939453125, 0.27734375, 0.39080810546875, 0.5042724609375, 0.61773681640625, 0.731201171875, 0.84466552734375, 0.9581298828125, 1.07159423828125, 1.18505859375, 1.29852294921875, 1.4119873046875, 1.52545166015625, 1.638916015625, 1.75238037109375, 1.8658447265625, 1.97930908203125, 2.0927734375, 2.20623779296875, 2.3197021484375, 2.43316650390625, 2.546630859375, 2.66009521484375, 2.7735595703125, 2.88702392578125, 3.00048828125, 3.11395263671875, 3.2274169921875, 3.34088134765625, 3.454345703125, 3.56781005859375, 3.6812744140625, 3.79473876953125, 3.908203125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 7.0, 9.0, 7.0, 5.0, 9.0, 14.0, 14.0, 19.0, 19.0, 29.0, 34.0, 22.0, 33.0, 56.0, 39.0, 39.0, 49.0, 43.0, 50.0, 44.0, 50.0, 42.0, 56.0, 48.0, 40.0, 29.0, 32.0, 39.0, 29.0, 22.0, 17.0, 15.0, 11.0, 10.0, 7.0, 3.0, 3.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.96484375, -3.84490966796875, -3.7249755859375, -3.60504150390625, -3.485107421875, -3.36517333984375, -3.2452392578125, -3.12530517578125, -3.00537109375, -2.88543701171875, -2.7655029296875, -2.64556884765625, -2.525634765625, -2.40570068359375, -2.2857666015625, -2.16583251953125, -2.0458984375, -1.92596435546875, -1.8060302734375, -1.68609619140625, -1.566162109375, -1.44622802734375, -1.3262939453125, -1.20635986328125, -1.08642578125, -0.96649169921875, -0.8465576171875, -0.72662353515625, -0.606689453125, -0.48675537109375, -0.3668212890625, -0.24688720703125, -0.126953125, -0.00701904296875, 0.1129150390625, 0.23284912109375, 0.352783203125, 0.47271728515625, 0.5926513671875, 0.71258544921875, 0.83251953125, 0.95245361328125, 1.0723876953125, 1.19232177734375, 1.312255859375, 1.43218994140625, 1.5521240234375, 1.67205810546875, 1.7919921875, 1.91192626953125, 2.0318603515625, 2.15179443359375, 2.271728515625, 2.39166259765625, 2.5115966796875, 2.63153076171875, 2.75146484375, 2.87139892578125, 2.9913330078125, 3.11126708984375, 3.231201171875, 3.35113525390625, 3.4710693359375, 3.59100341796875, 3.7109375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 4.0, 9.0, 13.0, 10.0, 14.0, 17.0, 27.0, 35.0, 67.0, 105.0, 159.0, 231.0, 439.0, 927.0, 2297.0, 7670.0, 46329.0, 696454.0, 261447.0, 23988.0, 5026.0, 1614.0, 721.0, 345.0, 205.0, 132.0, 75.0, 41.0, 43.0, 28.0, 21.0, 15.0, 11.0, 9.0, 8.0, 5.0, 2.0, 4.0, 2.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.38671875, -1.3417510986328125, -1.296783447265625, -1.2518157958984375, -1.20684814453125, -1.1618804931640625, -1.116912841796875, -1.0719451904296875, -1.0269775390625, -0.9820098876953125, -0.937042236328125, -0.8920745849609375, -0.84710693359375, -0.8021392822265625, -0.757171630859375, -0.7122039794921875, -0.667236328125, -0.6222686767578125, -0.577301025390625, -0.5323333740234375, -0.48736572265625, -0.4423980712890625, -0.397430419921875, -0.3524627685546875, -0.3074951171875, -0.2625274658203125, -0.217559814453125, -0.1725921630859375, -0.12762451171875, -0.0826568603515625, -0.037689208984375, 0.0072784423828125, 0.05224609375, 0.0972137451171875, 0.142181396484375, 0.1871490478515625, 0.23211669921875, 0.2770843505859375, 0.322052001953125, 0.3670196533203125, 0.4119873046875, 0.4569549560546875, 0.501922607421875, 0.5468902587890625, 0.59185791015625, 0.6368255615234375, 0.681793212890625, 0.7267608642578125, 0.771728515625, 0.8166961669921875, 0.861663818359375, 0.9066314697265625, 0.95159912109375, 0.9965667724609375, 1.041534423828125, 1.0865020751953125, 1.1314697265625, 1.1764373779296875, 1.221405029296875, 1.2663726806640625, 1.31134033203125, 1.3563079833984375, 1.401275634765625, 1.4462432861328125, 1.4912109375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 4.0, 7.0, 2.0, 7.0, 6.0, 7.0, 17.0, 20.0, 32.0, 40.0, 41.0, 60.0, 83.0, 106.0, 117.0, 105.0, 61.0, 52.0, 49.0, 33.0, 36.0, 21.0, 17.0, 16.0, 11.0, 7.0, 9.0, 4.0, 5.0, 5.0, 5.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002772808074951172, -0.0002675391733646393, -0.0002577975392341614, -0.00024805590510368347, -0.00023831427097320557, -0.00022857263684272766, -0.00021883100271224976, -0.00020908936858177185, -0.00019934773445129395, -0.00018960610032081604, -0.00017986446619033813, -0.00017012283205986023, -0.00016038119792938232, -0.00015063956379890442, -0.00014089792966842651, -0.0001311562955379486, -0.0001214146614074707, -0.0001116730272769928, -0.00010193139314651489, -9.218975901603699e-05, -8.244812488555908e-05, -7.270649075508118e-05, -6.296485662460327e-05, -5.3223222494125366e-05, -4.348158836364746e-05, -3.3739954233169556e-05, -2.399832010269165e-05, -1.4256685972213745e-05, -4.51505184173584e-06, 5.2265822887420654e-06, 1.496821641921997e-05, 2.4709850549697876e-05, 3.445148468017578e-05, 4.4193118810653687e-05, 5.393475294113159e-05, 6.36763870716095e-05, 7.34180212020874e-05, 8.315965533256531e-05, 9.290128946304321e-05, 0.00010264292359352112, 0.00011238455772399902, 0.00012212619185447693, 0.00013186782598495483, 0.00014160946011543274, 0.00015135109424591064, 0.00016109272837638855, 0.00017083436250686646, 0.00018057599663734436, 0.00019031763076782227, 0.00020005926489830017, 0.00020980089902877808, 0.00021954253315925598, 0.0002292841672897339, 0.0002390258014202118, 0.0002487674355506897, 0.0002585090696811676, 0.0002682507038116455, 0.0002779923379421234, 0.0002877339720726013, 0.0002974756062030792, 0.00030721724033355713, 0.00031695887446403503, 0.00032670050859451294, 0.00033644214272499084, 0.00034618377685546875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 2.0, 7.0, 1.0, 11.0, 15.0, 11.0, 22.0, 35.0, 59.0, 101.0, 143.0, 279.0, 567.0, 1213.0, 3177.0, 11756.0, 75860.0, 794797.0, 136183.0, 17095.0, 4326.0, 1437.0, 663.0, 312.0, 161.0, 103.0, 57.0, 41.0, 45.0, 22.0, 11.0, 14.0, 9.0, 4.0, 2.0, 5.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5009765625, -1.4549560546875, -1.408935546875, -1.3629150390625, -1.31689453125, -1.2708740234375, -1.224853515625, -1.1788330078125, -1.1328125, -1.0867919921875, -1.040771484375, -0.9947509765625, -0.94873046875, -0.9027099609375, -0.856689453125, -0.8106689453125, -0.7646484375, -0.7186279296875, -0.672607421875, -0.6265869140625, -0.58056640625, -0.5345458984375, -0.488525390625, -0.4425048828125, -0.396484375, -0.3504638671875, -0.304443359375, -0.2584228515625, -0.21240234375, -0.1663818359375, -0.120361328125, -0.0743408203125, -0.0283203125, 0.0177001953125, 0.063720703125, 0.1097412109375, 0.15576171875, 0.2017822265625, 0.247802734375, 0.2938232421875, 0.33984375, 0.3858642578125, 0.431884765625, 0.4779052734375, 0.52392578125, 0.5699462890625, 0.615966796875, 0.6619873046875, 0.7080078125, 0.7540283203125, 0.800048828125, 0.8460693359375, 0.89208984375, 0.9381103515625, 0.984130859375, 1.0301513671875, 1.076171875, 1.1221923828125, 1.168212890625, 1.2142333984375, 1.26025390625, 1.3062744140625, 1.352294921875, 1.3983154296875, 1.4443359375]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 5.0, 2.0, 6.0, 6.0, 11.0, 9.0, 6.0, 13.0, 19.0, 27.0, 19.0, 37.0, 48.0, 64.0, 74.0, 83.0, 85.0, 82.0, 70.0, 64.0, 69.0, 43.0, 36.0, 30.0, 22.0, 18.0, 13.0, 11.0, 5.0, 8.0, 9.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0908203125, -1.0528717041015625, -1.014923095703125, -0.9769744873046875, -0.93902587890625, -0.9010772705078125, -0.863128662109375, -0.8251800537109375, -0.7872314453125, -0.7492828369140625, -0.711334228515625, -0.6733856201171875, -0.63543701171875, -0.5974884033203125, -0.559539794921875, -0.5215911865234375, -0.483642578125, -0.4456939697265625, -0.407745361328125, -0.3697967529296875, -0.33184814453125, -0.2938995361328125, -0.255950927734375, -0.2180023193359375, -0.1800537109375, -0.1421051025390625, -0.104156494140625, -0.0662078857421875, -0.02825927734375, 0.0096893310546875, 0.047637939453125, 0.0855865478515625, 0.12353515625, 0.1614837646484375, 0.199432373046875, 0.2373809814453125, 0.27532958984375, 0.3132781982421875, 0.351226806640625, 0.3891754150390625, 0.4271240234375, 0.4650726318359375, 0.503021240234375, 0.5409698486328125, 0.57891845703125, 0.6168670654296875, 0.654815673828125, 0.6927642822265625, 0.730712890625, 0.7686614990234375, 0.806610107421875, 0.8445587158203125, 0.88250732421875, 0.9204559326171875, 0.958404541015625, 0.9963531494140625, 1.0343017578125, 1.0722503662109375, 1.110198974609375, 1.1481475830078125, 1.18609619140625, 1.2240447998046875, 1.261993408203125, 1.2999420166015625, 1.337890625]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 2.0, 3.0, 0.0, 4.0, 5.0, 13.0, 14.0, 20.0, 48.0, 104.0, 144.0, 289.0, 174.0, 103.0, 41.0, 22.0, 7.0, 8.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.962188720703125, -45.99844741821289, -45.034706115722656, -44.07096481323242, -43.10722351074219, -42.14348220825195, -41.17974090576172, -40.215999603271484, -39.25225830078125, -38.288516998291016, -37.32477569580078, -36.36103439331055, -35.39729309082031, -34.43355178833008, -33.469810485839844, -32.50606918334961, -31.542325973510742, -30.578584671020508, -29.614843368530273, -28.65110206604004, -27.687360763549805, -26.72361946105957, -25.759876251220703, -24.79613494873047, -23.832393646240234, -22.86865234375, -21.904911041259766, -20.94116973876953, -19.977428436279297, -19.013687133789062, -18.049945831298828, -17.086204528808594, -16.12246322631836, -15.158721923828125, -14.19498062133789, -13.231239318847656, -12.267498016357422, -11.303756713867188, -10.340014457702637, -9.376273155212402, -8.412530899047852, -7.448789596557617, -6.485048294067383, -5.52130651473999, -4.557565212249756, -3.5938239097595215, -2.630082130432129, -1.6663408279418945, -0.7025995254516602, 0.26114189624786377, 1.2248833179473877, 2.188624858856201, 3.1523661613464355, 4.11610746383667, 5.0798492431640625, 6.043590545654297, 7.007331848144531, 7.971073150634766, 8.934814453125, 9.898555755615234, 10.862297058105469, 11.826038360595703, 12.789780616760254, 13.753521919250488, 14.717263221740723]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 6.0, 14.0, 7.0, 11.0, 9.0, 16.0, 11.0, 16.0, 19.0, 20.0, 35.0, 33.0, 27.0, 25.0, 30.0, 29.0, 36.0, 59.0, 61.0, 56.0, 61.0, 44.0, 44.0, 36.0, 35.0, 20.0, 26.0, 17.0, 15.0, 27.0, 24.0, 18.0, 19.0, 13.0, 8.0, 15.0, 13.0, 8.0, 7.0, 7.0, 6.0, 5.0, 3.0, 1.0, 6.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-12.562311172485352, -12.178360939025879, -11.794410705566406, -11.410460472106934, -11.026510238647461, -10.642560005187988, -10.258609771728516, -9.874659538269043, -9.49070930480957, -9.106759071350098, -8.722808837890625, -8.338858604431152, -7.95490837097168, -7.570958137512207, -7.187007904052734, -6.803057670593262, -6.419106960296631, -6.035156726837158, -5.6512064933776855, -5.267256259918213, -4.88330602645874, -4.499355792999268, -4.115405082702637, -3.731455087661743, -3.3475048542022705, -2.963554620742798, -2.579604387283325, -2.1956539154052734, -1.8117038011550903, -1.4277535676956177, -1.0438032150268555, -0.6598529815673828, -0.27590274810791016, 0.10804751515388489, 0.49199777841567993, 0.8759480714797974, 1.25989830493927, 1.6438485383987427, 2.027798891067505, 2.4117491245269775, 2.79569935798645, 3.179649591445923, 3.5635998249053955, 3.9475502967834473, 4.33150053024292, 4.715450763702393, 5.099400997161865, 5.483351230621338, 5.8673014640808105, 6.251251697540283, 6.635201930999756, 7.0191521644592285, 7.403102397918701, 7.787052631378174, 8.171003341674805, 8.554953575134277, 8.93890380859375, 9.322854042053223, 9.706804275512695, 10.090754508972168, 10.47470474243164, 10.858654975891113, 11.242605209350586, 11.626555442810059, 12.010505676269531]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 7.0, 6.0, 15.0, 14.0, 28.0, 41.0, 81.0, 153.0, 329.0, 851.0, 2652.0, 10321.0, 74766.0, 2342433.0, 1694089.0, 56230.0, 8657.0, 2180.0, 752.0, 295.0, 172.0, 83.0, 39.0, 32.0, 17.0, 11.0, 9.0, 7.0, 4.0, 3.0, 1.0, 3.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.37109375, -2.29913330078125, -2.2271728515625, -2.15521240234375, -2.083251953125, -2.01129150390625, -1.9393310546875, -1.86737060546875, -1.79541015625, -1.72344970703125, -1.6514892578125, -1.57952880859375, -1.507568359375, -1.43560791015625, -1.3636474609375, -1.29168701171875, -1.2197265625, -1.14776611328125, -1.0758056640625, -1.00384521484375, -0.931884765625, -0.85992431640625, -0.7879638671875, -0.71600341796875, -0.64404296875, -0.57208251953125, -0.5001220703125, -0.42816162109375, -0.356201171875, -0.28424072265625, -0.2122802734375, -0.14031982421875, -0.068359375, 0.00360107421875, 0.0755615234375, 0.14752197265625, 0.219482421875, 0.29144287109375, 0.3634033203125, 0.43536376953125, 0.50732421875, 0.57928466796875, 0.6512451171875, 0.72320556640625, 0.795166015625, 0.86712646484375, 0.9390869140625, 1.01104736328125, 1.0830078125, 1.15496826171875, 1.2269287109375, 1.29888916015625, 1.370849609375, 1.44281005859375, 1.5147705078125, 1.58673095703125, 1.65869140625, 1.73065185546875, 1.8026123046875, 1.87457275390625, 1.946533203125, 2.01849365234375, 2.0904541015625, 2.16241455078125, 2.234375]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 1.0, 3.0, 4.0, 7.0, 4.0, 6.0, 11.0, 7.0, 17.0, 22.0, 12.0, 22.0, 24.0, 23.0, 34.0, 24.0, 22.0, 44.0, 37.0, 43.0, 42.0, 50.0, 47.0, 45.0, 54.0, 46.0, 47.0, 44.0, 43.0, 34.0, 30.0, 26.0, 24.0, 23.0, 14.0, 18.0, 13.0, 3.0, 12.0, 8.0, 4.0, 5.0, 3.0, 0.0, 4.0, 0.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.65966796875, -0.6340484619140625, -0.608428955078125, -0.5828094482421875, -0.55718994140625, -0.5315704345703125, -0.505950927734375, -0.4803314208984375, -0.4547119140625, -0.4290924072265625, -0.403472900390625, -0.3778533935546875, -0.35223388671875, -0.3266143798828125, -0.300994873046875, -0.2753753662109375, -0.249755859375, -0.2241363525390625, -0.198516845703125, -0.1728973388671875, -0.14727783203125, -0.1216583251953125, -0.096038818359375, -0.0704193115234375, -0.0447998046875, -0.0191802978515625, 0.006439208984375, 0.0320587158203125, 0.05767822265625, 0.0832977294921875, 0.108917236328125, 0.1345367431640625, 0.16015625, 0.1857757568359375, 0.211395263671875, 0.2370147705078125, 0.26263427734375, 0.2882537841796875, 0.313873291015625, 0.3394927978515625, 0.3651123046875, 0.3907318115234375, 0.416351318359375, 0.4419708251953125, 0.46759033203125, 0.4932098388671875, 0.518829345703125, 0.5444488525390625, 0.570068359375, 0.5956878662109375, 0.621307373046875, 0.6469268798828125, 0.67254638671875, 0.6981658935546875, 0.723785400390625, 0.7494049072265625, 0.7750244140625, 0.8006439208984375, 0.826263427734375, 0.8518829345703125, 0.87750244140625, 0.9031219482421875, 0.928741455078125, 0.9543609619140625, 0.97998046875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 8.0, 6.0, 7.0, 8.0, 12.0, 15.0, 17.0, 37.0, 41.0, 83.0, 113.0, 159.0, 264.0, 481.0, 866.0, 1867.0, 4564.0, 13227.0, 47800.0, 304618.0, 3287082.0, 446566.0, 60656.0, 15962.0, 5310.0, 2187.0, 978.0, 483.0, 280.0, 163.0, 106.0, 76.0, 58.0, 42.0, 43.0, 22.0, 27.0, 16.0, 13.0, 7.0, 4.0, 3.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8056640625, -1.7465972900390625, -1.687530517578125, -1.6284637451171875, -1.56939697265625, -1.5103302001953125, -1.451263427734375, -1.3921966552734375, -1.3331298828125, -1.2740631103515625, -1.214996337890625, -1.1559295654296875, -1.09686279296875, -1.0377960205078125, -0.978729248046875, -0.9196624755859375, -0.860595703125, -0.8015289306640625, -0.742462158203125, -0.6833953857421875, -0.62432861328125, -0.5652618408203125, -0.506195068359375, -0.4471282958984375, -0.3880615234375, -0.3289947509765625, -0.269927978515625, -0.2108612060546875, -0.15179443359375, -0.0927276611328125, -0.033660888671875, 0.0254058837890625, 0.08447265625, 0.1435394287109375, 0.202606201171875, 0.2616729736328125, 0.32073974609375, 0.3798065185546875, 0.438873291015625, 0.4979400634765625, 0.5570068359375, 0.6160736083984375, 0.675140380859375, 0.7342071533203125, 0.79327392578125, 0.8523406982421875, 0.911407470703125, 0.9704742431640625, 1.029541015625, 1.0886077880859375, 1.147674560546875, 1.2067413330078125, 1.26580810546875, 1.3248748779296875, 1.383941650390625, 1.4430084228515625, 1.5020751953125, 1.5611419677734375, 1.620208740234375, 1.6792755126953125, 1.73834228515625, 1.7974090576171875, 1.856475830078125, 1.9155426025390625, 1.974609375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 2.0, 9.0, 6.0, 7.0, 8.0, 16.0, 13.0, 9.0, 21.0, 33.0, 29.0, 48.0, 77.0, 76.0, 140.0, 225.0, 357.0, 570.0, 686.0, 568.0, 371.0, 249.0, 146.0, 102.0, 78.0, 40.0, 31.0, 37.0, 23.0, 23.0, 14.0, 14.0, 10.0, 6.0, 5.0, 7.0, 4.0, 3.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 2.0], "bins": [-1.9130859375, -1.8578033447265625, -1.802520751953125, -1.7472381591796875, -1.69195556640625, -1.6366729736328125, -1.581390380859375, -1.5261077880859375, -1.4708251953125, -1.4155426025390625, -1.360260009765625, -1.3049774169921875, -1.24969482421875, -1.1944122314453125, -1.139129638671875, -1.0838470458984375, -1.028564453125, -0.9732818603515625, -0.917999267578125, -0.8627166748046875, -0.80743408203125, -0.7521514892578125, -0.696868896484375, -0.6415863037109375, -0.5863037109375, -0.5310211181640625, -0.475738525390625, -0.4204559326171875, -0.36517333984375, -0.3098907470703125, -0.254608154296875, -0.1993255615234375, -0.14404296875, -0.0887603759765625, -0.033477783203125, 0.0218048095703125, 0.07708740234375, 0.1323699951171875, 0.187652587890625, 0.2429351806640625, 0.2982177734375, 0.3535003662109375, 0.408782958984375, 0.4640655517578125, 0.51934814453125, 0.5746307373046875, 0.629913330078125, 0.6851959228515625, 0.740478515625, 0.7957611083984375, 0.851043701171875, 0.9063262939453125, 0.96160888671875, 1.0168914794921875, 1.072174072265625, 1.1274566650390625, 1.1827392578125, 1.2380218505859375, 1.293304443359375, 1.3485870361328125, 1.40386962890625, 1.4591522216796875, 1.514434814453125, 1.5697174072265625, 1.625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 6.0, 12.0, 40.0, 95.0, 236.0, 318.0, 186.0, 64.0, 25.0, 7.0, 10.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.70520782470703, -16.62074089050293, -15.536274909973145, -14.45180892944336, -13.367341995239258, -12.282876014709473, -11.198410034179688, -10.113943099975586, -9.0294771194458, -7.945010662078857, -6.860544204711914, -5.776078224182129, -4.6916117668151855, -3.607145309448242, -2.522679328918457, -1.4382128715515137, -0.3537464141845703, 0.7307199239730835, 1.8151862621307373, 2.8996524810791016, 3.984118938446045, 5.068585395812988, 6.153051376342773, 7.237517833709717, 8.32198429107666, 9.406450271606445, 10.490917205810547, 11.575383186340332, 12.659849166870117, 13.744316101074219, 14.828782081604004, 15.913248062133789, 16.99771499633789, 18.082181930541992, 19.16664695739746, 20.251113891601562, 21.335580825805664, 22.420047760009766, 23.504512786865234, 24.588979721069336, 25.673446655273438, 26.75791358947754, 27.842378616333008, 28.92684555053711, 30.01131248474121, 31.095779418945312, 32.18024444580078, 33.26470947265625, 34.34917449951172, 35.43363952636719, 36.51810836791992, 37.60257339477539, 38.68703842163086, 39.771507263183594, 40.85597229003906, 41.94043731689453, 43.024906158447266, 44.109371185302734, 45.19384002685547, 46.27830505371094, 47.362770080566406, 48.44723892211914, 49.53170394897461, 50.61616897583008, 51.70063781738281]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 1.0, 3.0, 12.0, 12.0, 9.0, 5.0, 11.0, 18.0, 20.0, 20.0, 28.0, 32.0, 33.0, 45.0, 40.0, 44.0, 37.0, 51.0, 65.0, 63.0, 47.0, 50.0, 46.0, 50.0, 36.0, 40.0, 27.0, 37.0, 24.0, 15.0, 12.0, 12.0, 13.0, 15.0, 14.0, 8.0, 4.0, 8.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.922636032104492, -11.611213684082031, -11.299790382385254, -10.988368034362793, -10.676944732666016, -10.365522384643555, -10.054099082946777, -9.742676734924316, -9.431253433227539, -9.119831085205078, -8.8084077835083, -8.49698543548584, -8.185562133789062, -7.874139785766602, -7.562716960906982, -7.251294136047363, -6.939871788024902, -6.628448963165283, -6.317026138305664, -6.005603313446045, -5.694180488586426, -5.382758140563965, -5.071335315704346, -4.759912490844727, -4.448489665985107, -4.137066841125488, -3.825644016265869, -3.514221429824829, -3.20279860496521, -2.891375780105591, -2.579953193664551, -2.2685303688049316, -1.9571075439453125, -1.6456847190856934, -1.3342620134353638, -1.0228393077850342, -0.711416482925415, -0.3999936580657959, -0.08857095241546631, 0.22285175323486328, 0.5342745780944824, 0.8456973433494568, 1.1571201086044312, 1.4685428142547607, 1.7799656391143799, 2.091388463973999, 2.402811050415039, 2.714233875274658, 3.0256567001342773, 3.3370795249938965, 3.6485023498535156, 3.9599249362945557, 4.271347999572754, 4.582770347595215, 4.894193172454834, 5.205615997314453, 5.517038822174072, 5.828461647033691, 6.1398844718933105, 6.45130729675293, 6.762729644775391, 7.074152946472168, 7.385575294494629, 7.696998119354248, 8.008420944213867]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 5.0, 6.0, 6.0, 6.0, 8.0, 12.0, 30.0, 26.0, 46.0, 81.0, 150.0, 190.0, 330.0, 497.0, 997.0, 1807.0, 3472.0, 7143.0, 15250.0, 34097.0, 80273.0, 192433.0, 333833.0, 216301.0, 90162.0, 38189.0, 17015.0, 7787.0, 3809.0, 1974.0, 1061.0, 599.0, 356.0, 203.0, 148.0, 85.0, 55.0, 28.0, 35.0, 23.0, 14.0, 9.0, 2.0, 2.0, 4.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.400390625, -1.3495941162109375, -1.298797607421875, -1.2480010986328125, -1.19720458984375, -1.1464080810546875, -1.095611572265625, -1.0448150634765625, -0.9940185546875, -0.9432220458984375, -0.892425537109375, -0.8416290283203125, -0.79083251953125, -0.7400360107421875, -0.689239501953125, -0.6384429931640625, -0.587646484375, -0.5368499755859375, -0.486053466796875, -0.4352569580078125, -0.38446044921875, -0.3336639404296875, -0.282867431640625, -0.2320709228515625, -0.1812744140625, -0.1304779052734375, -0.079681396484375, -0.0288848876953125, 0.02191162109375, 0.0727081298828125, 0.123504638671875, 0.1743011474609375, 0.22509765625, 0.2758941650390625, 0.326690673828125, 0.3774871826171875, 0.42828369140625, 0.4790802001953125, 0.529876708984375, 0.5806732177734375, 0.6314697265625, 0.6822662353515625, 0.733062744140625, 0.7838592529296875, 0.83465576171875, 0.8854522705078125, 0.936248779296875, 0.9870452880859375, 1.037841796875, 1.0886383056640625, 1.139434814453125, 1.1902313232421875, 1.24102783203125, 1.2918243408203125, 1.342620849609375, 1.3934173583984375, 1.4442138671875, 1.4950103759765625, 1.545806884765625, 1.5966033935546875, 1.64739990234375, 1.6981964111328125, 1.748992919921875, 1.7997894287109375, 1.8505859375]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 7.0, 0.0, 7.0, 5.0, 6.0, 13.0, 8.0, 14.0, 12.0, 10.0, 21.0, 18.0, 21.0, 22.0, 27.0, 25.0, 27.0, 36.0, 36.0, 43.0, 36.0, 26.0, 43.0, 35.0, 38.0, 46.0, 41.0, 56.0, 33.0, 36.0, 27.0, 22.0, 22.0, 28.0, 27.0, 31.0, 15.0, 17.0, 11.0, 8.0, 10.0, 11.0, 3.0, 4.0, 5.0, 4.0, 2.0, 7.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.6923828125, -0.6698760986328125, -0.647369384765625, -0.6248626708984375, -0.60235595703125, -0.5798492431640625, -0.557342529296875, -0.5348358154296875, -0.5123291015625, -0.4898223876953125, -0.467315673828125, -0.4448089599609375, -0.42230224609375, -0.3997955322265625, -0.377288818359375, -0.3547821044921875, -0.332275390625, -0.3097686767578125, -0.287261962890625, -0.2647552490234375, -0.24224853515625, -0.2197418212890625, -0.197235107421875, -0.1747283935546875, -0.1522216796875, -0.1297149658203125, -0.107208251953125, -0.0847015380859375, -0.06219482421875, -0.0396881103515625, -0.017181396484375, 0.0053253173828125, 0.02783203125, 0.0503387451171875, 0.072845458984375, 0.0953521728515625, 0.11785888671875, 0.1403656005859375, 0.162872314453125, 0.1853790283203125, 0.2078857421875, 0.2303924560546875, 0.252899169921875, 0.2754058837890625, 0.29791259765625, 0.3204193115234375, 0.342926025390625, 0.3654327392578125, 0.387939453125, 0.4104461669921875, 0.432952880859375, 0.4554595947265625, 0.47796630859375, 0.5004730224609375, 0.522979736328125, 0.5454864501953125, 0.5679931640625, 0.5904998779296875, 0.613006591796875, 0.6355133056640625, 0.65802001953125, 0.6805267333984375, 0.703033447265625, 0.7255401611328125, 0.748046875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 6.0, 4.0, 6.0, 11.0, 22.0, 24.0, 37.0, 58.0, 79.0, 108.0, 151.0, 251.0, 412.0, 661.0, 1196.0, 2426.0, 6943.0, 32041.0, 217883.0, 668347.0, 93325.0, 15976.0, 4368.0, 1755.0, 928.0, 529.0, 331.0, 223.0, 134.0, 94.0, 86.0, 44.0, 31.0, 20.0, 10.0, 9.0, 12.0, 10.0, 4.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.265625, -3.157806396484375, -3.04998779296875, -2.942169189453125, -2.8343505859375, -2.726531982421875, -2.61871337890625, -2.510894775390625, -2.403076171875, -2.295257568359375, -2.18743896484375, -2.079620361328125, -1.9718017578125, -1.863983154296875, -1.75616455078125, -1.648345947265625, -1.54052734375, -1.432708740234375, -1.32489013671875, -1.217071533203125, -1.1092529296875, -1.001434326171875, -0.89361572265625, -0.785797119140625, -0.677978515625, -0.570159912109375, -0.46234130859375, -0.354522705078125, -0.2467041015625, -0.138885498046875, -0.03106689453125, 0.076751708984375, 0.1845703125, 0.292388916015625, 0.40020751953125, 0.508026123046875, 0.6158447265625, 0.723663330078125, 0.83148193359375, 0.939300537109375, 1.047119140625, 1.154937744140625, 1.26275634765625, 1.370574951171875, 1.4783935546875, 1.586212158203125, 1.69403076171875, 1.801849365234375, 1.90966796875, 2.017486572265625, 2.12530517578125, 2.233123779296875, 2.3409423828125, 2.448760986328125, 2.55657958984375, 2.664398193359375, 2.772216796875, 2.880035400390625, 2.98785400390625, 3.095672607421875, 3.2034912109375, 3.311309814453125, 3.41912841796875, 3.526947021484375, 3.634765625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 7.0, 6.0, 9.0, 6.0, 17.0, 12.0, 14.0, 24.0, 30.0, 36.0, 34.0, 41.0, 42.0, 57.0, 60.0, 55.0, 69.0, 56.0, 57.0, 54.0, 40.0, 47.0, 44.0, 34.0, 33.0, 23.0, 24.0, 25.0, 18.0, 9.0, 7.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.45703125, -4.3321533203125, -4.207275390625, -4.0823974609375, -3.95751953125, -3.8326416015625, -3.707763671875, -3.5828857421875, -3.4580078125, -3.3331298828125, -3.208251953125, -3.0833740234375, -2.95849609375, -2.8336181640625, -2.708740234375, -2.5838623046875, -2.458984375, -2.3341064453125, -2.209228515625, -2.0843505859375, -1.95947265625, -1.8345947265625, -1.709716796875, -1.5848388671875, -1.4599609375, -1.3350830078125, -1.210205078125, -1.0853271484375, -0.96044921875, -0.8355712890625, -0.710693359375, -0.5858154296875, -0.4609375, -0.3360595703125, -0.211181640625, -0.0863037109375, 0.03857421875, 0.1634521484375, 0.288330078125, 0.4132080078125, 0.5380859375, 0.6629638671875, 0.787841796875, 0.9127197265625, 1.03759765625, 1.1624755859375, 1.287353515625, 1.4122314453125, 1.537109375, 1.6619873046875, 1.786865234375, 1.9117431640625, 2.03662109375, 2.1614990234375, 2.286376953125, 2.4112548828125, 2.5361328125, 2.6610107421875, 2.785888671875, 2.9107666015625, 3.03564453125, 3.1605224609375, 3.285400390625, 3.4102783203125, 3.53515625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 4.0, 3.0, 7.0, 10.0, 8.0, 18.0, 16.0, 26.0, 52.0, 74.0, 108.0, 197.0, 399.0, 812.0, 2015.0, 6748.0, 36921.0, 304424.0, 619747.0, 62173.0, 10102.0, 2632.0, 1036.0, 413.0, 255.0, 129.0, 70.0, 44.0, 40.0, 26.0, 11.0, 17.0, 3.0, 6.0, 4.0, 5.0, 0.0, 4.0, 2.0, 1.0, 2.0], "bins": [-1.2177734375, -1.1881637573242188, -1.1585540771484375, -1.1289443969726562, -1.099334716796875, -1.0697250366210938, -1.0401153564453125, -1.0105056762695312, -0.98089599609375, -0.9512863159179688, -0.9216766357421875, -0.8920669555664062, -0.862457275390625, -0.8328475952148438, -0.8032379150390625, -0.7736282348632812, -0.7440185546875, -0.7144088745117188, -0.6847991943359375, -0.6551895141601562, -0.625579833984375, -0.5959701538085938, -0.5663604736328125, -0.5367507934570312, -0.50714111328125, -0.47753143310546875, -0.4479217529296875, -0.41831207275390625, -0.388702392578125, -0.35909271240234375, -0.3294830322265625, -0.29987335205078125, -0.270263671875, -0.24065399169921875, -0.2110443115234375, -0.18143463134765625, -0.151824951171875, -0.12221527099609375, -0.0926055908203125, -0.06299591064453125, -0.03338623046875, -0.00377655029296875, 0.0258331298828125, 0.05544281005859375, 0.085052490234375, 0.11466217041015625, 0.1442718505859375, 0.17388153076171875, 0.2034912109375, 0.23310089111328125, 0.2627105712890625, 0.29232025146484375, 0.321929931640625, 0.35153961181640625, 0.3811492919921875, 0.41075897216796875, 0.44036865234375, 0.46997833251953125, 0.4995880126953125, 0.5291976928710938, 0.558807373046875, 0.5884170532226562, 0.6180267333984375, 0.6476364135742188, 0.67724609375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 2.0, 4.0, 7.0, 4.0, 6.0, 9.0, 11.0, 9.0, 25.0, 40.0, 46.0, 61.0, 79.0, 89.0, 120.0, 111.0, 109.0, 71.0, 51.0, 35.0, 27.0, 19.0, 13.0, 14.0, 14.0, 7.0, 5.0, 7.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0003390312194824219, -0.00033006444573402405, -0.0003210976719856262, -0.0003121308982372284, -0.00030316412448883057, -0.00029419735074043274, -0.0002852305769920349, -0.0002762638032436371, -0.00026729702949523926, -0.00025833025574684143, -0.0002493634819984436, -0.00024039670825004578, -0.00023142993450164795, -0.00022246316075325012, -0.0002134963870048523, -0.00020452961325645447, -0.00019556283950805664, -0.0001865960657596588, -0.00017762929201126099, -0.00016866251826286316, -0.00015969574451446533, -0.0001507289707660675, -0.00014176219701766968, -0.00013279542326927185, -0.00012382864952087402, -0.0001148618757724762, -0.00010589510202407837, -9.692832827568054e-05, -8.796155452728271e-05, -7.899478077888489e-05, -7.002800703048706e-05, -6.106123328208923e-05, -5.2094459533691406e-05, -4.312768578529358e-05, -3.416091203689575e-05, -2.5194138288497925e-05, -1.6227364540100098e-05, -7.2605907917022705e-06, 1.7061829566955566e-06, 1.0672956705093384e-05, 1.963973045349121e-05, 2.8606504201889038e-05, 3.7573277950286865e-05, 4.654005169868469e-05, 5.550682544708252e-05, 6.447359919548035e-05, 7.344037294387817e-05, 8.2407146692276e-05, 9.137392044067383e-05, 0.00010034069418907166, 0.00010930746793746948, 0.00011827424168586731, 0.00012724101543426514, 0.00013620778918266296, 0.0001451745629310608, 0.00015414133667945862, 0.00016310811042785645, 0.00017207488417625427, 0.0001810416579246521, 0.00019000843167304993, 0.00019897520542144775, 0.00020794197916984558, 0.0002169087529182434, 0.00022587552666664124, 0.00023484230041503906]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 8.0, 10.0, 9.0, 13.0, 31.0, 34.0, 41.0, 60.0, 100.0, 128.0, 198.0, 326.0, 556.0, 1105.0, 2069.0, 5036.0, 15565.0, 75298.0, 547263.0, 322525.0, 57049.0, 12753.0, 4214.0, 1897.0, 930.0, 489.0, 311.0, 170.0, 103.0, 95.0, 55.0, 30.0, 21.0, 9.0, 10.0, 15.0, 7.0, 5.0, 4.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.7587890625, -0.735015869140625, -0.71124267578125, -0.687469482421875, -0.6636962890625, -0.639923095703125, -0.61614990234375, -0.592376708984375, -0.568603515625, -0.544830322265625, -0.52105712890625, -0.497283935546875, -0.4735107421875, -0.449737548828125, -0.42596435546875, -0.402191162109375, -0.37841796875, -0.354644775390625, -0.33087158203125, -0.307098388671875, -0.2833251953125, -0.259552001953125, -0.23577880859375, -0.212005615234375, -0.188232421875, -0.164459228515625, -0.14068603515625, -0.116912841796875, -0.0931396484375, -0.069366455078125, -0.04559326171875, -0.021820068359375, 0.001953125, 0.025726318359375, 0.04949951171875, 0.073272705078125, 0.0970458984375, 0.120819091796875, 0.14459228515625, 0.168365478515625, 0.192138671875, 0.215911865234375, 0.23968505859375, 0.263458251953125, 0.2872314453125, 0.311004638671875, 0.33477783203125, 0.358551025390625, 0.38232421875, 0.406097412109375, 0.42987060546875, 0.453643798828125, 0.4774169921875, 0.501190185546875, 0.52496337890625, 0.548736572265625, 0.572509765625, 0.596282958984375, 0.62005615234375, 0.643829345703125, 0.6676025390625, 0.691375732421875, 0.71514892578125, 0.738922119140625, 0.7626953125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 2.0, 5.0, 8.0, 6.0, 10.0, 7.0, 14.0, 15.0, 19.0, 20.0, 29.0, 30.0, 27.0, 39.0, 46.0, 44.0, 45.0, 51.0, 60.0, 63.0, 71.0, 59.0, 51.0, 62.0, 37.0, 27.0, 28.0, 17.0, 18.0, 17.0, 20.0, 15.0, 18.0, 6.0, 6.0, 3.0, 4.0, 2.0, 4.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.61767578125, -0.5965042114257812, -0.5753326416015625, -0.5541610717773438, -0.532989501953125, -0.5118179321289062, -0.4906463623046875, -0.46947479248046875, -0.44830322265625, -0.42713165283203125, -0.4059600830078125, -0.38478851318359375, -0.363616943359375, -0.34244537353515625, -0.3212738037109375, -0.30010223388671875, -0.2789306640625, -0.25775909423828125, -0.2365875244140625, -0.21541595458984375, -0.194244384765625, -0.17307281494140625, -0.1519012451171875, -0.13072967529296875, -0.10955810546875, -0.08838653564453125, -0.0672149658203125, -0.04604339599609375, -0.024871826171875, -0.00370025634765625, 0.0174713134765625, 0.03864288330078125, 0.059814453125, 0.08098602294921875, 0.1021575927734375, 0.12332916259765625, 0.144500732421875, 0.16567230224609375, 0.1868438720703125, 0.20801544189453125, 0.22918701171875, 0.25035858154296875, 0.2715301513671875, 0.29270172119140625, 0.313873291015625, 0.33504486083984375, 0.3562164306640625, 0.37738800048828125, 0.3985595703125, 0.41973114013671875, 0.4409027099609375, 0.46207427978515625, 0.483245849609375, 0.5044174194335938, 0.5255889892578125, 0.5467605590820312, 0.56793212890625, 0.5891036987304688, 0.6102752685546875, 0.6314468383789062, 0.652618408203125, 0.6737899780273438, 0.6949615478515625, 0.7161331176757812, 0.7373046875]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 11.0, 18.0, 24.0, 58.0, 106.0, 185.0, 282.0, 162.0, 79.0, 38.0, 13.0, 7.0, 9.0, 3.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-42.03028869628906, -41.14311218261719, -40.25593948364258, -39.36876678466797, -38.481590270996094, -37.59441375732422, -36.70724105834961, -35.820068359375, -34.932891845703125, -34.04571533203125, -33.15854263305664, -32.27136993408203, -31.384193420410156, -30.497018814086914, -29.609844207763672, -28.72266960144043, -27.835494995117188, -26.948320388793945, -26.061145782470703, -25.17397117614746, -24.28679656982422, -23.399621963500977, -22.512447357177734, -21.625272750854492, -20.73809814453125, -19.850923538208008, -18.963748931884766, -18.076574325561523, -17.18939971923828, -16.30222511291504, -15.415050506591797, -14.527875900268555, -13.64069938659668, -12.753524780273438, -11.866350173950195, -10.979175567626953, -10.092000961303711, -9.204826354980469, -8.317651748657227, -7.430477142333984, -6.543302536010742, -5.6561279296875, -4.768953323364258, -3.8817787170410156, -2.9946041107177734, -2.1074295043945312, -1.220254898071289, -0.3330802917480469, 0.5540943145751953, 1.4412689208984375, 2.3284435272216797, 3.215618133544922, 4.102792739868164, 4.989967346191406, 5.877141952514648, 6.764316558837891, 7.651491165161133, 8.538665771484375, 9.425840377807617, 10.31301498413086, 11.200189590454102, 12.087364196777344, 12.974538803100586, 13.861713409423828, 14.74888801574707]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 5.0, 4.0, 4.0, 7.0, 5.0, 3.0, 9.0, 7.0, 12.0, 13.0, 12.0, 13.0, 23.0, 19.0, 20.0, 28.0, 27.0, 23.0, 29.0, 32.0, 47.0, 47.0, 62.0, 61.0, 66.0, 46.0, 45.0, 34.0, 39.0, 38.0, 25.0, 35.0, 15.0, 26.0, 21.0, 13.0, 12.0, 15.0, 10.0, 12.0, 7.0, 11.0, 4.0, 4.0, 3.0, 5.0, 2.0, 0.0, 3.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.115571975708008, -11.708925247192383, -11.302278518676758, -10.895631790161133, -10.488985061645508, -10.082338333129883, -9.675691604614258, -9.269044876098633, -8.862398147583008, -8.455751419067383, -8.049104690551758, -7.642457962036133, -7.235811233520508, -6.829164505004883, -6.422517776489258, -6.015871047973633, -5.609224319458008, -5.202577590942383, -4.795930862426758, -4.389284133911133, -3.982637405395508, -3.575990676879883, -3.169343948364258, -2.762697219848633, -2.356050491333008, -1.9494037628173828, -1.5427570343017578, -1.1361103057861328, -0.7294635772705078, -0.3228168487548828, 0.08382987976074219, 0.4904766082763672, 0.8971233367919922, 1.3037700653076172, 1.7104167938232422, 2.117063522338867, 2.523710250854492, 2.930356979370117, 3.337003707885742, 3.743650436401367, 4.150297164916992, 4.556943893432617, 4.963590621948242, 5.370237350463867, 5.776884078979492, 6.183530807495117, 6.590177536010742, 6.996824264526367, 7.403470993041992, 7.810117721557617, 8.216764450073242, 8.623411178588867, 9.030057907104492, 9.436704635620117, 9.843351364135742, 10.249998092651367, 10.656644821166992, 11.063291549682617, 11.469938278198242, 11.876585006713867, 12.283231735229492, 12.689878463745117, 13.096525192260742, 13.503171920776367, 13.909818649291992]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 9.0, 9.0, 24.0, 21.0, 42.0, 66.0, 110.0, 205.0, 351.0, 832.0, 2163.0, 7041.0, 34913.0, 492003.0, 3325531.0, 295979.0, 25935.0, 5634.0, 1807.0, 753.0, 360.0, 173.0, 105.0, 69.0, 49.0, 27.0, 22.0, 13.0, 12.0, 3.0, 5.0, 4.0, 6.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.880859375, -1.822845458984375, -1.76483154296875, -1.706817626953125, -1.6488037109375, -1.590789794921875, -1.53277587890625, -1.474761962890625, -1.416748046875, -1.358734130859375, -1.30072021484375, -1.242706298828125, -1.1846923828125, -1.126678466796875, -1.06866455078125, -1.010650634765625, -0.95263671875, -0.894622802734375, -0.83660888671875, -0.778594970703125, -0.7205810546875, -0.662567138671875, -0.60455322265625, -0.546539306640625, -0.488525390625, -0.430511474609375, -0.37249755859375, -0.314483642578125, -0.2564697265625, -0.198455810546875, -0.14044189453125, -0.082427978515625, -0.0244140625, 0.033599853515625, 0.09161376953125, 0.149627685546875, 0.2076416015625, 0.265655517578125, 0.32366943359375, 0.381683349609375, 0.439697265625, 0.497711181640625, 0.55572509765625, 0.613739013671875, 0.6717529296875, 0.729766845703125, 0.78778076171875, 0.845794677734375, 0.90380859375, 0.961822509765625, 1.01983642578125, 1.077850341796875, 1.1358642578125, 1.193878173828125, 1.25189208984375, 1.309906005859375, 1.367919921875, 1.425933837890625, 1.48394775390625, 1.541961669921875, 1.5999755859375, 1.657989501953125, 1.71600341796875, 1.774017333984375, 1.83203125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 7.0, 4.0, 13.0, 11.0, 11.0, 12.0, 18.0, 27.0, 20.0, 26.0, 31.0, 27.0, 27.0, 28.0, 39.0, 49.0, 40.0, 41.0, 50.0, 59.0, 45.0, 47.0, 38.0, 30.0, 42.0, 53.0, 28.0, 34.0, 24.0, 30.0, 18.0, 19.0, 10.0, 11.0, 10.0, 8.0, 7.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.77099609375, -0.7461166381835938, -0.7212371826171875, -0.6963577270507812, -0.671478271484375, -0.6465988159179688, -0.6217193603515625, -0.5968399047851562, -0.57196044921875, -0.5470809936523438, -0.5222015380859375, -0.49732208251953125, -0.472442626953125, -0.44756317138671875, -0.4226837158203125, -0.39780426025390625, -0.3729248046875, -0.34804534912109375, -0.3231658935546875, -0.29828643798828125, -0.273406982421875, -0.24852752685546875, -0.2236480712890625, -0.19876861572265625, -0.17388916015625, -0.14900970458984375, -0.1241302490234375, -0.09925079345703125, -0.074371337890625, -0.04949188232421875, -0.0246124267578125, 0.00026702880859375, 0.025146484375, 0.05002593994140625, 0.0749053955078125, 0.09978485107421875, 0.124664306640625, 0.14954376220703125, 0.1744232177734375, 0.19930267333984375, 0.22418212890625, 0.24906158447265625, 0.2739410400390625, 0.29882049560546875, 0.323699951171875, 0.34857940673828125, 0.3734588623046875, 0.39833831787109375, 0.4232177734375, 0.44809722900390625, 0.4729766845703125, 0.49785614013671875, 0.522735595703125, 0.5476150512695312, 0.5724945068359375, 0.5973739624023438, 0.62225341796875, 0.6471328735351562, 0.6720123291015625, 0.6968917846679688, 0.721771240234375, 0.7466506958007812, 0.7715301513671875, 0.7964096069335938, 0.8212890625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 5.0, 1.0, 3.0, 14.0, 8.0, 12.0, 24.0, 30.0, 58.0, 95.0, 105.0, 237.0, 553.0, 1477.0, 5696.0, 36087.0, 884042.0, 3180725.0, 71869.0, 9300.0, 2213.0, 824.0, 352.0, 206.0, 118.0, 84.0, 46.0, 27.0, 22.0, 22.0, 5.0, 10.0, 7.0, 3.0, 9.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.13671875, -3.0474853515625, -2.958251953125, -2.8690185546875, -2.77978515625, -2.6905517578125, -2.601318359375, -2.5120849609375, -2.4228515625, -2.3336181640625, -2.244384765625, -2.1551513671875, -2.06591796875, -1.9766845703125, -1.887451171875, -1.7982177734375, -1.708984375, -1.6197509765625, -1.530517578125, -1.4412841796875, -1.35205078125, -1.2628173828125, -1.173583984375, -1.0843505859375, -0.9951171875, -0.9058837890625, -0.816650390625, -0.7274169921875, -0.63818359375, -0.5489501953125, -0.459716796875, -0.3704833984375, -0.28125, -0.1920166015625, -0.102783203125, -0.0135498046875, 0.07568359375, 0.1649169921875, 0.254150390625, 0.3433837890625, 0.4326171875, 0.5218505859375, 0.611083984375, 0.7003173828125, 0.78955078125, 0.8787841796875, 0.968017578125, 1.0572509765625, 1.146484375, 1.2357177734375, 1.324951171875, 1.4141845703125, 1.50341796875, 1.5926513671875, 1.681884765625, 1.7711181640625, 1.8603515625, 1.9495849609375, 2.038818359375, 2.1280517578125, 2.21728515625, 2.3065185546875, 2.395751953125, 2.4849853515625, 2.57421875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 5.0, 11.0, 10.0, 11.0, 21.0, 26.0, 22.0, 34.0, 45.0, 98.0, 128.0, 185.0, 377.0, 627.0, 751.0, 660.0, 422.0, 226.0, 138.0, 79.0, 51.0, 35.0, 33.0, 24.0, 15.0, 11.0, 8.0, 2.0, 4.0, 4.0, 1.0, 2.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6328125, -1.571380615234375, -1.50994873046875, -1.448516845703125, -1.3870849609375, -1.325653076171875, -1.26422119140625, -1.202789306640625, -1.141357421875, -1.079925537109375, -1.01849365234375, -0.957061767578125, -0.8956298828125, -0.834197998046875, -0.77276611328125, -0.711334228515625, -0.64990234375, -0.588470458984375, -0.52703857421875, -0.465606689453125, -0.4041748046875, -0.342742919921875, -0.28131103515625, -0.219879150390625, -0.158447265625, -0.097015380859375, -0.03558349609375, 0.025848388671875, 0.0872802734375, 0.148712158203125, 0.21014404296875, 0.271575927734375, 0.3330078125, 0.394439697265625, 0.45587158203125, 0.517303466796875, 0.5787353515625, 0.640167236328125, 0.70159912109375, 0.763031005859375, 0.824462890625, 0.885894775390625, 0.94732666015625, 1.008758544921875, 1.0701904296875, 1.131622314453125, 1.19305419921875, 1.254486083984375, 1.31591796875, 1.377349853515625, 1.43878173828125, 1.500213623046875, 1.5616455078125, 1.623077392578125, 1.68450927734375, 1.745941162109375, 1.807373046875, 1.868804931640625, 1.93023681640625, 1.991668701171875, 2.0531005859375, 2.114532470703125, 2.17596435546875, 2.237396240234375, 2.298828125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 5.0, 3.0, 10.0, 10.0, 24.0, 66.0, 125.0, 213.0, 239.0, 154.0, 75.0, 34.0, 11.0, 12.0, 10.0, 6.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.545472145080566, -12.797033309936523, -12.048593521118164, -11.300153732299805, -10.551714897155762, -9.803276062011719, -9.05483627319336, -8.306396484375, -7.557957649230957, -6.809518337249756, -6.061079025268555, -5.3126397132873535, -4.564200401306152, -3.815761089324951, -3.06732177734375, -2.318882465362549, -1.5704431533813477, -0.8220038414001465, -0.07356452941894531, 0.6748747825622559, 1.423314094543457, 2.171753406524658, 2.9201927185058594, 3.6686320304870605, 4.417071342468262, 5.165510654449463, 5.913949966430664, 6.662389278411865, 7.410828590393066, 8.15926742553711, 8.907707214355469, 9.656147003173828, 10.404586791992188, 11.153026580810547, 11.90146541595459, 12.649904251098633, 13.398344039916992, 14.146783828735352, 14.895222663879395, 15.643661499023438, 16.392101287841797, 17.140541076660156, 17.888980865478516, 18.637418746948242, 19.3858585357666, 20.13429832458496, 20.882736206054688, 21.631175994873047, 22.379615783691406, 23.128055572509766, 23.876495361328125, 24.62493324279785, 25.37337303161621, 26.12181282043457, 26.870250701904297, 27.618690490722656, 28.367130279541016, 29.115570068359375, 29.864009857177734, 30.61244773864746, 31.36088752746582, 32.10932540893555, 32.857765197753906, 33.606204986572266, 34.354644775390625]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 5.0, 3.0, 6.0, 6.0, 9.0, 13.0, 23.0, 21.0, 20.0, 28.0, 34.0, 37.0, 40.0, 47.0, 55.0, 52.0, 51.0, 49.0, 50.0, 53.0, 51.0, 43.0, 46.0, 35.0, 29.0, 46.0, 24.0, 27.0, 16.0, 13.0, 19.0, 17.0, 7.0, 10.0, 6.0, 8.0, 5.0, 6.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.258282661437988, -5.999912261962891, -5.741541862487793, -5.483171463012695, -5.224801063537598, -4.9664306640625, -4.7080607414245605, -4.449690341949463, -4.191319942474365, -3.9329495429992676, -3.67457914352417, -3.4162089824676514, -3.1578385829925537, -2.899468183517456, -2.6410980224609375, -2.38272762298584, -2.124357223510742, -1.8659868240356445, -1.6076165437698364, -1.3492462635040283, -1.0908758640289307, -0.832505464553833, -0.5741351842880249, -0.3157649040222168, -0.05739450454711914, 0.20097583532333374, 0.4593461751937866, 0.7177165150642395, 0.9760868549346924, 1.23445725440979, 1.4928275346755981, 1.7511978149414062, 2.0095672607421875, 2.267937660217285, 2.526308059692383, 2.7846782207489014, 3.043048620223999, 3.3014190196990967, 3.5597891807556152, 3.818159580230713, 4.0765299797058105, 4.334900379180908, 4.593270778656006, 4.8516411781311035, 5.110011100769043, 5.368381500244141, 5.626751899719238, 5.885122299194336, 6.143492698669434, 6.401863098144531, 6.660233497619629, 6.918603897094727, 7.176974296569824, 7.435344696044922, 7.693714618682861, 7.952085018157959, 8.210454940795898, 8.468825340270996, 8.727195739746094, 8.985566139221191, 9.243936538696289, 9.502306938171387, 9.760677337646484, 10.019046783447266, 10.27741813659668]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 2.0, 1.0, 7.0, 6.0, 10.0, 6.0, 8.0, 27.0, 24.0, 33.0, 62.0, 88.0, 128.0, 192.0, 347.0, 569.0, 956.0, 1644.0, 3022.0, 5800.0, 11887.0, 26329.0, 59870.0, 136719.0, 255048.0, 268942.0, 152363.0, 67537.0, 29392.0, 13451.0, 6427.0, 3288.0, 1856.0, 956.0, 583.0, 343.0, 211.0, 131.0, 86.0, 56.0, 34.0, 34.0, 29.0, 18.0, 9.0, 7.0, 3.0, 6.0, 4.0, 1.0, 7.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.3251953125, -1.28387451171875, -1.2425537109375, -1.20123291015625, -1.159912109375, -1.11859130859375, -1.0772705078125, -1.03594970703125, -0.99462890625, -0.95330810546875, -0.9119873046875, -0.87066650390625, -0.829345703125, -0.78802490234375, -0.7467041015625, -0.70538330078125, -0.6640625, -0.62274169921875, -0.5814208984375, -0.54010009765625, -0.498779296875, -0.45745849609375, -0.4161376953125, -0.37481689453125, -0.33349609375, -0.29217529296875, -0.2508544921875, -0.20953369140625, -0.168212890625, -0.12689208984375, -0.0855712890625, -0.04425048828125, -0.0029296875, 0.03839111328125, 0.0797119140625, 0.12103271484375, 0.162353515625, 0.20367431640625, 0.2449951171875, 0.28631591796875, 0.32763671875, 0.36895751953125, 0.4102783203125, 0.45159912109375, 0.492919921875, 0.53424072265625, 0.5755615234375, 0.61688232421875, 0.658203125, 0.69952392578125, 0.7408447265625, 0.78216552734375, 0.823486328125, 0.86480712890625, 0.9061279296875, 0.94744873046875, 0.98876953125, 1.03009033203125, 1.0714111328125, 1.11273193359375, 1.154052734375, 1.19537353515625, 1.2366943359375, 1.27801513671875, 1.3193359375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 5.0, 5.0, 8.0, 4.0, 12.0, 14.0, 9.0, 15.0, 17.0, 21.0, 19.0, 26.0, 37.0, 23.0, 34.0, 29.0, 30.0, 41.0, 44.0, 45.0, 53.0, 36.0, 45.0, 52.0, 44.0, 35.0, 48.0, 29.0, 30.0, 32.0, 29.0, 21.0, 20.0, 21.0, 19.0, 10.0, 13.0, 7.0, 5.0, 10.0, 3.0, 1.0, 0.0, 1.0, 4.0, 3.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.86328125, -0.8387222290039062, -0.8141632080078125, -0.7896041870117188, -0.765045166015625, -0.7404861450195312, -0.7159271240234375, -0.6913681030273438, -0.66680908203125, -0.6422500610351562, -0.6176910400390625, -0.5931320190429688, -0.568572998046875, -0.5440139770507812, -0.5194549560546875, -0.49489593505859375, -0.4703369140625, -0.44577789306640625, -0.4212188720703125, -0.39665985107421875, -0.372100830078125, -0.34754180908203125, -0.3229827880859375, -0.29842376708984375, -0.27386474609375, -0.24930572509765625, -0.2247467041015625, -0.20018768310546875, -0.175628662109375, -0.15106964111328125, -0.1265106201171875, -0.10195159912109375, -0.077392578125, -0.05283355712890625, -0.0282745361328125, -0.00371551513671875, 0.020843505859375, 0.04540252685546875, 0.0699615478515625, 0.09452056884765625, 0.11907958984375, 0.14363861083984375, 0.1681976318359375, 0.19275665283203125, 0.217315673828125, 0.24187469482421875, 0.2664337158203125, 0.29099273681640625, 0.3155517578125, 0.34011077880859375, 0.3646697998046875, 0.38922882080078125, 0.413787841796875, 0.43834686279296875, 0.4629058837890625, 0.48746490478515625, 0.51202392578125, 0.5365829467773438, 0.5611419677734375, 0.5857009887695312, 0.610260009765625, 0.6348190307617188, 0.6593780517578125, 0.6839370727539062, 0.70849609375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 8.0, 9.0, 9.0, 10.0, 11.0, 11.0, 17.0, 34.0, 36.0, 62.0, 97.0, 142.0, 237.0, 439.0, 665.0, 1510.0, 3723.0, 10195.0, 36750.0, 156043.0, 580076.0, 192791.0, 45424.0, 12426.0, 4206.0, 1704.0, 789.0, 418.0, 240.0, 140.0, 84.0, 75.0, 51.0, 31.0, 25.0, 17.0, 12.0, 6.0, 12.0, 9.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.2109375, -2.14306640625, -2.0751953125, -2.00732421875, -1.939453125, -1.87158203125, -1.8037109375, -1.73583984375, -1.66796875, -1.60009765625, -1.5322265625, -1.46435546875, -1.396484375, -1.32861328125, -1.2607421875, -1.19287109375, -1.125, -1.05712890625, -0.9892578125, -0.92138671875, -0.853515625, -0.78564453125, -0.7177734375, -0.64990234375, -0.58203125, -0.51416015625, -0.4462890625, -0.37841796875, -0.310546875, -0.24267578125, -0.1748046875, -0.10693359375, -0.0390625, 0.02880859375, 0.0966796875, 0.16455078125, 0.232421875, 0.30029296875, 0.3681640625, 0.43603515625, 0.50390625, 0.57177734375, 0.6396484375, 0.70751953125, 0.775390625, 0.84326171875, 0.9111328125, 0.97900390625, 1.046875, 1.11474609375, 1.1826171875, 1.25048828125, 1.318359375, 1.38623046875, 1.4541015625, 1.52197265625, 1.58984375, 1.65771484375, 1.7255859375, 1.79345703125, 1.861328125, 1.92919921875, 1.9970703125, 2.06494140625, 2.1328125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 6.0, 6.0, 5.0, 8.0, 11.0, 17.0, 18.0, 13.0, 25.0, 43.0, 32.0, 47.0, 45.0, 53.0, 68.0, 55.0, 66.0, 58.0, 42.0, 59.0, 56.0, 55.0, 36.0, 26.0, 34.0, 22.0, 18.0, 16.0, 23.0, 14.0, 9.0, 2.0, 8.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.662109375, -3.557403564453125, -3.45269775390625, -3.347991943359375, -3.2432861328125, -3.138580322265625, -3.03387451171875, -2.929168701171875, -2.824462890625, -2.719757080078125, -2.61505126953125, -2.510345458984375, -2.4056396484375, -2.300933837890625, -2.19622802734375, -2.091522216796875, -1.98681640625, -1.882110595703125, -1.77740478515625, -1.672698974609375, -1.5679931640625, -1.463287353515625, -1.35858154296875, -1.253875732421875, -1.149169921875, -1.044464111328125, -0.93975830078125, -0.835052490234375, -0.7303466796875, -0.625640869140625, -0.52093505859375, -0.416229248046875, -0.3115234375, -0.206817626953125, -0.10211181640625, 0.002593994140625, 0.1072998046875, 0.212005615234375, 0.31671142578125, 0.421417236328125, 0.526123046875, 0.630828857421875, 0.73553466796875, 0.840240478515625, 0.9449462890625, 1.049652099609375, 1.15435791015625, 1.259063720703125, 1.36376953125, 1.468475341796875, 1.57318115234375, 1.677886962890625, 1.7825927734375, 1.887298583984375, 1.99200439453125, 2.096710205078125, 2.201416015625, 2.306121826171875, 2.41082763671875, 2.515533447265625, 2.6202392578125, 2.724945068359375, 2.82965087890625, 2.934356689453125, 3.0390625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 1.0, 4.0, 11.0, 17.0, 25.0, 36.0, 78.0, 180.0, 384.0, 953.0, 3400.0, 19205.0, 203813.0, 742946.0, 66477.0, 8064.0, 1838.0, 595.0, 259.0, 121.0, 61.0, 31.0, 31.0, 9.0, 7.0, 1.0, 6.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1162109375, -1.075286865234375, -1.03436279296875, -0.993438720703125, -0.9525146484375, -0.911590576171875, -0.87066650390625, -0.829742431640625, -0.788818359375, -0.747894287109375, -0.70697021484375, -0.666046142578125, -0.6251220703125, -0.584197998046875, -0.54327392578125, -0.502349853515625, -0.46142578125, -0.420501708984375, -0.37957763671875, -0.338653564453125, -0.2977294921875, -0.256805419921875, -0.21588134765625, -0.174957275390625, -0.134033203125, -0.093109130859375, -0.05218505859375, -0.011260986328125, 0.0296630859375, 0.070587158203125, 0.11151123046875, 0.152435302734375, 0.193359375, 0.234283447265625, 0.27520751953125, 0.316131591796875, 0.3570556640625, 0.397979736328125, 0.43890380859375, 0.479827880859375, 0.520751953125, 0.561676025390625, 0.60260009765625, 0.643524169921875, 0.6844482421875, 0.725372314453125, 0.76629638671875, 0.807220458984375, 0.84814453125, 0.889068603515625, 0.92999267578125, 0.970916748046875, 1.0118408203125, 1.052764892578125, 1.09368896484375, 1.134613037109375, 1.175537109375, 1.216461181640625, 1.25738525390625, 1.298309326171875, 1.3392333984375, 1.380157470703125, 1.42108154296875, 1.462005615234375, 1.5029296875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 4.0, 5.0, 3.0, 7.0, 4.0, 14.0, 14.0, 18.0, 18.0, 34.0, 39.0, 39.0, 56.0, 68.0, 92.0, 93.0, 92.0, 99.0, 56.0, 48.0, 48.0, 32.0, 23.0, 17.0, 26.0, 15.0, 10.0, 4.0, 3.0, 2.0, 5.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0002880096435546875, -0.0002794116735458374, -0.0002708137035369873, -0.0002622157335281372, -0.0002536177635192871, -0.000245019793510437, -0.00023642182350158691, -0.00022782385349273682, -0.00021922588348388672, -0.00021062791347503662, -0.00020202994346618652, -0.00019343197345733643, -0.00018483400344848633, -0.00017623603343963623, -0.00016763806343078613, -0.00015904009342193604, -0.00015044212341308594, -0.00014184415340423584, -0.00013324618339538574, -0.00012464821338653564, -0.00011605024337768555, -0.00010745227336883545, -9.885430335998535e-05, -9.025633335113525e-05, -8.165836334228516e-05, -7.306039333343506e-05, -6.446242332458496e-05, -5.586445331573486e-05, -4.7266483306884766e-05, -3.866851329803467e-05, -3.007054328918457e-05, -2.1472573280334473e-05, -1.2874603271484375e-05, -4.276633262634277e-06, 4.32133674621582e-06, 1.2919306755065918e-05, 2.1517276763916016e-05, 3.0115246772766113e-05, 3.871321678161621e-05, 4.731118679046631e-05, 5.5909156799316406e-05, 6.45071268081665e-05, 7.31050968170166e-05, 8.17030668258667e-05, 9.03010368347168e-05, 9.88990068435669e-05, 0.00010749697685241699, 0.00011609494686126709, 0.0001246929168701172, 0.00013329088687896729, 0.00014188885688781738, 0.00015048682689666748, 0.00015908479690551758, 0.00016768276691436768, 0.00017628073692321777, 0.00018487870693206787, 0.00019347667694091797, 0.00020207464694976807, 0.00021067261695861816, 0.00021927058696746826, 0.00022786855697631836, 0.00023646652698516846, 0.00024506449699401855, 0.00025366246700286865, 0.00026226043701171875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 9.0, 8.0, 16.0, 28.0, 45.0, 80.0, 164.0, 353.0, 965.0, 3287.0, 17210.0, 157894.0, 755436.0, 97445.0, 11702.0, 2442.0, 800.0, 329.0, 156.0, 72.0, 41.0, 20.0, 17.0, 11.0, 7.0, 3.0, 3.0, 1.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.86865234375, -0.8298721313476562, -0.7910919189453125, -0.7523117065429688, -0.713531494140625, -0.6747512817382812, -0.6359710693359375, -0.5971908569335938, -0.55841064453125, -0.5196304321289062, -0.4808502197265625, -0.44207000732421875, -0.403289794921875, -0.36450958251953125, -0.3257293701171875, -0.28694915771484375, -0.2481689453125, -0.20938873291015625, -0.1706085205078125, -0.13182830810546875, -0.093048095703125, -0.05426788330078125, -0.0154876708984375, 0.02329254150390625, 0.06207275390625, 0.10085296630859375, 0.1396331787109375, 0.17841339111328125, 0.217193603515625, 0.25597381591796875, 0.2947540283203125, 0.33353424072265625, 0.372314453125, 0.41109466552734375, 0.4498748779296875, 0.48865509033203125, 0.527435302734375, 0.5662155151367188, 0.6049957275390625, 0.6437759399414062, 0.68255615234375, 0.7213363647460938, 0.7601165771484375, 0.7988967895507812, 0.837677001953125, 0.8764572143554688, 0.9152374267578125, 0.9540176391601562, 0.9927978515625, 1.0315780639648438, 1.0703582763671875, 1.1091384887695312, 1.147918701171875, 1.1866989135742188, 1.2254791259765625, 1.2642593383789062, 1.30303955078125, 1.3418197631835938, 1.3805999755859375, 1.4193801879882812, 1.458160400390625, 1.4969406127929688, 1.5357208251953125, 1.5745010375976562, 1.61328125]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 3.0, 1.0, 7.0, 7.0, 9.0, 11.0, 14.0, 16.0, 20.0, 21.0, 26.0, 25.0, 33.0, 32.0, 49.0, 40.0, 62.0, 59.0, 47.0, 68.0, 62.0, 62.0, 46.0, 41.0, 57.0, 32.0, 35.0, 24.0, 18.0, 13.0, 14.0, 11.0, 8.0, 3.0, 4.0, 7.0, 8.0, 0.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.8349609375, -0.81304931640625, -0.7911376953125, -0.76922607421875, -0.747314453125, -0.72540283203125, -0.7034912109375, -0.68157958984375, -0.65966796875, -0.63775634765625, -0.6158447265625, -0.59393310546875, -0.572021484375, -0.55010986328125, -0.5281982421875, -0.50628662109375, -0.484375, -0.46246337890625, -0.4405517578125, -0.41864013671875, -0.396728515625, -0.37481689453125, -0.3529052734375, -0.33099365234375, -0.30908203125, -0.28717041015625, -0.2652587890625, -0.24334716796875, -0.221435546875, -0.19952392578125, -0.1776123046875, -0.15570068359375, -0.1337890625, -0.11187744140625, -0.0899658203125, -0.06805419921875, -0.046142578125, -0.02423095703125, -0.0023193359375, 0.01959228515625, 0.04150390625, 0.06341552734375, 0.0853271484375, 0.10723876953125, 0.129150390625, 0.15106201171875, 0.1729736328125, 0.19488525390625, 0.216796875, 0.23870849609375, 0.2606201171875, 0.28253173828125, 0.304443359375, 0.32635498046875, 0.3482666015625, 0.37017822265625, 0.39208984375, 0.41400146484375, 0.4359130859375, 0.45782470703125, 0.479736328125, 0.50164794921875, 0.5235595703125, 0.54547119140625, 0.5673828125]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 8.0, 5.0, 14.0, 30.0, 72.0, 155.0, 314.0, 203.0, 102.0, 56.0, 18.0, 10.0, 5.0, 4.0, 6.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.671852111816406, -21.85114860534668, -21.03044319152832, -20.209739685058594, -19.389036178588867, -18.56833267211914, -17.74762725830078, -16.926923751831055, -16.106220245361328, -15.285515785217285, -14.464812278747559, -13.644107818603516, -12.823404312133789, -12.002699851989746, -11.181995391845703, -10.361291885375977, -9.540587425231934, -8.71988296508789, -7.899179458618164, -7.078474998474121, -6.2577714920043945, -5.437067031860352, -4.616363048553467, -3.795659065246582, -2.9749550819396973, -2.1542510986328125, -1.3335469961166382, -0.5128428936004639, 0.3078610897064209, 1.1285653114318848, 1.9492692947387695, 2.7699732780456543, 3.590677261352539, 4.411381244659424, 5.232085227966309, 6.052789688110352, 6.873493194580078, 7.694197654724121, 8.514902114868164, 9.33560562133789, 10.156309127807617, 10.97701358795166, 11.797717094421387, 12.61842155456543, 13.439125061035156, 14.2598295211792, 15.080533981323242, 15.901237487792969, 16.721942901611328, 17.542646408081055, 18.363351821899414, 19.18405532836914, 20.004758834838867, 20.825462341308594, 21.646167755126953, 22.46687126159668, 23.287574768066406, 24.108278274536133, 24.928983688354492, 25.74968719482422, 26.570390701293945, 27.391094207763672, 28.21179962158203, 29.032503128051758, 29.853206634521484]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 0.0, 4.0, 2.0, 5.0, 5.0, 5.0, 6.0, 7.0, 5.0, 7.0, 14.0, 12.0, 15.0, 14.0, 18.0, 17.0, 22.0, 23.0, 28.0, 19.0, 34.0, 29.0, 33.0, 48.0, 59.0, 71.0, 64.0, 81.0, 46.0, 45.0, 27.0, 36.0, 27.0, 23.0, 22.0, 16.0, 19.0, 13.0, 20.0, 21.0, 9.0, 10.0, 6.0, 4.0, 7.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-9.576784133911133, -9.259346008300781, -8.941906929016113, -8.624468803405762, -8.30703067779541, -7.9895920753479, -7.672153472900391, -7.354715347290039, -7.037276744842529, -6.7198381423950195, -6.402400016784668, -6.084961414337158, -5.767522811889648, -5.450084686279297, -5.132646083831787, -4.815207481384277, -4.497769355773926, -4.180330753326416, -3.8628926277160645, -3.5454540252685547, -3.228015661239624, -2.9105772972106934, -2.5931386947631836, -2.275700330734253, -1.9582619667053223, -1.6408236026763916, -1.3233851194381714, -1.0059466361999512, -0.6885082721710205, -0.37106990814208984, -0.05363142490386963, 0.2638070583343506, 0.5812463760375977, 0.8986847996711731, 1.2161232233047485, 1.5335617065429688, 1.8510000705718994, 2.16843843460083, 2.48587703704834, 2.8033154010772705, 3.120753765106201, 3.438192129135132, 3.7556304931640625, 4.073069095611572, 4.390507698059082, 4.707945823669434, 5.025384426116943, 5.342823028564453, 5.660261154174805, 5.9776997566223145, 6.295137882232666, 6.612576484680176, 6.930014610290527, 7.247453212738037, 7.564891815185547, 7.882329940795898, 8.19976806640625, 8.517206192016602, 8.83464527130127, 9.152083396911621, 9.469521522521973, 9.78696060180664, 10.104398727416992, 10.421836853027344, 10.739275932312012]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 9.0, 13.0, 15.0, 26.0, 36.0, 51.0, 100.0, 147.0, 230.0, 500.0, 1091.0, 2932.0, 10086.0, 55258.0, 851831.0, 2989630.0, 248372.0, 24684.0, 5518.0, 1931.0, 836.0, 395.0, 214.0, 133.0, 85.0, 53.0, 27.0, 23.0, 19.0, 9.0, 10.0, 5.0, 6.0, 4.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.6103515625, -1.56048583984375, -1.5106201171875, -1.46075439453125, -1.410888671875, -1.36102294921875, -1.3111572265625, -1.26129150390625, -1.21142578125, -1.16156005859375, -1.1116943359375, -1.06182861328125, -1.011962890625, -0.96209716796875, -0.9122314453125, -0.86236572265625, -0.8125, -0.76263427734375, -0.7127685546875, -0.66290283203125, -0.613037109375, -0.56317138671875, -0.5133056640625, -0.46343994140625, -0.41357421875, -0.36370849609375, -0.3138427734375, -0.26397705078125, -0.214111328125, -0.16424560546875, -0.1143798828125, -0.06451416015625, -0.0146484375, 0.03521728515625, 0.0850830078125, 0.13494873046875, 0.184814453125, 0.23468017578125, 0.2845458984375, 0.33441162109375, 0.38427734375, 0.43414306640625, 0.4840087890625, 0.53387451171875, 0.583740234375, 0.63360595703125, 0.6834716796875, 0.73333740234375, 0.783203125, 0.83306884765625, 0.8829345703125, 0.93280029296875, 0.982666015625, 1.03253173828125, 1.0823974609375, 1.13226318359375, 1.18212890625, 1.23199462890625, 1.2818603515625, 1.33172607421875, 1.381591796875, 1.43145751953125, 1.4813232421875, 1.53118896484375, 1.5810546875]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 3.0, 3.0, 4.0, 7.0, 6.0, 6.0, 14.0, 9.0, 17.0, 17.0, 23.0, 23.0, 27.0, 34.0, 33.0, 27.0, 39.0, 37.0, 48.0, 53.0, 55.0, 45.0, 55.0, 36.0, 39.0, 42.0, 42.0, 36.0, 27.0, 33.0, 30.0, 24.0, 19.0, 22.0, 17.0, 14.0, 8.0, 9.0, 2.0, 5.0, 5.0, 1.0, 4.0, 2.0, 2.0, 1.0, 2.0, 4.0, 0.0, 1.0], "bins": [-0.8623046875, -0.837982177734375, -0.81365966796875, -0.789337158203125, -0.7650146484375, -0.740692138671875, -0.71636962890625, -0.692047119140625, -0.667724609375, -0.643402099609375, -0.61907958984375, -0.594757080078125, -0.5704345703125, -0.546112060546875, -0.52178955078125, -0.497467041015625, -0.47314453125, -0.448822021484375, -0.42449951171875, -0.400177001953125, -0.3758544921875, -0.351531982421875, -0.32720947265625, -0.302886962890625, -0.278564453125, -0.254241943359375, -0.22991943359375, -0.205596923828125, -0.1812744140625, -0.156951904296875, -0.13262939453125, -0.108306884765625, -0.083984375, -0.059661865234375, -0.03533935546875, -0.011016845703125, 0.0133056640625, 0.037628173828125, 0.06195068359375, 0.086273193359375, 0.110595703125, 0.134918212890625, 0.15924072265625, 0.183563232421875, 0.2078857421875, 0.232208251953125, 0.25653076171875, 0.280853271484375, 0.30517578125, 0.329498291015625, 0.35382080078125, 0.378143310546875, 0.4024658203125, 0.426788330078125, 0.45111083984375, 0.475433349609375, 0.499755859375, 0.524078369140625, 0.54840087890625, 0.572723388671875, 0.5970458984375, 0.621368408203125, 0.64569091796875, 0.670013427734375, 0.6943359375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 3.0, 10.0, 6.0, 19.0, 19.0, 37.0, 70.0, 129.0, 276.0, 646.0, 2090.0, 10933.0, 170057.0, 3872837.0, 124064.0, 9783.0, 1998.0, 656.0, 342.0, 132.0, 67.0, 41.0, 22.0, 14.0, 7.0, 7.0, 7.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-3.85546875, -3.755218505859375, -3.65496826171875, -3.554718017578125, -3.4544677734375, -3.354217529296875, -3.25396728515625, -3.153717041015625, -3.053466796875, -2.953216552734375, -2.85296630859375, -2.752716064453125, -2.6524658203125, -2.552215576171875, -2.45196533203125, -2.351715087890625, -2.25146484375, -2.151214599609375, -2.05096435546875, -1.950714111328125, -1.8504638671875, -1.750213623046875, -1.64996337890625, -1.549713134765625, -1.449462890625, -1.349212646484375, -1.24896240234375, -1.148712158203125, -1.0484619140625, -0.948211669921875, -0.84796142578125, -0.747711181640625, -0.6474609375, -0.547210693359375, -0.44696044921875, -0.346710205078125, -0.2464599609375, -0.146209716796875, -0.04595947265625, 0.054290771484375, 0.154541015625, 0.254791259765625, 0.35504150390625, 0.455291748046875, 0.5555419921875, 0.655792236328125, 0.75604248046875, 0.856292724609375, 0.95654296875, 1.056793212890625, 1.15704345703125, 1.257293701171875, 1.3575439453125, 1.457794189453125, 1.55804443359375, 1.658294677734375, 1.758544921875, 1.858795166015625, 1.95904541015625, 2.059295654296875, 2.1595458984375, 2.259796142578125, 2.36004638671875, 2.460296630859375, 2.560546875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 4.0, 11.0, 9.0, 11.0, 19.0, 28.0, 46.0, 48.0, 82.0, 142.0, 226.0, 439.0, 743.0, 803.0, 576.0, 321.0, 198.0, 126.0, 71.0, 46.0, 27.0, 25.0, 19.0, 10.0, 11.0, 10.0, 4.0, 6.0, 4.0, 3.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.8779296875, -1.8160858154296875, -1.754241943359375, -1.6923980712890625, -1.63055419921875, -1.5687103271484375, -1.506866455078125, -1.4450225830078125, -1.3831787109375, -1.3213348388671875, -1.259490966796875, -1.1976470947265625, -1.13580322265625, -1.0739593505859375, -1.012115478515625, -0.9502716064453125, -0.888427734375, -0.8265838623046875, -0.764739990234375, -0.7028961181640625, -0.64105224609375, -0.5792083740234375, -0.517364501953125, -0.4555206298828125, -0.3936767578125, -0.3318328857421875, -0.269989013671875, -0.2081451416015625, -0.14630126953125, -0.0844573974609375, -0.022613525390625, 0.0392303466796875, 0.10107421875, 0.1629180908203125, 0.224761962890625, 0.2866058349609375, 0.34844970703125, 0.4102935791015625, 0.472137451171875, 0.5339813232421875, 0.5958251953125, 0.6576690673828125, 0.719512939453125, 0.7813568115234375, 0.84320068359375, 0.9050445556640625, 0.966888427734375, 1.0287322998046875, 1.090576171875, 1.1524200439453125, 1.214263916015625, 1.2761077880859375, 1.33795166015625, 1.3997955322265625, 1.461639404296875, 1.5234832763671875, 1.5853271484375, 1.6471710205078125, 1.709014892578125, 1.7708587646484375, 1.83270263671875, 1.8945465087890625, 1.956390380859375, 2.0182342529296875, 2.080078125]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 9.0, 18.0, 36.0, 53.0, 129.0, 177.0, 205.0, 169.0, 98.0, 50.0, 29.0, 15.0, 4.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.004962921142578, -8.413089752197266, -7.821216583251953, -7.229342937469482, -6.63746976852417, -6.045596599578857, -5.453722953796387, -4.861849784851074, -4.269976615905762, -3.678103446960449, -3.0862300395965576, -2.494356632232666, -1.9024834632873535, -1.310610294342041, -0.7187368869781494, -0.1268634796142578, 0.4650096893310547, 1.0568829774856567, 1.6487562656402588, 2.2406296730041504, 2.832502841949463, 3.4243760108947754, 4.016249656677246, 4.608122825622559, 5.199995994567871, 5.791869163513184, 6.383742332458496, 6.975615978240967, 7.567489147186279, 8.15936279296875, 8.751235961914062, 9.343109130859375, 9.934982299804688, 10.52685546875, 11.118728637695312, 11.710601806640625, 12.302474975585938, 12.89434814453125, 13.486222267150879, 14.078095436096191, 14.669968605041504, 15.261841773986816, 15.853714942932129, 16.445589065551758, 17.03746223449707, 17.629335403442383, 18.221208572387695, 18.813081741333008, 19.40495491027832, 19.996828079223633, 20.588701248168945, 21.180574417114258, 21.77244758605957, 22.364320755004883, 22.956193923950195, 23.54806900024414, 24.139942169189453, 24.731815338134766, 25.323688507080078, 25.91556167602539, 26.507434844970703, 27.099308013916016, 27.691181182861328, 28.28305435180664, 28.874927520751953]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 3.0, 4.0, 4.0, 6.0, 8.0, 10.0, 19.0, 9.0, 17.0, 17.0, 20.0, 32.0, 29.0, 40.0, 38.0, 41.0, 46.0, 50.0, 45.0, 46.0, 68.0, 57.0, 51.0, 33.0, 52.0, 42.0, 27.0, 22.0, 38.0, 25.0, 25.0, 14.0, 14.0, 18.0, 9.0, 6.0, 4.0, 6.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.077053070068359, -6.8152337074279785, -6.553414344787598, -6.291594982147217, -6.029775619506836, -5.767956733703613, -5.506137371063232, -5.244318008422852, -4.982498645782471, -4.72067928314209, -4.458859920501709, -4.197040557861328, -3.9352214336395264, -3.6734020709991455, -3.4115829467773438, -3.149763584136963, -2.887944221496582, -2.626124858856201, -2.3643054962158203, -2.1024863719940186, -1.8406670093536377, -1.5788476467132568, -1.3170284032821655, -1.0552091598510742, -0.7933897972106934, -0.5315704941749573, -0.2697511911392212, -0.007931888103485107, 0.253887414932251, 0.5157067775726318, 0.7775260210037231, 1.0393452644348145, 1.3011655807495117, 1.5629849433898926, 1.8248041868209839, 2.086623430252075, 2.348442792892456, 2.610262155532837, 2.8720812797546387, 3.1339006423950195, 3.3957200050354004, 3.6575393676757812, 3.919358730316162, 4.181178092956543, 4.442996978759766, 4.704816818237305, 4.966635704040527, 5.228455066680908, 5.490274429321289, 5.75209379196167, 6.013913154602051, 6.275732517242432, 6.5375518798828125, 6.799370765686035, 7.061190128326416, 7.323009490966797, 7.584828853607178, 7.846648216247559, 8.108467102050781, 8.37028694152832, 8.632105827331543, 8.893925666809082, 9.155744552612305, 9.417564392089844, 9.679383277893066]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 7.0, 5.0, 6.0, 6.0, 16.0, 18.0, 29.0, 33.0, 46.0, 80.0, 118.0, 146.0, 277.0, 464.0, 769.0, 1386.0, 2673.0, 5388.0, 10952.0, 24057.0, 53030.0, 121259.0, 255098.0, 291717.0, 154855.0, 68322.0, 29882.0, 13953.0, 6653.0, 3218.0, 1699.0, 917.0, 555.0, 333.0, 210.0, 104.0, 87.0, 51.0, 38.0, 23.0, 21.0, 16.0, 9.0, 9.0, 6.0, 5.0, 5.0, 1.0, 5.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-1.2568359375, -1.217742919921875, -1.17864990234375, -1.139556884765625, -1.1004638671875, -1.061370849609375, -1.02227783203125, -0.983184814453125, -0.944091796875, -0.904998779296875, -0.86590576171875, -0.826812744140625, -0.7877197265625, -0.748626708984375, -0.70953369140625, -0.670440673828125, -0.63134765625, -0.592254638671875, -0.55316162109375, -0.514068603515625, -0.4749755859375, -0.435882568359375, -0.39678955078125, -0.357696533203125, -0.318603515625, -0.279510498046875, -0.24041748046875, -0.201324462890625, -0.1622314453125, -0.123138427734375, -0.08404541015625, -0.044952392578125, -0.005859375, 0.033233642578125, 0.07232666015625, 0.111419677734375, 0.1505126953125, 0.189605712890625, 0.22869873046875, 0.267791748046875, 0.306884765625, 0.345977783203125, 0.38507080078125, 0.424163818359375, 0.4632568359375, 0.502349853515625, 0.54144287109375, 0.580535888671875, 0.61962890625, 0.658721923828125, 0.69781494140625, 0.736907958984375, 0.7760009765625, 0.815093994140625, 0.85418701171875, 0.893280029296875, 0.932373046875, 0.971466064453125, 1.01055908203125, 1.049652099609375, 1.0887451171875, 1.127838134765625, 1.16693115234375, 1.206024169921875, 1.2451171875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 6.0, 5.0, 1.0, 9.0, 2.0, 16.0, 10.0, 9.0, 13.0, 13.0, 17.0, 22.0, 33.0, 32.0, 38.0, 43.0, 36.0, 32.0, 46.0, 57.0, 47.0, 50.0, 43.0, 39.0, 44.0, 43.0, 31.0, 35.0, 41.0, 35.0, 22.0, 20.0, 23.0, 14.0, 10.0, 13.0, 13.0, 9.0, 6.0, 6.0, 8.0, 5.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.75537109375, -0.7297592163085938, -0.7041473388671875, -0.6785354614257812, -0.652923583984375, -0.6273117065429688, -0.6016998291015625, -0.5760879516601562, -0.55047607421875, -0.5248641967773438, -0.4992523193359375, -0.47364044189453125, -0.448028564453125, -0.42241668701171875, -0.3968048095703125, -0.37119293212890625, -0.3455810546875, -0.31996917724609375, -0.2943572998046875, -0.26874542236328125, -0.243133544921875, -0.21752166748046875, -0.1919097900390625, -0.16629791259765625, -0.14068603515625, -0.11507415771484375, -0.0894622802734375, -0.06385040283203125, -0.038238525390625, -0.01262664794921875, 0.0129852294921875, 0.03859710693359375, 0.064208984375, 0.08982086181640625, 0.1154327392578125, 0.14104461669921875, 0.166656494140625, 0.19226837158203125, 0.2178802490234375, 0.24349212646484375, 0.26910400390625, 0.29471588134765625, 0.3203277587890625, 0.34593963623046875, 0.371551513671875, 0.39716339111328125, 0.4227752685546875, 0.44838714599609375, 0.4739990234375, 0.49961090087890625, 0.5252227783203125, 0.5508346557617188, 0.576446533203125, 0.6020584106445312, 0.6276702880859375, 0.6532821655273438, 0.67889404296875, 0.7045059204101562, 0.7301177978515625, 0.7557296752929688, 0.781341552734375, 0.8069534301757812, 0.8325653076171875, 0.8581771850585938, 0.8837890625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 6.0, 9.0, 5.0, 9.0, 10.0, 30.0, 32.0, 45.0, 64.0, 83.0, 143.0, 187.0, 318.0, 461.0, 726.0, 1406.0, 2921.0, 8107.0, 27973.0, 124150.0, 624447.0, 195922.0, 42300.0, 11263.0, 3818.0, 1724.0, 906.0, 521.0, 302.0, 193.0, 141.0, 88.0, 60.0, 51.0, 33.0, 23.0, 20.0, 11.0, 16.0, 8.0, 9.0, 1.0, 5.0, 1.0, 4.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.03515625, -1.96875, -1.90234375, -1.8359375, -1.76953125, -1.703125, -1.63671875, -1.5703125, -1.50390625, -1.4375, -1.37109375, -1.3046875, -1.23828125, -1.171875, -1.10546875, -1.0390625, -0.97265625, -0.90625, -0.83984375, -0.7734375, -0.70703125, -0.640625, -0.57421875, -0.5078125, -0.44140625, -0.375, -0.30859375, -0.2421875, -0.17578125, -0.109375, -0.04296875, 0.0234375, 0.08984375, 0.15625, 0.22265625, 0.2890625, 0.35546875, 0.421875, 0.48828125, 0.5546875, 0.62109375, 0.6875, 0.75390625, 0.8203125, 0.88671875, 0.953125, 1.01953125, 1.0859375, 1.15234375, 1.21875, 1.28515625, 1.3515625, 1.41796875, 1.484375, 1.55078125, 1.6171875, 1.68359375, 1.75, 1.81640625, 1.8828125, 1.94921875, 2.015625, 2.08203125, 2.1484375, 2.21484375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 2.0, 4.0, 5.0, 9.0, 11.0, 16.0, 25.0, 14.0, 26.0, 29.0, 36.0, 55.0, 51.0, 47.0, 57.0, 59.0, 78.0, 60.0, 55.0, 52.0, 50.0, 55.0, 38.0, 40.0, 35.0, 32.0, 16.0, 9.0, 13.0, 8.0, 7.0, 6.0, 3.0, 1.0, 5.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.890625, -3.76470947265625, -3.6387939453125, -3.51287841796875, -3.386962890625, -3.26104736328125, -3.1351318359375, -3.00921630859375, -2.88330078125, -2.75738525390625, -2.6314697265625, -2.50555419921875, -2.379638671875, -2.25372314453125, -2.1278076171875, -2.00189208984375, -1.8759765625, -1.75006103515625, -1.6241455078125, -1.49822998046875, -1.372314453125, -1.24639892578125, -1.1204833984375, -0.99456787109375, -0.86865234375, -0.74273681640625, -0.6168212890625, -0.49090576171875, -0.364990234375, -0.23907470703125, -0.1131591796875, 0.01275634765625, 0.138671875, 0.26458740234375, 0.3905029296875, 0.51641845703125, 0.642333984375, 0.76824951171875, 0.8941650390625, 1.02008056640625, 1.14599609375, 1.27191162109375, 1.3978271484375, 1.52374267578125, 1.649658203125, 1.77557373046875, 1.9014892578125, 2.02740478515625, 2.1533203125, 2.27923583984375, 2.4051513671875, 2.53106689453125, 2.656982421875, 2.78289794921875, 2.9088134765625, 3.03472900390625, 3.16064453125, 3.28656005859375, 3.4124755859375, 3.53839111328125, 3.664306640625, 3.79022216796875, 3.9161376953125, 4.04205322265625, 4.16796875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 6.0, 8.0, 7.0, 9.0, 13.0, 22.0, 18.0, 29.0, 36.0, 67.0, 88.0, 125.0, 212.0, 273.0, 564.0, 1096.0, 2267.0, 5530.0, 14879.0, 46587.0, 193096.0, 638455.0, 100095.0, 27995.0, 9650.0, 3714.0, 1680.0, 815.0, 425.0, 261.0, 159.0, 111.0, 75.0, 72.0, 30.0, 21.0, 14.0, 21.0, 12.0, 6.0, 10.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.7607421875, -0.7403411865234375, -0.719940185546875, -0.6995391845703125, -0.67913818359375, -0.6587371826171875, -0.638336181640625, -0.6179351806640625, -0.5975341796875, -0.5771331787109375, -0.556732177734375, -0.5363311767578125, -0.51593017578125, -0.4955291748046875, -0.475128173828125, -0.4547271728515625, -0.434326171875, -0.4139251708984375, -0.393524169921875, -0.3731231689453125, -0.35272216796875, -0.3323211669921875, -0.311920166015625, -0.2915191650390625, -0.2711181640625, -0.2507171630859375, -0.230316162109375, -0.2099151611328125, -0.18951416015625, -0.1691131591796875, -0.148712158203125, -0.1283111572265625, -0.10791015625, -0.0875091552734375, -0.067108154296875, -0.0467071533203125, -0.02630615234375, -0.0059051513671875, 0.014495849609375, 0.0348968505859375, 0.0552978515625, 0.0756988525390625, 0.096099853515625, 0.1165008544921875, 0.13690185546875, 0.1573028564453125, 0.177703857421875, 0.1981048583984375, 0.218505859375, 0.2389068603515625, 0.259307861328125, 0.2797088623046875, 0.30010986328125, 0.3205108642578125, 0.340911865234375, 0.3613128662109375, 0.3817138671875, 0.4021148681640625, 0.422515869140625, 0.4429168701171875, 0.46331787109375, 0.4837188720703125, 0.504119873046875, 0.5245208740234375, 0.544921875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 2.0, 2.0, 3.0, 2.0, 4.0, 3.0, 5.0, 13.0, 14.0, 13.0, 14.0, 18.0, 20.0, 23.0, 29.0, 44.0, 54.0, 61.0, 78.0, 92.0, 93.0, 64.0, 89.0, 49.0, 45.0, 33.0, 26.0, 30.0, 12.0, 11.0, 10.0, 14.0, 6.0, 4.0, 5.0, 4.0, 1.0, 7.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001958608627319336, -0.00019012577831745148, -0.00018439069390296936, -0.00017865560948848724, -0.00017292052507400513, -0.000167185440659523, -0.0001614503562450409, -0.00015571527183055878, -0.00014998018741607666, -0.00014424510300159454, -0.00013851001858711243, -0.0001327749341726303, -0.0001270398497581482, -0.00012130476534366608, -0.00011556968092918396, -0.00010983459651470184, -0.00010409951210021973, -9.836442768573761e-05, -9.262934327125549e-05, -8.689425885677338e-05, -8.115917444229126e-05, -7.542409002780914e-05, -6.968900561332703e-05, -6.395392119884491e-05, -5.821883678436279e-05, -5.2483752369880676e-05, -4.674866795539856e-05, -4.101358354091644e-05, -3.5278499126434326e-05, -2.954341471195221e-05, -2.3808330297470093e-05, -1.8073245882987976e-05, -1.233816146850586e-05, -6.603077054023743e-06, -8.67992639541626e-07, 4.867091774940491e-06, 1.0602176189422607e-05, 1.6337260603904724e-05, 2.207234501838684e-05, 2.7807429432868958e-05, 3.3542513847351074e-05, 3.927759826183319e-05, 4.501268267631531e-05, 5.0747767090797424e-05, 5.648285150527954e-05, 6.221793591976166e-05, 6.795302033424377e-05, 7.368810474872589e-05, 7.942318916320801e-05, 8.515827357769012e-05, 9.089335799217224e-05, 9.662844240665436e-05, 0.00010236352682113647, 0.00010809861123561859, 0.00011383369565010071, 0.00011956878006458282, 0.00012530386447906494, 0.00013103894889354706, 0.00013677403330802917, 0.0001425091177225113, 0.0001482442021369934, 0.00015397928655147552, 0.00015971437096595764, 0.00016544945538043976, 0.00017118453979492188]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 4.0, 4.0, 3.0, 4.0, 7.0, 13.0, 14.0, 19.0, 35.0, 41.0, 83.0, 94.0, 180.0, 285.0, 459.0, 917.0, 1976.0, 4778.0, 13973.0, 49610.0, 246174.0, 614926.0, 81917.0, 20983.0, 6751.0, 2591.0, 1229.0, 628.0, 292.0, 210.0, 129.0, 83.0, 46.0, 27.0, 19.0, 29.0, 7.0, 7.0, 9.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.68408203125, -0.6628189086914062, -0.6415557861328125, -0.6202926635742188, -0.599029541015625, -0.5777664184570312, -0.5565032958984375, -0.5352401733398438, -0.51397705078125, -0.49271392822265625, -0.4714508056640625, -0.45018768310546875, -0.428924560546875, -0.40766143798828125, -0.3863983154296875, -0.36513519287109375, -0.3438720703125, -0.32260894775390625, -0.3013458251953125, -0.28008270263671875, -0.258819580078125, -0.23755645751953125, -0.2162933349609375, -0.19503021240234375, -0.17376708984375, -0.15250396728515625, -0.1312408447265625, -0.10997772216796875, -0.088714599609375, -0.06745147705078125, -0.0461883544921875, -0.02492523193359375, -0.003662109375, 0.01760101318359375, 0.0388641357421875, 0.06012725830078125, 0.081390380859375, 0.10265350341796875, 0.1239166259765625, 0.14517974853515625, 0.16644287109375, 0.18770599365234375, 0.2089691162109375, 0.23023223876953125, 0.251495361328125, 0.27275848388671875, 0.2940216064453125, 0.31528472900390625, 0.3365478515625, 0.35781097412109375, 0.3790740966796875, 0.40033721923828125, 0.421600341796875, 0.44286346435546875, 0.4641265869140625, 0.48538970947265625, 0.50665283203125, 0.5279159545898438, 0.5491790771484375, 0.5704421997070312, 0.591705322265625, 0.6129684448242188, 0.6342315673828125, 0.6554946899414062, 0.6767578125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 2.0, 2.0, 8.0, 11.0, 9.0, 12.0, 15.0, 16.0, 31.0, 41.0, 40.0, 71.0, 73.0, 88.0, 85.0, 104.0, 81.0, 69.0, 71.0, 41.0, 27.0, 31.0, 13.0, 13.0, 12.0, 4.0, 8.0, 4.0, 3.0, 8.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.83154296875, -0.8071060180664062, -0.7826690673828125, -0.7582321166992188, -0.733795166015625, -0.7093582153320312, -0.6849212646484375, -0.6604843139648438, -0.63604736328125, -0.6116104125976562, -0.5871734619140625, -0.5627365112304688, -0.538299560546875, -0.5138626098632812, -0.4894256591796875, -0.46498870849609375, -0.4405517578125, -0.41611480712890625, -0.3916778564453125, -0.36724090576171875, -0.342803955078125, -0.31836700439453125, -0.2939300537109375, -0.26949310302734375, -0.24505615234375, -0.22061920166015625, -0.1961822509765625, -0.17174530029296875, -0.147308349609375, -0.12287139892578125, -0.0984344482421875, -0.07399749755859375, -0.049560546875, -0.02512359619140625, -0.0006866455078125, 0.02375030517578125, 0.048187255859375, 0.07262420654296875, 0.0970611572265625, 0.12149810791015625, 0.14593505859375, 0.17037200927734375, 0.1948089599609375, 0.21924591064453125, 0.243682861328125, 0.26811981201171875, 0.2925567626953125, 0.31699371337890625, 0.3414306640625, 0.36586761474609375, 0.3903045654296875, 0.41474151611328125, 0.439178466796875, 0.46361541748046875, 0.4880523681640625, 0.5124893188476562, 0.53692626953125, 0.5613632202148438, 0.5858001708984375, 0.6102371215820312, 0.634674072265625, 0.6591110229492188, 0.6835479736328125, 0.7079849243164062, 0.732421875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 9.0, 20.0, 42.0, 91.0, 158.0, 387.0, 153.0, 72.0, 40.0, 14.0, 6.0, 2.0, 5.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.47957420349121, -15.631742477416992, -14.783909797668457, -13.936078071594238, -13.088245391845703, -12.240413665771484, -11.392581939697266, -10.544750213623047, -9.696917533874512, -8.849085807800293, -8.001253128051758, -7.153421401977539, -6.305589199066162, -5.457756996154785, -4.609925270080566, -3.7620930671691895, -2.9142608642578125, -2.0664286613464355, -1.2185966968536377, -0.37076473236083984, 0.4770674705505371, 1.324899673461914, 2.172731399536133, 3.0205636024475098, 3.8683958053588867, 4.716228008270264, 5.564060211181641, 6.411891937255859, 7.259724140167236, 8.107556343078613, 8.955388069152832, 9.803220748901367, 10.651054382324219, 11.498886108398438, 12.346718788146973, 13.194550514221191, 14.042383193969727, 14.890214920043945, 15.738046646118164, 16.585878372192383, 17.433712005615234, 18.281543731689453, 19.129375457763672, 19.97720718383789, 20.825040817260742, 21.67287254333496, 22.52070426940918, 23.3685359954834, 24.216367721557617, 25.064199447631836, 25.912031173706055, 26.759864807128906, 27.607696533203125, 28.455528259277344, 29.303359985351562, 30.15119171142578, 30.9990234375, 31.84685516357422, 32.69468688964844, 33.542518615722656, 34.390350341796875, 35.238182067871094, 36.08601379394531, 36.9338493347168, 37.781681060791016]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 2.0, 5.0, 2.0, 1.0, 3.0, 5.0, 6.0, 12.0, 10.0, 14.0, 24.0, 18.0, 27.0, 23.0, 34.0, 33.0, 25.0, 27.0, 46.0, 56.0, 91.0, 96.0, 72.0, 57.0, 43.0, 43.0, 35.0, 30.0, 31.0, 23.0, 20.0, 21.0, 17.0, 10.0, 8.0, 3.0, 7.0, 5.0, 7.0, 1.0, 3.0, 3.0, 1.0, 1.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-12.414369583129883, -12.051536560058594, -11.688702583312988, -11.3258695602417, -10.963035583496094, -10.600202560424805, -10.237369537353516, -9.87453556060791, -9.511701583862305, -9.148868560791016, -8.78603458404541, -8.423201560974121, -8.060367584228516, -7.697534561157227, -7.334701061248779, -6.971867561340332, -6.609034538269043, -6.246201038360596, -5.883367538452148, -5.520534515380859, -5.157700538635254, -4.794867515563965, -4.432034015655518, -4.06920051574707, -3.706367015838623, -3.343533515930176, -2.9807000160217285, -2.6178667545318604, -2.255033254623413, -1.8921997547149658, -1.5293664932250977, -1.1665329933166504, -0.8036994934082031, -0.44086605310440063, -0.07803261280059814, 0.28480076789855957, 0.6476342678070068, 1.010467767715454, 1.3733010292053223, 1.7361345291137695, 2.098968029022217, 2.461801528930664, 2.8246350288391113, 3.1874682903289795, 3.5503017902374268, 3.913135290145874, 4.275968551635742, 4.6388020515441895, 5.001635551452637, 5.364469051361084, 5.727302551269531, 6.09013557434082, 6.452969551086426, 6.815802574157715, 7.178636074066162, 7.541469573974609, 7.904303073883057, 8.267136573791504, 8.629969596862793, 8.992803573608398, 9.355636596679688, 9.718470573425293, 10.081303596496582, 10.444137573242188, 10.806970596313477]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 6.0, 7.0, 11.0, 14.0, 28.0, 27.0, 40.0, 56.0, 94.0, 159.0, 312.0, 609.0, 1287.0, 3261.0, 10315.0, 47231.0, 416061.0, 2712647.0, 896600.0, 83283.0, 14597.0, 4264.0, 1553.0, 803.0, 409.0, 182.0, 134.0, 81.0, 42.0, 40.0, 31.0, 24.0, 21.0, 12.0, 11.0, 6.0, 5.0, 5.0, 5.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-1.4736328125, -1.4270782470703125, -1.380523681640625, -1.3339691162109375, -1.28741455078125, -1.2408599853515625, -1.194305419921875, -1.1477508544921875, -1.1011962890625, -1.0546417236328125, -1.008087158203125, -0.9615325927734375, -0.91497802734375, -0.8684234619140625, -0.821868896484375, -0.7753143310546875, -0.728759765625, -0.6822052001953125, -0.635650634765625, -0.5890960693359375, -0.54254150390625, -0.4959869384765625, -0.449432373046875, -0.4028778076171875, -0.3563232421875, -0.3097686767578125, -0.263214111328125, -0.2166595458984375, -0.17010498046875, -0.1235504150390625, -0.076995849609375, -0.0304412841796875, 0.01611328125, 0.0626678466796875, 0.109222412109375, 0.1557769775390625, 0.20233154296875, 0.2488861083984375, 0.295440673828125, 0.3419952392578125, 0.3885498046875, 0.4351043701171875, 0.481658935546875, 0.5282135009765625, 0.57476806640625, 0.6213226318359375, 0.667877197265625, 0.7144317626953125, 0.760986328125, 0.8075408935546875, 0.854095458984375, 0.9006500244140625, 0.94720458984375, 0.9937591552734375, 1.040313720703125, 1.0868682861328125, 1.1334228515625, 1.1799774169921875, 1.226531982421875, 1.2730865478515625, 1.31964111328125, 1.3661956787109375, 1.412750244140625, 1.4593048095703125, 1.505859375]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 2.0, 2.0, 4.0, 7.0, 7.0, 15.0, 11.0, 9.0, 17.0, 14.0, 20.0, 21.0, 34.0, 29.0, 39.0, 38.0, 28.0, 22.0, 42.0, 72.0, 47.0, 47.0, 52.0, 42.0, 50.0, 36.0, 53.0, 29.0, 40.0, 32.0, 21.0, 24.0, 19.0, 11.0, 15.0, 11.0, 4.0, 10.0, 8.0, 4.0, 6.0, 4.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.7490234375, -0.723480224609375, -0.69793701171875, -0.672393798828125, -0.6468505859375, -0.621307373046875, -0.59576416015625, -0.570220947265625, -0.544677734375, -0.519134521484375, -0.49359130859375, -0.468048095703125, -0.4425048828125, -0.416961669921875, -0.39141845703125, -0.365875244140625, -0.34033203125, -0.314788818359375, -0.28924560546875, -0.263702392578125, -0.2381591796875, -0.212615966796875, -0.18707275390625, -0.161529541015625, -0.135986328125, -0.110443115234375, -0.08489990234375, -0.059356689453125, -0.0338134765625, -0.008270263671875, 0.01727294921875, 0.042816162109375, 0.068359375, 0.093902587890625, 0.11944580078125, 0.144989013671875, 0.1705322265625, 0.196075439453125, 0.22161865234375, 0.247161865234375, 0.272705078125, 0.298248291015625, 0.32379150390625, 0.349334716796875, 0.3748779296875, 0.400421142578125, 0.42596435546875, 0.451507568359375, 0.47705078125, 0.502593994140625, 0.52813720703125, 0.553680419921875, 0.5792236328125, 0.604766845703125, 0.63031005859375, 0.655853271484375, 0.681396484375, 0.706939697265625, 0.73248291015625, 0.758026123046875, 0.7835693359375, 0.809112548828125, 0.83465576171875, 0.860198974609375, 0.8857421875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 5.0, 10.0, 5.0, 15.0, 22.0, 39.0, 64.0, 122.0, 196.0, 410.0, 986.0, 3867.0, 47146.0, 3791599.0, 336237.0, 10488.0, 1827.0, 612.0, 281.0, 123.0, 90.0, 48.0, 40.0, 23.0, 16.0, 3.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.3671875, -4.2337646484375, -4.100341796875, -3.9669189453125, -3.83349609375, -3.7000732421875, -3.566650390625, -3.4332275390625, -3.2998046875, -3.1663818359375, -3.032958984375, -2.8995361328125, -2.76611328125, -2.6326904296875, -2.499267578125, -2.3658447265625, -2.232421875, -2.0989990234375, -1.965576171875, -1.8321533203125, -1.69873046875, -1.5653076171875, -1.431884765625, -1.2984619140625, -1.1650390625, -1.0316162109375, -0.898193359375, -0.7647705078125, -0.63134765625, -0.4979248046875, -0.364501953125, -0.2310791015625, -0.09765625, 0.0357666015625, 0.169189453125, 0.3026123046875, 0.43603515625, 0.5694580078125, 0.702880859375, 0.8363037109375, 0.9697265625, 1.1031494140625, 1.236572265625, 1.3699951171875, 1.50341796875, 1.6368408203125, 1.770263671875, 1.9036865234375, 2.037109375, 2.1705322265625, 2.303955078125, 2.4373779296875, 2.57080078125, 2.7042236328125, 2.837646484375, 2.9710693359375, 3.1044921875, 3.2379150390625, 3.371337890625, 3.5047607421875, 3.63818359375, 3.7716064453125, 3.905029296875, 4.0384521484375, 4.171875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 5.0, 7.0, 10.0, 9.0, 30.0, 39.0, 50.0, 109.0, 201.0, 412.0, 729.0, 1025.0, 698.0, 321.0, 145.0, 101.0, 59.0, 37.0, 34.0, 19.0, 15.0, 7.0, 5.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.587890625, -3.489471435546875, -3.39105224609375, -3.292633056640625, -3.1942138671875, -3.095794677734375, -2.99737548828125, -2.898956298828125, -2.800537109375, -2.702117919921875, -2.60369873046875, -2.505279541015625, -2.4068603515625, -2.308441162109375, -2.21002197265625, -2.111602783203125, -2.01318359375, -1.914764404296875, -1.81634521484375, -1.717926025390625, -1.6195068359375, -1.521087646484375, -1.42266845703125, -1.324249267578125, -1.225830078125, -1.127410888671875, -1.02899169921875, -0.930572509765625, -0.8321533203125, -0.733734130859375, -0.63531494140625, -0.536895751953125, -0.4384765625, -0.340057373046875, -0.24163818359375, -0.143218994140625, -0.0447998046875, 0.053619384765625, 0.15203857421875, 0.250457763671875, 0.348876953125, 0.447296142578125, 0.54571533203125, 0.644134521484375, 0.7425537109375, 0.840972900390625, 0.93939208984375, 1.037811279296875, 1.13623046875, 1.234649658203125, 1.33306884765625, 1.431488037109375, 1.5299072265625, 1.628326416015625, 1.72674560546875, 1.825164794921875, 1.923583984375, 2.022003173828125, 2.12042236328125, 2.218841552734375, 2.3172607421875, 2.415679931640625, 2.51409912109375, 2.612518310546875, 2.7109375]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 5.0, 10.0, 10.0, 63.0, 165.0, 328.0, 260.0, 98.0, 38.0, 23.0, 5.0, 4.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.391866683959961, -7.300963878631592, -6.210061073303223, -5.119158744812012, -4.028255939483643, -2.9373531341552734, -1.8464508056640625, -0.7555480003356934, 0.3353548049926758, 1.4262574911117554, 2.517160177230835, 3.608062744140625, 4.698965549468994, 5.789868354797363, 6.880770683288574, 7.971673488616943, 9.062576293945312, 10.153478622436523, 11.24438190460205, 12.335284233093262, 13.426187515258789, 14.51708984375, 15.607992172241211, 16.698894500732422, 17.789798736572266, 18.880701065063477, 19.971603393554688, 21.06250762939453, 22.153409957885742, 23.244312286376953, 24.335214614868164, 25.426116943359375, 26.517017364501953, 27.607919692993164, 28.698822021484375, 29.78972625732422, 30.88062858581543, 31.97153091430664, 33.06243133544922, 34.15333557128906, 35.244239807128906, 36.33514404296875, 37.42604446411133, 38.51694869995117, 39.60784912109375, 40.698753356933594, 41.78965759277344, 42.880558013916016, 43.971458435058594, 45.06236267089844, 46.153263092041016, 47.24416732788086, 48.33506774902344, 49.42597198486328, 50.516876220703125, 51.6077766418457, 52.69868087768555, 53.78958511352539, 54.88048553466797, 55.97138977050781, 57.06229019165039, 58.153194427490234, 59.24409484863281, 60.334999084472656, 61.4259033203125]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 7.0, 2.0, 3.0, 6.0, 4.0, 5.0, 5.0, 7.0, 7.0, 9.0, 10.0, 16.0, 22.0, 19.0, 27.0, 39.0, 34.0, 30.0, 38.0, 43.0, 49.0, 66.0, 60.0, 71.0, 48.0, 52.0, 48.0, 27.0, 31.0, 44.0, 32.0, 21.0, 19.0, 15.0, 22.0, 20.0, 6.0, 11.0, 8.0, 11.0, 6.0, 7.0, 1.0, 5.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.874604225158691, -8.557976722717285, -8.241349220275879, -7.924721717834473, -7.608094215393066, -7.29146671295166, -6.974839210510254, -6.658211708068848, -6.341584205627441, -6.024956703186035, -5.708329200744629, -5.391701698303223, -5.075074195861816, -4.75844669342041, -4.441819190979004, -4.125191688537598, -3.808563709259033, -3.491936206817627, -3.1753087043762207, -2.8586812019348145, -2.542053699493408, -2.225426197052002, -1.9087984561920166, -1.5921709537506104, -1.275543451309204, -0.9589159488677979, -0.6422883868217468, -0.3256608247756958, -0.00903332233428955, 0.3075941801071167, 0.6242218017578125, 0.9408493041992188, 1.257476806640625, 1.5741043090820312, 1.8907318115234375, 2.2073593139648438, 2.52398681640625, 2.8406143188476562, 3.1572420597076416, 3.473869562149048, 3.790497064590454, 4.1071248054504395, 4.423752307891846, 4.740379810333252, 5.057007312774658, 5.3736348152160645, 5.690262317657471, 6.006889820098877, 6.323517322540283, 6.6401448249816895, 6.956772327423096, 7.273399829864502, 7.590027332305908, 7.9066548347473145, 8.223282814025879, 8.539910316467285, 8.856537818908691, 9.173165321350098, 9.489792823791504, 9.80642032623291, 10.123047828674316, 10.439675331115723, 10.756302833557129, 11.072930335998535, 11.389557838439941]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 5.0, 3.0, 3.0, 4.0, 2.0, 8.0, 13.0, 17.0, 16.0, 42.0, 58.0, 83.0, 109.0, 190.0, 303.0, 471.0, 834.0, 1569.0, 2864.0, 5573.0, 11376.0, 24068.0, 56065.0, 136507.0, 301432.0, 285810.0, 125160.0, 51384.0, 22589.0, 10510.0, 5279.0, 2669.0, 1408.0, 853.0, 483.0, 264.0, 175.0, 115.0, 72.0, 42.0, 33.0, 20.0, 24.0, 20.0, 12.0, 9.0, 8.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.4873046875, -1.442169189453125, -1.39703369140625, -1.351898193359375, -1.3067626953125, -1.261627197265625, -1.21649169921875, -1.171356201171875, -1.126220703125, -1.081085205078125, -1.03594970703125, -0.990814208984375, -0.9456787109375, -0.900543212890625, -0.85540771484375, -0.810272216796875, -0.76513671875, -0.720001220703125, -0.67486572265625, -0.629730224609375, -0.5845947265625, -0.539459228515625, -0.49432373046875, -0.449188232421875, -0.404052734375, -0.358917236328125, -0.31378173828125, -0.268646240234375, -0.2235107421875, -0.178375244140625, -0.13323974609375, -0.088104248046875, -0.04296875, 0.002166748046875, 0.04730224609375, 0.092437744140625, 0.1375732421875, 0.182708740234375, 0.22784423828125, 0.272979736328125, 0.318115234375, 0.363250732421875, 0.40838623046875, 0.453521728515625, 0.4986572265625, 0.543792724609375, 0.58892822265625, 0.634063720703125, 0.67919921875, 0.724334716796875, 0.76947021484375, 0.814605712890625, 0.8597412109375, 0.904876708984375, 0.95001220703125, 0.995147705078125, 1.040283203125, 1.085418701171875, 1.13055419921875, 1.175689697265625, 1.2208251953125, 1.265960693359375, 1.31109619140625, 1.356231689453125, 1.4013671875]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 4.0, 3.0, 5.0, 3.0, 15.0, 10.0, 12.0, 21.0, 18.0, 27.0, 34.0, 40.0, 40.0, 39.0, 46.0, 59.0, 58.0, 53.0, 69.0, 56.0, 57.0, 44.0, 48.0, 36.0, 29.0, 30.0, 25.0, 21.0, 24.0, 22.0, 14.0, 13.0, 5.0, 7.0, 5.0, 6.0, 5.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.947265625, -0.9149322509765625, -0.882598876953125, -0.8502655029296875, -0.81793212890625, -0.7855987548828125, -0.753265380859375, -0.7209320068359375, -0.6885986328125, -0.6562652587890625, -0.623931884765625, -0.5915985107421875, -0.55926513671875, -0.5269317626953125, -0.494598388671875, -0.4622650146484375, -0.429931640625, -0.3975982666015625, -0.365264892578125, -0.3329315185546875, -0.30059814453125, -0.2682647705078125, -0.235931396484375, -0.2035980224609375, -0.1712646484375, -0.1389312744140625, -0.106597900390625, -0.0742645263671875, -0.04193115234375, -0.0095977783203125, 0.022735595703125, 0.0550689697265625, 0.08740234375, 0.1197357177734375, 0.152069091796875, 0.1844024658203125, 0.21673583984375, 0.2490692138671875, 0.281402587890625, 0.3137359619140625, 0.3460693359375, 0.3784027099609375, 0.410736083984375, 0.4430694580078125, 0.47540283203125, 0.5077362060546875, 0.540069580078125, 0.5724029541015625, 0.604736328125, 0.6370697021484375, 0.669403076171875, 0.7017364501953125, 0.73406982421875, 0.7664031982421875, 0.798736572265625, 0.8310699462890625, 0.8634033203125, 0.8957366943359375, 0.928070068359375, 0.9604034423828125, 0.99273681640625, 1.0250701904296875, 1.057403564453125, 1.0897369384765625, 1.1220703125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 5.0, 3.0, 5.0, 7.0, 17.0, 18.0, 19.0, 20.0, 45.0, 52.0, 75.0, 90.0, 148.0, 192.0, 275.0, 391.0, 623.0, 996.0, 1964.0, 4341.0, 12916.0, 52197.0, 315146.0, 576936.0, 58262.0, 13878.0, 4670.0, 2081.0, 1078.0, 653.0, 404.0, 311.0, 206.0, 126.0, 106.0, 74.0, 61.0, 50.0, 24.0, 31.0, 19.0, 15.0, 6.0, 3.0, 6.0, 3.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.537109375, -2.457916259765625, -2.37872314453125, -2.299530029296875, -2.2203369140625, -2.141143798828125, -2.06195068359375, -1.982757568359375, -1.903564453125, -1.824371337890625, -1.74517822265625, -1.665985107421875, -1.5867919921875, -1.507598876953125, -1.42840576171875, -1.349212646484375, -1.27001953125, -1.190826416015625, -1.11163330078125, -1.032440185546875, -0.9532470703125, -0.874053955078125, -0.79486083984375, -0.715667724609375, -0.636474609375, -0.557281494140625, -0.47808837890625, -0.398895263671875, -0.3197021484375, -0.240509033203125, -0.16131591796875, -0.082122802734375, -0.0029296875, 0.076263427734375, 0.15545654296875, 0.234649658203125, 0.3138427734375, 0.393035888671875, 0.47222900390625, 0.551422119140625, 0.630615234375, 0.709808349609375, 0.78900146484375, 0.868194580078125, 0.9473876953125, 1.026580810546875, 1.10577392578125, 1.184967041015625, 1.26416015625, 1.343353271484375, 1.42254638671875, 1.501739501953125, 1.5809326171875, 1.660125732421875, 1.73931884765625, 1.818511962890625, 1.897705078125, 1.976898193359375, 2.05609130859375, 2.135284423828125, 2.2144775390625, 2.293670654296875, 2.37286376953125, 2.452056884765625, 2.53125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 2.0, 3.0, 1.0, 5.0, 2.0, 5.0, 8.0, 6.0, 12.0, 11.0, 11.0, 16.0, 19.0, 21.0, 25.0, 23.0, 35.0, 34.0, 49.0, 44.0, 57.0, 49.0, 55.0, 65.0, 55.0, 57.0, 51.0, 35.0, 44.0, 25.0, 28.0, 26.0, 29.0, 14.0, 18.0, 15.0, 7.0, 8.0, 13.0, 4.0, 7.0, 4.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.17578125, -3.07257080078125, -2.9693603515625, -2.86614990234375, -2.762939453125, -2.65972900390625, -2.5565185546875, -2.45330810546875, -2.35009765625, -2.24688720703125, -2.1436767578125, -2.04046630859375, -1.937255859375, -1.83404541015625, -1.7308349609375, -1.62762451171875, -1.5244140625, -1.42120361328125, -1.3179931640625, -1.21478271484375, -1.111572265625, -1.00836181640625, -0.9051513671875, -0.80194091796875, -0.69873046875, -0.59552001953125, -0.4923095703125, -0.38909912109375, -0.285888671875, -0.18267822265625, -0.0794677734375, 0.02374267578125, 0.126953125, 0.23016357421875, 0.3333740234375, 0.43658447265625, 0.539794921875, 0.64300537109375, 0.7462158203125, 0.84942626953125, 0.95263671875, 1.05584716796875, 1.1590576171875, 1.26226806640625, 1.365478515625, 1.46868896484375, 1.5718994140625, 1.67510986328125, 1.7783203125, 1.88153076171875, 1.9847412109375, 2.08795166015625, 2.191162109375, 2.29437255859375, 2.3975830078125, 2.50079345703125, 2.60400390625, 2.70721435546875, 2.8104248046875, 2.91363525390625, 3.016845703125, 3.12005615234375, 3.2232666015625, 3.32647705078125, 3.4296875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 9.0, 6.0, 14.0, 23.0, 35.0, 47.0, 55.0, 102.0, 153.0, 338.0, 716.0, 1724.0, 6063.0, 33057.0, 325285.0, 633021.0, 37557.0, 6938.0, 1908.0, 709.0, 326.0, 177.0, 94.0, 48.0, 60.0, 28.0, 25.0, 13.0, 10.0, 5.0, 7.0, 5.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0546875, -1.0245819091796875, -0.994476318359375, -0.9643707275390625, -0.93426513671875, -0.9041595458984375, -0.874053955078125, -0.8439483642578125, -0.8138427734375, -0.7837371826171875, -0.753631591796875, -0.7235260009765625, -0.69342041015625, -0.6633148193359375, -0.633209228515625, -0.6031036376953125, -0.572998046875, -0.5428924560546875, -0.512786865234375, -0.4826812744140625, -0.45257568359375, -0.4224700927734375, -0.392364501953125, -0.3622589111328125, -0.3321533203125, -0.3020477294921875, -0.271942138671875, -0.2418365478515625, -0.21173095703125, -0.1816253662109375, -0.151519775390625, -0.1214141845703125, -0.09130859375, -0.0612030029296875, -0.031097412109375, -0.0009918212890625, 0.02911376953125, 0.0592193603515625, 0.089324951171875, 0.1194305419921875, 0.1495361328125, 0.1796417236328125, 0.209747314453125, 0.2398529052734375, 0.26995849609375, 0.3000640869140625, 0.330169677734375, 0.3602752685546875, 0.390380859375, 0.4204864501953125, 0.450592041015625, 0.4806976318359375, 0.51080322265625, 0.5409088134765625, 0.571014404296875, 0.6011199951171875, 0.6312255859375, 0.6613311767578125, 0.691436767578125, 0.7215423583984375, 0.75164794921875, 0.7817535400390625, 0.811859130859375, 0.8419647216796875, 0.8720703125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 5.0, 10.0, 8.0, 4.0, 12.0, 23.0, 34.0, 36.0, 30.0, 33.0, 67.0, 59.0, 93.0, 115.0, 94.0, 82.0, 70.0, 51.0, 41.0, 27.0, 25.0, 17.0, 14.0, 13.0, 10.0, 2.0, 8.0, 5.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002989768981933594, -0.00029057078063488007, -0.00028216466307640076, -0.00027375854551792145, -0.00026535242795944214, -0.00025694631040096283, -0.0002485401928424835, -0.0002401340752840042, -0.0002317279577255249, -0.0002233218401670456, -0.00021491572260856628, -0.00020650960505008698, -0.00019810348749160767, -0.00018969736993312836, -0.00018129125237464905, -0.00017288513481616974, -0.00016447901725769043, -0.00015607289969921112, -0.0001476667821407318, -0.0001392606645822525, -0.0001308545470237732, -0.00012244842946529388, -0.00011404231190681458, -0.00010563619434833527, -9.723007678985596e-05, -8.882395923137665e-05, -8.041784167289734e-05, -7.201172411441803e-05, -6.360560655593872e-05, -5.519948899745941e-05, -4.67933714389801e-05, -3.8387253880500793e-05, -2.9981136322021484e-05, -2.1575018763542175e-05, -1.3168901205062866e-05, -4.762783646583557e-06, 3.643333911895752e-06, 1.2049451470375061e-05, 2.045556902885437e-05, 2.886168658733368e-05, 3.726780414581299e-05, 4.56739217042923e-05, 5.4080039262771606e-05, 6.248615682125092e-05, 7.089227437973022e-05, 7.929839193820953e-05, 8.770450949668884e-05, 9.611062705516815e-05, 0.00010451674461364746, 0.00011292286217212677, 0.00012132897973060608, 0.0001297350972890854, 0.0001381412148475647, 0.000146547332406044, 0.00015495344996452332, 0.00016335956752300262, 0.00017176568508148193, 0.00018017180263996124, 0.00018857792019844055, 0.00019698403775691986, 0.00020539015531539917, 0.00021379627287387848, 0.0002222023904323578, 0.0002306085079908371, 0.0002390146255493164]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 11.0, 11.0, 14.0, 9.0, 26.0, 41.0, 50.0, 65.0, 104.0, 144.0, 232.0, 344.0, 629.0, 994.0, 1962.0, 4409.0, 12340.0, 46250.0, 215397.0, 643347.0, 88117.0, 21110.0, 6815.0, 2791.0, 1347.0, 752.0, 429.0, 262.0, 167.0, 125.0, 83.0, 44.0, 30.0, 26.0, 24.0, 11.0, 15.0, 8.0, 5.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.599609375, -0.5820846557617188, -0.5645599365234375, -0.5470352172851562, -0.529510498046875, -0.5119857788085938, -0.4944610595703125, -0.47693634033203125, -0.45941162109375, -0.44188690185546875, -0.4243621826171875, -0.40683746337890625, -0.389312744140625, -0.37178802490234375, -0.3542633056640625, -0.33673858642578125, -0.3192138671875, -0.30168914794921875, -0.2841644287109375, -0.26663970947265625, -0.249114990234375, -0.23159027099609375, -0.2140655517578125, -0.19654083251953125, -0.17901611328125, -0.16149139404296875, -0.1439666748046875, -0.12644195556640625, -0.108917236328125, -0.09139251708984375, -0.0738677978515625, -0.05634307861328125, -0.038818359375, -0.02129364013671875, -0.0037689208984375, 0.01375579833984375, 0.031280517578125, 0.04880523681640625, 0.0663299560546875, 0.08385467529296875, 0.10137939453125, 0.11890411376953125, 0.1364288330078125, 0.15395355224609375, 0.171478271484375, 0.18900299072265625, 0.2065277099609375, 0.22405242919921875, 0.2415771484375, 0.25910186767578125, 0.2766265869140625, 0.29415130615234375, 0.311676025390625, 0.32920074462890625, 0.3467254638671875, 0.36425018310546875, 0.38177490234375, 0.39929962158203125, 0.4168243408203125, 0.43434906005859375, 0.451873779296875, 0.46939849853515625, 0.4869232177734375, 0.5044479370117188, 0.52197265625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 4.0, 4.0, 6.0, 10.0, 7.0, 15.0, 10.0, 18.0, 21.0, 27.0, 22.0, 31.0, 34.0, 40.0, 42.0, 42.0, 55.0, 88.0, 57.0, 67.0, 62.0, 61.0, 37.0, 52.0, 31.0, 23.0, 23.0, 26.0, 15.0, 13.0, 8.0, 10.0, 11.0, 5.0, 5.0, 5.0, 3.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0], "bins": [-0.6171875, -0.5996856689453125, -0.582183837890625, -0.5646820068359375, -0.54718017578125, -0.5296783447265625, -0.512176513671875, -0.4946746826171875, -0.4771728515625, -0.4596710205078125, -0.442169189453125, -0.4246673583984375, -0.40716552734375, -0.3896636962890625, -0.372161865234375, -0.3546600341796875, -0.337158203125, -0.3196563720703125, -0.302154541015625, -0.2846527099609375, -0.26715087890625, -0.2496490478515625, -0.232147216796875, -0.2146453857421875, -0.1971435546875, -0.1796417236328125, -0.162139892578125, -0.1446380615234375, -0.12713623046875, -0.1096343994140625, -0.092132568359375, -0.0746307373046875, -0.05712890625, -0.0396270751953125, -0.022125244140625, -0.0046234130859375, 0.01287841796875, 0.0303802490234375, 0.047882080078125, 0.0653839111328125, 0.0828857421875, 0.1003875732421875, 0.117889404296875, 0.1353912353515625, 0.15289306640625, 0.1703948974609375, 0.187896728515625, 0.2053985595703125, 0.222900390625, 0.2404022216796875, 0.257904052734375, 0.2754058837890625, 0.29290771484375, 0.3104095458984375, 0.327911376953125, 0.3454132080078125, 0.3629150390625, 0.3804168701171875, 0.397918701171875, 0.4154205322265625, 0.43292236328125, 0.4504241943359375, 0.467926025390625, 0.4854278564453125, 0.5029296875]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 8.0, 6.0, 26.0, 23.0, 67.0, 158.0, 388.0, 162.0, 90.0, 39.0, 19.0, 9.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-32.272552490234375, -31.393699645996094, -30.514846801757812, -29.63599395751953, -28.757139205932617, -27.878286361694336, -26.999433517456055, -26.120580673217773, -25.24172592163086, -24.362873077392578, -23.484020233154297, -22.605167388916016, -21.7263126373291, -20.84745979309082, -19.96860694885254, -19.089754104614258, -18.210901260375977, -17.332048416137695, -16.453195571899414, -15.574341773986816, -14.695487976074219, -13.816635131835938, -12.937782287597656, -12.058929443359375, -11.180075645446777, -10.301222801208496, -9.422369003295898, -8.543516159057617, -7.664662837982178, -6.785809516906738, -5.906956672668457, -5.028103351593018, -4.149250030517578, -3.2703967094421387, -2.3915436267852783, -1.512690544128418, -0.6338372230529785, 0.24501609802246094, 1.1238689422607422, 2.0027222633361816, 2.881575584411621, 3.7604289054870605, 4.6392822265625, 5.518135070800781, 6.396988391876221, 7.27584171295166, 8.154694557189941, 9.033548355102539, 9.91240119934082, 10.791254043579102, 11.6701078414917, 12.54896068572998, 13.427814483642578, 14.30666732788086, 15.18552017211914, 16.064373016357422, 16.943225860595703, 17.822078704833984, 18.700931549072266, 19.579784393310547, 20.45863914489746, 21.337491989135742, 22.216344833374023, 23.095197677612305, 23.97405242919922]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 5.0, 5.0, 10.0, 11.0, 13.0, 13.0, 14.0, 24.0, 27.0, 37.0, 26.0, 32.0, 29.0, 49.0, 78.0, 175.0, 137.0, 46.0, 39.0, 39.0, 31.0, 31.0, 17.0, 25.0, 16.0, 17.0, 17.0, 11.0, 11.0, 5.0, 5.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.693618774414062, -13.216774940490723, -12.739931106567383, -12.26308822631836, -11.78624439239502, -11.30940055847168, -10.83255672454834, -10.355712890625, -9.878870010375977, -9.402026176452637, -8.925182342529297, -8.448339462280273, -7.971495628356934, -7.494651794433594, -7.017807960510254, -6.540964603424072, -6.064120769500732, -5.587276935577393, -5.110433578491211, -4.633589744567871, -4.1567463874816895, -3.6799025535583496, -3.203058958053589, -2.726215362548828, -2.2493717670440674, -1.7725281715393066, -1.295684576034546, -0.8188408613204956, -0.34199726581573486, 0.13484644889831543, 0.6116900444030762, 1.088533639907837, 1.5653772354125977, 2.0422208309173584, 2.519064426422119, 2.995908260345459, 3.4727516174316406, 3.9495954513549805, 4.42643928527832, 4.903282642364502, 5.380125999450684, 5.856969833374023, 6.333813190460205, 6.810657024383545, 7.287500381469727, 7.764344215393066, 8.241188049316406, 8.71803092956543, 9.194875717163086, 9.671719551086426, 10.148563385009766, 10.625406265258789, 11.102250099182129, 11.579093933105469, 12.055937767028809, 12.532781600952148, 13.009624481201172, 13.486468315124512, 13.963312149047852, 14.440155029296875, 14.916998863220215, 15.393842697143555, 15.870686531066895, 16.347530364990234, 16.824373245239258]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 1.0, 3.0, 12.0, 10.0, 16.0, 12.0, 22.0, 32.0, 52.0, 82.0, 133.0, 225.0, 320.0, 495.0, 932.0, 1581.0, 3039.0, 6469.0, 16811.0, 51803.0, 197820.0, 818904.0, 1835094.0, 945474.0, 227536.0, 55396.0, 17473.0, 6934.0, 3294.0, 1640.0, 968.0, 559.0, 382.0, 258.0, 142.0, 117.0, 74.0, 41.0, 23.0, 20.0, 18.0, 14.0, 5.0, 11.0, 12.0, 10.0, 6.0, 2.0, 3.0, 1.0, 0.0, 4.0, 2.0, 1.0, 2.0], "bins": [-1.267578125, -1.2274017333984375, -1.187225341796875, -1.1470489501953125, -1.10687255859375, -1.0666961669921875, -1.026519775390625, -0.9863433837890625, -0.9461669921875, -0.9059906005859375, -0.865814208984375, -0.8256378173828125, -0.78546142578125, -0.7452850341796875, -0.705108642578125, -0.6649322509765625, -0.624755859375, -0.5845794677734375, -0.544403076171875, -0.5042266845703125, -0.46405029296875, -0.4238739013671875, -0.383697509765625, -0.3435211181640625, -0.3033447265625, -0.2631683349609375, -0.222991943359375, -0.1828155517578125, -0.14263916015625, -0.1024627685546875, -0.062286376953125, -0.0221099853515625, 0.01806640625, 0.0582427978515625, 0.098419189453125, 0.1385955810546875, 0.17877197265625, 0.2189483642578125, 0.259124755859375, 0.2993011474609375, 0.3394775390625, 0.3796539306640625, 0.419830322265625, 0.4600067138671875, 0.50018310546875, 0.5403594970703125, 0.580535888671875, 0.6207122802734375, 0.660888671875, 0.7010650634765625, 0.741241455078125, 0.7814178466796875, 0.82159423828125, 0.8617706298828125, 0.901947021484375, 0.9421234130859375, 0.9822998046875, 1.0224761962890625, 1.062652587890625, 1.1028289794921875, 1.14300537109375, 1.1831817626953125, 1.223358154296875, 1.2635345458984375, 1.3037109375]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 4.0, 9.0, 7.0, 11.0, 18.0, 20.0, 27.0, 25.0, 23.0, 29.0, 46.0, 41.0, 51.0, 53.0, 60.0, 50.0, 65.0, 52.0, 49.0, 44.0, 48.0, 41.0, 34.0, 40.0, 31.0, 28.0, 14.0, 15.0, 12.0, 14.0, 11.0, 9.0, 8.0, 2.0, 3.0, 7.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.70263671875, -0.6739730834960938, -0.6453094482421875, -0.6166458129882812, -0.587982177734375, -0.5593185424804688, -0.5306549072265625, -0.5019912719726562, -0.47332763671875, -0.44466400146484375, -0.4160003662109375, -0.38733673095703125, -0.358673095703125, -0.33000946044921875, -0.3013458251953125, -0.27268218994140625, -0.2440185546875, -0.21535491943359375, -0.1866912841796875, -0.15802764892578125, -0.129364013671875, -0.10070037841796875, -0.0720367431640625, -0.04337310791015625, -0.01470947265625, 0.01395416259765625, 0.0426177978515625, 0.07128143310546875, 0.099945068359375, 0.12860870361328125, 0.1572723388671875, 0.18593597412109375, 0.214599609375, 0.24326324462890625, 0.2719268798828125, 0.30059051513671875, 0.329254150390625, 0.35791778564453125, 0.3865814208984375, 0.41524505615234375, 0.44390869140625, 0.47257232666015625, 0.5012359619140625, 0.5298995971679688, 0.558563232421875, 0.5872268676757812, 0.6158905029296875, 0.6445541381835938, 0.6732177734375, 0.7018814086914062, 0.7305450439453125, 0.7592086791992188, 0.787872314453125, 0.8165359497070312, 0.8451995849609375, 0.8738632202148438, 0.90252685546875, 0.9311904907226562, 0.9598541259765625, 0.9885177612304688, 1.017181396484375, 1.0458450317382812, 1.0745086669921875, 1.1031723022460938, 1.1318359375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 5.0, 3.0, 9.0, 11.0, 10.0, 20.0, 43.0, 68.0, 153.0, 251.0, 628.0, 1675.0, 6606.0, 123414.0, 4012209.0, 42145.0, 4498.0, 1388.0, 561.0, 244.0, 138.0, 68.0, 44.0, 26.0, 20.0, 13.0, 7.0, 5.0, 4.0, 6.0, 1.0, 4.0, 0.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.45703125, -6.23724365234375, -6.0174560546875, -5.79766845703125, -5.577880859375, -5.35809326171875, -5.1383056640625, -4.91851806640625, -4.69873046875, -4.47894287109375, -4.2591552734375, -4.03936767578125, -3.819580078125, -3.59979248046875, -3.3800048828125, -3.16021728515625, -2.9404296875, -2.72064208984375, -2.5008544921875, -2.28106689453125, -2.061279296875, -1.84149169921875, -1.6217041015625, -1.40191650390625, -1.18212890625, -0.96234130859375, -0.7425537109375, -0.52276611328125, -0.302978515625, -0.08319091796875, 0.1365966796875, 0.35638427734375, 0.576171875, 0.79595947265625, 1.0157470703125, 1.23553466796875, 1.455322265625, 1.67510986328125, 1.8948974609375, 2.11468505859375, 2.33447265625, 2.55426025390625, 2.7740478515625, 2.99383544921875, 3.213623046875, 3.43341064453125, 3.6531982421875, 3.87298583984375, 4.0927734375, 4.31256103515625, 4.5323486328125, 4.75213623046875, 4.971923828125, 5.19171142578125, 5.4114990234375, 5.63128662109375, 5.85107421875, 6.07086181640625, 6.2906494140625, 6.51043701171875, 6.730224609375, 6.95001220703125, 7.1697998046875, 7.38958740234375, 7.609375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 6.0, 5.0, 9.0, 13.0, 14.0, 24.0, 34.0, 37.0, 68.0, 92.0, 154.0, 194.0, 322.0, 444.0, 616.0, 615.0, 463.0, 317.0, 221.0, 138.0, 79.0, 77.0, 34.0, 22.0, 34.0, 9.0, 10.0, 6.0, 5.0, 3.0, 4.0, 4.0, 1.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.087890625, -1.978363037109375, -1.86883544921875, -1.759307861328125, -1.6497802734375, -1.540252685546875, -1.43072509765625, -1.321197509765625, -1.211669921875, -1.102142333984375, -0.99261474609375, -0.883087158203125, -0.7735595703125, -0.664031982421875, -0.55450439453125, -0.444976806640625, -0.33544921875, -0.225921630859375, -0.11639404296875, -0.006866455078125, 0.1026611328125, 0.212188720703125, 0.32171630859375, 0.431243896484375, 0.540771484375, 0.650299072265625, 0.75982666015625, 0.869354248046875, 0.9788818359375, 1.088409423828125, 1.19793701171875, 1.307464599609375, 1.4169921875, 1.526519775390625, 1.63604736328125, 1.745574951171875, 1.8551025390625, 1.964630126953125, 2.07415771484375, 2.183685302734375, 2.293212890625, 2.402740478515625, 2.51226806640625, 2.621795654296875, 2.7313232421875, 2.840850830078125, 2.95037841796875, 3.059906005859375, 3.16943359375, 3.278961181640625, 3.38848876953125, 3.498016357421875, 3.6075439453125, 3.717071533203125, 3.82659912109375, 3.936126708984375, 4.045654296875, 4.155181884765625, 4.26470947265625, 4.374237060546875, 4.4837646484375, 4.593292236328125, 4.70281982421875, 4.812347412109375, 4.921875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 8.0, 6.0, 17.0, 43.0, 89.0, 212.0, 333.0, 173.0, 66.0, 33.0, 10.0, 5.0, 8.0, 4.0, 1.0, 1.0, 2.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.6939582824707, -32.69845199584961, -30.70294761657715, -28.707443237304688, -26.711936950683594, -24.716432571411133, -22.720928192138672, -20.725421905517578, -18.729917526245117, -16.734413146972656, -14.738906860351562, -12.743402481079102, -10.747897148132324, -8.752391815185547, -6.756887435913086, -4.761382102966309, -2.7658767700195312, -0.770371675491333, 1.2251334190368652, 3.2206382751464844, 5.216143608093262, 7.211648941040039, 9.2071533203125, 11.202658653259277, 13.198163986206055, 15.193669319152832, 17.18917465209961, 19.18467903137207, 21.18018341064453, 23.175689697265625, 25.171194076538086, 27.166698455810547, 29.162208557128906, 31.157712936401367, 33.15321731567383, 35.14872360229492, 37.144229888916016, 39.139732360839844, 41.13523864746094, 43.13074493408203, 45.126251220703125, 47.12175750732422, 49.11725997924805, 51.11276626586914, 53.108272552490234, 55.10377502441406, 57.099281311035156, 59.09478759765625, 61.09029006958008, 63.08579635620117, 65.081298828125, 67.0768051147461, 69.07231140136719, 71.06781768798828, 73.06332397460938, 75.05882263183594, 77.05432891845703, 79.04983520507812, 81.04534149169922, 83.04084777832031, 85.03634643554688, 87.03185272216797, 89.02735900878906, 91.02286529541016, 93.01837158203125]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 4.0, 8.0, 11.0, 13.0, 16.0, 13.0, 21.0, 18.0, 20.0, 19.0, 34.0, 38.0, 36.0, 36.0, 36.0, 58.0, 76.0, 69.0, 69.0, 47.0, 51.0, 39.0, 37.0, 43.0, 19.0, 25.0, 21.0, 20.0, 19.0, 15.0, 10.0, 13.0, 16.0, 8.0, 7.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-20.473234176635742, -19.86264419555664, -19.25205421447754, -18.641464233398438, -18.030874252319336, -17.420284271240234, -16.809694290161133, -16.19910430908203, -15.588515281677246, -14.977925300598145, -14.367335319519043, -13.756745338439941, -13.146156311035156, -12.535566329956055, -11.924976348876953, -11.314386367797852, -10.70379638671875, -10.093206405639648, -9.482616424560547, -8.872026443481445, -8.261436462402344, -7.6508469581604, -7.040257453918457, -6.4296674728393555, -5.819077491760254, -5.208487510681152, -4.597897529602051, -3.9873080253601074, -3.376718044281006, -2.7661280632019043, -2.155538320541382, -1.5449485778808594, -0.934356689453125, -0.323766827583313, 0.286823034286499, 0.897412896156311, 1.508002758026123, 2.1185927391052246, 2.729182481765747, 3.3397722244262695, 3.950362205505371, 4.560952186584473, 5.171542167663574, 5.782131671905518, 6.392721652984619, 7.003311634063721, 7.613901138305664, 8.224491119384766, 8.835081100463867, 9.445671081542969, 10.05626106262207, 10.666851043701172, 11.277441024780273, 11.888031005859375, 12.49862003326416, 13.109210014343262, 13.719799995422363, 14.330389976501465, 14.940979957580566, 15.551569938659668, 16.162158966064453, 16.772748947143555, 17.383338928222656, 17.993928909301758, 18.60451889038086]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 1.0, 3.0, 8.0, 9.0, 15.0, 16.0, 30.0, 37.0, 54.0, 101.0, 171.0, 376.0, 809.0, 2093.0, 5788.0, 19708.0, 92192.0, 635707.0, 234704.0, 40599.0, 10328.0, 3371.0, 1298.0, 532.0, 249.0, 138.0, 89.0, 45.0, 29.0, 18.0, 13.0, 10.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.828125, -2.739044189453125, -2.64996337890625, -2.560882568359375, -2.4718017578125, -2.382720947265625, -2.29364013671875, -2.204559326171875, -2.115478515625, -2.026397705078125, -1.93731689453125, -1.848236083984375, -1.7591552734375, -1.670074462890625, -1.58099365234375, -1.491912841796875, -1.40283203125, -1.313751220703125, -1.22467041015625, -1.135589599609375, -1.0465087890625, -0.957427978515625, -0.86834716796875, -0.779266357421875, -0.690185546875, -0.601104736328125, -0.51202392578125, -0.422943115234375, -0.3338623046875, -0.244781494140625, -0.15570068359375, -0.066619873046875, 0.0224609375, 0.111541748046875, 0.20062255859375, 0.289703369140625, 0.3787841796875, 0.467864990234375, 0.55694580078125, 0.646026611328125, 0.735107421875, 0.824188232421875, 0.91326904296875, 1.002349853515625, 1.0914306640625, 1.180511474609375, 1.26959228515625, 1.358673095703125, 1.44775390625, 1.536834716796875, 1.62591552734375, 1.714996337890625, 1.8040771484375, 1.893157958984375, 1.98223876953125, 2.071319580078125, 2.160400390625, 2.249481201171875, 2.33856201171875, 2.427642822265625, 2.5167236328125, 2.605804443359375, 2.69488525390625, 2.783966064453125, 2.873046875]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 1.0, 4.0, 5.0, 2.0, 7.0, 13.0, 22.0, 24.0, 34.0, 35.0, 44.0, 55.0, 71.0, 82.0, 71.0, 81.0, 66.0, 67.0, 58.0, 56.0, 47.0, 34.0, 30.0, 25.0, 18.0, 17.0, 11.0, 10.0, 7.0, 3.0, 2.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5078125, -1.4566497802734375, -1.405487060546875, -1.3543243408203125, -1.30316162109375, -1.2519989013671875, -1.200836181640625, -1.1496734619140625, -1.0985107421875, -1.0473480224609375, -0.996185302734375, -0.9450225830078125, -0.89385986328125, -0.8426971435546875, -0.791534423828125, -0.7403717041015625, -0.689208984375, -0.6380462646484375, -0.586883544921875, -0.5357208251953125, -0.48455810546875, -0.4333953857421875, -0.382232666015625, -0.3310699462890625, -0.2799072265625, -0.2287445068359375, -0.177581787109375, -0.1264190673828125, -0.07525634765625, -0.0240936279296875, 0.027069091796875, 0.0782318115234375, 0.12939453125, 0.1805572509765625, 0.231719970703125, 0.2828826904296875, 0.33404541015625, 0.3852081298828125, 0.436370849609375, 0.4875335693359375, 0.5386962890625, 0.5898590087890625, 0.641021728515625, 0.6921844482421875, 0.74334716796875, 0.7945098876953125, 0.845672607421875, 0.8968353271484375, 0.947998046875, 0.9991607666015625, 1.050323486328125, 1.1014862060546875, 1.15264892578125, 1.2038116455078125, 1.254974365234375, 1.3061370849609375, 1.3572998046875, 1.4084625244140625, 1.459625244140625, 1.5107879638671875, 1.56195068359375, 1.6131134033203125, 1.664276123046875, 1.7154388427734375, 1.7666015625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 2.0, 7.0, 4.0, 7.0, 8.0, 5.0, 8.0, 13.0, 14.0, 29.0, 34.0, 60.0, 83.0, 112.0, 213.0, 286.0, 515.0, 1015.0, 2383.0, 7031.0, 31743.0, 700090.0, 266509.0, 27463.0, 6460.0, 2163.0, 967.0, 505.0, 279.0, 191.0, 111.0, 88.0, 51.0, 32.0, 25.0, 16.0, 9.0, 8.0, 5.0, 5.0, 4.0, 0.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.1015625, -3.01531982421875, -2.9290771484375, -2.84283447265625, -2.756591796875, -2.67034912109375, -2.5841064453125, -2.49786376953125, -2.41162109375, -2.32537841796875, -2.2391357421875, -2.15289306640625, -2.066650390625, -1.98040771484375, -1.8941650390625, -1.80792236328125, -1.7216796875, -1.63543701171875, -1.5491943359375, -1.46295166015625, -1.376708984375, -1.29046630859375, -1.2042236328125, -1.11798095703125, -1.03173828125, -0.94549560546875, -0.8592529296875, -0.77301025390625, -0.686767578125, -0.60052490234375, -0.5142822265625, -0.42803955078125, -0.341796875, -0.25555419921875, -0.1693115234375, -0.08306884765625, 0.003173828125, 0.08941650390625, 0.1756591796875, 0.26190185546875, 0.34814453125, 0.43438720703125, 0.5206298828125, 0.60687255859375, 0.693115234375, 0.77935791015625, 0.8656005859375, 0.95184326171875, 1.0380859375, 1.12432861328125, 1.2105712890625, 1.29681396484375, 1.383056640625, 1.46929931640625, 1.5555419921875, 1.64178466796875, 1.72802734375, 1.81427001953125, 1.9005126953125, 1.98675537109375, 2.072998046875, 2.15924072265625, 2.2454833984375, 2.33172607421875, 2.41796875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 5.0, 3.0, 3.0, 4.0, 6.0, 6.0, 12.0, 11.0, 14.0, 11.0, 11.0, 20.0, 18.0, 14.0, 19.0, 28.0, 29.0, 28.0, 56.0, 58.0, 62.0, 76.0, 78.0, 59.0, 56.0, 48.0, 42.0, 35.0, 21.0, 16.0, 18.0, 20.0, 15.0, 18.0, 12.0, 16.0, 12.0, 13.0, 7.0, 7.0, 2.0, 5.0, 0.0, 3.0, 2.0, 4.0, 0.0, 1.0], "bins": [-4.78515625, -4.65924072265625, -4.5333251953125, -4.40740966796875, -4.281494140625, -4.15557861328125, -4.0296630859375, -3.90374755859375, -3.77783203125, -3.65191650390625, -3.5260009765625, -3.40008544921875, -3.274169921875, -3.14825439453125, -3.0223388671875, -2.89642333984375, -2.7705078125, -2.64459228515625, -2.5186767578125, -2.39276123046875, -2.266845703125, -2.14093017578125, -2.0150146484375, -1.88909912109375, -1.76318359375, -1.63726806640625, -1.5113525390625, -1.38543701171875, -1.259521484375, -1.13360595703125, -1.0076904296875, -0.88177490234375, -0.755859375, -0.62994384765625, -0.5040283203125, -0.37811279296875, -0.252197265625, -0.12628173828125, -0.0003662109375, 0.12554931640625, 0.25146484375, 0.37738037109375, 0.5032958984375, 0.62921142578125, 0.755126953125, 0.88104248046875, 1.0069580078125, 1.13287353515625, 1.2587890625, 1.38470458984375, 1.5106201171875, 1.63653564453125, 1.762451171875, 1.88836669921875, 2.0142822265625, 2.14019775390625, 2.26611328125, 2.39202880859375, 2.5179443359375, 2.64385986328125, 2.769775390625, 2.89569091796875, 3.0216064453125, 3.14752197265625, 3.2734375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 8.0, 8.0, 15.0, 16.0, 16.0, 26.0, 34.0, 36.0, 60.0, 89.0, 135.0, 253.0, 520.0, 1129.0, 3118.0, 10839.0, 54129.0, 886679.0, 72276.0, 12830.0, 3697.0, 1282.0, 597.0, 286.0, 156.0, 86.0, 74.0, 39.0, 29.0, 24.0, 7.0, 15.0, 13.0, 10.0, 10.0, 5.0, 5.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.66943359375, -0.6442337036132812, -0.6190338134765625, -0.5938339233398438, -0.568634033203125, -0.5434341430664062, -0.5182342529296875, -0.49303436279296875, -0.46783447265625, -0.44263458251953125, -0.4174346923828125, -0.39223480224609375, -0.367034912109375, -0.34183502197265625, -0.3166351318359375, -0.29143524169921875, -0.2662353515625, -0.24103546142578125, -0.2158355712890625, -0.19063568115234375, -0.165435791015625, -0.14023590087890625, -0.1150360107421875, -0.08983612060546875, -0.06463623046875, -0.03943634033203125, -0.0142364501953125, 0.01096343994140625, 0.036163330078125, 0.06136322021484375, 0.0865631103515625, 0.11176300048828125, 0.136962890625, 0.16216278076171875, 0.1873626708984375, 0.21256256103515625, 0.237762451171875, 0.26296234130859375, 0.2881622314453125, 0.31336212158203125, 0.33856201171875, 0.36376190185546875, 0.3889617919921875, 0.41416168212890625, 0.439361572265625, 0.46456146240234375, 0.4897613525390625, 0.5149612426757812, 0.5401611328125, 0.5653610229492188, 0.5905609130859375, 0.6157608032226562, 0.640960693359375, 0.6661605834960938, 0.6913604736328125, 0.7165603637695312, 0.74176025390625, 0.7669601440429688, 0.7921600341796875, 0.8173599243164062, 0.842559814453125, 0.8677597045898438, 0.8929595947265625, 0.9181594848632812, 0.943359375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 4.0, 6.0, 6.0, 2.0, 8.0, 4.0, 20.0, 15.0, 30.0, 33.0, 58.0, 74.0, 103.0, 146.0, 143.0, 95.0, 60.0, 54.0, 26.0, 27.0, 20.0, 17.0, 6.0, 11.0, 12.0, 3.0, 6.0, 5.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003075599670410156, -0.00029921717941761017, -0.0002908743917942047, -0.00028253160417079926, -0.0002741888165473938, -0.00026584602892398834, -0.0002575032413005829, -0.00024916045367717743, -0.00024081766605377197, -0.00023247487843036652, -0.00022413209080696106, -0.0002157893031835556, -0.00020744651556015015, -0.0001991037279367447, -0.00019076094031333923, -0.00018241815268993378, -0.00017407536506652832, -0.00016573257744312286, -0.0001573897898197174, -0.00014904700219631195, -0.0001407042145729065, -0.00013236142694950104, -0.00012401863932609558, -0.00011567585170269012, -0.00010733306407928467, -9.899027645587921e-05, -9.064748883247375e-05, -8.23047012090683e-05, -7.396191358566284e-05, -6.561912596225739e-05, -5.727633833885193e-05, -4.893355071544647e-05, -4.0590763092041016e-05, -3.224797546863556e-05, -2.3905187845230103e-05, -1.5562400221824646e-05, -7.2196125984191895e-06, 1.123175024986267e-06, 9.465962648391724e-06, 1.780875027179718e-05, 2.6151537895202637e-05, 3.449432551860809e-05, 4.283711314201355e-05, 5.1179900765419006e-05, 5.952268838882446e-05, 6.786547601222992e-05, 7.620826363563538e-05, 8.455105125904083e-05, 9.289383888244629e-05, 0.00010123662650585175, 0.0001095794141292572, 0.00011792220175266266, 0.00012626498937606812, 0.00013460777699947357, 0.00014295056462287903, 0.00015129335224628448, 0.00015963613986968994, 0.0001679789274930954, 0.00017632171511650085, 0.0001846645027399063, 0.00019300729036331177, 0.00020135007798671722, 0.00020969286561012268, 0.00021803565323352814, 0.0002263784408569336]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 8.0, 6.0, 11.0, 14.0, 25.0, 50.0, 90.0, 198.0, 452.0, 1354.0, 4828.0, 27074.0, 890518.0, 108929.0, 10966.0, 2560.0, 822.0, 311.0, 155.0, 73.0, 37.0, 23.0, 18.0, 4.0, 4.0, 4.0, 8.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.8583984375, -0.8313751220703125, -0.804351806640625, -0.7773284912109375, -0.75030517578125, -0.7232818603515625, -0.696258544921875, -0.6692352294921875, -0.6422119140625, -0.6151885986328125, -0.588165283203125, -0.5611419677734375, -0.53411865234375, -0.5070953369140625, -0.480072021484375, -0.4530487060546875, -0.426025390625, -0.3990020751953125, -0.371978759765625, -0.3449554443359375, -0.31793212890625, -0.2909088134765625, -0.263885498046875, -0.2368621826171875, -0.2098388671875, -0.1828155517578125, -0.155792236328125, -0.1287689208984375, -0.10174560546875, -0.0747222900390625, -0.047698974609375, -0.0206756591796875, 0.00634765625, 0.0333709716796875, 0.060394287109375, 0.0874176025390625, 0.11444091796875, 0.1414642333984375, 0.168487548828125, 0.1955108642578125, 0.2225341796875, 0.2495574951171875, 0.276580810546875, 0.3036041259765625, 0.33062744140625, 0.3576507568359375, 0.384674072265625, 0.4116973876953125, 0.438720703125, 0.4657440185546875, 0.492767333984375, 0.5197906494140625, 0.54681396484375, 0.5738372802734375, 0.600860595703125, 0.6278839111328125, 0.6549072265625, 0.6819305419921875, 0.708953857421875, 0.7359771728515625, 0.76300048828125, 0.7900238037109375, 0.817047119140625, 0.8440704345703125, 0.87109375]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 4.0, 8.0, 10.0, 11.0, 9.0, 24.0, 26.0, 42.0, 71.0, 122.0, 212.0, 167.0, 101.0, 62.0, 44.0, 25.0, 19.0, 11.0, 11.0, 4.0, 7.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.80712890625, -0.7747116088867188, -0.7422943115234375, -0.7098770141601562, -0.677459716796875, -0.6450424194335938, -0.6126251220703125, -0.5802078247070312, -0.54779052734375, -0.5153732299804688, -0.4829559326171875, -0.45053863525390625, -0.418121337890625, -0.38570404052734375, -0.3532867431640625, -0.32086944580078125, -0.2884521484375, -0.25603485107421875, -0.2236175537109375, -0.19120025634765625, -0.158782958984375, -0.12636566162109375, -0.0939483642578125, -0.06153106689453125, -0.02911376953125, 0.00330352783203125, 0.0357208251953125, 0.06813812255859375, 0.100555419921875, 0.13297271728515625, 0.1653900146484375, 0.19780731201171875, 0.230224609375, 0.26264190673828125, 0.2950592041015625, 0.32747650146484375, 0.359893798828125, 0.39231109619140625, 0.4247283935546875, 0.45714569091796875, 0.48956298828125, 0.5219802856445312, 0.5543975830078125, 0.5868148803710938, 0.619232177734375, 0.6516494750976562, 0.6840667724609375, 0.7164840698242188, 0.7489013671875, 0.7813186645507812, 0.8137359619140625, 0.8461532592773438, 0.878570556640625, 0.9109878540039062, 0.9434051513671875, 0.9758224487304688, 1.00823974609375, 1.0406570434570312, 1.0730743408203125, 1.1054916381835938, 1.137908935546875, 1.1703262329101562, 1.2027435302734375, 1.2351608276367188, 1.267578125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 4.0, 7.0, 9.0, 14.0, 47.0, 111.0, 365.0, 327.0, 72.0, 27.0, 16.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-60.41972351074219, -59.30076217651367, -58.18180465698242, -57.062843322753906, -55.943885803222656, -54.82492446899414, -53.705963134765625, -52.587005615234375, -51.46804428100586, -50.349082946777344, -49.230125427246094, -48.11116409301758, -46.99220275878906, -45.87324523925781, -44.7542839050293, -43.63532638549805, -42.51636505126953, -41.397403717041016, -40.278446197509766, -39.15948486328125, -38.04052734375, -36.921566009521484, -35.80260467529297, -34.68364715576172, -33.5646858215332, -32.44572448730469, -31.326766967773438, -30.207805633544922, -29.08884620666504, -27.969886779785156, -26.85092544555664, -25.731966018676758, -24.61301040649414, -23.494050979614258, -22.375091552734375, -21.25613021850586, -20.137170791625977, -19.018211364746094, -17.899250030517578, -16.780290603637695, -15.661331176757812, -14.54237174987793, -13.42341136932373, -12.304450988769531, -11.185491561889648, -10.066532135009766, -8.947571754455566, -7.828611850738525, -6.709651947021484, -5.590692043304443, -4.471732139587402, -3.3527722358703613, -2.2338123321533203, -1.1148524284362793, 0.004107475280761719, 1.1230673789978027, 2.2420272827148438, 3.3609871864318848, 4.479947090148926, 5.598906993865967, 6.717866897583008, 7.836826801300049, 8.95578670501709, 10.074747085571289, 11.193706512451172]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 3.0, 6.0, 6.0, 7.0, 6.0, 13.0, 13.0, 12.0, 15.0, 9.0, 23.0, 18.0, 36.0, 24.0, 19.0, 22.0, 44.0, 190.0, 248.0, 53.0, 28.0, 26.0, 25.0, 21.0, 28.0, 18.0, 16.0, 12.0, 7.0, 12.0, 5.0, 8.0, 8.0, 6.0, 3.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.198326110839844, -11.779027938842773, -11.35973072052002, -10.94043254852295, -10.521134376525879, -10.101837158203125, -9.682538986206055, -9.263240814208984, -8.843942642211914, -8.424644470214844, -8.00534725189209, -7.5860490798950195, -7.166750907897949, -6.747453212738037, -6.328155517578125, -5.908857345581055, -5.489559650421143, -5.0702619552612305, -4.65096378326416, -4.231666088104248, -3.8123679161071777, -3.3930702209472656, -2.9737722873687744, -2.554474353790283, -2.135176420211792, -1.7158784866333008, -1.2965805530548096, -0.8772827386856079, -0.4579848051071167, -0.03868699073791504, 0.38061094284057617, 0.7999088764190674, 1.2192068099975586, 1.6385047435760498, 2.057802677154541, 2.477100372314453, 2.8963985443115234, 3.3156962394714355, 3.7349941730499268, 4.154292106628418, 4.573590278625488, 4.9928879737854, 5.412186145782471, 5.831483840942383, 6.250782012939453, 6.670079708099365, 7.089377403259277, 7.508675575256348, 7.92797327041626, 8.347270965576172, 8.766569137573242, 9.185867309570312, 9.605164527893066, 10.024462699890137, 10.443760871887207, 10.863058090209961, 11.282356262207031, 11.701654434204102, 12.120951652526855, 12.540249824523926, 12.959547996520996, 13.37884521484375, 13.79814338684082, 14.21744155883789, 14.636739730834961]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 1.0, 2.0, 3.0, 3.0, 4.0, 7.0, 7.0, 10.0, 7.0, 15.0, 14.0, 13.0, 15.0, 17.0, 28.0, 22.0, 38.0, 29.0, 52.0, 67.0, 224.0, 119.0, 51.0, 37.0, 37.0, 32.0, 20.0, 16.0, 15.0, 22.0, 17.0, 11.0, 11.0, 13.0, 9.0, 3.0, 6.0, 4.0, 4.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.79638671875, -0.7628860473632812, -0.7293853759765625, -0.6958847045898438, -0.662384033203125, -0.6288833618164062, -0.5953826904296875, -0.5618820190429688, -0.52838134765625, -0.49488067626953125, -0.4613800048828125, -0.42787933349609375, -0.394378662109375, -0.36087799072265625, -0.3273773193359375, -0.29387664794921875, -0.2603759765625, -0.22687530517578125, -0.1933746337890625, -0.15987396240234375, -0.126373291015625, -0.09287261962890625, -0.0593719482421875, -0.02587127685546875, 0.00762939453125, 0.04113006591796875, 0.0746307373046875, 0.10813140869140625, 0.141632080078125, 0.17513275146484375, 0.2086334228515625, 0.24213409423828125, 0.275634765625, 0.30913543701171875, 0.3426361083984375, 0.37613677978515625, 0.409637451171875, 0.44313812255859375, 0.4766387939453125, 0.5101394653320312, 0.54364013671875, 0.5771408081054688, 0.6106414794921875, 0.6441421508789062, 0.677642822265625, 0.7111434936523438, 0.7446441650390625, 0.7781448364257812, 0.8116455078125, 0.8451461791992188, 0.8786468505859375, 0.9121475219726562, 0.945648193359375, 0.9791488647460938, 1.0126495361328125, 1.0461502075195312, 1.07965087890625, 1.1131515502929688, 1.1466522216796875, 1.1801528930664062, 1.213653564453125, 1.2471542358398438, 1.2806549072265625, 1.3141555786132812, 1.34765625]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 14.0, 14.0, 14.0, 15.0, 8.0, 18.0, 36.0, 60.0, 132.0, 238.0, 492.0, 1477.0, 5672.0, 196711.0, 8174326.0, 6720.0, 1600.0, 539.0, 207.0, 120.0, 68.0, 26.0, 25.0, 18.0, 10.0, 6.0, 5.0, 3.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.052157402038574, -12.690153121948242, -12.328149795532227, -11.966145515441895, -11.604141235351562, -11.24213695526123, -10.880132675170898, -10.518129348754883, -10.15612506866455, -9.794120788574219, -9.432117462158203, -9.070113182067871, -8.708108901977539, -8.346104621887207, -7.984100818634033, -7.622097015380859, -7.260092735290527, -6.898088455200195, -6.5360846519470215, -6.174080848693848, -5.812076568603516, -5.450072288513184, -5.08806848526001, -4.726064682006836, -4.364060401916504, -4.002056121826172, -3.640052318572998, -3.278048276901245, -2.916044235229492, -2.5540401935577393, -2.1920361518859863, -1.8300321102142334, -1.4680290222167969, -1.106024980545044, -0.744020938873291, -0.3820168972015381, -0.020012855529785156, 0.3419911861419678, 0.7039952278137207, 1.0659992694854736, 1.4280033111572266, 1.7900073528289795, 2.1520113945007324, 2.5140154361724854, 2.8760194778442383, 3.238023519515991, 3.600027561187744, 3.962031602859497, 4.32403564453125, 4.686039924621582, 5.048043727874756, 5.41004753112793, 5.772051811218262, 6.134056091308594, 6.496059894561768, 6.858063697814941, 7.220067977905273, 7.5820722579956055, 7.944076061248779, 8.306079864501953, 8.668084144592285, 9.030088424682617, 9.392091751098633, 9.754096031188965, 10.116100311279297]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 6.0, 1.0, 4.0, 6.0, 3.0, 3.0, 5.0, 4.0, 5.0, 6.0, 2.0, 8.0, 7.0, 5.0, 3.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-11.049534797668457, -10.772295951843262, -10.495057106018066, -10.217818260192871, -9.940579414367676, -9.66334056854248, -9.386101722717285, -9.108863830566406, -8.831624984741211, -8.554386138916016, -8.27714729309082, -7.999908447265625, -7.72266960144043, -7.445430755615234, -7.168192386627197, -6.890953540802002, -6.613714218139648, -6.336475372314453, -6.059236526489258, -5.7819976806640625, -5.504758834838867, -5.227519989013672, -4.950281620025635, -4.6730427742004395, -4.395803928375244, -4.118565082550049, -3.8413262367248535, -3.5640876293182373, -3.286848783493042, -3.0096099376678467, -2.7323713302612305, -2.455132484436035, -2.177894115447998, -1.9006552696228027, -1.623416543006897, -1.3461778163909912, -1.068938970565796, -0.7917001247406006, -0.5144613981246948, -0.23722267150878906, 0.04001617431640625, 0.3172549605369568, 0.5944937467575073, 0.8717325329780579, 1.1489713191986084, 1.4262101650238037, 1.7034488916397095, 1.9806876182556152, 2.2579264640808105, 2.535165309906006, 2.812404155731201, 3.0896427631378174, 3.3668816089630127, 3.644120454788208, 3.921359062194824, 4.1985979080200195, 4.475836753845215, 4.75307559967041, 5.0303144454956055, 5.307553291320801, 5.584792137145996, 5.862030982971191, 6.1392693519592285, 6.416508197784424, 6.693747043609619]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 3.0, 10.0, 7.0, 10.0, 14.0, 32.0, 38.0, 68.0, 105.0, 212.0, 637.0, 2515.0, 15599.0, 145855.0, 313839.0, 38476.0, 5139.0, 1059.0, 343.0, 129.0, 73.0, 40.0, 22.0, 18.0, 6.0, 4.0, 4.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-14.09375, -13.51171875, -12.9296875, -12.34765625, -11.765625, -11.18359375, -10.6015625, -10.01953125, -9.4375, -8.85546875, -8.2734375, -7.69140625, -7.109375, -6.52734375, -5.9453125, -5.36328125, -4.78125, -4.19921875, -3.6171875, -3.03515625, -2.453125, -1.87109375, -1.2890625, -0.70703125, -0.125, 0.45703125, 1.0390625, 1.62109375, 2.203125, 2.78515625, 3.3671875, 3.94921875, 4.53125, 5.11328125, 5.6953125, 6.27734375, 6.859375, 7.44140625, 8.0234375, 8.60546875, 9.1875, 9.76953125, 10.3515625, 10.93359375, 11.515625, 12.09765625, 12.6796875, 13.26171875, 13.84375, 14.42578125, 15.0078125, 15.58984375, 16.171875, 16.75390625, 17.3359375, 17.91796875, 18.5, 19.08203125, 19.6640625, 20.24609375, 20.828125, 21.41015625, 21.9921875, 22.57421875, 23.15625]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 5.0, 5.0, 7.0, 18.0, 20.0, 17.0, 29.0, 39.0, 44.0, 54.0, 68.0, 75.0, 84.0, 88.0, 68.0, 78.0, 65.0, 51.0, 36.0, 56.0, 29.0, 18.0, 5.0, 13.0, 7.0, 4.0, 5.0, 4.0, 0.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.705078125, -1.655426025390625, -1.60577392578125, -1.556121826171875, -1.5064697265625, -1.456817626953125, -1.40716552734375, -1.357513427734375, -1.307861328125, -1.258209228515625, -1.20855712890625, -1.158905029296875, -1.1092529296875, -1.059600830078125, -1.00994873046875, -0.960296630859375, -0.91064453125, -0.860992431640625, -0.81134033203125, -0.761688232421875, -0.7120361328125, -0.662384033203125, -0.61273193359375, -0.563079833984375, -0.513427734375, -0.463775634765625, -0.41412353515625, -0.364471435546875, -0.3148193359375, -0.265167236328125, -0.21551513671875, -0.165863037109375, -0.1162109375, -0.066558837890625, -0.01690673828125, 0.032745361328125, 0.0823974609375, 0.132049560546875, 0.18170166015625, 0.231353759765625, 0.281005859375, 0.330657958984375, 0.38031005859375, 0.429962158203125, 0.4796142578125, 0.529266357421875, 0.57891845703125, 0.628570556640625, 0.67822265625, 0.727874755859375, 0.77752685546875, 0.827178955078125, 0.8768310546875, 0.926483154296875, 0.97613525390625, 1.025787353515625, 1.075439453125, 1.125091552734375, 1.17474365234375, 1.224395751953125, 1.2740478515625, 1.323699951171875, 1.37335205078125, 1.423004150390625, 1.47265625]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 11.0, 9.0, 13.0, 69.0, 135.0, 163.0, 50.0, 16.0, 9.0, 7.0, 2.0, 5.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.818909645080566, -8.232321739196777, -7.6457343101501465, -7.059146881103516, -6.472558975219727, -5.885971546173096, -5.299384117126465, -4.712796211242676, -4.126208782196045, -3.539621114730835, -2.953033447265625, -2.366446018218994, -1.7798583507537842, -1.1932706832885742, -0.6066832542419434, -0.020095348358154297, 0.5664920806884766, 1.1530797481536865, 1.739667296409607, 2.3262548446655273, 2.9128425121307373, 3.4994301795959473, 4.086017608642578, 4.672605514526367, 5.259192943572998, 5.845780372619629, 6.432368278503418, 7.018955707550049, 7.60554313659668, 8.192131042480469, 8.778718948364258, 9.365306854248047, 9.951892852783203, 10.538480758666992, 11.125067710876465, 11.711655616760254, 12.298243522644043, 12.884830474853516, 13.471418380737305, 14.058006286621094, 14.644594192504883, 15.231182098388672, 15.817769050598145, 16.40435791015625, 16.990943908691406, 17.577531814575195, 18.164119720458984, 18.750707626342773, 19.337295532226562, 19.92388343811035, 20.51047134399414, 21.097057342529297, 21.683645248413086, 22.270233154296875, 22.856821060180664, 23.443408966064453, 24.02999496459961, 24.6165828704834, 25.203170776367188, 25.789756774902344, 26.376344680786133, 26.962932586669922, 27.54952049255371, 28.1361083984375, 28.72269630432129]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 6.0, 10.0, 6.0, 6.0, 8.0, 39.0, 82.0, 121.0, 99.0, 46.0, 11.0, 12.0, 8.0, 7.0, 9.0, 1.0, 2.0, 2.0, 2.0, 3.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.361876487731934, -8.096219062805176, -7.830562114715576, -7.564904689788818, -7.299247741699219, -7.033590316772461, -6.767932891845703, -6.502275466918945, -6.236618518829346, -5.970961093902588, -5.705304145812988, -5.4396467208862305, -5.173989295959473, -4.908332347869873, -4.642674922943115, -4.377017974853516, -4.111360549926758, -3.845703363418579, -3.5800461769104004, -3.3143887519836426, -3.048731565475464, -2.783074378967285, -2.5174169540405273, -2.2517597675323486, -1.98610258102417, -1.7204453945159912, -1.454788088798523, -1.1891307830810547, -0.923473596572876, -0.6578164100646973, -0.392159104347229, -0.12650179862976074, 0.13915634155273438, 0.40481358766555786, 0.6704708337783813, 0.9361280798912048, 1.2017853260040283, 1.467442512512207, 1.7330998182296753, 1.9987571239471436, 2.2644143104553223, 2.530071496963501, 2.7957286834716797, 3.0613861083984375, 3.327043294906616, 3.592700481414795, 3.8583579063415527, 4.124014854431152, 4.38967227935791, 4.655329704284668, 4.920986652374268, 5.186644077301025, 5.452301025390625, 5.717958450317383, 5.983615875244141, 6.249273300170898, 6.514930248260498, 6.780587673187256, 7.0462446212768555, 7.311902046203613, 7.577559471130371, 7.843216419219971, 8.10887336730957, 8.374530792236328, 8.640188217163086]}, "eval/loss": 4.305517673492432, "eval/wer": 1.9549980166600556, "eval/runtime": 784.9234, "eval/samples_per_second": 3.366, "eval/steps_per_second": 0.282, "train/train_runtime": 6633.4843, "train/train_samples_per_second": 4.302, "train/train_steps_per_second": 0.179, "train/total_flos": 0.0, "train/train_loss": 4.355411059521546} \ No newline at end of file +{"train/loss": 4.7853, "train/learning_rate": 5.805515239477504e-07, "train/epoch": 1.0, "train/global_step": 1189, "_runtime": 7866, "_timestamp": 1646187247, "_step": 1192, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 6.0, 7.0, 21.0, 31.0, 147.0, 519.0, 207.0, 32.0, 21.0, 12.0, 6.0, 4.0, 4.0], "bins": [-485.33099365234375, -476.75994873046875, -468.1888732910156, -459.6178283691406, -451.0467834472656, -442.4757385253906, -433.9046630859375, -425.3336181640625, -416.7625732421875, -408.1915283203125, -399.6204528808594, -391.0494079589844, -382.4783630371094, -373.9073181152344, -365.33624267578125, -356.76519775390625, -348.19415283203125, -339.62310791015625, -331.0520324707031, -322.4809875488281, -313.9099426269531, -305.3388977050781, -296.767822265625, -288.19677734375, -279.6257019042969, -271.0546569824219, -262.48358154296875, -253.91253662109375, -245.34149169921875, -236.7704315185547, -228.19937133789062, -219.62832641601562, -211.0572967529297, -202.48623657226562, -193.91519165039062, -185.34413146972656, -176.77308654785156, -168.2020263671875, -159.6309814453125, -151.05992126464844, -142.48887634277344, -133.91781616210938, -125.34677124023438, -116.77571105957031, -108.20466613769531, -99.63360595703125, -91.06255340576172, -82.49150085449219, -73.92044067382812, -65.3493881225586, -56.77833557128906, -48.207279205322266, -39.636226654052734, -31.065174102783203, -22.494117736816406, -13.923065185546875, -5.352016448974609, 3.2190370559692383, 11.790090560913086, 20.36114501953125, 28.93219757080078, 37.50325012207031, 46.07430648803711, 54.64535903930664, 63.21641159057617]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 6.0, 5.0, 0.0, 6.0, 4.0, 3.0, 4.0, 8.0, 10.0, 8.0, 15.0, 15.0, 23.0, 15.0, 22.0, 28.0, 21.0, 33.0, 43.0, 50.0, 59.0, 73.0, 74.0, 62.0, 69.0, 55.0, 48.0, 32.0, 32.0, 32.0, 22.0, 16.0, 22.0, 18.0, 14.0, 16.0, 7.0, 13.0, 6.0, 2.0, 5.0, 2.0, 4.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-121.59696960449219, -117.4406509399414, -113.28433227539062, -109.12801361083984, -104.97169494628906, -100.81536865234375, -96.65904998779297, -92.50273132324219, -88.3464126586914, -84.19009399414062, -80.03377532958984, -75.87745666503906, -71.72113037109375, -67.5648193359375, -63.40849304199219, -59.252174377441406, -55.095855712890625, -50.939537048339844, -46.78321838378906, -42.626895904541016, -38.470577239990234, -34.31425857543945, -30.15793800354004, -26.001617431640625, -21.845298767089844, -17.688980102539062, -13.532659530639648, -9.37633991241455, -5.220020294189453, -1.0637016296386719, 3.092618942260742, 7.248939514160156, 11.405258178710938, 15.561577796936035, 19.717897415161133, 23.874217987060547, 28.030536651611328, 32.18685531616211, 36.343177795410156, 40.49949645996094, 44.65581512451172, 48.8121337890625, 52.96845245361328, 57.12477493286133, 61.28109359741211, 65.43740844726562, 69.59373474121094, 73.75005340576172, 77.9063720703125, 82.06269073486328, 86.21900939941406, 90.37532806396484, 94.53164672851562, 98.68797302246094, 102.84429168701172, 107.0006103515625, 111.15692901611328, 115.31324768066406, 119.46956634521484, 123.62588500976562, 127.78221130371094, 131.9385223388672, 136.0948486328125, 140.25115966796875, 144.40748596191406]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 5.0, 5.0, 4.0, 6.0, 7.0, 11.0, 13.0, 8.0, 11.0, 23.0, 19.0, 16.0, 17.0, 40.0, 45.0, 60.0, 86.0, 108.0, 101.0, 73.0, 57.0, 41.0, 43.0, 29.0, 21.0, 22.0, 17.0, 14.0, 19.0, 10.0, 10.0, 14.0, 9.0, 6.0, 9.0, 3.0, 5.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.4140625, -9.10400390625, -8.7939453125, -8.48388671875, -8.173828125, -7.86376953125, -7.5537109375, -7.24365234375, -6.93359375, -6.62353515625, -6.3134765625, -6.00341796875, -5.693359375, -5.38330078125, -5.0732421875, -4.76318359375, -4.453125, -4.14306640625, -3.8330078125, -3.52294921875, -3.212890625, -2.90283203125, -2.5927734375, -2.28271484375, -1.97265625, -1.66259765625, -1.3525390625, -1.04248046875, -0.732421875, -0.42236328125, -0.1123046875, 0.19775390625, 0.5078125, 0.81787109375, 1.1279296875, 1.43798828125, 1.748046875, 2.05810546875, 2.3681640625, 2.67822265625, 2.98828125, 3.29833984375, 3.6083984375, 3.91845703125, 4.228515625, 4.53857421875, 4.8486328125, 5.15869140625, 5.46875, 5.77880859375, 6.0888671875, 6.39892578125, 6.708984375, 7.01904296875, 7.3291015625, 7.63916015625, 7.94921875, 8.25927734375, 8.5693359375, 8.87939453125, 9.189453125, 9.49951171875, 9.8095703125, 10.11962890625, 10.4296875]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 6.0, 4.0, 4.0, 4.0, 7.0, 9.0, 11.0, 15.0, 29.0, 44.0, 54.0, 80.0, 105.0, 128.0, 156.0, 270.0, 398.0, 602.0, 878.0, 1353.0, 2231.0, 3736.0, 6684.0, 13309.0, 37672.0, 481680.0, 3393357.0, 195460.0, 27874.0, 11931.0, 6384.0, 3601.0, 2235.0, 1322.0, 900.0, 554.0, 390.0, 257.0, 175.0, 112.0, 85.0, 44.0, 43.0, 22.0, 26.0, 14.0, 14.0, 10.0, 2.0, 4.0, 3.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-29.3125, -28.34716796875, -27.3818359375, -26.41650390625, -25.451171875, -24.48583984375, -23.5205078125, -22.55517578125, -21.58984375, -20.62451171875, -19.6591796875, -18.69384765625, -17.728515625, -16.76318359375, -15.7978515625, -14.83251953125, -13.8671875, -12.90185546875, -11.9365234375, -10.97119140625, -10.005859375, -9.04052734375, -8.0751953125, -7.10986328125, -6.14453125, -5.17919921875, -4.2138671875, -3.24853515625, -2.283203125, -1.31787109375, -0.3525390625, 0.61279296875, 1.578125, 2.54345703125, 3.5087890625, 4.47412109375, 5.439453125, 6.40478515625, 7.3701171875, 8.33544921875, 9.30078125, 10.26611328125, 11.2314453125, 12.19677734375, 13.162109375, 14.12744140625, 15.0927734375, 16.05810546875, 17.0234375, 17.98876953125, 18.9541015625, 19.91943359375, 20.884765625, 21.85009765625, 22.8154296875, 23.78076171875, 24.74609375, 25.71142578125, 26.6767578125, 27.64208984375, 28.607421875, 29.57275390625, 30.5380859375, 31.50341796875, 32.46875]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 5.0, 3.0, 6.0, 4.0, 5.0, 10.0, 9.0, 6.0, 20.0, 12.0, 18.0, 25.0, 31.0, 49.0, 52.0, 46.0, 88.0, 109.0, 236.0, 401.0, 660.0, 783.0, 593.0, 324.0, 186.0, 89.0, 63.0, 40.0, 42.0, 26.0, 26.0, 15.0, 23.0, 15.0, 18.0, 11.0, 6.0, 6.0, 2.0, 2.0, 3.0, 2.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-28.46875, -27.5576171875, -26.646484375, -25.7353515625, -24.82421875, -23.9130859375, -23.001953125, -22.0908203125, -21.1796875, -20.2685546875, -19.357421875, -18.4462890625, -17.53515625, -16.6240234375, -15.712890625, -14.8017578125, -13.890625, -12.9794921875, -12.068359375, -11.1572265625, -10.24609375, -9.3349609375, -8.423828125, -7.5126953125, -6.6015625, -5.6904296875, -4.779296875, -3.8681640625, -2.95703125, -2.0458984375, -1.134765625, -0.2236328125, 0.6875, 1.5986328125, 2.509765625, 3.4208984375, 4.33203125, 5.2431640625, 6.154296875, 7.0654296875, 7.9765625, 8.8876953125, 9.798828125, 10.7099609375, 11.62109375, 12.5322265625, 13.443359375, 14.3544921875, 15.265625, 16.1767578125, 17.087890625, 17.9990234375, 18.91015625, 19.8212890625, 20.732421875, 21.6435546875, 22.5546875, 23.4658203125, 24.376953125, 25.2880859375, 26.19921875, 27.1103515625, 28.021484375, 28.9326171875, 29.84375]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 5.0, 2.0, 3.0, 1.0, 4.0, 4.0, 6.0, 8.0, 11.0, 17.0, 8.0, 20.0, 26.0, 20.0, 25.0, 53.0, 40.0, 71.0, 119.0, 124.0, 227.0, 391.0, 848.0, 2284.0, 6817.0, 26358.0, 165688.0, 3781773.0, 171036.0, 27069.0, 6961.0, 2279.0, 863.0, 371.0, 221.0, 138.0, 76.0, 59.0, 55.0, 51.0, 41.0, 28.0, 17.0, 22.0, 8.0, 6.0, 6.0, 6.0, 9.0, 5.0, 5.0, 2.0, 5.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0], "bins": [-81.625, -79.0341796875, -76.443359375, -73.8525390625, -71.26171875, -68.6708984375, -66.080078125, -63.4892578125, -60.8984375, -58.3076171875, -55.716796875, -53.1259765625, -50.53515625, -47.9443359375, -45.353515625, -42.7626953125, -40.171875, -37.5810546875, -34.990234375, -32.3994140625, -29.80859375, -27.2177734375, -24.626953125, -22.0361328125, -19.4453125, -16.8544921875, -14.263671875, -11.6728515625, -9.08203125, -6.4912109375, -3.900390625, -1.3095703125, 1.28125, 3.8720703125, 6.462890625, 9.0537109375, 11.64453125, 14.2353515625, 16.826171875, 19.4169921875, 22.0078125, 24.5986328125, 27.189453125, 29.7802734375, 32.37109375, 34.9619140625, 37.552734375, 40.1435546875, 42.734375, 45.3251953125, 47.916015625, 50.5068359375, 53.09765625, 55.6884765625, 58.279296875, 60.8701171875, 63.4609375, 66.0517578125, 68.642578125, 71.2333984375, 73.82421875, 76.4150390625, 79.005859375, 81.5966796875, 84.1875]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 5.0, 9.0, 26.0, 22.0, 56.0, 85.0, 184.0, 248.0, 152.0, 102.0, 46.0, 31.0, 23.0, 6.0, 4.0, 6.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-86.32012939453125, -82.11811065673828, -77.91609191894531, -73.71407318115234, -69.51205444335938, -65.31004333496094, -61.10802459716797, -56.906005859375, -52.70398712158203, -48.50196838378906, -44.299949645996094, -40.09793472290039, -35.89591598510742, -31.693897247314453, -27.491880416870117, -23.28986358642578, -19.087844848632812, -14.88582706451416, -10.683809280395508, -6.4817914962768555, -2.279773712158203, 1.9222450256347656, 6.124261856079102, 10.326278686523438, 14.528297424316406, 18.730316162109375, 22.93233299255371, 27.134349822998047, 31.336368560791016, 35.538387298583984, 39.74040222167969, 43.942420959472656, 48.144439697265625, 52.346458435058594, 56.54847717285156, 60.750492095947266, 64.9525146484375, 69.15452575683594, 73.3565444946289, 77.55856323242188, 81.76058197021484, 85.96260070800781, 90.16461944580078, 94.36663818359375, 98.56864929199219, 102.77067565917969, 106.97268676757812, 111.1747055053711, 115.37672424316406, 119.57874298095703, 123.78076171875, 127.98278045654297, 132.18479919433594, 136.38681030273438, 140.58883666992188, 144.7908477783203, 148.99285888671875, 153.1948699951172, 157.3968963623047, 161.59890747070312, 165.80093383789062, 170.00294494628906, 174.20497131347656, 178.406982421875, 182.6090087890625]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 3.0, 6.0, 11.0, 9.0, 14.0, 6.0, 13.0, 22.0, 14.0, 21.0, 31.0, 25.0, 24.0, 29.0, 31.0, 31.0, 52.0, 38.0, 40.0, 49.0, 51.0, 47.0, 34.0, 36.0, 34.0, 39.0, 44.0, 37.0, 29.0, 24.0, 26.0, 23.0, 20.0, 18.0, 17.0, 13.0, 17.0, 5.0, 8.0, 6.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0], "bins": [-98.53227233886719, -95.51553344726562, -92.49879455566406, -89.4820556640625, -86.46531677246094, -83.4485855102539, -80.43184661865234, -77.41510772705078, -74.39836883544922, -71.38162994384766, -68.3648910522461, -65.34815216064453, -62.331417083740234, -59.31467819213867, -56.297943115234375, -53.28120422363281, -50.26446533203125, -47.24772644042969, -44.230987548828125, -41.21425247192383, -38.197513580322266, -35.1807746887207, -32.164039611816406, -29.147300720214844, -26.13056182861328, -23.11382293701172, -20.09708595275879, -17.08034896850586, -14.063610076904297, -11.04687213897705, -8.030134201049805, -5.013397216796875, -1.9966583251953125, 1.0200796127319336, 4.03681755065918, 7.053555488586426, 10.070293426513672, 13.087031364440918, 16.103769302368164, 19.120506286621094, 22.137245178222656, 25.15398406982422, 28.17072105407715, 31.187458038330078, 34.20419692993164, 37.2209358215332, 40.2376708984375, 43.25440979003906, 46.271148681640625, 49.28788757324219, 52.30462646484375, 55.32136154174805, 58.33810043334961, 61.35483932495117, 64.37157440185547, 67.38831329345703, 70.4050521850586, 73.42179107666016, 76.43852996826172, 79.45526885986328, 82.47200012207031, 85.48873901367188, 88.50547790527344, 91.522216796875, 94.53895568847656]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 5.0, 2.0, 2.0, 2.0, 2.0, 6.0, 9.0, 9.0, 8.0, 14.0, 13.0, 13.0, 31.0, 28.0, 34.0, 30.0, 57.0, 62.0, 60.0, 75.0, 74.0, 66.0, 60.0, 61.0, 55.0, 27.0, 33.0, 35.0, 20.0, 20.0, 19.0, 13.0, 20.0, 9.0, 8.0, 4.0, 4.0, 7.0, 6.0, 0.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.6328125, -10.287841796875, -9.94287109375, -9.597900390625, -9.2529296875, -8.907958984375, -8.56298828125, -8.218017578125, -7.873046875, -7.528076171875, -7.18310546875, -6.838134765625, -6.4931640625, -6.148193359375, -5.80322265625, -5.458251953125, -5.11328125, -4.768310546875, -4.42333984375, -4.078369140625, -3.7333984375, -3.388427734375, -3.04345703125, -2.698486328125, -2.353515625, -2.008544921875, -1.66357421875, -1.318603515625, -0.9736328125, -0.628662109375, -0.28369140625, 0.061279296875, 0.40625, 0.751220703125, 1.09619140625, 1.441162109375, 1.7861328125, 2.131103515625, 2.47607421875, 2.821044921875, 3.166015625, 3.510986328125, 3.85595703125, 4.200927734375, 4.5458984375, 4.890869140625, 5.23583984375, 5.580810546875, 5.92578125, 6.270751953125, 6.61572265625, 6.960693359375, 7.3056640625, 7.650634765625, 7.99560546875, 8.340576171875, 8.685546875, 9.030517578125, 9.37548828125, 9.720458984375, 10.0654296875, 10.410400390625, 10.75537109375, 11.100341796875, 11.4453125]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 7.0, 12.0, 14.0, 17.0, 42.0, 39.0, 57.0, 94.0, 121.0, 171.0, 277.0, 344.0, 493.0, 667.0, 920.0, 1331.0, 1903.0, 2991.0, 4489.0, 6866.0, 10835.0, 18452.0, 32866.0, 64598.0, 148587.0, 325822.0, 225996.0, 93543.0, 44193.0, 23773.0, 13738.0, 8494.0, 5386.0, 3556.0, 2406.0, 1620.0, 1072.0, 831.0, 534.0, 422.0, 279.0, 183.0, 164.0, 107.0, 76.0, 53.0, 46.0, 20.0, 16.0, 12.0, 13.0, 2.0, 4.0, 2.0, 0.0, 1.0, 4.0, 1.0], "bins": [-1.0390625, -1.006317138671875, -0.97357177734375, -0.940826416015625, -0.9080810546875, -0.875335693359375, -0.84259033203125, -0.809844970703125, -0.777099609375, -0.744354248046875, -0.71160888671875, -0.678863525390625, -0.6461181640625, -0.613372802734375, -0.58062744140625, -0.547882080078125, -0.51513671875, -0.482391357421875, -0.44964599609375, -0.416900634765625, -0.3841552734375, -0.351409912109375, -0.31866455078125, -0.285919189453125, -0.253173828125, -0.220428466796875, -0.18768310546875, -0.154937744140625, -0.1221923828125, -0.089447021484375, -0.05670166015625, -0.023956298828125, 0.0087890625, 0.041534423828125, 0.07427978515625, 0.107025146484375, 0.1397705078125, 0.172515869140625, 0.20526123046875, 0.238006591796875, 0.270751953125, 0.303497314453125, 0.33624267578125, 0.368988037109375, 0.4017333984375, 0.434478759765625, 0.46722412109375, 0.499969482421875, 0.53271484375, 0.565460205078125, 0.59820556640625, 0.630950927734375, 0.6636962890625, 0.696441650390625, 0.72918701171875, 0.761932373046875, 0.794677734375, 0.827423095703125, 0.86016845703125, 0.892913818359375, 0.9256591796875, 0.958404541015625, 0.99114990234375, 1.023895263671875, 1.056640625]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 4.0, 7.0, 10.0, 8.0, 6.0, 10.0, 6.0, 12.0, 8.0, 23.0, 21.0, 16.0, 22.0, 23.0, 20.0, 19.0, 33.0, 26.0, 37.0, 27.0, 40.0, 36.0, 39.0, 39.0, 1056.0, 35.0, 45.0, 40.0, 42.0, 41.0, 32.0, 21.0, 19.0, 20.0, 25.0, 21.0, 15.0, 21.0, 19.0, 18.0, 12.0, 11.0, 10.0, 5.0, 5.0, 6.0, 5.0, 5.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0], "bins": [-5.01171875, -4.8643798828125, -4.717041015625, -4.5697021484375, -4.42236328125, -4.2750244140625, -4.127685546875, -3.9803466796875, -3.8330078125, -3.6856689453125, -3.538330078125, -3.3909912109375, -3.24365234375, -3.0963134765625, -2.948974609375, -2.8016357421875, -2.654296875, -2.5069580078125, -2.359619140625, -2.2122802734375, -2.06494140625, -1.9176025390625, -1.770263671875, -1.6229248046875, -1.4755859375, -1.3282470703125, -1.180908203125, -1.0335693359375, -0.88623046875, -0.7388916015625, -0.591552734375, -0.4442138671875, -0.296875, -0.1495361328125, -0.002197265625, 0.1451416015625, 0.29248046875, 0.4398193359375, 0.587158203125, 0.7344970703125, 0.8818359375, 1.0291748046875, 1.176513671875, 1.3238525390625, 1.47119140625, 1.6185302734375, 1.765869140625, 1.9132080078125, 2.060546875, 2.2078857421875, 2.355224609375, 2.5025634765625, 2.64990234375, 2.7972412109375, 2.944580078125, 3.0919189453125, 3.2392578125, 3.3865966796875, 3.533935546875, 3.6812744140625, 3.82861328125, 3.9759521484375, 4.123291015625, 4.2706298828125, 4.41796875]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 6.0, 5.0, 6.0, 12.0, 12.0, 31.0, 55.0, 76.0, 116.0, 174.0, 259.0, 400.0, 579.0, 855.0, 1238.0, 1783.0, 2665.0, 3875.0, 5694.0, 8397.0, 12192.0, 18147.0, 26811.0, 40711.0, 64764.0, 106952.0, 202669.0, 1231618.0, 136620.0, 80462.0, 49767.0, 32694.0, 21568.0, 14531.0, 9897.0, 6739.0, 4687.0, 3225.0, 2187.0, 1521.0, 1016.0, 714.0, 464.0, 328.0, 204.0, 143.0, 93.0, 60.0, 43.0, 23.0, 17.0, 11.0, 7.0, 5.0, 8.0, 4.0, 1.0, 4.0, 0.0, 1.0, 1.0], "bins": [-0.416015625, -0.402252197265625, -0.38848876953125, -0.374725341796875, -0.3609619140625, -0.347198486328125, -0.33343505859375, -0.319671630859375, -0.305908203125, -0.292144775390625, -0.27838134765625, -0.264617919921875, -0.2508544921875, -0.237091064453125, -0.22332763671875, -0.209564208984375, -0.19580078125, -0.182037353515625, -0.16827392578125, -0.154510498046875, -0.1407470703125, -0.126983642578125, -0.11322021484375, -0.099456787109375, -0.085693359375, -0.071929931640625, -0.05816650390625, -0.044403076171875, -0.0306396484375, -0.016876220703125, -0.00311279296875, 0.010650634765625, 0.0244140625, 0.038177490234375, 0.05194091796875, 0.065704345703125, 0.0794677734375, 0.093231201171875, 0.10699462890625, 0.120758056640625, 0.134521484375, 0.148284912109375, 0.16204833984375, 0.175811767578125, 0.1895751953125, 0.203338623046875, 0.21710205078125, 0.230865478515625, 0.24462890625, 0.258392333984375, 0.27215576171875, 0.285919189453125, 0.2996826171875, 0.313446044921875, 0.32720947265625, 0.340972900390625, 0.354736328125, 0.368499755859375, 0.38226318359375, 0.396026611328125, 0.4097900390625, 0.423553466796875, 0.43731689453125, 0.451080322265625, 0.46484375]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 1.0, 5.0, 6.0, 7.0, 10.0, 12.0, 15.0, 16.0, 19.0, 20.0, 18.0, 24.0, 32.0, 31.0, 34.0, 40.0, 37.0, 33.0, 36.0, 38.0, 44.0, 46.0, 41.0, 48.0, 37.0, 46.0, 33.0, 37.0, 31.0, 36.0, 28.0, 29.0, 14.0, 17.0, 13.0, 16.0, 5.0, 12.0, 6.0, 6.0, 7.0, 3.0, 3.0, 1.0, 4.0, 6.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.0209808349609375, -0.020348072052001953, -0.019715309143066406, -0.01908254623413086, -0.018449783325195312, -0.017817020416259766, -0.01718425750732422, -0.016551494598388672, -0.015918731689453125, -0.015285968780517578, -0.014653205871582031, -0.014020442962646484, -0.013387680053710938, -0.01275491714477539, -0.012122154235839844, -0.011489391326904297, -0.01085662841796875, -0.010223865509033203, -0.009591102600097656, -0.00895833969116211, -0.008325576782226562, -0.007692813873291016, -0.007060050964355469, -0.006427288055419922, -0.005794525146484375, -0.005161762237548828, -0.004528999328613281, -0.0038962364196777344, -0.0032634735107421875, -0.0026307106018066406, -0.0019979476928710938, -0.0013651847839355469, -0.000732421875, -9.965896606445312e-05, 0.0005331039428710938, 0.0011658668518066406, 0.0017986297607421875, 0.0024313926696777344, 0.0030641555786132812, 0.003696918487548828, 0.004329681396484375, 0.004962444305419922, 0.005595207214355469, 0.006227970123291016, 0.0068607330322265625, 0.007493495941162109, 0.008126258850097656, 0.008759021759033203, 0.00939178466796875, 0.010024547576904297, 0.010657310485839844, 0.01129007339477539, 0.011922836303710938, 0.012555599212646484, 0.013188362121582031, 0.013821125030517578, 0.014453887939453125, 0.015086650848388672, 0.01571941375732422, 0.016352176666259766, 0.016984939575195312, 0.01761770248413086, 0.018250465393066406, 0.018883228302001953, 0.0195159912109375]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 5.0, 4.0, 3.0, 5.0, 4.0, 12.0, 13.0, 6.0, 13.0, 20.0, 21.0, 27.0, 42.0, 54.0, 65.0, 111.0, 159.0, 211.0, 314.0, 496.0, 988.0, 1004028.0, 39967.0, 627.0, 393.0, 287.0, 190.0, 128.0, 92.0, 51.0, 40.0, 48.0, 22.0, 24.0, 16.0, 17.0, 13.0, 10.0, 6.0, 10.0, 4.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.5166015625, -0.4998321533203125, -0.483062744140625, -0.4662933349609375, -0.44952392578125, -0.4327545166015625, -0.415985107421875, -0.3992156982421875, -0.3824462890625, -0.3656768798828125, -0.348907470703125, -0.3321380615234375, -0.31536865234375, -0.2985992431640625, -0.281829833984375, -0.2650604248046875, -0.248291015625, -0.2315216064453125, -0.214752197265625, -0.1979827880859375, -0.18121337890625, -0.1644439697265625, -0.147674560546875, -0.1309051513671875, -0.1141357421875, -0.0973663330078125, -0.080596923828125, -0.0638275146484375, -0.04705810546875, -0.0302886962890625, -0.013519287109375, 0.0032501220703125, 0.02001953125, 0.0367889404296875, 0.053558349609375, 0.0703277587890625, 0.08709716796875, 0.1038665771484375, 0.120635986328125, 0.1374053955078125, 0.1541748046875, 0.1709442138671875, 0.187713623046875, 0.2044830322265625, 0.22125244140625, 0.2380218505859375, 0.254791259765625, 0.2715606689453125, 0.288330078125, 0.3050994873046875, 0.321868896484375, 0.3386383056640625, 0.35540771484375, 0.3721771240234375, 0.388946533203125, 0.4057159423828125, 0.4224853515625, 0.4392547607421875, 0.456024169921875, 0.4727935791015625, 0.48956298828125, 0.5063323974609375, 0.523101806640625, 0.5398712158203125, 0.556640625]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 929.0, 84.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5500984191894531, -0.527895450592041, -0.5056924819946289, -0.4834895431995392, -0.4612865746021271, -0.43908363580703735, -0.41688066720962524, -0.39467769861221313, -0.372474730014801, -0.3502717614173889, -0.3280688226222992, -0.3058658540248871, -0.283662885427475, -0.26145994663238525, -0.23925697803497314, -0.21705400943756104, -0.1948510706424713, -0.1726481169462204, -0.1504451483488083, -0.12824219465255737, -0.10603923350572586, -0.08383627235889435, -0.06163331866264343, -0.03943035006523132, -0.017227396368980408, 0.0049755629152059555, 0.02717852219939232, 0.04938147962093353, 0.07158444076776505, 0.09378740191459656, 0.11599035561084747, 0.13819332420825958, 0.1603962779045105, 0.1825992316007614, 0.20480220019817352, 0.22700515389442444, 0.24920812249183655, 0.27141106128692627, 0.2936140298843384, 0.3158169984817505, 0.3380199670791626, 0.3602229356765747, 0.38242587447166443, 0.40462884306907654, 0.42683181166648865, 0.44903475046157837, 0.4712377190589905, 0.4934406876564026, 0.5156435966491699, 0.537846565246582, 0.5600495338439941, 0.5822525024414062, 0.6044554114341736, 0.6266583800315857, 0.6488613486289978, 0.6710643172264099, 0.693267285823822, 0.7154702544212341, 0.7376732230186462, 0.7598761320114136, 0.7820791006088257, 0.8042820692062378, 0.8264850378036499, 0.848688006401062, 0.8708909749984741]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 4.0, 9.0, 7.0, 11.0, 7.0, 17.0, 22.0, 25.0, 39.0, 64.0, 46.0, 39.0, 70.0, 71.0, 54.0, 59.0, 66.0, 57.0, 63.0, 61.0, 56.0, 44.0, 32.0, 26.0, 22.0, 12.0, 5.0, 7.0, 7.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1001366376876831, -0.09781963378190994, -0.09550262987613678, -0.09318562597036362, -0.09086862206459045, -0.08855162560939789, -0.08623462170362473, -0.08391761779785156, -0.0816006138920784, -0.07928360998630524, -0.07696660608053207, -0.07464960217475891, -0.07233260571956635, -0.07001560181379318, -0.06769859790802002, -0.06538159400224686, -0.0630645900964737, -0.06074758619070053, -0.05843058228492737, -0.056113582104444504, -0.05379657819867134, -0.05147957429289818, -0.049162574112415314, -0.04684557020664215, -0.04452856630086899, -0.042211562395095825, -0.03989455848932266, -0.0375775583088398, -0.035260554403066635, -0.03294355049729347, -0.03062654845416546, -0.028309546411037445, -0.025992542505264282, -0.02367553859949112, -0.021358536556363106, -0.019041534513235092, -0.01672453060746193, -0.014407527633011341, -0.012090524658560753, -0.00977352261543274, -0.007456518709659576, -0.005139515735208988, -0.0028225127607584, -0.0005055097863078117, 0.0018114931881427765, 0.004128496162593365, 0.006445499137043953, 0.008762501180171967, 0.01107950508594513, 0.013396508060395718, 0.015713511034846306, 0.01803051307797432, 0.020347516983747482, 0.022664520889520645, 0.02498152293264866, 0.027298524975776672, 0.029615528881549835, 0.031932532787323, 0.03424953669309616, 0.036566536873579025, 0.03888354077935219, 0.04120054468512535, 0.043517544865608215, 0.04583454877138138, 0.04815155267715454]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 5.0, 2.0, 2.0, 2.0, 2.0, 6.0, 9.0, 9.0, 8.0, 14.0, 13.0, 12.0, 32.0, 28.0, 34.0, 30.0, 57.0, 62.0, 60.0, 75.0, 74.0, 66.0, 60.0, 61.0, 55.0, 27.0, 33.0, 35.0, 20.0, 20.0, 19.0, 13.0, 20.0, 9.0, 8.0, 4.0, 4.0, 7.0, 6.0, 0.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.6328125, -10.287841796875, -9.94287109375, -9.597900390625, -9.2529296875, -8.907958984375, -8.56298828125, -8.218017578125, -7.873046875, -7.528076171875, -7.18310546875, -6.838134765625, -6.4931640625, -6.148193359375, -5.80322265625, -5.458251953125, -5.11328125, -4.768310546875, -4.42333984375, -4.078369140625, -3.7333984375, -3.388427734375, -3.04345703125, -2.698486328125, -2.353515625, -2.008544921875, -1.66357421875, -1.318603515625, -0.9736328125, -0.628662109375, -0.28369140625, 0.061279296875, 0.40625, 0.751220703125, 1.09619140625, 1.441162109375, 1.7861328125, 2.131103515625, 2.47607421875, 2.821044921875, 3.166015625, 3.510986328125, 3.85595703125, 4.200927734375, 4.5458984375, 4.890869140625, 5.23583984375, 5.580810546875, 5.92578125, 6.270751953125, 6.61572265625, 6.960693359375, 7.3056640625, 7.650634765625, 7.99560546875, 8.340576171875, 8.685546875, 9.030517578125, 9.37548828125, 9.720458984375, 10.0654296875, 10.410400390625, 10.75537109375, 11.100341796875, 11.4453125]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 6.0, 6.0, 6.0, 9.0, 21.0, 26.0, 27.0, 47.0, 77.0, 84.0, 109.0, 186.0, 245.0, 370.0, 503.0, 849.0, 1229.0, 2019.0, 3340.0, 6277.0, 13250.0, 39339.0, 327918.0, 570727.0, 49799.0, 15466.0, 6798.0, 3676.0, 2077.0, 1313.0, 893.0, 564.0, 398.0, 258.0, 171.0, 150.0, 90.0, 59.0, 55.0, 48.0, 21.0, 17.0, 12.0, 13.0, 3.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.453125, -30.407470703125, -29.36181640625, -28.316162109375, -27.2705078125, -26.224853515625, -25.17919921875, -24.133544921875, -23.087890625, -22.042236328125, -20.99658203125, -19.950927734375, -18.9052734375, -17.859619140625, -16.81396484375, -15.768310546875, -14.72265625, -13.677001953125, -12.63134765625, -11.585693359375, -10.5400390625, -9.494384765625, -8.44873046875, -7.403076171875, -6.357421875, -5.311767578125, -4.26611328125, -3.220458984375, -2.1748046875, -1.129150390625, -0.08349609375, 0.962158203125, 2.0078125, 3.053466796875, 4.09912109375, 5.144775390625, 6.1904296875, 7.236083984375, 8.28173828125, 9.327392578125, 10.373046875, 11.418701171875, 12.46435546875, 13.510009765625, 14.5556640625, 15.601318359375, 16.64697265625, 17.692626953125, 18.73828125, 19.783935546875, 20.82958984375, 21.875244140625, 22.9208984375, 23.966552734375, 25.01220703125, 26.057861328125, 27.103515625, 28.149169921875, 29.19482421875, 30.240478515625, 31.2861328125, 32.331787109375, 33.37744140625, 34.423095703125, 35.46875]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 5.0, 3.0, 3.0, 6.0, 8.0, 6.0, 7.0, 11.0, 9.0, 21.0, 15.0, 19.0, 26.0, 23.0, 28.0, 29.0, 37.0, 33.0, 37.0, 52.0, 66.0, 84.0, 136.0, 1698.0, 172.0, 80.0, 61.0, 54.0, 42.0, 24.0, 27.0, 42.0, 20.0, 31.0, 25.0, 21.0, 19.0, 11.0, 6.0, 15.0, 10.0, 6.0, 6.0, 5.0, 7.0, 1.0, 5.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0], "bins": [-29.6875, -28.804443359375, -27.92138671875, -27.038330078125, -26.1552734375, -25.272216796875, -24.38916015625, -23.506103515625, -22.623046875, -21.739990234375, -20.85693359375, -19.973876953125, -19.0908203125, -18.207763671875, -17.32470703125, -16.441650390625, -15.55859375, -14.675537109375, -13.79248046875, -12.909423828125, -12.0263671875, -11.143310546875, -10.26025390625, -9.377197265625, -8.494140625, -7.611083984375, -6.72802734375, -5.844970703125, -4.9619140625, -4.078857421875, -3.19580078125, -2.312744140625, -1.4296875, -0.546630859375, 0.33642578125, 1.219482421875, 2.1025390625, 2.985595703125, 3.86865234375, 4.751708984375, 5.634765625, 6.517822265625, 7.40087890625, 8.283935546875, 9.1669921875, 10.050048828125, 10.93310546875, 11.816162109375, 12.69921875, 13.582275390625, 14.46533203125, 15.348388671875, 16.2314453125, 17.114501953125, 17.99755859375, 18.880615234375, 19.763671875, 20.646728515625, 21.52978515625, 22.412841796875, 23.2958984375, 24.178955078125, 25.06201171875, 25.945068359375, 26.828125]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 4.0, 5.0, 5.0, 2.0, 7.0, 5.0, 9.0, 15.0, 5.0, 17.0, 20.0, 21.0, 20.0, 16.0, 34.0, 32.0, 36.0, 59.0, 118.0, 175.0, 519.0, 4826.0, 3073946.0, 63939.0, 1080.0, 300.0, 122.0, 76.0, 55.0, 38.0, 33.0, 25.0, 19.0, 22.0, 20.0, 15.0, 8.0, 12.0, 8.0, 7.0, 5.0, 8.0, 8.0, 2.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-127.5, -123.3515625, -119.203125, -115.0546875, -110.90625, -106.7578125, -102.609375, -98.4609375, -94.3125, -90.1640625, -86.015625, -81.8671875, -77.71875, -73.5703125, -69.421875, -65.2734375, -61.125, -56.9765625, -52.828125, -48.6796875, -44.53125, -40.3828125, -36.234375, -32.0859375, -27.9375, -23.7890625, -19.640625, -15.4921875, -11.34375, -7.1953125, -3.046875, 1.1015625, 5.25, 9.3984375, 13.546875, 17.6953125, 21.84375, 25.9921875, 30.140625, 34.2890625, 38.4375, 42.5859375, 46.734375, 50.8828125, 55.03125, 59.1796875, 63.328125, 67.4765625, 71.625, 75.7734375, 79.921875, 84.0703125, 88.21875, 92.3671875, 96.515625, 100.6640625, 104.8125, 108.9609375, 113.109375, 117.2578125, 121.40625, 125.5546875, 129.703125, 133.8515625, 138.0]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 971.0, 42.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-937.2486572265625, -917.9788818359375, -898.7090454101562, -879.4392700195312, -860.16943359375, -840.899658203125, -821.6298217773438, -802.3600463867188, -783.0902099609375, -763.8204345703125, -744.5505981445312, -725.2808227539062, -706.010986328125, -686.7412109375, -667.4713745117188, -648.2015991210938, -628.9318237304688, -609.6620483398438, -590.3922119140625, -571.1224365234375, -551.8526000976562, -532.5828247070312, -513.31298828125, -494.043212890625, -474.7734069824219, -455.50360107421875, -436.2337951660156, -416.9639892578125, -397.6942138671875, -378.42437744140625, -359.15460205078125, -339.8847961425781, -320.6149597167969, -301.34515380859375, -282.0753479003906, -262.8055419921875, -243.53575134277344, -224.2659454345703, -204.99615478515625, -185.72634887695312, -166.45654296875, -147.18673706054688, -127.91693878173828, -108.64714050292969, -89.37733459472656, -70.10752868652344, -50.837730407714844, -31.56793212890625, -12.298126220703125, 6.971675872802734, 26.241477966308594, 45.51128005981445, 64.78108215332031, 84.05088806152344, 103.32068634033203, 122.59048461914062, 141.86029052734375, 161.13009643554688, 180.39990234375, 199.66969299316406, 218.9394989013672, 238.2093048095703, 257.4790954589844, 276.7489013671875, 296.0187072753906]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 2.0, 3.0, 6.0, 4.0, 9.0, 7.0, 11.0, 13.0, 17.0, 14.0, 14.0, 22.0, 24.0, 35.0, 25.0, 29.0, 21.0, 31.0, 36.0, 43.0, 38.0, 35.0, 47.0, 31.0, 41.0, 47.0, 41.0, 27.0, 37.0, 32.0, 24.0, 40.0, 38.0, 24.0, 25.0, 13.0, 11.0, 10.0, 13.0, 15.0, 12.0, 6.0, 8.0, 8.0, 5.0, 4.0, 6.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-93.83245086669922, -90.99108123779297, -88.14971923828125, -85.308349609375, -82.46697998046875, -79.62561798095703, -76.78424835205078, -73.94288635253906, -71.10151672363281, -68.26014709472656, -65.41878509521484, -62.577415466308594, -59.73604965209961, -56.894683837890625, -54.053314208984375, -51.21194839477539, -48.370582580566406, -45.52921676635742, -42.68785095214844, -39.84648132324219, -37.0051155090332, -34.16374969482422, -31.3223819732666, -28.481014251708984, -25.6396484375, -22.798282623291016, -19.9569149017334, -17.11554718017578, -14.274181365966797, -11.432814598083496, -8.591447830200195, -5.750080108642578, -2.908721923828125, -0.06735515594482422, 2.7740116119384766, 5.615378379821777, 8.456745147705078, 11.298111915588379, 14.13947868347168, 16.980846405029297, 19.82221221923828, 22.663578033447266, 25.504945755004883, 28.3463134765625, 31.187679290771484, 34.02904510498047, 36.87041473388672, 39.7117805480957, 42.55314636230469, 45.39451217651367, 48.235877990722656, 51.077247619628906, 53.91861343383789, 56.759979248046875, 59.601348876953125, 62.44271469116211, 65.2840805053711, 68.12545013427734, 70.96681213378906, 73.80818176269531, 76.64955139160156, 79.49091339111328, 82.33228302001953, 85.17364501953125, 88.0150146484375]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 2.0, 1.0, 3.0, 8.0, 7.0, 5.0, 6.0, 14.0, 14.0, 12.0, 21.0, 33.0, 36.0, 31.0, 40.0, 53.0, 65.0, 66.0, 76.0, 84.0, 69.0, 61.0, 46.0, 34.0, 38.0, 32.0, 24.0, 21.0, 19.0, 15.0, 21.0, 12.0, 9.0, 1.0, 7.0, 8.0, 1.0, 3.0, 3.0, 2.0, 0.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.1953125, -10.8250732421875, -10.454833984375, -10.0845947265625, -9.71435546875, -9.3441162109375, -8.973876953125, -8.6036376953125, -8.2333984375, -7.8631591796875, -7.492919921875, -7.1226806640625, -6.75244140625, -6.3822021484375, -6.011962890625, -5.6417236328125, -5.271484375, -4.9012451171875, -4.531005859375, -4.1607666015625, -3.79052734375, -3.4202880859375, -3.050048828125, -2.6798095703125, -2.3095703125, -1.9393310546875, -1.569091796875, -1.1988525390625, -0.82861328125, -0.4583740234375, -0.088134765625, 0.2821044921875, 0.65234375, 1.0225830078125, 1.392822265625, 1.7630615234375, 2.13330078125, 2.5035400390625, 2.873779296875, 3.2440185546875, 3.6142578125, 3.9844970703125, 4.354736328125, 4.7249755859375, 5.09521484375, 5.4654541015625, 5.835693359375, 6.2059326171875, 6.576171875, 6.9464111328125, 7.316650390625, 7.6868896484375, 8.05712890625, 8.4273681640625, 8.797607421875, 9.1678466796875, 9.5380859375, 9.9083251953125, 10.278564453125, 10.6488037109375, 11.01904296875, 11.3892822265625, 11.759521484375, 12.1297607421875, 12.5]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 5.0, 7.0, 3.0, 10.0, 15.0, 22.0, 23.0, 41.0, 45.0, 74.0, 99.0, 186.0, 251.0, 462.0, 722.0, 1303.0, 2501.0, 5252.0, 12910.0, 54356.0, 2474029.0, 1576471.0, 41683.0, 12439.0, 5330.0, 2612.0, 1367.0, 757.0, 499.0, 264.0, 178.0, 121.0, 71.0, 46.0, 37.0, 25.0, 18.0, 19.0, 8.0, 13.0, 3.0, 4.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.125, -38.78515625, -37.4453125, -36.10546875, -34.765625, -33.42578125, -32.0859375, -30.74609375, -29.40625, -28.06640625, -26.7265625, -25.38671875, -24.046875, -22.70703125, -21.3671875, -20.02734375, -18.6875, -17.34765625, -16.0078125, -14.66796875, -13.328125, -11.98828125, -10.6484375, -9.30859375, -7.96875, -6.62890625, -5.2890625, -3.94921875, -2.609375, -1.26953125, 0.0703125, 1.41015625, 2.75, 4.08984375, 5.4296875, 6.76953125, 8.109375, 9.44921875, 10.7890625, 12.12890625, 13.46875, 14.80859375, 16.1484375, 17.48828125, 18.828125, 20.16796875, 21.5078125, 22.84765625, 24.1875, 25.52734375, 26.8671875, 28.20703125, 29.546875, 30.88671875, 32.2265625, 33.56640625, 34.90625, 36.24609375, 37.5859375, 38.92578125, 40.265625, 41.60546875, 42.9453125, 44.28515625, 45.625]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 5.0, 11.0, 5.0, 8.0, 12.0, 12.0, 12.0, 19.0, 17.0, 22.0, 23.0, 27.0, 55.0, 59.0, 88.0, 151.0, 313.0, 528.0, 756.0, 758.0, 417.0, 287.0, 155.0, 65.0, 59.0, 35.0, 30.0, 30.0, 20.0, 14.0, 10.0, 10.0, 8.0, 9.0, 8.0, 9.0, 3.0, 3.0, 5.0, 1.0, 6.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0], "bins": [-28.828125, -27.924072265625, -27.02001953125, -26.115966796875, -25.2119140625, -24.307861328125, -23.40380859375, -22.499755859375, -21.595703125, -20.691650390625, -19.78759765625, -18.883544921875, -17.9794921875, -17.075439453125, -16.17138671875, -15.267333984375, -14.36328125, -13.459228515625, -12.55517578125, -11.651123046875, -10.7470703125, -9.843017578125, -8.93896484375, -8.034912109375, -7.130859375, -6.226806640625, -5.32275390625, -4.418701171875, -3.5146484375, -2.610595703125, -1.70654296875, -0.802490234375, 0.1015625, 1.005615234375, 1.90966796875, 2.813720703125, 3.7177734375, 4.621826171875, 5.52587890625, 6.429931640625, 7.333984375, 8.238037109375, 9.14208984375, 10.046142578125, 10.9501953125, 11.854248046875, 12.75830078125, 13.662353515625, 14.56640625, 15.470458984375, 16.37451171875, 17.278564453125, 18.1826171875, 19.086669921875, 19.99072265625, 20.894775390625, 21.798828125, 22.702880859375, 23.60693359375, 24.510986328125, 25.4150390625, 26.319091796875, 27.22314453125, 28.127197265625, 29.03125]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 2.0, 7.0, 9.0, 4.0, 6.0, 10.0, 10.0, 21.0, 34.0, 39.0, 45.0, 67.0, 105.0, 171.0, 263.0, 410.0, 730.0, 1127.0, 1890.0, 3069.0, 5297.0, 9380.0, 17635.0, 36546.0, 97020.0, 940385.0, 2811242.0, 169229.0, 49047.0, 22540.0, 11639.0, 6560.0, 3831.0, 2250.0, 1274.0, 816.0, 539.0, 388.0, 236.0, 146.0, 106.0, 71.0, 45.0, 23.0, 14.0, 4.0, 11.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.25, -33.953125, -32.65625, -31.359375, -30.0625, -28.765625, -27.46875, -26.171875, -24.875, -23.578125, -22.28125, -20.984375, -19.6875, -18.390625, -17.09375, -15.796875, -14.5, -13.203125, -11.90625, -10.609375, -9.3125, -8.015625, -6.71875, -5.421875, -4.125, -2.828125, -1.53125, -0.234375, 1.0625, 2.359375, 3.65625, 4.953125, 6.25, 7.546875, 8.84375, 10.140625, 11.4375, 12.734375, 14.03125, 15.328125, 16.625, 17.921875, 19.21875, 20.515625, 21.8125, 23.109375, 24.40625, 25.703125, 27.0, 28.296875, 29.59375, 30.890625, 32.1875, 33.484375, 34.78125, 36.078125, 37.375, 38.671875, 39.96875, 41.265625, 42.5625, 43.859375, 45.15625, 46.453125, 47.75]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 5.0, 12.0, 16.0, 25.0, 55.0, 83.0, 221.0, 277.0, 155.0, 69.0, 39.0, 21.0, 12.0, 6.0, 3.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0], "bins": [-302.0759582519531, -296.0727233886719, -290.0694580078125, -284.06622314453125, -278.0629577636719, -272.0597229003906, -266.05645751953125, -260.05322265625, -254.0499725341797, -248.04672241210938, -242.04347229003906, -236.04022216796875, -230.0369873046875, -224.0337371826172, -218.03048706054688, -212.02723693847656, -206.02398681640625, -200.02073669433594, -194.01748657226562, -188.0142364501953, -182.010986328125, -176.00775146484375, -170.00450134277344, -164.00125122070312, -157.9980010986328, -151.9947509765625, -145.9915008544922, -139.98825073242188, -133.98501586914062, -127.98175811767578, -121.978515625, -115.97526550292969, -109.97200775146484, -103.96875762939453, -97.96551513671875, -91.96226501464844, -85.95901489257812, -79.95576477050781, -73.9525146484375, -67.94927215576172, -61.946022033691406, -55.942771911621094, -49.93952560424805, -43.936279296875, -37.93302917480469, -31.929780960083008, -25.926532745361328, -19.92328643798828, -13.920036315917969, -7.916788101196289, -1.9135398864746094, 4.08970832824707, 10.09295654296875, 16.09620475769043, 22.09945297241211, 28.102699279785156, 34.10594940185547, 40.10919952392578, 46.11244583129883, 52.115692138671875, 58.11894226074219, 64.1221923828125, 70.12544250488281, 76.1286849975586, 82.1319351196289]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 4.0, 2.0, 7.0, 12.0, 6.0, 12.0, 12.0, 18.0, 18.0, 25.0, 27.0, 29.0, 21.0, 34.0, 34.0, 38.0, 39.0, 43.0, 37.0, 42.0, 39.0, 34.0, 58.0, 50.0, 51.0, 37.0, 23.0, 19.0, 28.0, 28.0, 24.0, 32.0, 19.0, 16.0, 18.0, 12.0, 10.0, 11.0, 6.0, 13.0, 11.0, 2.0, 0.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-99.378662109375, -96.53338623046875, -93.68810272216797, -90.84281921386719, -87.99754333496094, -85.15226745605469, -82.3069839477539, -79.46170043945312, -76.61642456054688, -73.77114868164062, -70.92586517333984, -68.08058166503906, -65.23530578613281, -62.3900260925293, -59.54474639892578, -56.699466705322266, -53.85418701171875, -51.008907318115234, -48.16362762451172, -45.3183479309082, -42.47306823730469, -39.62778854370117, -36.782508850097656, -33.93722915649414, -31.091949462890625, -28.24666976928711, -25.401390075683594, -22.556110382080078, -19.710830688476562, -16.865550994873047, -14.020271301269531, -11.174991607666016, -8.3297119140625, -5.484432220458984, -2.6391525268554688, 0.20612716674804688, 3.0514068603515625, 5.896686553955078, 8.741966247558594, 11.58724594116211, 14.432525634765625, 17.27780532836914, 20.123085021972656, 22.968364715576172, 25.813644409179688, 28.658924102783203, 31.50420379638672, 34.349483489990234, 37.19476318359375, 40.040042877197266, 42.88532257080078, 45.7306022644043, 48.57588195800781, 51.42116165161133, 54.266441345214844, 57.11172103881836, 59.957000732421875, 62.80228042602539, 65.6475601196289, 68.49284362792969, 71.33811950683594, 74.18339538574219, 77.02867889404297, 79.87396240234375, 82.71923828125]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 3.0, 4.0, 2.0, 5.0, 11.0, 10.0, 12.0, 9.0, 19.0, 16.0, 26.0, 38.0, 34.0, 39.0, 45.0, 58.0, 58.0, 63.0, 55.0, 43.0, 60.0, 63.0, 47.0, 48.0, 35.0, 41.0, 38.0, 17.0, 15.0, 16.0, 15.0, 16.0, 8.0, 4.0, 10.0, 3.0, 4.0, 4.0, 2.0, 6.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.625, -11.25048828125, -10.8759765625, -10.50146484375, -10.126953125, -9.75244140625, -9.3779296875, -9.00341796875, -8.62890625, -8.25439453125, -7.8798828125, -7.50537109375, -7.130859375, -6.75634765625, -6.3818359375, -6.00732421875, -5.6328125, -5.25830078125, -4.8837890625, -4.50927734375, -4.134765625, -3.76025390625, -3.3857421875, -3.01123046875, -2.63671875, -2.26220703125, -1.8876953125, -1.51318359375, -1.138671875, -0.76416015625, -0.3896484375, -0.01513671875, 0.359375, 0.73388671875, 1.1083984375, 1.48291015625, 1.857421875, 2.23193359375, 2.6064453125, 2.98095703125, 3.35546875, 3.72998046875, 4.1044921875, 4.47900390625, 4.853515625, 5.22802734375, 5.6025390625, 5.97705078125, 6.3515625, 6.72607421875, 7.1005859375, 7.47509765625, 7.849609375, 8.22412109375, 8.5986328125, 8.97314453125, 9.34765625, 9.72216796875, 10.0966796875, 10.47119140625, 10.845703125, 11.22021484375, 11.5947265625, 11.96923828125, 12.34375]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 9.0, 13.0, 20.0, 26.0, 30.0, 65.0, 67.0, 98.0, 175.0, 270.0, 421.0, 657.0, 1032.0, 1558.0, 2585.0, 4188.0, 7074.0, 12257.0, 22600.0, 42976.0, 90700.0, 223307.0, 348733.0, 150069.0, 65281.0, 32348.0, 17409.0, 9684.0, 5719.0, 3433.0, 2083.0, 1246.0, 911.0, 525.0, 331.0, 238.0, 134.0, 89.0, 55.0, 39.0, 45.0, 17.0, 24.0, 6.0, 4.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2451171875, -1.2065582275390625, -1.167999267578125, -1.1294403076171875, -1.09088134765625, -1.0523223876953125, -1.013763427734375, -0.9752044677734375, -0.9366455078125, -0.8980865478515625, -0.859527587890625, -0.8209686279296875, -0.78240966796875, -0.7438507080078125, -0.705291748046875, -0.6667327880859375, -0.628173828125, -0.5896148681640625, -0.551055908203125, -0.5124969482421875, -0.47393798828125, -0.4353790283203125, -0.396820068359375, -0.3582611083984375, -0.3197021484375, -0.2811431884765625, -0.242584228515625, -0.2040252685546875, -0.16546630859375, -0.1269073486328125, -0.088348388671875, -0.0497894287109375, -0.01123046875, 0.0273284912109375, 0.065887451171875, 0.1044464111328125, 0.14300537109375, 0.1815643310546875, 0.220123291015625, 0.2586822509765625, 0.2972412109375, 0.3358001708984375, 0.374359130859375, 0.4129180908203125, 0.45147705078125, 0.4900360107421875, 0.528594970703125, 0.5671539306640625, 0.605712890625, 0.6442718505859375, 0.682830810546875, 0.7213897705078125, 0.75994873046875, 0.7985076904296875, 0.837066650390625, 0.8756256103515625, 0.9141845703125, 0.9527435302734375, 0.991302490234375, 1.0298614501953125, 1.06842041015625, 1.1069793701171875, 1.145538330078125, 1.1840972900390625, 1.22265625]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 7.0, 5.0, 6.0, 13.0, 10.0, 13.0, 8.0, 12.0, 20.0, 19.0, 22.0, 29.0, 50.0, 27.0, 35.0, 40.0, 47.0, 51.0, 52.0, 35.0, 1064.0, 37.0, 45.0, 48.0, 42.0, 43.0, 39.0, 28.0, 26.0, 23.0, 21.0, 22.0, 15.0, 15.0, 11.0, 14.0, 18.0, 7.0, 5.0, 6.0, 0.0, 4.0, 4.0, 3.0, 0.0, 0.0, 1.0], "bins": [-8.078125, -7.86114501953125, -7.6441650390625, -7.42718505859375, -7.210205078125, -6.99322509765625, -6.7762451171875, -6.55926513671875, -6.34228515625, -6.12530517578125, -5.9083251953125, -5.69134521484375, -5.474365234375, -5.25738525390625, -5.0404052734375, -4.82342529296875, -4.6064453125, -4.38946533203125, -4.1724853515625, -3.95550537109375, -3.738525390625, -3.52154541015625, -3.3045654296875, -3.08758544921875, -2.87060546875, -2.65362548828125, -2.4366455078125, -2.21966552734375, -2.002685546875, -1.78570556640625, -1.5687255859375, -1.35174560546875, -1.134765625, -0.91778564453125, -0.7008056640625, -0.48382568359375, -0.266845703125, -0.04986572265625, 0.1671142578125, 0.38409423828125, 0.60107421875, 0.81805419921875, 1.0350341796875, 1.25201416015625, 1.468994140625, 1.68597412109375, 1.9029541015625, 2.11993408203125, 2.3369140625, 2.55389404296875, 2.7708740234375, 2.98785400390625, 3.204833984375, 3.42181396484375, 3.6387939453125, 3.85577392578125, 4.07275390625, 4.28973388671875, 4.5067138671875, 4.72369384765625, 4.940673828125, 5.15765380859375, 5.3746337890625, 5.59161376953125, 5.80859375]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [4.0, 4.0, 5.0, 8.0, 17.0, 19.0, 16.0, 37.0, 37.0, 37.0, 97.0, 159.0, 256.0, 347.0, 649.0, 956.0, 1532.0, 2323.0, 3495.0, 5331.0, 8102.0, 12556.0, 19505.0, 32014.0, 54838.0, 98969.0, 188949.0, 1299646.0, 158256.0, 83730.0, 47685.0, 28437.0, 17474.0, 10990.0, 7183.0, 4692.0, 3165.0, 1980.0, 1358.0, 820.0, 495.0, 347.0, 245.0, 142.0, 75.0, 61.0, 30.0, 28.0, 16.0, 15.0, 8.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.53515625, -0.5156021118164062, -0.4960479736328125, -0.47649383544921875, -0.456939697265625, -0.43738555908203125, -0.4178314208984375, -0.39827728271484375, -0.37872314453125, -0.35916900634765625, -0.3396148681640625, -0.32006072998046875, -0.300506591796875, -0.28095245361328125, -0.2613983154296875, -0.24184417724609375, -0.2222900390625, -0.20273590087890625, -0.1831817626953125, -0.16362762451171875, -0.144073486328125, -0.12451934814453125, -0.1049652099609375, -0.08541107177734375, -0.06585693359375, -0.04630279541015625, -0.0267486572265625, -0.00719451904296875, 0.012359619140625, 0.03191375732421875, 0.0514678955078125, 0.07102203369140625, 0.090576171875, 0.11013031005859375, 0.1296844482421875, 0.14923858642578125, 0.168792724609375, 0.18834686279296875, 0.2079010009765625, 0.22745513916015625, 0.24700927734375, 0.26656341552734375, 0.2861175537109375, 0.30567169189453125, 0.325225830078125, 0.34477996826171875, 0.3643341064453125, 0.38388824462890625, 0.4034423828125, 0.42299652099609375, 0.4425506591796875, 0.46210479736328125, 0.481658935546875, 0.5012130737304688, 0.5207672119140625, 0.5403213500976562, 0.55987548828125, 0.5794296264648438, 0.5989837646484375, 0.6185379028320312, 0.638092041015625, 0.6576461791992188, 0.6772003173828125, 0.6967544555664062, 0.71630859375]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 3.0, 7.0, 7.0, 9.0, 11.0, 9.0, 12.0, 15.0, 16.0, 26.0, 37.0, 35.0, 40.0, 37.0, 38.0, 35.0, 53.0, 49.0, 50.0, 49.0, 70.0, 53.0, 51.0, 42.0, 46.0, 25.0, 31.0, 26.0, 13.0, 15.0, 14.0, 16.0, 10.0, 12.0, 7.0, 8.0, 2.0, 2.0, 3.0, 4.0, 1.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.016937255859375, -0.016445398330688477, -0.015953540802001953, -0.01546168327331543, -0.014969825744628906, -0.014477968215942383, -0.01398611068725586, -0.013494253158569336, -0.013002395629882812, -0.012510538101196289, -0.012018680572509766, -0.011526823043823242, -0.011034965515136719, -0.010543107986450195, -0.010051250457763672, -0.009559392929077148, -0.009067535400390625, -0.008575677871704102, -0.008083820343017578, -0.007591962814331055, -0.007100105285644531, -0.006608247756958008, -0.006116390228271484, -0.005624532699584961, -0.0051326751708984375, -0.004640817642211914, -0.004148960113525391, -0.003657102584838867, -0.0031652450561523438, -0.0026733875274658203, -0.002181529998779297, -0.0016896724700927734, -0.00119781494140625, -0.0007059574127197266, -0.00021409988403320312, 0.0002777576446533203, 0.0007696151733398438, 0.0012614727020263672, 0.0017533302307128906, 0.002245187759399414, 0.0027370452880859375, 0.003228902816772461, 0.0037207603454589844, 0.004212617874145508, 0.004704475402832031, 0.005196332931518555, 0.005688190460205078, 0.0061800479888916016, 0.006671905517578125, 0.0071637630462646484, 0.007655620574951172, 0.008147478103637695, 0.008639335632324219, 0.009131193161010742, 0.009623050689697266, 0.010114908218383789, 0.010606765747070312, 0.011098623275756836, 0.01159048080444336, 0.012082338333129883, 0.012574195861816406, 0.01306605339050293, 0.013557910919189453, 0.014049768447875977, 0.0145416259765625]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 0.0, 4.0, 4.0, 0.0, 6.0, 3.0, 12.0, 13.0, 8.0, 25.0, 17.0, 10.0, 26.0, 33.0, 37.0, 29.0, 47.0, 77.0, 82.0, 121.0, 224.0, 502.0, 117316.0, 928720.0, 516.0, 215.0, 112.0, 73.0, 53.0, 38.0, 50.0, 37.0, 36.0, 17.0, 14.0, 15.0, 13.0, 12.0, 13.0, 8.0, 3.0, 5.0, 5.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.513671875, -0.49658203125, -0.4794921875, -0.46240234375, -0.4453125, -0.42822265625, -0.4111328125, -0.39404296875, -0.376953125, -0.35986328125, -0.3427734375, -0.32568359375, -0.30859375, -0.29150390625, -0.2744140625, -0.25732421875, -0.240234375, -0.22314453125, -0.2060546875, -0.18896484375, -0.171875, -0.15478515625, -0.1376953125, -0.12060546875, -0.103515625, -0.08642578125, -0.0693359375, -0.05224609375, -0.03515625, -0.01806640625, -0.0009765625, 0.01611328125, 0.033203125, 0.05029296875, 0.0673828125, 0.08447265625, 0.1015625, 0.11865234375, 0.1357421875, 0.15283203125, 0.169921875, 0.18701171875, 0.2041015625, 0.22119140625, 0.23828125, 0.25537109375, 0.2724609375, 0.28955078125, 0.306640625, 0.32373046875, 0.3408203125, 0.35791015625, 0.375, 0.39208984375, 0.4091796875, 0.42626953125, 0.443359375, 0.46044921875, 0.4775390625, 0.49462890625, 0.51171875, 0.52880859375, 0.5458984375, 0.56298828125, 0.580078125]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1012.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007155167404562235, 0.007726811338216066, 0.022608790546655655, 0.03749076649546623, 0.05237274616956711, 0.06725472956895828, 0.08213670551776886, 0.09701868891716003, 0.11190066486597061, 0.1267826408147812, 0.14166462421417236, 0.15654659271240234, 0.17142857611179352, 0.1863105595111847, 0.20119252800941467, 0.21607452630996704, 0.23095649480819702, 0.2458384782075882, 0.26072046160697937, 0.27560243010520935, 0.29048439860343933, 0.3053663969039917, 0.3202483654022217, 0.33513033390045166, 0.35001233220100403, 0.364894300699234, 0.3797762989997864, 0.39465826749801636, 0.40954023599624634, 0.4244222342967987, 0.4393042027950287, 0.45418620109558105, 0.46906813979148865, 0.48395010828971863, 0.498832106590271, 0.513714075088501, 0.528596043586731, 0.5434780120849609, 0.5583599805831909, 0.5732420086860657, 0.5881239771842957, 0.6030059456825256, 0.6178879141807556, 0.6327699422836304, 0.6476519107818604, 0.6625338792800903, 0.6774158477783203, 0.6922978162765503, 0.7071797847747803, 0.7220617532730103, 0.7369437217712402, 0.7518256902694702, 0.766707718372345, 0.781589686870575, 0.7964716553688049, 0.8113536238670349, 0.8262356519699097, 0.8411176204681396, 0.8559995889663696, 0.8708815574645996, 0.8857635855674744, 0.9006455540657043, 0.9155275225639343, 0.9304094910621643, 0.9452914595603943]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 8.0, 8.0, 18.0, 19.0, 15.0, 16.0, 28.0, 26.0, 33.0, 30.0, 40.0, 33.0, 46.0, 45.0, 53.0, 47.0, 49.0, 61.0, 47.0, 43.0, 44.0, 58.0, 38.0, 38.0, 29.0, 32.0, 24.0, 10.0, 23.0, 8.0, 12.0, 7.0, 9.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.05142170190811157, -0.0501592755317688, -0.048896849155426025, -0.04763442650437355, -0.04637200012803078, -0.045109573751688004, -0.04384715110063553, -0.042584724724292755, -0.04132229834794998, -0.04005987197160721, -0.038797445595264435, -0.03753502294421196, -0.036272596567869186, -0.03501017019152641, -0.03374774754047394, -0.032485321164131165, -0.03122289478778839, -0.029960468411445618, -0.028698043897747993, -0.02743561938405037, -0.026173193007707596, -0.024910766631364822, -0.023648342117667198, -0.022385917603969574, -0.0211234912276268, -0.019861064851284027, -0.018598640337586403, -0.01733621582388878, -0.016073789447546005, -0.014811364002525806, -0.013548938557505608, -0.012286513112485409, -0.01102408766746521, -0.009761662222445011, -0.008499236777424812, -0.0072368113324046135, -0.005974385887384415, -0.004711960442364216, -0.003449534997344017, -0.002187109552323818, -0.0009246841073036194, 0.00033774133771657944, 0.0016001667827367783, 0.002862592227756977, 0.004125017672777176, 0.005387443117797375, 0.0066498685628175735, 0.007912294007837772, 0.009174719452857971, 0.01043714489787817, 0.011699570342898369, 0.012961995787918568, 0.014224421232938766, 0.015486846677958965, 0.016749272122979164, 0.01801169663667679, 0.019274123013019562, 0.020536549389362335, 0.02179897390305996, 0.023061398416757584, 0.024323824793100357, 0.02558625116944313, 0.026848675683140755, 0.02811110019683838, 0.029373526573181152]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 3.0, 4.0, 2.0, 5.0, 11.0, 10.0, 12.0, 9.0, 19.0, 16.0, 26.0, 38.0, 34.0, 39.0, 45.0, 58.0, 58.0, 63.0, 55.0, 43.0, 60.0, 63.0, 48.0, 47.0, 35.0, 41.0, 38.0, 17.0, 15.0, 16.0, 15.0, 16.0, 8.0, 4.0, 10.0, 3.0, 4.0, 4.0, 2.0, 6.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.625, -11.25048828125, -10.8759765625, -10.50146484375, -10.126953125, -9.75244140625, -9.3779296875, -9.00341796875, -8.62890625, -8.25439453125, -7.8798828125, -7.50537109375, -7.130859375, -6.75634765625, -6.3818359375, -6.00732421875, -5.6328125, -5.25830078125, -4.8837890625, -4.50927734375, -4.134765625, -3.76025390625, -3.3857421875, -3.01123046875, -2.63671875, -2.26220703125, -1.8876953125, -1.51318359375, -1.138671875, -0.76416015625, -0.3896484375, -0.01513671875, 0.359375, 0.73388671875, 1.1083984375, 1.48291015625, 1.857421875, 2.23193359375, 2.6064453125, 2.98095703125, 3.35546875, 3.72998046875, 4.1044921875, 4.47900390625, 4.853515625, 5.22802734375, 5.6025390625, 5.97705078125, 6.3515625, 6.72607421875, 7.1005859375, 7.47509765625, 7.849609375, 8.22412109375, 8.5986328125, 8.97314453125, 9.34765625, 9.72216796875, 10.0966796875, 10.47119140625, 10.845703125, 11.22021484375, 11.5947265625, 11.96923828125, 12.34375]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 4.0, 6.0, 5.0, 5.0, 15.0, 20.0, 29.0, 39.0, 44.0, 65.0, 94.0, 165.0, 197.0, 318.0, 553.0, 1065.0, 1991.0, 4532.0, 12482.0, 44583.0, 266744.0, 596431.0, 85712.0, 20666.0, 6867.0, 2719.0, 1299.0, 712.0, 371.0, 260.0, 153.0, 125.0, 83.0, 51.0, 45.0, 30.0, 19.0, 21.0, 11.0, 10.0, 4.0, 4.0, 6.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.640625, -10.2996826171875, -9.958740234375, -9.6177978515625, -9.27685546875, -8.9359130859375, -8.594970703125, -8.2540283203125, -7.9130859375, -7.5721435546875, -7.231201171875, -6.8902587890625, -6.54931640625, -6.2083740234375, -5.867431640625, -5.5264892578125, -5.185546875, -4.8446044921875, -4.503662109375, -4.1627197265625, -3.82177734375, -3.4808349609375, -3.139892578125, -2.7989501953125, -2.4580078125, -2.1170654296875, -1.776123046875, -1.4351806640625, -1.09423828125, -0.7532958984375, -0.412353515625, -0.0714111328125, 0.26953125, 0.6104736328125, 0.951416015625, 1.2923583984375, 1.63330078125, 1.9742431640625, 2.315185546875, 2.6561279296875, 2.9970703125, 3.3380126953125, 3.678955078125, 4.0198974609375, 4.36083984375, 4.7017822265625, 5.042724609375, 5.3836669921875, 5.724609375, 6.0655517578125, 6.406494140625, 6.7474365234375, 7.08837890625, 7.4293212890625, 7.770263671875, 8.1112060546875, 8.4521484375, 8.7930908203125, 9.134033203125, 9.4749755859375, 9.81591796875, 10.1568603515625, 10.497802734375, 10.8387451171875, 11.1796875]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 5.0, 6.0, 2.0, 5.0, 8.0, 9.0, 9.0, 8.0, 14.0, 13.0, 14.0, 24.0, 15.0, 39.0, 25.0, 41.0, 31.0, 34.0, 47.0, 49.0, 55.0, 64.0, 1865.0, 188.0, 66.0, 53.0, 35.0, 45.0, 29.0, 32.0, 23.0, 36.0, 25.0, 20.0, 18.0, 18.0, 19.0, 13.0, 8.0, 9.0, 8.0, 9.0, 5.0, 4.0, 6.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0], "bins": [-41.0, -39.8544921875, -38.708984375, -37.5634765625, -36.41796875, -35.2724609375, -34.126953125, -32.9814453125, -31.8359375, -30.6904296875, -29.544921875, -28.3994140625, -27.25390625, -26.1083984375, -24.962890625, -23.8173828125, -22.671875, -21.5263671875, -20.380859375, -19.2353515625, -18.08984375, -16.9443359375, -15.798828125, -14.6533203125, -13.5078125, -12.3623046875, -11.216796875, -10.0712890625, -8.92578125, -7.7802734375, -6.634765625, -5.4892578125, -4.34375, -3.1982421875, -2.052734375, -0.9072265625, 0.23828125, 1.3837890625, 2.529296875, 3.6748046875, 4.8203125, 5.9658203125, 7.111328125, 8.2568359375, 9.40234375, 10.5478515625, 11.693359375, 12.8388671875, 13.984375, 15.1298828125, 16.275390625, 17.4208984375, 18.56640625, 19.7119140625, 20.857421875, 22.0029296875, 23.1484375, 24.2939453125, 25.439453125, 26.5849609375, 27.73046875, 28.8759765625, 30.021484375, 31.1669921875, 32.3125]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 5.0, 1.0, 3.0, 6.0, 5.0, 7.0, 8.0, 11.0, 7.0, 13.0, 16.0, 21.0, 19.0, 20.0, 28.0, 47.0, 38.0, 55.0, 64.0, 104.0, 199.0, 450.0, 1436.0, 28177.0, 3106234.0, 6901.0, 904.0, 335.0, 174.0, 80.0, 63.0, 59.0, 36.0, 46.0, 18.0, 29.0, 15.0, 10.0, 19.0, 9.0, 9.0, 8.0, 5.0, 7.0, 4.0, 4.0, 5.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.3125, -70.7255859375, -68.138671875, -65.5517578125, -62.96484375, -60.3779296875, -57.791015625, -55.2041015625, -52.6171875, -50.0302734375, -47.443359375, -44.8564453125, -42.26953125, -39.6826171875, -37.095703125, -34.5087890625, -31.921875, -29.3349609375, -26.748046875, -24.1611328125, -21.57421875, -18.9873046875, -16.400390625, -13.8134765625, -11.2265625, -8.6396484375, -6.052734375, -3.4658203125, -0.87890625, 1.7080078125, 4.294921875, 6.8818359375, 9.46875, 12.0556640625, 14.642578125, 17.2294921875, 19.81640625, 22.4033203125, 24.990234375, 27.5771484375, 30.1640625, 32.7509765625, 35.337890625, 37.9248046875, 40.51171875, 43.0986328125, 45.685546875, 48.2724609375, 50.859375, 53.4462890625, 56.033203125, 58.6201171875, 61.20703125, 63.7939453125, 66.380859375, 68.9677734375, 71.5546875, 74.1416015625, 76.728515625, 79.3154296875, 81.90234375, 84.4892578125, 87.076171875, 89.6630859375, 92.25]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 164.0, 857.0], "bins": [-921.3816528320312, -906.7872924804688, -892.1929321289062, -877.5985717773438, -863.004150390625, -848.4097900390625, -833.8154296875, -819.2210693359375, -804.626708984375, -790.0323486328125, -775.43798828125, -760.8436279296875, -746.249267578125, -731.6548461914062, -717.0604858398438, -702.4661254882812, -687.8717651367188, -673.2774047851562, -658.6830444335938, -644.0886840820312, -629.4942626953125, -614.89990234375, -600.3055419921875, -585.711181640625, -571.1168212890625, -556.5224609375, -541.9281005859375, -527.333740234375, -512.7393798828125, -498.1449890136719, -483.55059814453125, -468.95623779296875, -454.36187744140625, -439.76751708984375, -425.17315673828125, -410.5787658691406, -395.9844055175781, -381.3900451660156, -366.795654296875, -352.2012939453125, -337.60693359375, -323.0125732421875, -308.418212890625, -293.8238220214844, -279.2294616699219, -264.6351013183594, -250.0407257080078, -235.44635009765625, -220.85198974609375, -206.25762939453125, -191.6632537841797, -177.06887817382812, -162.47451782226562, -147.88015747070312, -133.28578186035156, -118.69141387939453, -104.0970458984375, -89.50267791748047, -74.90830993652344, -60.313941955566406, -45.719573974609375, -31.125205993652344, -16.530838012695312, -1.9364700317382812, 12.657898902893066]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 5.0, 7.0, 5.0, 5.0, 14.0, 9.0, 18.0, 11.0, 20.0, 21.0, 20.0, 18.0, 33.0, 33.0, 32.0, 31.0, 44.0, 35.0, 34.0, 33.0, 45.0, 58.0, 41.0, 37.0, 35.0, 37.0, 32.0, 23.0, 33.0, 33.0, 39.0, 21.0, 26.0, 23.0, 22.0, 15.0, 6.0, 7.0, 12.0, 7.0, 5.0, 5.0, 2.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-106.93266296386719, -103.48381042480469, -100.03496551513672, -96.58611297607422, -93.13726806640625, -89.68841552734375, -86.23956298828125, -82.79071807861328, -79.34187316894531, -75.89302062988281, -72.44417572021484, -68.99532318115234, -65.54647827148438, -62.097625732421875, -58.64877700805664, -55.199928283691406, -51.751075744628906, -48.30222702026367, -44.85337829589844, -41.40452575683594, -37.95568084716797, -34.50682830810547, -31.057979583740234, -27.609130859375, -24.160282135009766, -20.71143341064453, -17.262584686279297, -13.81373405456543, -10.364885330200195, -6.916036605834961, -3.4671859741210938, -0.018337249755859375, 3.4305038452148438, 6.879353046417236, 10.328202247619629, 13.77705192565918, 17.225900650024414, 20.67474937438965, 24.123600006103516, 27.57244873046875, 31.021297454833984, 34.47014617919922, 37.91899490356445, 41.36784362792969, 44.81669616699219, 48.265541076660156, 51.714393615722656, 55.16324234008789, 58.612091064453125, 62.06093978881836, 65.5097885131836, 68.9586410522461, 72.40748596191406, 75.85633850097656, 79.30519104003906, 82.75403594970703, 86.202880859375, 89.6517333984375, 93.10057830810547, 96.54943084716797, 99.99827575683594, 103.44712829589844, 106.89598083496094, 110.3448257446289, 113.7936782836914]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 1.0, 5.0, 3.0, 4.0, 10.0, 11.0, 10.0, 9.0, 16.0, 22.0, 24.0, 32.0, 39.0, 39.0, 40.0, 49.0, 65.0, 63.0, 57.0, 52.0, 61.0, 63.0, 44.0, 41.0, 46.0, 38.0, 33.0, 22.0, 20.0, 10.0, 18.0, 16.0, 7.0, 8.0, 6.0, 1.0, 5.0, 3.0, 4.0, 5.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.0390625, -11.6522216796875, -11.265380859375, -10.8785400390625, -10.49169921875, -10.1048583984375, -9.718017578125, -9.3311767578125, -8.9443359375, -8.5574951171875, -8.170654296875, -7.7838134765625, -7.39697265625, -7.0101318359375, -6.623291015625, -6.2364501953125, -5.849609375, -5.4627685546875, -5.075927734375, -4.6890869140625, -4.30224609375, -3.9154052734375, -3.528564453125, -3.1417236328125, -2.7548828125, -2.3680419921875, -1.981201171875, -1.5943603515625, -1.20751953125, -0.8206787109375, -0.433837890625, -0.0469970703125, 0.33984375, 0.7266845703125, 1.113525390625, 1.5003662109375, 1.88720703125, 2.2740478515625, 2.660888671875, 3.0477294921875, 3.4345703125, 3.8214111328125, 4.208251953125, 4.5950927734375, 4.98193359375, 5.3687744140625, 5.755615234375, 6.1424560546875, 6.529296875, 6.9161376953125, 7.302978515625, 7.6898193359375, 8.07666015625, 8.4635009765625, 8.850341796875, 9.2371826171875, 9.6240234375, 10.0108642578125, 10.397705078125, 10.7845458984375, 11.17138671875, 11.5582275390625, 11.945068359375, 12.3319091796875, 12.71875]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 1.0, 6.0, 9.0, 11.0, 16.0, 24.0, 32.0, 44.0, 65.0, 131.0, 226.0, 335.0, 572.0, 1241.0, 2543.0, 5728.0, 16076.0, 187857.0, 3871790.0, 84485.0, 13119.0, 5010.0, 2276.0, 1161.0, 621.0, 373.0, 198.0, 111.0, 68.0, 46.0, 34.0, 15.0, 19.0, 8.0, 6.0, 6.0, 8.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.5, -51.796875, -50.09375, -48.390625, -46.6875, -44.984375, -43.28125, -41.578125, -39.875, -38.171875, -36.46875, -34.765625, -33.0625, -31.359375, -29.65625, -27.953125, -26.25, -24.546875, -22.84375, -21.140625, -19.4375, -17.734375, -16.03125, -14.328125, -12.625, -10.921875, -9.21875, -7.515625, -5.8125, -4.109375, -2.40625, -0.703125, 1.0, 2.703125, 4.40625, 6.109375, 7.8125, 9.515625, 11.21875, 12.921875, 14.625, 16.328125, 18.03125, 19.734375, 21.4375, 23.140625, 24.84375, 26.546875, 28.25, 29.953125, 31.65625, 33.359375, 35.0625, 36.765625, 38.46875, 40.171875, 41.875, 43.578125, 45.28125, 46.984375, 48.6875, 50.390625, 52.09375, 53.796875, 55.5]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 4.0, 4.0, 5.0, 5.0, 6.0, 8.0, 9.0, 10.0, 15.0, 14.0, 23.0, 21.0, 21.0, 34.0, 29.0, 59.0, 107.0, 222.0, 385.0, 733.0, 882.0, 668.0, 310.0, 170.0, 93.0, 59.0, 33.0, 32.0, 23.0, 14.0, 8.0, 9.0, 8.0, 11.0, 6.0, 8.0, 4.0, 8.0, 3.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-28.84375, -27.86083984375, -26.8779296875, -25.89501953125, -24.912109375, -23.92919921875, -22.9462890625, -21.96337890625, -20.98046875, -19.99755859375, -19.0146484375, -18.03173828125, -17.048828125, -16.06591796875, -15.0830078125, -14.10009765625, -13.1171875, -12.13427734375, -11.1513671875, -10.16845703125, -9.185546875, -8.20263671875, -7.2197265625, -6.23681640625, -5.25390625, -4.27099609375, -3.2880859375, -2.30517578125, -1.322265625, -0.33935546875, 0.6435546875, 1.62646484375, 2.609375, 3.59228515625, 4.5751953125, 5.55810546875, 6.541015625, 7.52392578125, 8.5068359375, 9.48974609375, 10.47265625, 11.45556640625, 12.4384765625, 13.42138671875, 14.404296875, 15.38720703125, 16.3701171875, 17.35302734375, 18.3359375, 19.31884765625, 20.3017578125, 21.28466796875, 22.267578125, 23.25048828125, 24.2333984375, 25.21630859375, 26.19921875, 27.18212890625, 28.1650390625, 29.14794921875, 30.130859375, 31.11376953125, 32.0966796875, 33.07958984375, 34.0625]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 0.0, 3.0, 7.0, 11.0, 3.0, 7.0, 9.0, 16.0, 29.0, 37.0, 50.0, 60.0, 102.0, 115.0, 172.0, 226.0, 340.0, 487.0, 666.0, 1002.0, 1420.0, 2092.0, 3205.0, 4710.0, 7480.0, 12036.0, 20583.0, 40210.0, 113751.0, 1051310.0, 2608134.0, 206224.0, 53991.0, 25447.0, 14428.0, 8786.0, 5526.0, 3690.0, 2435.0, 1655.0, 1115.0, 793.0, 551.0, 369.0, 295.0, 185.0, 166.0, 113.0, 61.0, 47.0, 34.0, 22.0, 21.0, 21.0, 18.0, 10.0, 7.0, 5.0, 3.0, 3.0, 1.0], "bins": [-35.25, -34.1875, -33.125, -32.0625, -31.0, -29.9375, -28.875, -27.8125, -26.75, -25.6875, -24.625, -23.5625, -22.5, -21.4375, -20.375, -19.3125, -18.25, -17.1875, -16.125, -15.0625, -14.0, -12.9375, -11.875, -10.8125, -9.75, -8.6875, -7.625, -6.5625, -5.5, -4.4375, -3.375, -2.3125, -1.25, -0.1875, 0.875, 1.9375, 3.0, 4.0625, 5.125, 6.1875, 7.25, 8.3125, 9.375, 10.4375, 11.5, 12.5625, 13.625, 14.6875, 15.75, 16.8125, 17.875, 18.9375, 20.0, 21.0625, 22.125, 23.1875, 24.25, 25.3125, 26.375, 27.4375, 28.5, 29.5625, 30.625, 31.6875, 32.75]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 4.0, 3.0, 6.0, 23.0, 45.0, 60.0, 144.0, 306.0, 215.0, 103.0, 51.0, 24.0, 11.0, 4.0, 7.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-384.76837158203125, -377.0287170410156, -369.2890625, -361.54937744140625, -353.8097229003906, -346.070068359375, -338.3304138183594, -330.59075927734375, -322.85107421875, -315.1114196777344, -307.37176513671875, -299.632080078125, -291.8924255371094, -284.15277099609375, -276.4131164550781, -268.6734619140625, -260.9338073730469, -253.19415283203125, -245.45448303222656, -237.71482849121094, -229.97515869140625, -222.23550415039062, -214.495849609375, -206.75619506835938, -199.0165252685547, -191.27687072753906, -183.53720092773438, -175.79754638671875, -168.05789184570312, -160.31822204589844, -152.5785675048828, -144.83889770507812, -137.09925842285156, -129.35960388183594, -121.61993408203125, -113.88027954101562, -106.14061737060547, -98.40095520019531, -90.66130065917969, -82.92163848876953, -75.18197631835938, -67.44231414794922, -59.70265579223633, -51.96299743652344, -44.22333526611328, -36.483673095703125, -28.744014739990234, -21.004356384277344, -13.264694213867188, -5.525033950805664, 2.2146263122558594, 9.954286575317383, 17.693946838378906, 25.433609008789062, 33.17326736450195, 40.912925720214844, 48.652587890625, 56.392250061035156, 64.13191223144531, 71.87156677246094, 79.6112289428711, 87.35089111328125, 95.09054565429688, 102.83020782470703, 110.56986999511719]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 4.0, 4.0, 4.0, 6.0, 5.0, 10.0, 10.0, 15.0, 15.0, 19.0, 17.0, 25.0, 27.0, 20.0, 15.0, 32.0, 41.0, 39.0, 32.0, 32.0, 31.0, 44.0, 33.0, 33.0, 39.0, 41.0, 52.0, 39.0, 43.0, 30.0, 28.0, 30.0, 24.0, 28.0, 22.0, 16.0, 19.0, 14.0, 17.0, 8.0, 8.0, 8.0, 11.0, 2.0, 3.0, 4.0, 5.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-87.39977264404297, -84.71659851074219, -82.03343200683594, -79.35026550292969, -76.6670913696289, -73.98391723632812, -71.30075073242188, -68.61758422851562, -65.93441009521484, -63.25123977661133, -60.56806945800781, -57.8848991394043, -55.20172882080078, -52.518558502197266, -49.83538818359375, -47.152217864990234, -44.46904754638672, -41.7858772277832, -39.10270690917969, -36.41953659057617, -33.736366271972656, -31.05319595336914, -28.370025634765625, -25.68685531616211, -23.003684997558594, -20.320514678955078, -17.637344360351562, -14.954174041748047, -12.271003723144531, -9.587833404541016, -6.9046630859375, -4.221492767333984, -1.5383148193359375, 1.1448554992675781, 3.8280258178710938, 6.511196136474609, 9.194366455078125, 11.87753677368164, 14.560707092285156, 17.243877410888672, 19.927047729492188, 22.610218048095703, 25.29338836669922, 27.976558685302734, 30.65972900390625, 33.342899322509766, 36.02606964111328, 38.7092399597168, 41.39241027832031, 44.07558059692383, 46.758750915527344, 49.44192123413086, 52.125091552734375, 54.80826187133789, 57.491432189941406, 60.17460250854492, 62.85777282714844, 65.54093933105469, 68.22411346435547, 70.90728759765625, 73.5904541015625, 76.27362060546875, 78.95679473876953, 81.63996887207031, 84.32313537597656]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 6.0, 5.0, 2.0, 4.0, 8.0, 6.0, 6.0, 6.0, 18.0, 17.0, 17.0, 15.0, 32.0, 20.0, 36.0, 39.0, 31.0, 50.0, 55.0, 58.0, 65.0, 56.0, 58.0, 40.0, 52.0, 47.0, 36.0, 26.0, 27.0, 34.0, 31.0, 18.0, 12.0, 15.0, 18.0, 7.0, 5.0, 6.0, 5.0, 7.0, 5.0, 1.0, 2.0, 5.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.4609375, -11.0955810546875, -10.730224609375, -10.3648681640625, -9.99951171875, -9.6341552734375, -9.268798828125, -8.9034423828125, -8.5380859375, -8.1727294921875, -7.807373046875, -7.4420166015625, -7.07666015625, -6.7113037109375, -6.345947265625, -5.9805908203125, -5.615234375, -5.2498779296875, -4.884521484375, -4.5191650390625, -4.15380859375, -3.7884521484375, -3.423095703125, -3.0577392578125, -2.6923828125, -2.3270263671875, -1.961669921875, -1.5963134765625, -1.23095703125, -0.8656005859375, -0.500244140625, -0.1348876953125, 0.23046875, 0.5958251953125, 0.961181640625, 1.3265380859375, 1.69189453125, 2.0572509765625, 2.422607421875, 2.7879638671875, 3.1533203125, 3.5186767578125, 3.884033203125, 4.2493896484375, 4.61474609375, 4.9801025390625, 5.345458984375, 5.7108154296875, 6.076171875, 6.4415283203125, 6.806884765625, 7.1722412109375, 7.53759765625, 7.9029541015625, 8.268310546875, 8.6336669921875, 8.9990234375, 9.3643798828125, 9.729736328125, 10.0950927734375, 10.46044921875, 10.8258056640625, 11.191162109375, 11.5565185546875, 11.921875]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 9.0, 13.0, 11.0, 9.0, 33.0, 37.0, 47.0, 82.0, 123.0, 185.0, 237.0, 370.0, 495.0, 727.0, 1025.0, 1598.0, 2362.0, 3592.0, 5670.0, 9006.0, 14921.0, 24869.0, 43867.0, 84457.0, 178833.0, 304704.0, 178403.0, 84017.0, 43960.0, 24737.0, 14612.0, 8967.0, 5615.0, 3610.0, 2351.0, 1591.0, 1080.0, 753.0, 503.0, 303.0, 248.0, 176.0, 103.0, 76.0, 56.0, 40.0, 28.0, 25.0, 16.0, 6.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0], "bins": [-1.119140625, -1.0847015380859375, -1.050262451171875, -1.0158233642578125, -0.98138427734375, -0.9469451904296875, -0.912506103515625, -0.8780670166015625, -0.8436279296875, -0.8091888427734375, -0.774749755859375, -0.7403106689453125, -0.70587158203125, -0.6714324951171875, -0.636993408203125, -0.6025543212890625, -0.568115234375, -0.5336761474609375, -0.499237060546875, -0.4647979736328125, -0.43035888671875, -0.3959197998046875, -0.361480712890625, -0.3270416259765625, -0.2926025390625, -0.2581634521484375, -0.223724365234375, -0.1892852783203125, -0.15484619140625, -0.1204071044921875, -0.085968017578125, -0.0515289306640625, -0.01708984375, 0.0173492431640625, 0.051788330078125, 0.0862274169921875, 0.12066650390625, 0.1551055908203125, 0.189544677734375, 0.2239837646484375, 0.2584228515625, 0.2928619384765625, 0.327301025390625, 0.3617401123046875, 0.39617919921875, 0.4306182861328125, 0.465057373046875, 0.4994964599609375, 0.533935546875, 0.5683746337890625, 0.602813720703125, 0.6372528076171875, 0.67169189453125, 0.7061309814453125, 0.740570068359375, 0.7750091552734375, 0.8094482421875, 0.8438873291015625, 0.878326416015625, 0.9127655029296875, 0.94720458984375, 0.9816436767578125, 1.016082763671875, 1.0505218505859375, 1.0849609375]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 6.0, 6.0, 4.0, 1.0, 4.0, 5.0, 5.0, 7.0, 9.0, 8.0, 12.0, 11.0, 16.0, 21.0, 21.0, 12.0, 27.0, 25.0, 42.0, 28.0, 35.0, 41.0, 32.0, 36.0, 39.0, 47.0, 1079.0, 36.0, 33.0, 36.0, 29.0, 35.0, 33.0, 25.0, 28.0, 26.0, 29.0, 27.0, 19.0, 16.0, 16.0, 10.0, 10.0, 16.0, 6.0, 5.0, 9.0, 6.0, 3.0, 3.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.06640625, -5.86688232421875, -5.6673583984375, -5.46783447265625, -5.268310546875, -5.06878662109375, -4.8692626953125, -4.66973876953125, -4.47021484375, -4.27069091796875, -4.0711669921875, -3.87164306640625, -3.672119140625, -3.47259521484375, -3.2730712890625, -3.07354736328125, -2.8740234375, -2.67449951171875, -2.4749755859375, -2.27545166015625, -2.075927734375, -1.87640380859375, -1.6768798828125, -1.47735595703125, -1.27783203125, -1.07830810546875, -0.8787841796875, -0.67926025390625, -0.479736328125, -0.28021240234375, -0.0806884765625, 0.11883544921875, 0.318359375, 0.51788330078125, 0.7174072265625, 0.91693115234375, 1.116455078125, 1.31597900390625, 1.5155029296875, 1.71502685546875, 1.91455078125, 2.11407470703125, 2.3135986328125, 2.51312255859375, 2.712646484375, 2.91217041015625, 3.1116943359375, 3.31121826171875, 3.5107421875, 3.71026611328125, 3.9097900390625, 4.10931396484375, 4.308837890625, 4.50836181640625, 4.7078857421875, 4.90740966796875, 5.10693359375, 5.30645751953125, 5.5059814453125, 5.70550537109375, 5.905029296875, 6.10455322265625, 6.3040771484375, 6.50360107421875, 6.703125]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 6.0, 7.0, 14.0, 16.0, 30.0, 67.0, 94.0, 143.0, 201.0, 283.0, 424.0, 605.0, 939.0, 1322.0, 2057.0, 3098.0, 4697.0, 6991.0, 10652.0, 16160.0, 24753.0, 39659.0, 67568.0, 119524.0, 317240.0, 1155977.0, 130534.0, 73189.0, 43345.0, 26832.0, 17116.0, 11157.0, 7344.0, 4958.0, 3259.0, 2366.0, 1444.0, 1045.0, 679.0, 435.0, 298.0, 203.0, 135.0, 93.0, 57.0, 35.0, 27.0, 16.0, 13.0, 13.0, 3.0, 5.0, 4.0, 4.0], "bins": [-0.673828125, -0.6546173095703125, -0.635406494140625, -0.6161956787109375, -0.59698486328125, -0.5777740478515625, -0.558563232421875, -0.5393524169921875, -0.5201416015625, -0.5009307861328125, -0.481719970703125, -0.4625091552734375, -0.44329833984375, -0.4240875244140625, -0.404876708984375, -0.3856658935546875, -0.366455078125, -0.3472442626953125, -0.328033447265625, -0.3088226318359375, -0.28961181640625, -0.2704010009765625, -0.251190185546875, -0.2319793701171875, -0.2127685546875, -0.1935577392578125, -0.174346923828125, -0.1551361083984375, -0.13592529296875, -0.1167144775390625, -0.097503662109375, -0.0782928466796875, -0.05908203125, -0.0398712158203125, -0.020660400390625, -0.0014495849609375, 0.01776123046875, 0.0369720458984375, 0.056182861328125, 0.0753936767578125, 0.0946044921875, 0.1138153076171875, 0.133026123046875, 0.1522369384765625, 0.17144775390625, 0.1906585693359375, 0.209869384765625, 0.2290802001953125, 0.248291015625, 0.2675018310546875, 0.286712646484375, 0.3059234619140625, 0.32513427734375, 0.3443450927734375, 0.363555908203125, 0.3827667236328125, 0.4019775390625, 0.4211883544921875, 0.440399169921875, 0.4596099853515625, 0.47882080078125, 0.4980316162109375, 0.517242431640625, 0.5364532470703125, 0.5556640625]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 4.0, 0.0, 6.0, 6.0, 13.0, 8.0, 7.0, 16.0, 15.0, 18.0, 20.0, 19.0, 31.0, 32.0, 41.0, 60.0, 62.0, 95.0, 76.0, 85.0, 59.0, 64.0, 51.0, 35.0, 29.0, 20.0, 31.0, 13.0, 5.0, 16.0, 9.0, 11.0, 11.0, 7.0, 6.0, 4.0, 7.0, 6.0, 3.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.020294189453125, -0.019631385803222656, -0.018968582153320312, -0.01830577850341797, -0.017642974853515625, -0.01698017120361328, -0.016317367553710938, -0.015654563903808594, -0.01499176025390625, -0.014328956604003906, -0.013666152954101562, -0.013003349304199219, -0.012340545654296875, -0.011677742004394531, -0.011014938354492188, -0.010352134704589844, -0.0096893310546875, -0.009026527404785156, -0.008363723754882812, -0.007700920104980469, -0.007038116455078125, -0.006375312805175781, -0.0057125091552734375, -0.005049705505371094, -0.00438690185546875, -0.0037240982055664062, -0.0030612945556640625, -0.0023984909057617188, -0.001735687255859375, -0.0010728836059570312, -0.0004100799560546875, 0.00025272369384765625, 0.00091552734375, 0.0015783309936523438, 0.0022411346435546875, 0.0029039382934570312, 0.003566741943359375, 0.004229545593261719, 0.0048923492431640625, 0.005555152893066406, 0.00621795654296875, 0.006880760192871094, 0.0075435638427734375, 0.008206367492675781, 0.008869171142578125, 0.009531974792480469, 0.010194778442382812, 0.010857582092285156, 0.0115203857421875, 0.012183189392089844, 0.012845993041992188, 0.013508796691894531, 0.014171600341796875, 0.014834403991699219, 0.015497207641601562, 0.016160011291503906, 0.01682281494140625, 0.017485618591308594, 0.018148422241210938, 0.01881122589111328, 0.019474029541015625, 0.02013683319091797, 0.020799636840820312, 0.021462440490722656, 0.022125244140625]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 5.0, 5.0, 4.0, 5.0, 6.0, 8.0, 10.0, 10.0, 13.0, 14.0, 6.0, 16.0, 28.0, 26.0, 25.0, 37.0, 69.0, 104.0, 163.0, 594.0, 32613.0, 1012452.0, 1635.0, 275.0, 132.0, 65.0, 46.0, 22.0, 26.0, 29.0, 19.0, 18.0, 20.0, 12.0, 8.0, 9.0, 14.0, 5.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.63818359375, -0.6183624267578125, -0.598541259765625, -0.5787200927734375, -0.55889892578125, -0.5390777587890625, -0.519256591796875, -0.4994354248046875, -0.4796142578125, -0.4597930908203125, -0.439971923828125, -0.4201507568359375, -0.40032958984375, -0.3805084228515625, -0.360687255859375, -0.3408660888671875, -0.321044921875, -0.3012237548828125, -0.281402587890625, -0.2615814208984375, -0.24176025390625, -0.2219390869140625, -0.202117919921875, -0.1822967529296875, -0.1624755859375, -0.1426544189453125, -0.122833251953125, -0.1030120849609375, -0.08319091796875, -0.0633697509765625, -0.043548583984375, -0.0237274169921875, -0.00390625, 0.0159149169921875, 0.035736083984375, 0.0555572509765625, 0.07537841796875, 0.0951995849609375, 0.115020751953125, 0.1348419189453125, 0.1546630859375, 0.1744842529296875, 0.194305419921875, 0.2141265869140625, 0.23394775390625, 0.2537689208984375, 0.273590087890625, 0.2934112548828125, 0.313232421875, 0.3330535888671875, 0.352874755859375, 0.3726959228515625, 0.39251708984375, 0.4123382568359375, 0.432159423828125, 0.4519805908203125, 0.4718017578125, 0.4916229248046875, 0.511444091796875, 0.5312652587890625, 0.55108642578125, 0.5709075927734375, 0.590728759765625, 0.6105499267578125, 0.63037109375]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [34.0, 851.0, 127.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.018961401656270027, -0.007432793267071247, 0.004095815122127533, 0.015624424442648888, 0.027153031900525093, 0.03868164122104645, 0.05021025240421295, 0.06173885613679886, 0.07326746731996536, 0.08479607850313187, 0.09632468223571777, 0.10785329341888428, 0.11938190460205078, 0.13091051578521729, 0.1424391269683838, 0.1539677232503891, 0.1654963344335556, 0.1770249456167221, 0.1885535567998886, 0.20008215308189392, 0.21161076426506042, 0.22313937544822693, 0.23466798663139343, 0.24619659781455994, 0.25772520899772644, 0.26925382018089294, 0.28078243136405945, 0.29231104254722595, 0.30383965373039246, 0.3153682351112366, 0.3268968462944031, 0.3384254574775696, 0.3499540388584137, 0.3614826500415802, 0.3730112612247467, 0.3845398724079132, 0.3960684835910797, 0.40759706497192383, 0.41912567615509033, 0.43065428733825684, 0.44218289852142334, 0.45371150970458984, 0.46524012088775635, 0.47676873207092285, 0.48829734325408936, 0.49982595443725586, 0.5113545656204224, 0.5228831768035889, 0.5344117879867554, 0.5459403991699219, 0.5574690103530884, 0.5689976215362549, 0.5805262327194214, 0.5920548439025879, 0.6035834550857544, 0.6151120662689209, 0.6266406178474426, 0.6381692290306091, 0.6496978402137756, 0.6612264513969421, 0.6727550625801086, 0.6842836737632751, 0.6958122849464417, 0.7073408961296082, 0.7188695073127747]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 3.0, 8.0, 7.0, 12.0, 10.0, 6.0, 23.0, 18.0, 12.0, 19.0, 15.0, 24.0, 20.0, 28.0, 40.0, 31.0, 42.0, 41.0, 39.0, 42.0, 35.0, 46.0, 43.0, 36.0, 43.0, 41.0, 42.0, 32.0, 29.0, 25.0, 41.0, 23.0, 19.0, 16.0, 14.0, 20.0, 16.0, 12.0, 8.0, 7.0, 6.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.04014807939529419, -0.03895947337150574, -0.037770871073007584, -0.03658226877450943, -0.03539366275072098, -0.034205056726932526, -0.03301645442843437, -0.03182785212993622, -0.030639246106147766, -0.029450641945004463, -0.02826203778386116, -0.027073433622717857, -0.025884829461574554, -0.02469622530043125, -0.02350762113928795, -0.022319016978144646, -0.021130412817001343, -0.01994180865585804, -0.018753204494714737, -0.017564600333571434, -0.01637599617242813, -0.015187392011284828, -0.013998787850141525, -0.012810183688998222, -0.01162157952785492, -0.010432975366711617, -0.009244371205568314, -0.00805576704442501, -0.006867162883281708, -0.005678558722138405, -0.004489954560995102, -0.003301350399851799, -0.002112746238708496, -0.0009241420775651932, 0.00026446208357810974, 0.0014530662447214127, 0.0026416704058647156, 0.0038302745670080185, 0.005018878728151321, 0.006207482889294624, 0.007396087050437927, 0.00858469121158123, 0.009773295372724533, 0.010961899533867836, 0.012150503695011139, 0.013339107856154442, 0.014527712017297745, 0.015716316178441048, 0.01690492033958435, 0.018093524500727654, 0.019282128661870956, 0.02047073282301426, 0.021659336984157562, 0.022847941145300865, 0.024036545306444168, 0.02522514946758747, 0.026413753628730774, 0.027602357789874077, 0.02879096195101738, 0.029979566112160683, 0.031168170273303986, 0.03235677629709244, 0.03354537859559059, 0.034733980894088745, 0.0359225869178772]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 6.0, 5.0, 2.0, 4.0, 8.0, 6.0, 6.0, 6.0, 19.0, 16.0, 17.0, 15.0, 32.0, 20.0, 36.0, 39.0, 31.0, 50.0, 55.0, 58.0, 65.0, 56.0, 58.0, 40.0, 52.0, 47.0, 36.0, 26.0, 27.0, 34.0, 31.0, 18.0, 12.0, 15.0, 18.0, 7.0, 5.0, 6.0, 5.0, 7.0, 5.0, 1.0, 2.0, 5.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.4609375, -11.0955810546875, -10.730224609375, -10.3648681640625, -9.99951171875, -9.6341552734375, -9.268798828125, -8.9034423828125, -8.5380859375, -8.1727294921875, -7.807373046875, -7.4420166015625, -7.07666015625, -6.7113037109375, -6.345947265625, -5.9805908203125, -5.615234375, -5.2498779296875, -4.884521484375, -4.5191650390625, -4.15380859375, -3.7884521484375, -3.423095703125, -3.0577392578125, -2.6923828125, -2.3270263671875, -1.961669921875, -1.5963134765625, -1.23095703125, -0.8656005859375, -0.500244140625, -0.1348876953125, 0.23046875, 0.5958251953125, 0.961181640625, 1.3265380859375, 1.69189453125, 2.0572509765625, 2.422607421875, 2.7879638671875, 3.1533203125, 3.5186767578125, 3.884033203125, 4.2493896484375, 4.61474609375, 4.9801025390625, 5.345458984375, 5.7108154296875, 6.076171875, 6.4415283203125, 6.806884765625, 7.1722412109375, 7.53759765625, 7.9029541015625, 8.268310546875, 8.6336669921875, 8.9990234375, 9.3643798828125, 9.729736328125, 10.0950927734375, 10.46044921875, 10.8258056640625, 11.191162109375, 11.5565185546875, 11.921875]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 6.0, 6.0, 12.0, 7.0, 15.0, 20.0, 25.0, 38.0, 43.0, 73.0, 83.0, 123.0, 188.0, 267.0, 372.0, 512.0, 882.0, 1433.0, 2624.0, 5438.0, 13326.0, 42394.0, 190395.0, 606277.0, 130529.0, 32001.0, 10921.0, 4587.0, 2258.0, 1252.0, 783.0, 469.0, 321.0, 231.0, 162.0, 134.0, 78.0, 76.0, 53.0, 34.0, 20.0, 26.0, 17.0, 14.0, 9.0, 7.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-8.4453125, -8.1845703125, -7.923828125, -7.6630859375, -7.40234375, -7.1416015625, -6.880859375, -6.6201171875, -6.359375, -6.0986328125, -5.837890625, -5.5771484375, -5.31640625, -5.0556640625, -4.794921875, -4.5341796875, -4.2734375, -4.0126953125, -3.751953125, -3.4912109375, -3.23046875, -2.9697265625, -2.708984375, -2.4482421875, -2.1875, -1.9267578125, -1.666015625, -1.4052734375, -1.14453125, -0.8837890625, -0.623046875, -0.3623046875, -0.1015625, 0.1591796875, 0.419921875, 0.6806640625, 0.94140625, 1.2021484375, 1.462890625, 1.7236328125, 1.984375, 2.2451171875, 2.505859375, 2.7666015625, 3.02734375, 3.2880859375, 3.548828125, 3.8095703125, 4.0703125, 4.3310546875, 4.591796875, 4.8525390625, 5.11328125, 5.3740234375, 5.634765625, 5.8955078125, 6.15625, 6.4169921875, 6.677734375, 6.9384765625, 7.19921875, 7.4599609375, 7.720703125, 7.9814453125, 8.2421875]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 6.0, 7.0, 7.0, 5.0, 11.0, 8.0, 15.0, 16.0, 19.0, 31.0, 33.0, 22.0, 30.0, 25.0, 38.0, 30.0, 47.0, 34.0, 42.0, 77.0, 266.0, 1730.0, 94.0, 51.0, 37.0, 44.0, 32.0, 34.0, 37.0, 29.0, 24.0, 28.0, 16.0, 22.0, 15.0, 14.0, 11.0, 15.0, 11.0, 9.0, 6.0, 3.0, 4.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-35.15625, -34.02734375, -32.8984375, -31.76953125, -30.640625, -29.51171875, -28.3828125, -27.25390625, -26.125, -24.99609375, -23.8671875, -22.73828125, -21.609375, -20.48046875, -19.3515625, -18.22265625, -17.09375, -15.96484375, -14.8359375, -13.70703125, -12.578125, -11.44921875, -10.3203125, -9.19140625, -8.0625, -6.93359375, -5.8046875, -4.67578125, -3.546875, -2.41796875, -1.2890625, -0.16015625, 0.96875, 2.09765625, 3.2265625, 4.35546875, 5.484375, 6.61328125, 7.7421875, 8.87109375, 10.0, 11.12890625, 12.2578125, 13.38671875, 14.515625, 15.64453125, 16.7734375, 17.90234375, 19.03125, 20.16015625, 21.2890625, 22.41796875, 23.546875, 24.67578125, 25.8046875, 26.93359375, 28.0625, 29.19140625, 30.3203125, 31.44921875, 32.578125, 33.70703125, 34.8359375, 35.96484375, 37.09375]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 6.0, 5.0, 4.0, 10.0, 13.0, 19.0, 11.0, 10.0, 22.0, 16.0, 30.0, 41.0, 38.0, 58.0, 70.0, 114.0, 174.0, 331.0, 833.0, 5113.0, 1908376.0, 1223594.0, 5021.0, 756.0, 382.0, 193.0, 94.0, 80.0, 50.0, 40.0, 28.0, 34.0, 33.0, 20.0, 18.0, 7.0, 15.0, 12.0, 5.0, 8.0, 5.0, 4.0, 1.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-62.84375, -60.93896484375, -59.0341796875, -57.12939453125, -55.224609375, -53.31982421875, -51.4150390625, -49.51025390625, -47.60546875, -45.70068359375, -43.7958984375, -41.89111328125, -39.986328125, -38.08154296875, -36.1767578125, -34.27197265625, -32.3671875, -30.46240234375, -28.5576171875, -26.65283203125, -24.748046875, -22.84326171875, -20.9384765625, -19.03369140625, -17.12890625, -15.22412109375, -13.3193359375, -11.41455078125, -9.509765625, -7.60498046875, -5.7001953125, -3.79541015625, -1.890625, 0.01416015625, 1.9189453125, 3.82373046875, 5.728515625, 7.63330078125, 9.5380859375, 11.44287109375, 13.34765625, 15.25244140625, 17.1572265625, 19.06201171875, 20.966796875, 22.87158203125, 24.7763671875, 26.68115234375, 28.5859375, 30.49072265625, 32.3955078125, 34.30029296875, 36.205078125, 38.10986328125, 40.0146484375, 41.91943359375, 43.82421875, 45.72900390625, 47.6337890625, 49.53857421875, 51.443359375, 53.34814453125, 55.2529296875, 57.15771484375, 59.0625]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 20.0, 840.0, 160.0], "bins": [-659.6683959960938, -649.1531982421875, -638.637939453125, -628.1227416992188, -617.6075439453125, -607.09228515625, -596.5770874023438, -586.0618896484375, -575.5466918945312, -565.031494140625, -554.5162353515625, -544.0010375976562, -533.48583984375, -522.9705810546875, -512.4553833007812, -501.940185546875, -491.4249267578125, -480.9096984863281, -470.3945007324219, -459.8792724609375, -449.36407470703125, -438.8488464355469, -428.3336181640625, -417.81842041015625, -407.30322265625, -396.7879943847656, -386.2727966308594, -375.757568359375, -365.24237060546875, -354.7271423339844, -344.2119140625, -333.69671630859375, -323.1814880371094, -312.666259765625, -302.15106201171875, -291.6358337402344, -281.1206359863281, -270.60540771484375, -260.0902099609375, -249.57498168945312, -239.0597686767578, -228.5445556640625, -218.0293426513672, -207.51412963867188, -196.9989013671875, -186.4836883544922, -175.96847534179688, -165.4532470703125, -154.93804931640625, -144.42283630371094, -133.90762329101562, -123.39240264892578, -112.87718200683594, -102.36196899414062, -91.84675598144531, -81.33153533935547, -70.81632232666016, -60.30110549926758, -49.785888671875, -39.27067565917969, -28.75545883178711, -18.24024200439453, -7.725028991699219, 2.790191650390625, 13.305407524108887]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 5.0, 3.0, 2.0, 3.0, 8.0, 6.0, 11.0, 15.0, 16.0, 16.0, 20.0, 19.0, 17.0, 25.0, 24.0, 30.0, 39.0, 38.0, 34.0, 41.0, 33.0, 39.0, 33.0, 48.0, 49.0, 49.0, 49.0, 46.0, 36.0, 29.0, 28.0, 34.0, 19.0, 27.0, 19.0, 22.0, 11.0, 13.0, 12.0, 9.0, 8.0, 3.0, 6.0, 3.0, 2.0, 5.0, 2.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-133.70159912109375, -129.6881866455078, -125.67477416992188, -121.66136169433594, -117.64794921875, -113.63453674316406, -109.62113189697266, -105.60771942138672, -101.59430694580078, -97.58089447021484, -93.5674819946289, -89.55406951904297, -85.54066467285156, -81.52725219726562, -77.51383972167969, -73.50042724609375, -69.48701477050781, -65.47360229492188, -61.46018981933594, -57.446781158447266, -53.43336868286133, -49.41995620727539, -45.40654754638672, -41.39313507080078, -37.379722595214844, -33.366310119628906, -29.3528995513916, -25.339488983154297, -21.32607650756836, -17.312664031982422, -13.299253463745117, -9.285842895507812, -5.2724456787109375, -1.2590341567993164, 2.7543773651123047, 6.767788887023926, 10.781200408935547, 14.794612884521484, 18.80802345275879, 22.821434020996094, 26.83484649658203, 30.84825897216797, 34.861671447753906, 38.87508010864258, 42.888492584228516, 46.90190505981445, 50.915313720703125, 54.92872619628906, 58.942138671875, 62.95555114746094, 66.96896362304688, 70.98237609863281, 74.99578857421875, 79.00920104980469, 83.0226058959961, 87.03601837158203, 91.04943084716797, 95.0628433227539, 99.07625579833984, 103.08966827392578, 107.10307312011719, 111.11648559570312, 115.12989807128906, 119.143310546875, 123.15672302246094]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 4.0, 5.0, 5.0, 6.0, 4.0, 6.0, 7.0, 10.0, 19.0, 13.0, 17.0, 22.0, 23.0, 42.0, 34.0, 28.0, 34.0, 54.0, 49.0, 69.0, 67.0, 53.0, 51.0, 61.0, 44.0, 43.0, 37.0, 18.0, 38.0, 23.0, 31.0, 13.0, 15.0, 17.0, 9.0, 7.0, 4.0, 9.0, 3.0, 6.0, 2.0, 2.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.96875, -11.582275390625, -11.19580078125, -10.809326171875, -10.4228515625, -10.036376953125, -9.64990234375, -9.263427734375, -8.876953125, -8.490478515625, -8.10400390625, -7.717529296875, -7.3310546875, -6.944580078125, -6.55810546875, -6.171630859375, -5.78515625, -5.398681640625, -5.01220703125, -4.625732421875, -4.2392578125, -3.852783203125, -3.46630859375, -3.079833984375, -2.693359375, -2.306884765625, -1.92041015625, -1.533935546875, -1.1474609375, -0.760986328125, -0.37451171875, 0.011962890625, 0.3984375, 0.784912109375, 1.17138671875, 1.557861328125, 1.9443359375, 2.330810546875, 2.71728515625, 3.103759765625, 3.490234375, 3.876708984375, 4.26318359375, 4.649658203125, 5.0361328125, 5.422607421875, 5.80908203125, 6.195556640625, 6.58203125, 6.968505859375, 7.35498046875, 7.741455078125, 8.1279296875, 8.514404296875, 8.90087890625, 9.287353515625, 9.673828125, 10.060302734375, 10.44677734375, 10.833251953125, 11.2197265625, 11.606201171875, 11.99267578125, 12.379150390625, 12.765625]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 3.0, 7.0, 5.0, 3.0, 4.0, 11.0, 12.0, 18.0, 27.0, 24.0, 38.0, 61.0, 111.0, 192.0, 351.0, 771.0, 2086.0, 6530.0, 36187.0, 4021071.0, 112608.0, 9279.0, 2844.0, 1045.0, 425.0, 230.0, 91.0, 72.0, 47.0, 35.0, 22.0, 11.0, 24.0, 5.0, 9.0, 5.0, 7.0, 3.0, 4.0, 1.0, 3.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-71.0, -68.681640625, -66.36328125, -64.044921875, -61.7265625, -59.408203125, -57.08984375, -54.771484375, -52.453125, -50.134765625, -47.81640625, -45.498046875, -43.1796875, -40.861328125, -38.54296875, -36.224609375, -33.90625, -31.587890625, -29.26953125, -26.951171875, -24.6328125, -22.314453125, -19.99609375, -17.677734375, -15.359375, -13.041015625, -10.72265625, -8.404296875, -6.0859375, -3.767578125, -1.44921875, 0.869140625, 3.1875, 5.505859375, 7.82421875, 10.142578125, 12.4609375, 14.779296875, 17.09765625, 19.416015625, 21.734375, 24.052734375, 26.37109375, 28.689453125, 31.0078125, 33.326171875, 35.64453125, 37.962890625, 40.28125, 42.599609375, 44.91796875, 47.236328125, 49.5546875, 51.873046875, 54.19140625, 56.509765625, 58.828125, 61.146484375, 63.46484375, 65.783203125, 68.1015625, 70.419921875, 72.73828125, 75.056640625, 77.375]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 1.0, 6.0, 7.0, 4.0, 3.0, 3.0, 9.0, 8.0, 5.0, 13.0, 15.0, 20.0, 36.0, 37.0, 56.0, 117.0, 217.0, 446.0, 811.0, 926.0, 611.0, 296.0, 171.0, 71.0, 45.0, 25.0, 19.0, 12.0, 12.0, 10.0, 12.0, 7.0, 7.0, 8.0, 4.0, 5.0, 9.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.9375, -27.98095703125, -27.0244140625, -26.06787109375, -25.111328125, -24.15478515625, -23.1982421875, -22.24169921875, -21.28515625, -20.32861328125, -19.3720703125, -18.41552734375, -17.458984375, -16.50244140625, -15.5458984375, -14.58935546875, -13.6328125, -12.67626953125, -11.7197265625, -10.76318359375, -9.806640625, -8.85009765625, -7.8935546875, -6.93701171875, -5.98046875, -5.02392578125, -4.0673828125, -3.11083984375, -2.154296875, -1.19775390625, -0.2412109375, 0.71533203125, 1.671875, 2.62841796875, 3.5849609375, 4.54150390625, 5.498046875, 6.45458984375, 7.4111328125, 8.36767578125, 9.32421875, 10.28076171875, 11.2373046875, 12.19384765625, 13.150390625, 14.10693359375, 15.0634765625, 16.02001953125, 16.9765625, 17.93310546875, 18.8896484375, 19.84619140625, 20.802734375, 21.75927734375, 22.7158203125, 23.67236328125, 24.62890625, 25.58544921875, 26.5419921875, 27.49853515625, 28.455078125, 29.41162109375, 30.3681640625, 31.32470703125, 32.28125]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 5.0, 11.0, 13.0, 22.0, 33.0, 57.0, 86.0, 155.0, 249.0, 430.0, 736.0, 1313.0, 2326.0, 4302.0, 8370.0, 18175.0, 52113.0, 638659.0, 3298913.0, 115672.0, 27938.0, 11777.0, 5725.0, 3145.0, 1718.0, 969.0, 581.0, 306.0, 177.0, 102.0, 77.0, 47.0, 27.0, 17.0, 13.0, 7.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-56.5, -54.7998046875, -53.099609375, -51.3994140625, -49.69921875, -47.9990234375, -46.298828125, -44.5986328125, -42.8984375, -41.1982421875, -39.498046875, -37.7978515625, -36.09765625, -34.3974609375, -32.697265625, -30.9970703125, -29.296875, -27.5966796875, -25.896484375, -24.1962890625, -22.49609375, -20.7958984375, -19.095703125, -17.3955078125, -15.6953125, -13.9951171875, -12.294921875, -10.5947265625, -8.89453125, -7.1943359375, -5.494140625, -3.7939453125, -2.09375, -0.3935546875, 1.306640625, 3.0068359375, 4.70703125, 6.4072265625, 8.107421875, 9.8076171875, 11.5078125, 13.2080078125, 14.908203125, 16.6083984375, 18.30859375, 20.0087890625, 21.708984375, 23.4091796875, 25.109375, 26.8095703125, 28.509765625, 30.2099609375, 31.91015625, 33.6103515625, 35.310546875, 37.0107421875, 38.7109375, 40.4111328125, 42.111328125, 43.8115234375, 45.51171875, 47.2119140625, 48.912109375, 50.6123046875, 52.3125]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 6.0, 12.0, 17.0, 24.0, 41.0, 63.0, 99.0, 176.0, 204.0, 142.0, 90.0, 51.0, 26.0, 24.0, 11.0, 9.0, 7.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-244.9332733154297, -239.7628936767578, -234.59251403808594, -229.42213439941406, -224.2517547607422, -219.0813751220703, -213.91099548339844, -208.74063110351562, -203.57025146484375, -198.39987182617188, -193.2294921875, -188.05911254882812, -182.88873291015625, -177.71835327148438, -172.5479736328125, -167.37759399414062, -162.20721435546875, -157.03683471679688, -151.866455078125, -146.69607543945312, -141.52569580078125, -136.35531616210938, -131.1849365234375, -126.01456451416016, -120.84418487548828, -115.6738052368164, -110.50342559814453, -105.33304595947266, -100.16267395019531, -94.99229431152344, -89.82191467285156, -84.65153503417969, -79.48117065429688, -74.310791015625, -69.14041137695312, -63.970035552978516, -58.79965591430664, -53.629276275634766, -48.458900451660156, -43.28852081298828, -38.118141174316406, -32.94776153564453, -27.77738380432129, -22.607006072998047, -17.436626434326172, -12.266246795654297, -7.095869064331055, -1.9254913330078125, 3.2448883056640625, 8.415266990661621, 13.58564567565918, 18.756023406982422, 23.926403045654297, 29.096782684326172, 34.26715850830078, 39.437538146972656, 44.60791778564453, 49.778297424316406, 54.94867706298828, 60.11905288696289, 65.2894287109375, 70.45980834960938, 75.63018798828125, 80.80056762695312, 85.970947265625]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 2.0, 4.0, 6.0, 3.0, 1.0, 8.0, 7.0, 5.0, 6.0, 20.0, 13.0, 24.0, 18.0, 15.0, 25.0, 23.0, 23.0, 26.0, 32.0, 33.0, 30.0, 41.0, 40.0, 38.0, 43.0, 41.0, 31.0, 39.0, 45.0, 39.0, 44.0, 31.0, 37.0, 27.0, 31.0, 14.0, 21.0, 18.0, 16.0, 19.0, 10.0, 13.0, 8.0, 9.0, 7.0, 6.0, 2.0, 2.0, 3.0, 4.0, 4.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.24476623535156, -66.90499877929688, -64.56523132324219, -62.225460052490234, -59.88569259643555, -57.545921325683594, -55.206153869628906, -52.86638641357422, -50.52661895751953, -48.186851501464844, -45.84708023071289, -43.5073127746582, -41.167545318603516, -38.82777404785156, -36.488006591796875, -34.14823913574219, -31.808467864990234, -29.468698501586914, -27.128931045532227, -24.789161682128906, -22.44939422607422, -20.1096248626709, -17.769855499267578, -15.43008804321289, -13.09031867980957, -10.750550270080566, -8.410781860351562, -6.071012496948242, -3.7312440872192383, -1.3914756774902344, 0.9482936859130859, 3.2880611419677734, 5.627830505371094, 7.967598915100098, 10.307367324829102, 12.647136688232422, 14.986905097961426, 17.32667350769043, 19.66644287109375, 22.006210327148438, 24.345979690551758, 26.685749053955078, 29.025516510009766, 31.365285873413086, 33.705055236816406, 36.044822692871094, 38.38459014892578, 40.72435760498047, 43.06412887573242, 45.40389633178711, 47.74366760253906, 50.08343505859375, 52.42320251464844, 54.762969970703125, 57.10274124145508, 59.442508697509766, 61.78227996826172, 64.1220474243164, 66.4618148803711, 68.80158996582031, 71.141357421875, 73.48112487792969, 75.82089233398438, 78.16065979003906, 80.50042724609375]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 4.0, 1.0, 4.0, 4.0, 4.0, 4.0, 9.0, 8.0, 6.0, 14.0, 12.0, 12.0, 21.0, 19.0, 25.0, 37.0, 31.0, 35.0, 30.0, 31.0, 49.0, 55.0, 54.0, 46.0, 57.0, 39.0, 48.0, 36.0, 39.0, 35.0, 33.0, 35.0, 32.0, 18.0, 25.0, 18.0, 19.0, 18.0, 13.0, 7.0, 4.0, 4.0, 2.0, 3.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.265625, -10.899658203125, -10.53369140625, -10.167724609375, -9.8017578125, -9.435791015625, -9.06982421875, -8.703857421875, -8.337890625, -7.971923828125, -7.60595703125, -7.239990234375, -6.8740234375, -6.508056640625, -6.14208984375, -5.776123046875, -5.41015625, -5.044189453125, -4.67822265625, -4.312255859375, -3.9462890625, -3.580322265625, -3.21435546875, -2.848388671875, -2.482421875, -2.116455078125, -1.75048828125, -1.384521484375, -1.0185546875, -0.652587890625, -0.28662109375, 0.079345703125, 0.4453125, 0.811279296875, 1.17724609375, 1.543212890625, 1.9091796875, 2.275146484375, 2.64111328125, 3.007080078125, 3.373046875, 3.739013671875, 4.10498046875, 4.470947265625, 4.8369140625, 5.202880859375, 5.56884765625, 5.934814453125, 6.30078125, 6.666748046875, 7.03271484375, 7.398681640625, 7.7646484375, 8.130615234375, 8.49658203125, 8.862548828125, 9.228515625, 9.594482421875, 9.96044921875, 10.326416015625, 10.6923828125, 11.058349609375, 11.42431640625, 11.790283203125, 12.15625]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 3.0, 5.0, 7.0, 15.0, 18.0, 13.0, 29.0, 48.0, 68.0, 104.0, 129.0, 196.0, 268.0, 329.0, 546.0, 796.0, 1149.0, 1507.0, 2400.0, 3448.0, 5343.0, 8116.0, 12790.0, 20371.0, 33655.0, 58089.0, 108637.0, 222712.0, 262609.0, 132377.0, 68256.0, 39022.0, 23346.0, 14478.0, 9293.0, 6023.0, 3916.0, 2655.0, 1831.0, 1149.0, 808.0, 607.0, 405.0, 315.0, 213.0, 136.0, 97.0, 73.0, 51.0, 30.0, 33.0, 24.0, 16.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.1142578125, -1.0784759521484375, -1.042694091796875, -1.0069122314453125, -0.97113037109375, -0.9353485107421875, -0.899566650390625, -0.8637847900390625, -0.8280029296875, -0.7922210693359375, -0.756439208984375, -0.7206573486328125, -0.68487548828125, -0.6490936279296875, -0.613311767578125, -0.5775299072265625, -0.541748046875, -0.5059661865234375, -0.470184326171875, -0.4344024658203125, -0.39862060546875, -0.3628387451171875, -0.327056884765625, -0.2912750244140625, -0.2554931640625, -0.2197113037109375, -0.183929443359375, -0.1481475830078125, -0.11236572265625, -0.0765838623046875, -0.040802001953125, -0.0050201416015625, 0.03076171875, 0.0665435791015625, 0.102325439453125, 0.1381072998046875, 0.17388916015625, 0.2096710205078125, 0.245452880859375, 0.2812347412109375, 0.3170166015625, 0.3527984619140625, 0.388580322265625, 0.4243621826171875, 0.46014404296875, 0.4959259033203125, 0.531707763671875, 0.5674896240234375, 0.603271484375, 0.6390533447265625, 0.674835205078125, 0.7106170654296875, 0.74639892578125, 0.7821807861328125, 0.817962646484375, 0.8537445068359375, 0.8895263671875, 0.9253082275390625, 0.961090087890625, 0.9968719482421875, 1.03265380859375, 1.0684356689453125, 1.104217529296875, 1.1399993896484375, 1.17578125]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 5.0, 1.0, 9.0, 5.0, 4.0, 11.0, 16.0, 16.0, 16.0, 18.0, 31.0, 27.0, 26.0, 22.0, 31.0, 39.0, 24.0, 25.0, 36.0, 31.0, 40.0, 51.0, 1054.0, 42.0, 44.0, 33.0, 38.0, 30.0, 29.0, 33.0, 38.0, 30.0, 30.0, 23.0, 17.0, 17.0, 17.0, 14.0, 11.0, 10.0, 8.0, 8.0, 5.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.0234375, -5.8134765625, -5.603515625, -5.3935546875, -5.18359375, -4.9736328125, -4.763671875, -4.5537109375, -4.34375, -4.1337890625, -3.923828125, -3.7138671875, -3.50390625, -3.2939453125, -3.083984375, -2.8740234375, -2.6640625, -2.4541015625, -2.244140625, -2.0341796875, -1.82421875, -1.6142578125, -1.404296875, -1.1943359375, -0.984375, -0.7744140625, -0.564453125, -0.3544921875, -0.14453125, 0.0654296875, 0.275390625, 0.4853515625, 0.6953125, 0.9052734375, 1.115234375, 1.3251953125, 1.53515625, 1.7451171875, 1.955078125, 2.1650390625, 2.375, 2.5849609375, 2.794921875, 3.0048828125, 3.21484375, 3.4248046875, 3.634765625, 3.8447265625, 4.0546875, 4.2646484375, 4.474609375, 4.6845703125, 4.89453125, 5.1044921875, 5.314453125, 5.5244140625, 5.734375, 5.9443359375, 6.154296875, 6.3642578125, 6.57421875, 6.7841796875, 6.994140625, 7.2041015625, 7.4140625]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 7.0, 9.0, 17.0, 16.0, 37.0, 49.0, 87.0, 116.0, 160.0, 279.0, 413.0, 685.0, 995.0, 1577.0, 2530.0, 3840.0, 6088.0, 9694.0, 15455.0, 24680.0, 40913.0, 69615.0, 124625.0, 683999.0, 806968.0, 126088.0, 69611.0, 40639.0, 25077.0, 15711.0, 9997.0, 6267.0, 3951.0, 2468.0, 1559.0, 1033.0, 643.0, 453.0, 270.0, 150.0, 125.0, 89.0, 56.0, 33.0, 20.0, 14.0, 8.0, 9.0, 4.0, 1.0, 5.0, 0.0, 2.0], "bins": [-0.767578125, -0.7456512451171875, -0.723724365234375, -0.7017974853515625, -0.67987060546875, -0.6579437255859375, -0.636016845703125, -0.6140899658203125, -0.5921630859375, -0.5702362060546875, -0.548309326171875, -0.5263824462890625, -0.50445556640625, -0.4825286865234375, -0.460601806640625, -0.4386749267578125, -0.416748046875, -0.3948211669921875, -0.372894287109375, -0.3509674072265625, -0.32904052734375, -0.3071136474609375, -0.285186767578125, -0.2632598876953125, -0.2413330078125, -0.2194061279296875, -0.197479248046875, -0.1755523681640625, -0.15362548828125, -0.1316986083984375, -0.109771728515625, -0.0878448486328125, -0.06591796875, -0.0439910888671875, -0.022064208984375, -0.0001373291015625, 0.02178955078125, 0.0437164306640625, 0.065643310546875, 0.0875701904296875, 0.1094970703125, 0.1314239501953125, 0.153350830078125, 0.1752777099609375, 0.19720458984375, 0.2191314697265625, 0.241058349609375, 0.2629852294921875, 0.284912109375, 0.3068389892578125, 0.328765869140625, 0.3506927490234375, 0.37261962890625, 0.3945465087890625, 0.416473388671875, 0.4384002685546875, 0.4603271484375, 0.4822540283203125, 0.504180908203125, 0.5261077880859375, 0.54803466796875, 0.5699615478515625, 0.591888427734375, 0.6138153076171875, 0.6357421875]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 3.0, 5.0, 4.0, 3.0, 7.0, 2.0, 5.0, 10.0, 8.0, 13.0, 10.0, 9.0, 11.0, 18.0, 16.0, 18.0, 25.0, 28.0, 35.0, 39.0, 49.0, 62.0, 67.0, 72.0, 68.0, 72.0, 54.0, 47.0, 31.0, 38.0, 22.0, 25.0, 16.0, 19.0, 19.0, 12.0, 10.0, 13.0, 2.0, 4.0, 9.0, 5.0, 5.0, 3.0, 3.0, 1.0, 5.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01110076904296875, -0.010750174522399902, -0.010399580001831055, -0.010048985481262207, -0.00969839096069336, -0.009347796440124512, -0.008997201919555664, -0.008646607398986816, -0.008296012878417969, -0.007945418357849121, -0.0075948238372802734, -0.007244229316711426, -0.006893634796142578, -0.0065430402755737305, -0.006192445755004883, -0.005841851234436035, -0.0054912567138671875, -0.00514066219329834, -0.004790067672729492, -0.0044394731521606445, -0.004088878631591797, -0.0037382841110229492, -0.0033876895904541016, -0.003037095069885254, -0.0026865005493164062, -0.0023359060287475586, -0.001985311508178711, -0.0016347169876098633, -0.0012841224670410156, -0.000933527946472168, -0.0005829334259033203, -0.00023233890533447266, 0.000118255615234375, 0.00046885013580322266, 0.0008194446563720703, 0.001170039176940918, 0.0015206336975097656, 0.0018712282180786133, 0.002221822738647461, 0.0025724172592163086, 0.0029230117797851562, 0.003273606300354004, 0.0036242008209228516, 0.003974795341491699, 0.004325389862060547, 0.0046759843826293945, 0.005026578903198242, 0.00537717342376709, 0.0057277679443359375, 0.006078362464904785, 0.006428956985473633, 0.0067795515060424805, 0.007130146026611328, 0.007480740547180176, 0.007831335067749023, 0.008181929588317871, 0.008532524108886719, 0.008883118629455566, 0.009233713150024414, 0.009584307670593262, 0.00993490219116211, 0.010285496711730957, 0.010636091232299805, 0.010986685752868652, 0.0113372802734375]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 6.0, 2.0, 6.0, 8.0, 8.0, 10.0, 10.0, 10.0, 23.0, 27.0, 29.0, 28.0, 52.0, 79.0, 114.0, 154.0, 272.0, 743.0, 6406.0, 884851.0, 151469.0, 2998.0, 514.0, 235.0, 105.0, 101.0, 64.0, 44.0, 39.0, 30.0, 32.0, 23.0, 17.0, 9.0, 7.0, 10.0, 4.0, 3.0, 3.0, 1.0, 1.0, 3.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0], "bins": [-0.5537109375, -0.5373573303222656, -0.5210037231445312, -0.5046501159667969, -0.4882965087890625, -0.4719429016113281, -0.45558929443359375, -0.4392356872558594, -0.422882080078125, -0.4065284729003906, -0.39017486572265625, -0.3738212585449219, -0.3574676513671875, -0.3411140441894531, -0.32476043701171875, -0.3084068298339844, -0.29205322265625, -0.2756996154785156, -0.25934600830078125, -0.24299240112304688, -0.2266387939453125, -0.21028518676757812, -0.19393157958984375, -0.17757797241210938, -0.161224365234375, -0.14487075805664062, -0.12851715087890625, -0.11216354370117188, -0.0958099365234375, -0.07945632934570312, -0.06310272216796875, -0.046749114990234375, -0.0303955078125, -0.014041900634765625, 0.00231170654296875, 0.018665313720703125, 0.0350189208984375, 0.051372528076171875, 0.06772613525390625, 0.08407974243164062, 0.100433349609375, 0.11678695678710938, 0.13314056396484375, 0.14949417114257812, 0.1658477783203125, 0.18220138549804688, 0.19855499267578125, 0.21490859985351562, 0.23126220703125, 0.24761581420898438, 0.26396942138671875, 0.2803230285644531, 0.2966766357421875, 0.3130302429199219, 0.32938385009765625, 0.3457374572753906, 0.362091064453125, 0.3784446716308594, 0.39479827880859375, 0.4111518859863281, 0.4275054931640625, 0.4438591003417969, 0.46021270751953125, 0.4765663146972656, 0.492919921875]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [3.0, 14.0, 46.0, 226.0, 550.0, 136.0, 29.0, 10.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.033143263310194016, -0.025342797860503197, -0.017542332410812378, -0.009741868823766708, -0.0019414033740758896, 0.005859062075614929, 0.013659525662660599, 0.021459992974996567, 0.029260456562042236, 0.037060920149087906, 0.044861387461423874, 0.05266185104846954, 0.06046231836080551, 0.06826278567314148, 0.07606324553489685, 0.08386371284723282, 0.09166418015956879, 0.09946464747190475, 0.10726510733366013, 0.1150655746459961, 0.12286604195833206, 0.13066650927066803, 0.1384669691324234, 0.14626744389533997, 0.15406790375709534, 0.1618683636188507, 0.16966883838176727, 0.17746929824352264, 0.18526975810527802, 0.19307023286819458, 0.20087069272994995, 0.20867115259170532, 0.2164716273546219, 0.22427208721637726, 0.23207256197929382, 0.2398730218410492, 0.24767348170280457, 0.25547394156455994, 0.2632744312286377, 0.27107489109039307, 0.27887535095214844, 0.2866758108139038, 0.2944762706756592, 0.30227673053741455, 0.3100772202014923, 0.3178776800632477, 0.32567813992500305, 0.3334785997867584, 0.3412790596485138, 0.34907951951026917, 0.35687997937202454, 0.3646804690361023, 0.37248092889785767, 0.38028138875961304, 0.3880818486213684, 0.3958823084831238, 0.40368279814720154, 0.4114832580089569, 0.4192837178707123, 0.42708420753479004, 0.4348846673965454, 0.4426851272583008, 0.45048558712005615, 0.4582860469818115, 0.4660865068435669]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 7.0, 5.0, 8.0, 7.0, 13.0, 11.0, 14.0, 14.0, 17.0, 20.0, 15.0, 11.0, 22.0, 29.0, 25.0, 41.0, 35.0, 35.0, 36.0, 37.0, 45.0, 40.0, 43.0, 39.0, 42.0, 38.0, 34.0, 29.0, 37.0, 30.0, 23.0, 27.0, 32.0, 22.0, 22.0, 15.0, 15.0, 22.0, 11.0, 11.0, 9.0, 6.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.013226926326751709, -0.01282772421836853, -0.012428522109985352, -0.012029320001602173, -0.011630117893218994, -0.011230915784835815, -0.010831713676452637, -0.010432511568069458, -0.01003330945968628, -0.0096341073513031, -0.009234905242919922, -0.008835703134536743, -0.008436501026153564, -0.008037298917770386, -0.007638096809387207, -0.007238894701004028, -0.00683969259262085, -0.006440490484237671, -0.006041288375854492, -0.0056420862674713135, -0.005242884159088135, -0.004843682050704956, -0.004444479942321777, -0.004045277833938599, -0.00364607572555542, -0.003246873617172241, -0.0028476715087890625, -0.002448469400405884, -0.002049267292022705, -0.0016500651836395264, -0.0012508630752563477, -0.0008516609668731689, -0.00045245885848999023, -5.3256750106811523e-05, 0.0003459453582763672, 0.0007451474666595459, 0.0011443495750427246, 0.0015435516834259033, 0.001942753791809082, 0.0023419559001922607, 0.0027411580085754395, 0.003140360116958618, 0.003539562225341797, 0.003938764333724976, 0.004337966442108154, 0.004737168550491333, 0.005136370658874512, 0.00553557276725769, 0.005934774875640869, 0.006333976984024048, 0.0067331790924072266, 0.007132381200790405, 0.007531583309173584, 0.007930785417556763, 0.008329987525939941, 0.00872918963432312, 0.009128391742706299, 0.009527593851089478, 0.009926795959472656, 0.010325998067855835, 0.010725200176239014, 0.011124402284622192, 0.011523604393005371, 0.01192280650138855, 0.012322008609771729]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 4.0, 1.0, 4.0, 4.0, 4.0, 4.0, 9.0, 8.0, 6.0, 15.0, 11.0, 12.0, 21.0, 19.0, 25.0, 37.0, 31.0, 35.0, 30.0, 31.0, 49.0, 55.0, 54.0, 46.0, 57.0, 39.0, 48.0, 36.0, 39.0, 35.0, 33.0, 35.0, 32.0, 18.0, 25.0, 18.0, 19.0, 18.0, 13.0, 7.0, 4.0, 4.0, 2.0, 3.0, 3.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.265625, -10.899658203125, -10.53369140625, -10.167724609375, -9.8017578125, -9.435791015625, -9.06982421875, -8.703857421875, -8.337890625, -7.971923828125, -7.60595703125, -7.239990234375, -6.8740234375, -6.508056640625, -6.14208984375, -5.776123046875, -5.41015625, -5.044189453125, -4.67822265625, -4.312255859375, -3.9462890625, -3.580322265625, -3.21435546875, -2.848388671875, -2.482421875, -2.116455078125, -1.75048828125, -1.384521484375, -1.0185546875, -0.652587890625, -0.28662109375, 0.079345703125, 0.4453125, 0.811279296875, 1.17724609375, 1.543212890625, 1.9091796875, 2.275146484375, 2.64111328125, 3.007080078125, 3.373046875, 3.739013671875, 4.10498046875, 4.470947265625, 4.8369140625, 5.202880859375, 5.56884765625, 5.934814453125, 6.30078125, 6.666748046875, 7.03271484375, 7.398681640625, 7.7646484375, 8.130615234375, 8.49658203125, 8.862548828125, 9.228515625, 9.594482421875, 9.96044921875, 10.326416015625, 10.6923828125, 11.058349609375, 11.42431640625, 11.790283203125, 12.15625]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 4.0, 2.0, 3.0, 3.0, 6.0, 5.0, 8.0, 13.0, 12.0, 12.0, 23.0, 30.0, 43.0, 59.0, 95.0, 108.0, 187.0, 237.0, 402.0, 593.0, 1053.0, 1863.0, 3594.0, 7412.0, 17179.0, 47684.0, 163485.0, 533642.0, 183643.0, 52206.0, 18566.0, 7611.0, 3629.0, 2009.0, 1122.0, 688.0, 410.0, 290.0, 182.0, 141.0, 95.0, 58.0, 46.0, 29.0, 20.0, 16.0, 18.0, 7.0, 7.0, 4.0, 6.0, 2.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.06640625, -4.8948974609375, -4.723388671875, -4.5518798828125, -4.38037109375, -4.2088623046875, -4.037353515625, -3.8658447265625, -3.6943359375, -3.5228271484375, -3.351318359375, -3.1798095703125, -3.00830078125, -2.8367919921875, -2.665283203125, -2.4937744140625, -2.322265625, -2.1507568359375, -1.979248046875, -1.8077392578125, -1.63623046875, -1.4647216796875, -1.293212890625, -1.1217041015625, -0.9501953125, -0.7786865234375, -0.607177734375, -0.4356689453125, -0.26416015625, -0.0926513671875, 0.078857421875, 0.2503662109375, 0.421875, 0.5933837890625, 0.764892578125, 0.9364013671875, 1.10791015625, 1.2794189453125, 1.450927734375, 1.6224365234375, 1.7939453125, 1.9654541015625, 2.136962890625, 2.3084716796875, 2.47998046875, 2.6514892578125, 2.822998046875, 2.9945068359375, 3.166015625, 3.3375244140625, 3.509033203125, 3.6805419921875, 3.85205078125, 4.0235595703125, 4.195068359375, 4.3665771484375, 4.5380859375, 4.7095947265625, 4.881103515625, 5.0526123046875, 5.22412109375, 5.3956298828125, 5.567138671875, 5.7386474609375, 5.91015625]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 3.0, 1.0, 7.0, 5.0, 5.0, 12.0, 8.0, 7.0, 15.0, 15.0, 19.0, 29.0, 19.0, 25.0, 25.0, 25.0, 34.0, 32.0, 34.0, 32.0, 44.0, 55.0, 206.0, 1890.0, 70.0, 40.0, 24.0, 44.0, 26.0, 33.0, 33.0, 28.0, 28.0, 16.0, 27.0, 22.0, 16.0, 16.0, 19.0, 10.0, 10.0, 11.0, 11.0, 6.0, 4.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-39.46875, -38.27880859375, -37.0888671875, -35.89892578125, -34.708984375, -33.51904296875, -32.3291015625, -31.13916015625, -29.94921875, -28.75927734375, -27.5693359375, -26.37939453125, -25.189453125, -23.99951171875, -22.8095703125, -21.61962890625, -20.4296875, -19.23974609375, -18.0498046875, -16.85986328125, -15.669921875, -14.47998046875, -13.2900390625, -12.10009765625, -10.91015625, -9.72021484375, -8.5302734375, -7.34033203125, -6.150390625, -4.96044921875, -3.7705078125, -2.58056640625, -1.390625, -0.20068359375, 0.9892578125, 2.17919921875, 3.369140625, 4.55908203125, 5.7490234375, 6.93896484375, 8.12890625, 9.31884765625, 10.5087890625, 11.69873046875, 12.888671875, 14.07861328125, 15.2685546875, 16.45849609375, 17.6484375, 18.83837890625, 20.0283203125, 21.21826171875, 22.408203125, 23.59814453125, 24.7880859375, 25.97802734375, 27.16796875, 28.35791015625, 29.5478515625, 30.73779296875, 31.927734375, 33.11767578125, 34.3076171875, 35.49755859375, 36.6875]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 4.0, 6.0, 10.0, 10.0, 6.0, 15.0, 19.0, 14.0, 19.0, 21.0, 29.0, 25.0, 44.0, 55.0, 64.0, 117.0, 132.0, 213.0, 352.0, 664.0, 2958.0, 3031486.0, 106462.0, 1466.0, 528.0, 312.0, 199.0, 110.0, 79.0, 51.0, 40.0, 36.0, 23.0, 28.0, 22.0, 18.0, 15.0, 8.0, 8.0, 7.0, 6.0, 6.0, 7.0, 1.0, 2.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-60.1875, -58.2353515625, -56.283203125, -54.3310546875, -52.37890625, -50.4267578125, -48.474609375, -46.5224609375, -44.5703125, -42.6181640625, -40.666015625, -38.7138671875, -36.76171875, -34.8095703125, -32.857421875, -30.9052734375, -28.953125, -27.0009765625, -25.048828125, -23.0966796875, -21.14453125, -19.1923828125, -17.240234375, -15.2880859375, -13.3359375, -11.3837890625, -9.431640625, -7.4794921875, -5.52734375, -3.5751953125, -1.623046875, 0.3291015625, 2.28125, 4.2333984375, 6.185546875, 8.1376953125, 10.08984375, 12.0419921875, 13.994140625, 15.9462890625, 17.8984375, 19.8505859375, 21.802734375, 23.7548828125, 25.70703125, 27.6591796875, 29.611328125, 31.5634765625, 33.515625, 35.4677734375, 37.419921875, 39.3720703125, 41.32421875, 43.2763671875, 45.228515625, 47.1806640625, 49.1328125, 51.0849609375, 53.037109375, 54.9892578125, 56.94140625, 58.8935546875, 60.845703125, 62.7978515625, 64.75]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 412.0, 606.0, 1.0, 1.0, 2.0], "bins": [-669.5501708984375, -658.401123046875, -647.2520751953125, -636.10302734375, -624.9539794921875, -613.8049926757812, -602.6559448242188, -591.5068969726562, -580.3578491210938, -569.2088012695312, -558.0597534179688, -546.9107055664062, -535.7616577148438, -524.6126708984375, -513.463623046875, -502.3145751953125, -491.16552734375, -480.0164794921875, -468.867431640625, -457.7184143066406, -446.5693664550781, -435.4203186035156, -424.2712707519531, -413.12225341796875, -401.9731750488281, -390.8241271972656, -379.6750793457031, -368.52606201171875, -357.37701416015625, -346.22796630859375, -335.07891845703125, -323.92987060546875, -312.78082275390625, -301.63177490234375, -290.48272705078125, -279.3337097167969, -268.1846618652344, -257.0356140136719, -245.88656616210938, -234.73753356933594, -223.5885009765625, -212.439453125, -201.29042053222656, -190.14137268066406, -178.99234008789062, -167.84329223632812, -156.69424438476562, -145.5452117919922, -134.39617919921875, -123.24713897705078, -112.09809875488281, -100.94905090332031, -89.80001831054688, -78.65097045898438, -67.5019302368164, -56.35289001464844, -45.20384216308594, -34.05480194091797, -22.905759811401367, -11.756717681884766, -0.6076774597167969, 10.541362762451172, 21.690406799316406, 32.839447021484375, 43.988487243652344]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 6.0, 5.0, 2.0, 5.0, 10.0, 6.0, 6.0, 10.0, 14.0, 11.0, 12.0, 24.0, 26.0, 21.0, 26.0, 20.0, 28.0, 31.0, 42.0, 32.0, 34.0, 40.0, 30.0, 36.0, 46.0, 40.0, 35.0, 29.0, 25.0, 32.0, 33.0, 41.0, 32.0, 23.0, 22.0, 21.0, 16.0, 23.0, 12.0, 17.0, 9.0, 17.0, 11.0, 6.0, 10.0, 9.0, 8.0, 7.0, 5.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0], "bins": [-127.93402099609375, -124.18264770507812, -120.43128204345703, -116.67991638183594, -112.92854309082031, -109.17716979980469, -105.4258041381836, -101.6744384765625, -97.92306518554688, -94.17169189453125, -90.42032623291016, -86.66896057128906, -82.91758728027344, -79.16621398925781, -75.41484832763672, -71.66348266601562, -67.912109375, -64.16073608398438, -60.40937042236328, -56.65800094604492, -52.90663146972656, -49.1552619934082, -45.403892517089844, -41.652523040771484, -37.901153564453125, -34.149784088134766, -30.398414611816406, -26.647045135498047, -22.895675659179688, -19.144306182861328, -15.392936706542969, -11.64156723022461, -7.89019775390625, -4.138828277587891, -0.38745880126953125, 3.363910675048828, 7.1152801513671875, 10.866649627685547, 14.618019104003906, 18.369388580322266, 22.120758056640625, 25.872127532958984, 29.623497009277344, 33.3748664855957, 37.12623596191406, 40.87760543823242, 44.62897491455078, 48.38034439086914, 52.1317138671875, 55.88308334350586, 59.63445281982422, 63.38582229614258, 67.13719177246094, 70.88856506347656, 74.63993072509766, 78.39129638671875, 82.14266967773438, 85.89404296875, 89.6454086303711, 93.39677429199219, 97.14814758300781, 100.89952087402344, 104.65088653564453, 108.40225219726562, 112.15362548828125]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 1.0, 3.0, 4.0, 6.0, 4.0, 6.0, 6.0, 10.0, 14.0, 9.0, 13.0, 20.0, 11.0, 27.0, 34.0, 35.0, 28.0, 29.0, 37.0, 38.0, 54.0, 54.0, 47.0, 55.0, 42.0, 47.0, 39.0, 41.0, 32.0, 40.0, 30.0, 36.0, 23.0, 18.0, 24.0, 18.0, 14.0, 21.0, 8.0, 6.0, 4.0, 4.0, 1.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-11.3828125, -11.017822265625, -10.65283203125, -10.287841796875, -9.9228515625, -9.557861328125, -9.19287109375, -8.827880859375, -8.462890625, -8.097900390625, -7.73291015625, -7.367919921875, -7.0029296875, -6.637939453125, -6.27294921875, -5.907958984375, -5.54296875, -5.177978515625, -4.81298828125, -4.447998046875, -4.0830078125, -3.718017578125, -3.35302734375, -2.988037109375, -2.623046875, -2.258056640625, -1.89306640625, -1.528076171875, -1.1630859375, -0.798095703125, -0.43310546875, -0.068115234375, 0.296875, 0.661865234375, 1.02685546875, 1.391845703125, 1.7568359375, 2.121826171875, 2.48681640625, 2.851806640625, 3.216796875, 3.581787109375, 3.94677734375, 4.311767578125, 4.6767578125, 5.041748046875, 5.40673828125, 5.771728515625, 6.13671875, 6.501708984375, 6.86669921875, 7.231689453125, 7.5966796875, 7.961669921875, 8.32666015625, 8.691650390625, 9.056640625, 9.421630859375, 9.78662109375, 10.151611328125, 10.5166015625, 10.881591796875, 11.24658203125, 11.611572265625, 11.9765625]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 3.0, 3.0, 5.0, 6.0, 9.0, 13.0, 9.0, 21.0, 31.0, 38.0, 44.0, 75.0, 85.0, 130.0, 147.0, 213.0, 336.0, 425.0, 713.0, 936.0, 1508.0, 2239.0, 3688.0, 6241.0, 11755.0, 47183.0, 1004766.0, 2944907.0, 131017.0, 17568.0, 7864.0, 4526.0, 2674.0, 1695.0, 1070.0, 743.0, 475.0, 330.0, 233.0, 158.0, 120.0, 79.0, 63.0, 38.0, 33.0, 23.0, 14.0, 7.0, 16.0, 5.0, 2.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-32.84375, -31.85400390625, -30.8642578125, -29.87451171875, -28.884765625, -27.89501953125, -26.9052734375, -25.91552734375, -24.92578125, -23.93603515625, -22.9462890625, -21.95654296875, -20.966796875, -19.97705078125, -18.9873046875, -17.99755859375, -17.0078125, -16.01806640625, -15.0283203125, -14.03857421875, -13.048828125, -12.05908203125, -11.0693359375, -10.07958984375, -9.08984375, -8.10009765625, -7.1103515625, -6.12060546875, -5.130859375, -4.14111328125, -3.1513671875, -2.16162109375, -1.171875, -0.18212890625, 0.8076171875, 1.79736328125, 2.787109375, 3.77685546875, 4.7666015625, 5.75634765625, 6.74609375, 7.73583984375, 8.7255859375, 9.71533203125, 10.705078125, 11.69482421875, 12.6845703125, 13.67431640625, 14.6640625, 15.65380859375, 16.6435546875, 17.63330078125, 18.623046875, 19.61279296875, 20.6025390625, 21.59228515625, 22.58203125, 23.57177734375, 24.5615234375, 25.55126953125, 26.541015625, 27.53076171875, 28.5205078125, 29.51025390625, 30.5]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 5.0, 2.0, 6.0, 7.0, 6.0, 10.0, 11.0, 12.0, 10.0, 12.0, 19.0, 32.0, 30.0, 72.0, 126.0, 274.0, 530.0, 929.0, 877.0, 507.0, 245.0, 118.0, 61.0, 36.0, 29.0, 13.0, 16.0, 9.0, 13.0, 10.0, 4.0, 9.0, 6.0, 4.0, 9.0, 1.0, 2.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-34.375, -33.361572265625, -32.34814453125, -31.334716796875, -30.3212890625, -29.307861328125, -28.29443359375, -27.281005859375, -26.267578125, -25.254150390625, -24.24072265625, -23.227294921875, -22.2138671875, -21.200439453125, -20.18701171875, -19.173583984375, -18.16015625, -17.146728515625, -16.13330078125, -15.119873046875, -14.1064453125, -13.093017578125, -12.07958984375, -11.066162109375, -10.052734375, -9.039306640625, -8.02587890625, -7.012451171875, -5.9990234375, -4.985595703125, -3.97216796875, -2.958740234375, -1.9453125, -0.931884765625, 0.08154296875, 1.094970703125, 2.1083984375, 3.121826171875, 4.13525390625, 5.148681640625, 6.162109375, 7.175537109375, 8.18896484375, 9.202392578125, 10.2158203125, 11.229248046875, 12.24267578125, 13.256103515625, 14.26953125, 15.282958984375, 16.29638671875, 17.309814453125, 18.3232421875, 19.336669921875, 20.35009765625, 21.363525390625, 22.376953125, 23.390380859375, 24.40380859375, 25.417236328125, 26.4306640625, 27.444091796875, 28.45751953125, 29.470947265625, 30.484375]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 5.0, 7.0, 10.0, 15.0, 26.0, 21.0, 42.0, 67.0, 95.0, 143.0, 231.0, 316.0, 466.0, 726.0, 1139.0, 1694.0, 2780.0, 4390.0, 7326.0, 12642.0, 24948.0, 69090.0, 735850.0, 3090272.0, 162153.0, 37933.0, 17192.0, 9504.0, 5550.0, 3464.0, 2169.0, 1379.0, 915.0, 597.0, 370.0, 260.0, 160.0, 110.0, 65.0, 55.0, 45.0, 19.0, 15.0, 12.0, 12.0, 4.0, 2.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.03125, -36.6845703125, -35.337890625, -33.9912109375, -32.64453125, -31.2978515625, -29.951171875, -28.6044921875, -27.2578125, -25.9111328125, -24.564453125, -23.2177734375, -21.87109375, -20.5244140625, -19.177734375, -17.8310546875, -16.484375, -15.1376953125, -13.791015625, -12.4443359375, -11.09765625, -9.7509765625, -8.404296875, -7.0576171875, -5.7109375, -4.3642578125, -3.017578125, -1.6708984375, -0.32421875, 1.0224609375, 2.369140625, 3.7158203125, 5.0625, 6.4091796875, 7.755859375, 9.1025390625, 10.44921875, 11.7958984375, 13.142578125, 14.4892578125, 15.8359375, 17.1826171875, 18.529296875, 19.8759765625, 21.22265625, 22.5693359375, 23.916015625, 25.2626953125, 26.609375, 27.9560546875, 29.302734375, 30.6494140625, 31.99609375, 33.3427734375, 34.689453125, 36.0361328125, 37.3828125, 38.7294921875, 40.076171875, 41.4228515625, 42.76953125, 44.1162109375, 45.462890625, 46.8095703125, 48.15625]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 7.0, 21.0, 48.0, 92.0, 255.0, 344.0, 132.0, 51.0, 23.0, 17.0, 7.0, 11.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-137.1599578857422, -126.76881408691406, -116.37767028808594, -105.98652648925781, -95.59538269042969, -85.20423889160156, -74.81310272216797, -64.42195892333984, -54.03081512451172, -43.639671325683594, -33.24852752685547, -22.85738754272461, -12.466243743896484, -2.0750999450683594, 8.3160400390625, 18.707183837890625, 29.09832763671875, 39.489471435546875, 49.880615234375, 60.27175521850586, 70.66290283203125, 81.05404663085938, 91.44518280029297, 101.8363265991211, 112.22747039794922, 122.61861419677734, 133.00975036621094, 143.40089416503906, 153.7920379638672, 164.1831817626953, 174.57432556152344, 184.96546936035156, 195.35659790039062, 205.74774169921875, 216.13888549804688, 226.530029296875, 236.92117309570312, 247.31231689453125, 257.7034606933594, 268.0946044921875, 278.4857482910156, 288.87689208984375, 299.2680358886719, 309.6591796875, 320.0503234863281, 330.44146728515625, 340.8326110839844, 351.2237548828125, 361.6148681640625, 372.0060119628906, 382.39715576171875, 392.7882995605469, 403.179443359375, 413.5705871582031, 423.96173095703125, 434.3528747558594, 444.7440185546875, 455.1351623535156, 465.52630615234375, 475.9174499511719, 486.30859375, 496.6997375488281, 507.09088134765625, 517.4819946289062, 527.8731689453125]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 5.0, 7.0, 5.0, 10.0, 14.0, 13.0, 20.0, 27.0, 16.0, 27.0, 23.0, 23.0, 25.0, 31.0, 34.0, 37.0, 35.0, 51.0, 42.0, 44.0, 49.0, 43.0, 55.0, 38.0, 41.0, 28.0, 32.0, 31.0, 24.0, 26.0, 31.0, 20.0, 17.0, 17.0, 11.0, 17.0, 6.0, 7.0, 12.0, 5.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.45968627929688, -81.68390655517578, -78.90812683105469, -76.13233947753906, -73.35655975341797, -70.58078002929688, -67.80500030517578, -65.02922058105469, -62.25343704223633, -59.477657318115234, -56.701873779296875, -53.92609405517578, -51.15031433105469, -48.37453079223633, -45.598751068115234, -42.822967529296875, -40.04718780517578, -37.27140808105469, -34.49562454223633, -31.719844818115234, -28.944063186645508, -26.16828155517578, -23.392501831054688, -20.61672019958496, -17.840938568115234, -15.065156936645508, -12.289376258850098, -9.513595581054688, -6.737813949584961, -3.9620323181152344, -1.1862525939941406, 1.589529037475586, 4.365318298339844, 7.141099452972412, 9.91688060760498, 12.69266128540039, 15.468442916870117, 18.244224548339844, 21.020004272460938, 23.795785903930664, 26.57156753540039, 29.347349166870117, 32.123130798339844, 34.89891052246094, 37.67469024658203, 40.45047378540039, 43.226253509521484, 46.002037048339844, 48.77781677246094, 51.55359649658203, 54.32938003540039, 57.105159759521484, 59.880943298339844, 62.65672302246094, 65.43250274658203, 68.20828247070312, 70.98406982421875, 73.75984954833984, 76.53562927246094, 79.31141662597656, 82.08719635009766, 84.86297607421875, 87.63875579833984, 90.41453552246094, 93.19031524658203]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 5.0, 3.0, 8.0, 3.0, 9.0, 10.0, 6.0, 11.0, 10.0, 16.0, 14.0, 16.0, 32.0, 28.0, 31.0, 45.0, 34.0, 40.0, 36.0, 31.0, 55.0, 41.0, 60.0, 47.0, 52.0, 45.0, 31.0, 36.0, 27.0, 39.0, 34.0, 24.0, 24.0, 21.0, 19.0, 16.0, 12.0, 6.0, 7.0, 6.0, 8.0, 3.0, 0.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.9453125, -11.5615234375, -11.177734375, -10.7939453125, -10.41015625, -10.0263671875, -9.642578125, -9.2587890625, -8.875, -8.4912109375, -8.107421875, -7.7236328125, -7.33984375, -6.9560546875, -6.572265625, -6.1884765625, -5.8046875, -5.4208984375, -5.037109375, -4.6533203125, -4.26953125, -3.8857421875, -3.501953125, -3.1181640625, -2.734375, -2.3505859375, -1.966796875, -1.5830078125, -1.19921875, -0.8154296875, -0.431640625, -0.0478515625, 0.3359375, 0.7197265625, 1.103515625, 1.4873046875, 1.87109375, 2.2548828125, 2.638671875, 3.0224609375, 3.40625, 3.7900390625, 4.173828125, 4.5576171875, 4.94140625, 5.3251953125, 5.708984375, 6.0927734375, 6.4765625, 6.8603515625, 7.244140625, 7.6279296875, 8.01171875, 8.3955078125, 8.779296875, 9.1630859375, 9.546875, 9.9306640625, 10.314453125, 10.6982421875, 11.08203125, 11.4658203125, 11.849609375, 12.2333984375, 12.6171875]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 0.0, 3.0, 9.0, 4.0, 8.0, 9.0, 15.0, 34.0, 45.0, 64.0, 87.0, 138.0, 217.0, 265.0, 417.0, 672.0, 955.0, 1425.0, 2226.0, 3324.0, 5263.0, 9029.0, 14632.0, 25552.0, 45476.0, 87416.0, 182913.0, 296389.0, 178301.0, 85298.0, 44912.0, 25034.0, 14708.0, 8532.0, 5386.0, 3397.0, 2124.0, 1389.0, 921.0, 626.0, 422.0, 290.0, 201.0, 134.0, 90.0, 82.0, 40.0, 29.0, 21.0, 14.0, 12.0, 6.0, 8.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.2529296875, -1.213134765625, -1.17333984375, -1.133544921875, -1.09375, -1.053955078125, -1.01416015625, -0.974365234375, -0.9345703125, -0.894775390625, -0.85498046875, -0.815185546875, -0.775390625, -0.735595703125, -0.69580078125, -0.656005859375, -0.6162109375, -0.576416015625, -0.53662109375, -0.496826171875, -0.45703125, -0.417236328125, -0.37744140625, -0.337646484375, -0.2978515625, -0.258056640625, -0.21826171875, -0.178466796875, -0.138671875, -0.098876953125, -0.05908203125, -0.019287109375, 0.0205078125, 0.060302734375, 0.10009765625, 0.139892578125, 0.1796875, 0.219482421875, 0.25927734375, 0.299072265625, 0.3388671875, 0.378662109375, 0.41845703125, 0.458251953125, 0.498046875, 0.537841796875, 0.57763671875, 0.617431640625, 0.6572265625, 0.697021484375, 0.73681640625, 0.776611328125, 0.81640625, 0.856201171875, 0.89599609375, 0.935791015625, 0.9755859375, 1.015380859375, 1.05517578125, 1.094970703125, 1.134765625, 1.174560546875, 1.21435546875, 1.254150390625, 1.2939453125]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 5.0, 3.0, 3.0, 7.0, 11.0, 6.0, 16.0, 14.0, 21.0, 25.0, 18.0, 25.0, 36.0, 30.0, 33.0, 41.0, 35.0, 48.0, 42.0, 34.0, 49.0, 1063.0, 43.0, 35.0, 50.0, 31.0, 34.0, 25.0, 35.0, 20.0, 33.0, 31.0, 31.0, 19.0, 15.0, 5.0, 11.0, 7.0, 9.0, 11.0, 4.0, 7.0, 9.0, 4.0, 2.0, 1.0, 0.0, 2.0], "bins": [-8.7265625, -8.49481201171875, -8.2630615234375, -8.03131103515625, -7.799560546875, -7.56781005859375, -7.3360595703125, -7.10430908203125, -6.87255859375, -6.64080810546875, -6.4090576171875, -6.17730712890625, -5.945556640625, -5.71380615234375, -5.4820556640625, -5.25030517578125, -5.0185546875, -4.78680419921875, -4.5550537109375, -4.32330322265625, -4.091552734375, -3.85980224609375, -3.6280517578125, -3.39630126953125, -3.16455078125, -2.93280029296875, -2.7010498046875, -2.46929931640625, -2.237548828125, -2.00579833984375, -1.7740478515625, -1.54229736328125, -1.310546875, -1.07879638671875, -0.8470458984375, -0.61529541015625, -0.383544921875, -0.15179443359375, 0.0799560546875, 0.31170654296875, 0.54345703125, 0.77520751953125, 1.0069580078125, 1.23870849609375, 1.470458984375, 1.70220947265625, 1.9339599609375, 2.16571044921875, 2.3974609375, 2.62921142578125, 2.8609619140625, 3.09271240234375, 3.324462890625, 3.55621337890625, 3.7879638671875, 4.01971435546875, 4.25146484375, 4.48321533203125, 4.7149658203125, 4.94671630859375, 5.178466796875, 5.41021728515625, 5.6419677734375, 5.87371826171875, 6.10546875]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 7.0, 7.0, 11.0, 17.0, 16.0, 21.0, 54.0, 64.0, 132.0, 198.0, 297.0, 435.0, 696.0, 1140.0, 1791.0, 2708.0, 4280.0, 6849.0, 10664.0, 17273.0, 28949.0, 48769.0, 87465.0, 169389.0, 1312293.0, 179893.0, 92804.0, 51473.0, 30167.0, 18515.0, 11451.0, 7153.0, 4303.0, 2769.0, 1811.0, 1175.0, 760.0, 502.0, 298.0, 206.0, 146.0, 71.0, 32.0, 27.0, 18.0, 10.0, 17.0, 7.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.666015625, -0.6426849365234375, -0.619354248046875, -0.5960235595703125, -0.57269287109375, -0.5493621826171875, -0.526031494140625, -0.5027008056640625, -0.4793701171875, -0.4560394287109375, -0.432708740234375, -0.4093780517578125, -0.38604736328125, -0.3627166748046875, -0.339385986328125, -0.3160552978515625, -0.292724609375, -0.2693939208984375, -0.246063232421875, -0.2227325439453125, -0.19940185546875, -0.1760711669921875, -0.152740478515625, -0.1294097900390625, -0.1060791015625, -0.0827484130859375, -0.059417724609375, -0.0360870361328125, -0.01275634765625, 0.0105743408203125, 0.033905029296875, 0.0572357177734375, 0.08056640625, 0.1038970947265625, 0.127227783203125, 0.1505584716796875, 0.17388916015625, 0.1972198486328125, 0.220550537109375, 0.2438812255859375, 0.2672119140625, 0.2905426025390625, 0.313873291015625, 0.3372039794921875, 0.36053466796875, 0.3838653564453125, 0.407196044921875, 0.4305267333984375, 0.453857421875, 0.4771881103515625, 0.500518798828125, 0.5238494873046875, 0.54718017578125, 0.5705108642578125, 0.593841552734375, 0.6171722412109375, 0.6405029296875, 0.6638336181640625, 0.687164306640625, 0.7104949951171875, 0.73382568359375, 0.7571563720703125, 0.780487060546875, 0.8038177490234375, 0.8271484375]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 5.0, 4.0, 2.0, 2.0, 10.0, 6.0, 8.0, 9.0, 16.0, 13.0, 12.0, 20.0, 21.0, 19.0, 33.0, 35.0, 43.0, 44.0, 49.0, 50.0, 84.0, 78.0, 72.0, 71.0, 50.0, 48.0, 28.0, 29.0, 31.0, 20.0, 18.0, 14.0, 12.0, 9.0, 11.0, 8.0, 8.0, 7.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0106048583984375, -0.010184049606323242, -0.009763240814208984, -0.009342432022094727, -0.008921623229980469, -0.008500814437866211, -0.008080005645751953, -0.007659196853637695, -0.0072383880615234375, -0.00681757926940918, -0.006396770477294922, -0.005975961685180664, -0.005555152893066406, -0.0051343441009521484, -0.004713535308837891, -0.004292726516723633, -0.003871917724609375, -0.003451108932495117, -0.0030303001403808594, -0.0026094913482666016, -0.0021886825561523438, -0.001767873764038086, -0.0013470649719238281, -0.0009262561798095703, -0.0005054473876953125, -8.463859558105469e-05, 0.0003361701965332031, 0.0007569789886474609, 0.0011777877807617188, 0.0015985965728759766, 0.0020194053649902344, 0.002440214157104492, 0.00286102294921875, 0.003281831741333008, 0.0037026405334472656, 0.0041234493255615234, 0.004544258117675781, 0.004965066909790039, 0.005385875701904297, 0.005806684494018555, 0.0062274932861328125, 0.00664830207824707, 0.007069110870361328, 0.007489919662475586, 0.007910728454589844, 0.008331537246704102, 0.00875234603881836, 0.009173154830932617, 0.009593963623046875, 0.010014772415161133, 0.01043558120727539, 0.010856389999389648, 0.011277198791503906, 0.011698007583618164, 0.012118816375732422, 0.01253962516784668, 0.012960433959960938, 0.013381242752075195, 0.013802051544189453, 0.014222860336303711, 0.014643669128417969, 0.015064477920532227, 0.015485286712646484, 0.015906095504760742, 0.016326904296875]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 4.0, 11.0, 6.0, 12.0, 8.0, 16.0, 22.0, 21.0, 19.0, 28.0, 30.0, 40.0, 55.0, 76.0, 125.0, 298.0, 1491.0, 25166.0, 1006211.0, 13133.0, 1069.0, 229.0, 119.0, 76.0, 50.0, 38.0, 28.0, 33.0, 21.0, 20.0, 13.0, 18.0, 12.0, 11.0, 13.0, 12.0, 4.0, 6.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.4375, -0.4247894287109375, -0.412078857421875, -0.3993682861328125, -0.38665771484375, -0.3739471435546875, -0.361236572265625, -0.3485260009765625, -0.3358154296875, -0.3231048583984375, -0.310394287109375, -0.2976837158203125, -0.28497314453125, -0.2722625732421875, -0.259552001953125, -0.2468414306640625, -0.234130859375, -0.2214202880859375, -0.208709716796875, -0.1959991455078125, -0.18328857421875, -0.1705780029296875, -0.157867431640625, -0.1451568603515625, -0.1324462890625, -0.1197357177734375, -0.107025146484375, -0.0943145751953125, -0.08160400390625, -0.0688934326171875, -0.056182861328125, -0.0434722900390625, -0.03076171875, -0.0180511474609375, -0.005340576171875, 0.0073699951171875, 0.02008056640625, 0.0327911376953125, 0.045501708984375, 0.0582122802734375, 0.0709228515625, 0.0836334228515625, 0.096343994140625, 0.1090545654296875, 0.12176513671875, 0.1344757080078125, 0.147186279296875, 0.1598968505859375, 0.172607421875, 0.1853179931640625, 0.198028564453125, 0.2107391357421875, 0.22344970703125, 0.2361602783203125, 0.248870849609375, 0.2615814208984375, 0.2742919921875, 0.2870025634765625, 0.299713134765625, 0.3124237060546875, 0.32513427734375, 0.3378448486328125, 0.350555419921875, 0.3632659912109375, 0.3759765625]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 16.0, 38.0, 94.0, 330.0, 350.0, 103.0, 36.0, 20.0, 11.0, 4.0, 1.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.035230644047260284, -0.03170756995677948, -0.028184499591588974, -0.02466142736375332, -0.021138355135917664, -0.01761528290808201, -0.014092210680246353, -0.010569138452410698, -0.007046066224575043, -0.0035229939967393875, 7.82310962677002e-08, 0.003523150458931923, 0.007046222686767578, 0.010569294914603233, 0.014092367142438889, 0.017615439370274544, 0.0211385115981102, 0.024661583825945854, 0.02818465605378151, 0.031707726418972015, 0.03523080050945282, 0.038753874599933624, 0.04227694496512413, 0.045800015330314636, 0.04932308942079544, 0.052846163511276245, 0.05636923387646675, 0.05989230424165726, 0.06341537833213806, 0.06693845242261887, 0.07046152651309967, 0.07398459315299988, 0.07750765979290009, 0.08103073388338089, 0.0845538079738617, 0.0880768746137619, 0.0915999487042427, 0.09512302279472351, 0.09864608943462372, 0.10216916352510452, 0.10569223761558533, 0.10921531170606613, 0.11273838579654694, 0.11626145243644714, 0.11978452652692795, 0.12330760061740875, 0.12683066725730896, 0.13035374879837036, 0.13387681543827057, 0.13739988207817078, 0.14092296361923218, 0.14444603025913239, 0.1479690968990326, 0.151492178440094, 0.1550152450799942, 0.1585383266210556, 0.1620613932609558, 0.16558445990085602, 0.16910754144191742, 0.17263060808181763, 0.17615368962287903, 0.17967675626277924, 0.18319982290267944, 0.18672290444374084, 0.19024597108364105]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 2.0, 4.0, 7.0, 14.0, 10.0, 9.0, 20.0, 15.0, 24.0, 18.0, 18.0, 20.0, 20.0, 23.0, 34.0, 23.0, 20.0, 41.0, 38.0, 41.0, 44.0, 45.0, 37.0, 29.0, 38.0, 36.0, 43.0, 40.0, 53.0, 31.0, 34.0, 20.0, 27.0, 19.0, 16.0, 15.0, 15.0, 15.0, 13.0, 7.0, 5.0, 4.0, 5.0, 0.0, 5.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.020763278007507324, -0.020069709047675133, -0.01937614008784294, -0.01868257112801075, -0.01798900216817856, -0.017295433208346367, -0.016601864248514175, -0.015908295288681984, -0.015214726328849792, -0.014521157369017601, -0.01382758840918541, -0.013134019449353218, -0.012440450489521027, -0.011746881529688835, -0.011053312569856644, -0.010359743610024452, -0.00966617465019226, -0.00897260569036007, -0.008279036730527878, -0.007585467770695686, -0.006891898810863495, -0.006198329851031303, -0.005504760891199112, -0.0048111919313669205, -0.004117622971534729, -0.0034240540117025375, -0.002730485051870346, -0.0020369160920381546, -0.0013433471322059631, -0.0006497781723737717, 4.37907874584198e-05, 0.0007373597472906113, 0.0014309287071228027, 0.002124497666954994, 0.0028180666267871857, 0.003511635586619377, 0.004205204546451569, 0.00489877350628376, 0.0055923424661159515, 0.006285911425948143, 0.0069794803857803345, 0.007673049345612526, 0.008366618305444717, 0.009060187265276909, 0.0097537562251091, 0.010447325184941292, 0.011140894144773483, 0.011834463104605675, 0.012528032064437866, 0.013221601024270058, 0.01391516998410225, 0.01460873894393444, 0.015302307903766632, 0.015995876863598824, 0.016689445823431015, 0.017383014783263206, 0.018076583743095398, 0.01877015270292759, 0.01946372166275978, 0.020157290622591972, 0.020850859582424164, 0.021544428542256355, 0.022237997502088547, 0.022931566461920738, 0.02362513542175293]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 5.0, 3.0, 8.0, 3.0, 9.0, 10.0, 6.0, 11.0, 10.0, 16.0, 14.0, 16.0, 32.0, 28.0, 31.0, 45.0, 34.0, 39.0, 37.0, 31.0, 55.0, 41.0, 60.0, 47.0, 52.0, 45.0, 31.0, 36.0, 27.0, 39.0, 34.0, 24.0, 25.0, 20.0, 19.0, 16.0, 12.0, 6.0, 7.0, 6.0, 8.0, 3.0, 0.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.9453125, -11.5615234375, -11.177734375, -10.7939453125, -10.41015625, -10.0263671875, -9.642578125, -9.2587890625, -8.875, -8.4912109375, -8.107421875, -7.7236328125, -7.33984375, -6.9560546875, -6.572265625, -6.1884765625, -5.8046875, -5.4208984375, -5.037109375, -4.6533203125, -4.26953125, -3.8857421875, -3.501953125, -3.1181640625, -2.734375, -2.3505859375, -1.966796875, -1.5830078125, -1.19921875, -0.8154296875, -0.431640625, -0.0478515625, 0.3359375, 0.7197265625, 1.103515625, 1.4873046875, 1.87109375, 2.2548828125, 2.638671875, 3.0224609375, 3.40625, 3.7900390625, 4.173828125, 4.5576171875, 4.94140625, 5.3251953125, 5.708984375, 6.0927734375, 6.4765625, 6.8603515625, 7.244140625, 7.6279296875, 8.01171875, 8.3955078125, 8.779296875, 9.1630859375, 9.546875, 9.9306640625, 10.314453125, 10.6982421875, 11.08203125, 11.4658203125, 11.849609375, 12.2333984375, 12.6171875]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 3.0, 5.0, 6.0, 3.0, 8.0, 16.0, 6.0, 12.0, 18.0, 23.0, 38.0, 52.0, 108.0, 150.0, 276.0, 537.0, 1150.0, 2762.0, 7288.0, 21371.0, 71480.0, 297407.0, 480472.0, 115230.0, 32470.0, 10693.0, 3811.0, 1578.0, 719.0, 342.0, 197.0, 89.0, 60.0, 64.0, 32.0, 24.0, 19.0, 7.0, 10.0, 7.0, 6.0, 4.0, 1.0, 3.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.38671875, -6.181884765625, -5.97705078125, -5.772216796875, -5.5673828125, -5.362548828125, -5.15771484375, -4.952880859375, -4.748046875, -4.543212890625, -4.33837890625, -4.133544921875, -3.9287109375, -3.723876953125, -3.51904296875, -3.314208984375, -3.109375, -2.904541015625, -2.69970703125, -2.494873046875, -2.2900390625, -2.085205078125, -1.88037109375, -1.675537109375, -1.470703125, -1.265869140625, -1.06103515625, -0.856201171875, -0.6513671875, -0.446533203125, -0.24169921875, -0.036865234375, 0.16796875, 0.372802734375, 0.57763671875, 0.782470703125, 0.9873046875, 1.192138671875, 1.39697265625, 1.601806640625, 1.806640625, 2.011474609375, 2.21630859375, 2.421142578125, 2.6259765625, 2.830810546875, 3.03564453125, 3.240478515625, 3.4453125, 3.650146484375, 3.85498046875, 4.059814453125, 4.2646484375, 4.469482421875, 4.67431640625, 4.879150390625, 5.083984375, 5.288818359375, 5.49365234375, 5.698486328125, 5.9033203125, 6.108154296875, 6.31298828125, 6.517822265625, 6.72265625]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 8.0, 4.0, 4.0, 6.0, 5.0, 12.0, 13.0, 13.0, 11.0, 19.0, 18.0, 20.0, 20.0, 31.0, 24.0, 36.0, 35.0, 32.0, 36.0, 40.0, 41.0, 68.0, 1762.0, 315.0, 62.0, 40.0, 23.0, 41.0, 31.0, 33.0, 43.0, 26.0, 34.0, 26.0, 26.0, 18.0, 15.0, 10.0, 9.0, 7.0, 13.0, 9.0, 6.0, 4.0, 3.0, 1.0, 2.0, 1.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-41.21875, -39.92626953125, -38.6337890625, -37.34130859375, -36.048828125, -34.75634765625, -33.4638671875, -32.17138671875, -30.87890625, -29.58642578125, -28.2939453125, -27.00146484375, -25.708984375, -24.41650390625, -23.1240234375, -21.83154296875, -20.5390625, -19.24658203125, -17.9541015625, -16.66162109375, -15.369140625, -14.07666015625, -12.7841796875, -11.49169921875, -10.19921875, -8.90673828125, -7.6142578125, -6.32177734375, -5.029296875, -3.73681640625, -2.4443359375, -1.15185546875, 0.140625, 1.43310546875, 2.7255859375, 4.01806640625, 5.310546875, 6.60302734375, 7.8955078125, 9.18798828125, 10.48046875, 11.77294921875, 13.0654296875, 14.35791015625, 15.650390625, 16.94287109375, 18.2353515625, 19.52783203125, 20.8203125, 22.11279296875, 23.4052734375, 24.69775390625, 25.990234375, 27.28271484375, 28.5751953125, 29.86767578125, 31.16015625, 32.45263671875, 33.7451171875, 35.03759765625, 36.330078125, 37.62255859375, 38.9150390625, 40.20751953125, 41.5]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 2.0, 2.0, 1.0, 3.0, 3.0, 6.0, 10.0, 10.0, 7.0, 10.0, 11.0, 15.0, 19.0, 32.0, 36.0, 45.0, 45.0, 66.0, 91.0, 100.0, 205.0, 274.0, 536.0, 1568.0, 224126.0, 2914490.0, 2316.0, 629.0, 313.0, 189.0, 135.0, 102.0, 74.0, 40.0, 45.0, 21.0, 20.0, 22.0, 18.0, 15.0, 10.0, 15.0, 10.0, 5.0, 6.0, 4.0, 8.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-67.5625, -65.4580078125, -63.353515625, -61.2490234375, -59.14453125, -57.0400390625, -54.935546875, -52.8310546875, -50.7265625, -48.6220703125, -46.517578125, -44.4130859375, -42.30859375, -40.2041015625, -38.099609375, -35.9951171875, -33.890625, -31.7861328125, -29.681640625, -27.5771484375, -25.47265625, -23.3681640625, -21.263671875, -19.1591796875, -17.0546875, -14.9501953125, -12.845703125, -10.7412109375, -8.63671875, -6.5322265625, -4.427734375, -2.3232421875, -0.21875, 1.8857421875, 3.990234375, 6.0947265625, 8.19921875, 10.3037109375, 12.408203125, 14.5126953125, 16.6171875, 18.7216796875, 20.826171875, 22.9306640625, 25.03515625, 27.1396484375, 29.244140625, 31.3486328125, 33.453125, 35.5576171875, 37.662109375, 39.7666015625, 41.87109375, 43.9755859375, 46.080078125, 48.1845703125, 50.2890625, 52.3935546875, 54.498046875, 56.6025390625, 58.70703125, 60.8115234375, 62.916015625, 65.0205078125, 67.125]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [47.0, 850.0, 116.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.709879875183105, -4.412458419799805, 2.884963035583496, 10.182385444641113, 17.47980499267578, 24.777225494384766, 32.074649810791016, 39.3720703125, 46.669490814208984, 53.96691131591797, 61.26433563232422, 68.56175231933594, 75.85917663574219, 83.15660095214844, 90.45402526855469, 97.7514419555664, 105.04886627197266, 112.3462905883789, 119.64370727539062, 126.94113159179688, 134.23855590820312, 141.53598022460938, 148.83340454101562, 156.1308135986328, 163.42823791503906, 170.7256622314453, 178.02308654785156, 185.32049560546875, 192.617919921875, 199.91534423828125, 207.2127685546875, 214.51019287109375, 221.8076171875, 229.10504150390625, 236.4024658203125, 243.69989013671875, 250.99729919433594, 258.29473876953125, 265.5921630859375, 272.8895568847656, 280.1869812011719, 287.4844055175781, 294.7818298339844, 302.0792541503906, 309.3766784667969, 316.674072265625, 323.97149658203125, 331.2689208984375, 338.56634521484375, 345.86376953125, 353.16119384765625, 360.4586181640625, 367.75604248046875, 375.053466796875, 382.35089111328125, 389.6482849121094, 396.94573974609375, 404.2431640625, 411.54058837890625, 418.8380126953125, 426.13543701171875, 433.432861328125, 440.73028564453125, 448.0276794433594, 455.3251037597656]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 6.0, 2.0, 6.0, 7.0, 8.0, 3.0, 15.0, 13.0, 17.0, 19.0, 17.0, 21.0, 33.0, 21.0, 21.0, 48.0, 38.0, 28.0, 40.0, 34.0, 47.0, 42.0, 46.0, 47.0, 38.0, 43.0, 41.0, 34.0, 38.0, 31.0, 34.0, 27.0, 22.0, 14.0, 13.0, 14.0, 19.0, 4.0, 13.0, 11.0, 8.0, 3.0, 4.0, 6.0, 2.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0], "bins": [-133.54962158203125, -129.2626953125, -124.97576904296875, -120.6888427734375, -116.40191650390625, -112.114990234375, -107.82806396484375, -103.5411376953125, -99.25421142578125, -94.96728515625, -90.68035888671875, -86.3934326171875, -82.10650634765625, -77.819580078125, -73.53265380859375, -69.2457275390625, -64.95879364013672, -60.67186737060547, -56.38494110107422, -52.09801483154297, -47.81108856201172, -43.52416229248047, -39.23723220825195, -34.9503059387207, -30.663379669189453, -26.376453399658203, -22.089527130126953, -17.80259895324707, -13.51567268371582, -9.22874641418457, -4.9418182373046875, -0.6548919677734375, 3.6320343017578125, 7.918961048126221, 12.205887794494629, 16.492815017700195, 20.779741287231445, 25.066667556762695, 29.353595733642578, 33.64052200317383, 37.92744827270508, 42.21437454223633, 46.50130081176758, 50.788230895996094, 55.075157165527344, 59.362083435058594, 63.649009704589844, 67.9359359741211, 72.22286224365234, 76.5097885131836, 80.79671478271484, 85.0836410522461, 89.37056732177734, 93.6574935913086, 97.94442749023438, 102.23135375976562, 106.51828002929688, 110.80520629882812, 115.09213256835938, 119.37905883789062, 123.66598510742188, 127.95291137695312, 132.23983764648438, 136.52676391601562, 140.81369018554688]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 7.0, 5.0, 10.0, 5.0, 10.0, 10.0, 12.0, 15.0, 17.0, 16.0, 36.0, 25.0, 45.0, 34.0, 29.0, 48.0, 35.0, 47.0, 39.0, 52.0, 64.0, 47.0, 51.0, 33.0, 33.0, 37.0, 31.0, 37.0, 27.0, 25.0, 23.0, 23.0, 15.0, 13.0, 9.0, 6.0, 7.0, 7.0, 5.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.0859375, -11.692138671875, -11.29833984375, -10.904541015625, -10.5107421875, -10.116943359375, -9.72314453125, -9.329345703125, -8.935546875, -8.541748046875, -8.14794921875, -7.754150390625, -7.3603515625, -6.966552734375, -6.57275390625, -6.178955078125, -5.78515625, -5.391357421875, -4.99755859375, -4.603759765625, -4.2099609375, -3.816162109375, -3.42236328125, -3.028564453125, -2.634765625, -2.240966796875, -1.84716796875, -1.453369140625, -1.0595703125, -0.665771484375, -0.27197265625, 0.121826171875, 0.515625, 0.909423828125, 1.30322265625, 1.697021484375, 2.0908203125, 2.484619140625, 2.87841796875, 3.272216796875, 3.666015625, 4.059814453125, 4.45361328125, 4.847412109375, 5.2412109375, 5.635009765625, 6.02880859375, 6.422607421875, 6.81640625, 7.210205078125, 7.60400390625, 7.997802734375, 8.3916015625, 8.785400390625, 9.17919921875, 9.572998046875, 9.966796875, 10.360595703125, 10.75439453125, 11.148193359375, 11.5419921875, 11.935791015625, 12.32958984375, 12.723388671875, 13.1171875]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 7.0, 3.0, 9.0, 13.0, 14.0, 18.0, 20.0, 40.0, 58.0, 63.0, 121.0, 176.0, 245.0, 408.0, 645.0, 1020.0, 1872.0, 3459.0, 7205.0, 18453.0, 302157.0, 3660086.0, 169411.0, 15287.0, 6334.0, 3016.0, 1641.0, 921.0, 552.0, 353.0, 221.0, 143.0, 86.0, 75.0, 35.0, 45.0, 20.0, 15.0, 7.0, 16.0, 6.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.75, -39.41064453125, -38.0712890625, -36.73193359375, -35.392578125, -34.05322265625, -32.7138671875, -31.37451171875, -30.03515625, -28.69580078125, -27.3564453125, -26.01708984375, -24.677734375, -23.33837890625, -21.9990234375, -20.65966796875, -19.3203125, -17.98095703125, -16.6416015625, -15.30224609375, -13.962890625, -12.62353515625, -11.2841796875, -9.94482421875, -8.60546875, -7.26611328125, -5.9267578125, -4.58740234375, -3.248046875, -1.90869140625, -0.5693359375, 0.77001953125, 2.109375, 3.44873046875, 4.7880859375, 6.12744140625, 7.466796875, 8.80615234375, 10.1455078125, 11.48486328125, 12.82421875, 14.16357421875, 15.5029296875, 16.84228515625, 18.181640625, 19.52099609375, 20.8603515625, 22.19970703125, 23.5390625, 24.87841796875, 26.2177734375, 27.55712890625, 28.896484375, 30.23583984375, 31.5751953125, 32.91455078125, 34.25390625, 35.59326171875, 36.9326171875, 38.27197265625, 39.611328125, 40.95068359375, 42.2900390625, 43.62939453125, 44.96875]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 5.0, 3.0, 8.0, 6.0, 6.0, 3.0, 6.0, 5.0, 11.0, 9.0, 17.0, 17.0, 18.0, 38.0, 39.0, 69.0, 136.0, 350.0, 689.0, 1022.0, 805.0, 366.0, 186.0, 91.0, 49.0, 29.0, 25.0, 13.0, 14.0, 4.0, 5.0, 3.0, 8.0, 7.0, 9.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-33.875, -32.7685546875, -31.662109375, -30.5556640625, -29.44921875, -28.3427734375, -27.236328125, -26.1298828125, -25.0234375, -23.9169921875, -22.810546875, -21.7041015625, -20.59765625, -19.4912109375, -18.384765625, -17.2783203125, -16.171875, -15.0654296875, -13.958984375, -12.8525390625, -11.74609375, -10.6396484375, -9.533203125, -8.4267578125, -7.3203125, -6.2138671875, -5.107421875, -4.0009765625, -2.89453125, -1.7880859375, -0.681640625, 0.4248046875, 1.53125, 2.6376953125, 3.744140625, 4.8505859375, 5.95703125, 7.0634765625, 8.169921875, 9.2763671875, 10.3828125, 11.4892578125, 12.595703125, 13.7021484375, 14.80859375, 15.9150390625, 17.021484375, 18.1279296875, 19.234375, 20.3408203125, 21.447265625, 22.5537109375, 23.66015625, 24.7666015625, 25.873046875, 26.9794921875, 28.0859375, 29.1923828125, 30.298828125, 31.4052734375, 32.51171875, 33.6181640625, 34.724609375, 35.8310546875, 36.9375]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 8.0, 3.0, 10.0, 13.0, 17.0, 21.0, 28.0, 42.0, 62.0, 76.0, 121.0, 196.0, 249.0, 370.0, 554.0, 797.0, 1192.0, 1786.0, 2772.0, 4311.0, 7119.0, 12531.0, 24062.0, 59384.0, 374635.0, 3268337.0, 325281.0, 56228.0, 22948.0, 11877.0, 6889.0, 4175.0, 2691.0, 1798.0, 1104.0, 840.0, 519.0, 371.0, 255.0, 184.0, 134.0, 77.0, 63.0, 46.0, 27.0, 24.0, 18.0, 5.0, 14.0, 8.0, 4.0, 3.0, 5.0, 2.0, 0.0, 4.0], "bins": [-40.78125, -39.56298828125, -38.3447265625, -37.12646484375, -35.908203125, -34.68994140625, -33.4716796875, -32.25341796875, -31.03515625, -29.81689453125, -28.5986328125, -27.38037109375, -26.162109375, -24.94384765625, -23.7255859375, -22.50732421875, -21.2890625, -20.07080078125, -18.8525390625, -17.63427734375, -16.416015625, -15.19775390625, -13.9794921875, -12.76123046875, -11.54296875, -10.32470703125, -9.1064453125, -7.88818359375, -6.669921875, -5.45166015625, -4.2333984375, -3.01513671875, -1.796875, -0.57861328125, 0.6396484375, 1.85791015625, 3.076171875, 4.29443359375, 5.5126953125, 6.73095703125, 7.94921875, 9.16748046875, 10.3857421875, 11.60400390625, 12.822265625, 14.04052734375, 15.2587890625, 16.47705078125, 17.6953125, 18.91357421875, 20.1318359375, 21.35009765625, 22.568359375, 23.78662109375, 25.0048828125, 26.22314453125, 27.44140625, 28.65966796875, 29.8779296875, 31.09619140625, 32.314453125, 33.53271484375, 34.7509765625, 35.96923828125, 37.1875]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 3.0, 5.0, 13.0, 13.0, 15.0, 21.0, 26.0, 54.0, 76.0, 108.0, 168.0, 184.0, 109.0, 78.0, 38.0, 32.0, 22.0, 8.0, 9.0, 6.0, 6.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-119.85140228271484, -115.04425048828125, -110.23709869384766, -105.42994689941406, -100.62278747558594, -95.81563568115234, -91.00848388671875, -86.20132446289062, -81.39418029785156, -76.58702850341797, -71.77987670898438, -66.97271728515625, -62.165565490722656, -57.35841369628906, -52.55126190185547, -47.74410629272461, -42.93695068359375, -38.129798889160156, -33.3226432800293, -28.515491485595703, -23.708337783813477, -18.90118408203125, -14.094032287597656, -9.286876678466797, -4.479724884033203, 0.32742834091186523, 5.134581565856934, 9.941734313964844, 14.74888801574707, 19.556041717529297, 24.36319351196289, 29.17034912109375, 33.977508544921875, 38.78466033935547, 43.59181594848633, 48.39896774291992, 53.20612335205078, 58.013275146484375, 62.82042694091797, 67.62757873535156, 72.43473815917969, 77.24188995361328, 82.04904174804688, 86.856201171875, 91.6633529663086, 96.47050476074219, 101.27765655517578, 106.08480834960938, 110.89196014404297, 115.69911193847656, 120.50626373291016, 125.31341552734375, 130.12057495117188, 134.927734375, 139.73487854003906, 144.5420379638672, 149.34918212890625, 154.15634155273438, 158.96348571777344, 163.77064514160156, 168.57778930664062, 173.38494873046875, 178.19210815429688, 182.99925231933594, 187.80641174316406]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 3.0, 6.0, 3.0, 5.0, 8.0, 7.0, 12.0, 15.0, 12.0, 17.0, 23.0, 30.0, 30.0, 26.0, 25.0, 30.0, 32.0, 45.0, 41.0, 44.0, 43.0, 38.0, 41.0, 45.0, 36.0, 48.0, 38.0, 39.0, 37.0, 35.0, 27.0, 26.0, 21.0, 28.0, 11.0, 14.0, 14.0, 12.0, 11.0, 5.0, 7.0, 2.0, 6.0, 7.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-76.74385070800781, -74.01144409179688, -71.2790298461914, -68.54662322998047, -65.814208984375, -63.0817985534668, -60.349388122558594, -57.616981506347656, -54.88456726074219, -52.152156829833984, -49.41974639892578, -46.68733596801758, -43.954925537109375, -41.22251510620117, -38.49010467529297, -35.75769805908203, -33.02528762817383, -30.292877197265625, -27.560466766357422, -24.82805633544922, -22.095645904541016, -19.363235473632812, -16.630826950073242, -13.898416519165039, -11.166006088256836, -8.433595657348633, -5.701185703277588, -2.968775749206543, -0.23636531829833984, 2.4960451126098633, 5.22845458984375, 7.960865020751953, 10.693275451660156, 13.42568588256836, 16.158096313476562, 18.890506744384766, 21.62291717529297, 24.355327606201172, 27.087736129760742, 29.820146560668945, 32.55255889892578, 35.284969329833984, 38.01737976074219, 40.74979019165039, 43.482200622558594, 46.2146110534668, 48.947021484375, 51.67942810058594, 54.41183853149414, 57.144248962402344, 59.87665939331055, 62.60906982421875, 65.34147644042969, 68.07389068603516, 70.8062973022461, 73.53871154785156, 76.2711181640625, 79.00352478027344, 81.7359390258789, 84.46834564208984, 87.20075988769531, 89.93316650390625, 92.66558074951172, 95.39798736572266, 98.13040161132812]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 3.0, 6.0, 3.0, 10.0, 7.0, 11.0, 8.0, 17.0, 16.0, 24.0, 19.0, 24.0, 27.0, 29.0, 35.0, 43.0, 42.0, 38.0, 45.0, 42.0, 51.0, 40.0, 35.0, 40.0, 32.0, 40.0, 40.0, 39.0, 40.0, 40.0, 25.0, 24.0, 13.0, 12.0, 25.0, 8.0, 13.0, 9.0, 7.0, 4.0, 5.0, 6.0, 2.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.28125, -11.888671875, -11.49609375, -11.103515625, -10.7109375, -10.318359375, -9.92578125, -9.533203125, -9.140625, -8.748046875, -8.35546875, -7.962890625, -7.5703125, -7.177734375, -6.78515625, -6.392578125, -6.0, -5.607421875, -5.21484375, -4.822265625, -4.4296875, -4.037109375, -3.64453125, -3.251953125, -2.859375, -2.466796875, -2.07421875, -1.681640625, -1.2890625, -0.896484375, -0.50390625, -0.111328125, 0.28125, 0.673828125, 1.06640625, 1.458984375, 1.8515625, 2.244140625, 2.63671875, 3.029296875, 3.421875, 3.814453125, 4.20703125, 4.599609375, 4.9921875, 5.384765625, 5.77734375, 6.169921875, 6.5625, 6.955078125, 7.34765625, 7.740234375, 8.1328125, 8.525390625, 8.91796875, 9.310546875, 9.703125, 10.095703125, 10.48828125, 10.880859375, 11.2734375, 11.666015625, 12.05859375, 12.451171875, 12.84375]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 7.0, 3.0, 11.0, 12.0, 26.0, 21.0, 35.0, 46.0, 89.0, 117.0, 184.0, 260.0, 417.0, 611.0, 960.0, 1489.0, 2291.0, 3483.0, 5391.0, 8445.0, 13249.0, 21438.0, 35901.0, 62797.0, 120206.0, 238125.0, 244648.0, 125714.0, 65248.0, 36803.0, 22330.0, 13668.0, 8680.0, 5492.0, 3627.0, 2383.0, 1434.0, 986.0, 660.0, 425.0, 263.0, 183.0, 121.0, 102.0, 56.0, 46.0, 35.0, 9.0, 15.0, 6.0, 4.0, 4.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0], "bins": [-1.52734375, -1.4796600341796875, -1.431976318359375, -1.3842926025390625, -1.33660888671875, -1.2889251708984375, -1.241241455078125, -1.1935577392578125, -1.1458740234375, -1.0981903076171875, -1.050506591796875, -1.0028228759765625, -0.95513916015625, -0.9074554443359375, -0.859771728515625, -0.8120880126953125, -0.764404296875, -0.7167205810546875, -0.669036865234375, -0.6213531494140625, -0.57366943359375, -0.5259857177734375, -0.478302001953125, -0.4306182861328125, -0.3829345703125, -0.3352508544921875, -0.287567138671875, -0.2398834228515625, -0.19219970703125, -0.1445159912109375, -0.096832275390625, -0.0491485595703125, -0.00146484375, 0.0462188720703125, 0.093902587890625, 0.1415863037109375, 0.18927001953125, 0.2369537353515625, 0.284637451171875, 0.3323211669921875, 0.3800048828125, 0.4276885986328125, 0.475372314453125, 0.5230560302734375, 0.57073974609375, 0.6184234619140625, 0.666107177734375, 0.7137908935546875, 0.761474609375, 0.8091583251953125, 0.856842041015625, 0.9045257568359375, 0.95220947265625, 0.9998931884765625, 1.047576904296875, 1.0952606201171875, 1.1429443359375, 1.1906280517578125, 1.238311767578125, 1.2859954833984375, 1.33367919921875, 1.3813629150390625, 1.429046630859375, 1.4767303466796875, 1.5244140625]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 2.0, 7.0, 10.0, 6.0, 7.0, 15.0, 11.0, 12.0, 8.0, 18.0, 29.0, 27.0, 27.0, 26.0, 38.0, 31.0, 27.0, 38.0, 40.0, 36.0, 40.0, 45.0, 1063.0, 36.0, 43.0, 40.0, 31.0, 37.0, 21.0, 25.0, 38.0, 32.0, 24.0, 19.0, 17.0, 11.0, 15.0, 19.0, 14.0, 6.0, 9.0, 2.0, 8.0, 7.0, 5.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.8125, -7.5848388671875, -7.357177734375, -7.1295166015625, -6.90185546875, -6.6741943359375, -6.446533203125, -6.2188720703125, -5.9912109375, -5.7635498046875, -5.535888671875, -5.3082275390625, -5.08056640625, -4.8529052734375, -4.625244140625, -4.3975830078125, -4.169921875, -3.9422607421875, -3.714599609375, -3.4869384765625, -3.25927734375, -3.0316162109375, -2.803955078125, -2.5762939453125, -2.3486328125, -2.1209716796875, -1.893310546875, -1.6656494140625, -1.43798828125, -1.2103271484375, -0.982666015625, -0.7550048828125, -0.52734375, -0.2996826171875, -0.072021484375, 0.1556396484375, 0.38330078125, 0.6109619140625, 0.838623046875, 1.0662841796875, 1.2939453125, 1.5216064453125, 1.749267578125, 1.9769287109375, 2.20458984375, 2.4322509765625, 2.659912109375, 2.8875732421875, 3.115234375, 3.3428955078125, 3.570556640625, 3.7982177734375, 4.02587890625, 4.2535400390625, 4.481201171875, 4.7088623046875, 4.9365234375, 5.1641845703125, 5.391845703125, 5.6195068359375, 5.84716796875, 6.0748291015625, 6.302490234375, 6.5301513671875, 6.7578125]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 1.0, 5.0, 12.0, 13.0, 20.0, 24.0, 44.0, 73.0, 115.0, 155.0, 196.0, 358.0, 600.0, 903.0, 1483.0, 2206.0, 3641.0, 5753.0, 9301.0, 14710.0, 24215.0, 40801.0, 71404.0, 130713.0, 1146535.0, 356218.0, 121711.0, 66563.0, 38656.0, 23115.0, 14109.0, 8651.0, 5437.0, 3438.0, 2082.0, 1375.0, 915.0, 568.0, 347.0, 211.0, 163.0, 111.0, 64.0, 54.0, 23.0, 13.0, 10.0, 10.0, 5.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.716796875, -0.6920318603515625, -0.667266845703125, -0.6425018310546875, -0.61773681640625, -0.5929718017578125, -0.568206787109375, -0.5434417724609375, -0.5186767578125, -0.4939117431640625, -0.469146728515625, -0.4443817138671875, -0.41961669921875, -0.3948516845703125, -0.370086669921875, -0.3453216552734375, -0.320556640625, -0.2957916259765625, -0.271026611328125, -0.2462615966796875, -0.22149658203125, -0.1967315673828125, -0.171966552734375, -0.1472015380859375, -0.1224365234375, -0.0976715087890625, -0.072906494140625, -0.0481414794921875, -0.02337646484375, 0.0013885498046875, 0.026153564453125, 0.0509185791015625, 0.07568359375, 0.1004486083984375, 0.125213623046875, 0.1499786376953125, 0.17474365234375, 0.1995086669921875, 0.224273681640625, 0.2490386962890625, 0.2738037109375, 0.2985687255859375, 0.323333740234375, 0.3480987548828125, 0.37286376953125, 0.3976287841796875, 0.422393798828125, 0.4471588134765625, 0.471923828125, 0.4966888427734375, 0.521453857421875, 0.5462188720703125, 0.57098388671875, 0.5957489013671875, 0.620513916015625, 0.6452789306640625, 0.6700439453125, 0.6948089599609375, 0.719573974609375, 0.7443389892578125, 0.76910400390625, 0.7938690185546875, 0.818634033203125, 0.8433990478515625, 0.8681640625]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 6.0, 1.0, 8.0, 4.0, 6.0, 3.0, 5.0, 12.0, 14.0, 20.0, 32.0, 28.0, 90.0, 145.0, 159.0, 158.0, 92.0, 52.0, 32.0, 34.0, 13.0, 17.0, 2.0, 7.0, 10.0, 6.0, 8.0, 5.0, 3.0, 5.0, 4.0, 3.0, 5.0, 5.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.04541015625, -0.0439763069152832, -0.042542457580566406, -0.04110860824584961, -0.03967475891113281, -0.038240909576416016, -0.03680706024169922, -0.03537321090698242, -0.033939361572265625, -0.03250551223754883, -0.03107166290283203, -0.029637813568115234, -0.028203964233398438, -0.02677011489868164, -0.025336265563964844, -0.023902416229248047, -0.02246856689453125, -0.021034717559814453, -0.019600868225097656, -0.01816701889038086, -0.016733169555664062, -0.015299320220947266, -0.013865470886230469, -0.012431621551513672, -0.010997772216796875, -0.009563922882080078, -0.008130073547363281, -0.006696224212646484, -0.0052623748779296875, -0.0038285255432128906, -0.0023946762084960938, -0.0009608268737792969, 0.0004730224609375, 0.0019068717956542969, 0.0033407211303710938, 0.004774570465087891, 0.0062084197998046875, 0.007642269134521484, 0.009076118469238281, 0.010509967803955078, 0.011943817138671875, 0.013377666473388672, 0.014811515808105469, 0.016245365142822266, 0.017679214477539062, 0.01911306381225586, 0.020546913146972656, 0.021980762481689453, 0.02341461181640625, 0.024848461151123047, 0.026282310485839844, 0.02771615982055664, 0.029150009155273438, 0.030583858489990234, 0.03201770782470703, 0.03345155715942383, 0.034885406494140625, 0.03631925582885742, 0.03775310516357422, 0.039186954498291016, 0.04062080383300781, 0.04205465316772461, 0.043488502502441406, 0.0449223518371582, 0.046356201171875]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 2.0, 4.0, 1.0, 3.0, 8.0, 7.0, 9.0, 11.0, 31.0, 30.0, 54.0, 70.0, 106.0, 173.0, 1188.0, 45064.0, 993602.0, 7277.0, 472.0, 146.0, 100.0, 58.0, 34.0, 34.0, 22.0, 15.0, 9.0, 8.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.1376953125, -1.1024627685546875, -1.067230224609375, -1.0319976806640625, -0.99676513671875, -0.9615325927734375, -0.926300048828125, -0.8910675048828125, -0.8558349609375, -0.8206024169921875, -0.785369873046875, -0.7501373291015625, -0.71490478515625, -0.6796722412109375, -0.644439697265625, -0.6092071533203125, -0.573974609375, -0.5387420654296875, -0.503509521484375, -0.4682769775390625, -0.43304443359375, -0.3978118896484375, -0.362579345703125, -0.3273468017578125, -0.2921142578125, -0.2568817138671875, -0.221649169921875, -0.1864166259765625, -0.15118408203125, -0.1159515380859375, -0.080718994140625, -0.0454864501953125, -0.01025390625, 0.0249786376953125, 0.060211181640625, 0.0954437255859375, 0.13067626953125, 0.1659088134765625, 0.201141357421875, 0.2363739013671875, 0.2716064453125, 0.3068389892578125, 0.342071533203125, 0.3773040771484375, 0.41253662109375, 0.4477691650390625, 0.483001708984375, 0.5182342529296875, 0.553466796875, 0.5886993408203125, 0.623931884765625, 0.6591644287109375, 0.69439697265625, 0.7296295166015625, 0.764862060546875, 0.8000946044921875, 0.8353271484375, 0.8705596923828125, 0.905792236328125, 0.9410247802734375, 0.97625732421875, 1.0114898681640625, 1.046722412109375, 1.0819549560546875, 1.1171875]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 7.0, 15.0, 17.0, 34.0, 69.0, 121.0, 264.0, 240.0, 95.0, 64.0, 26.0, 21.0, 11.0, 8.0, 3.0, 0.0, 3.0, 2.0, 0.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11927410215139389, -0.11261456459760666, -0.10595502704381943, -0.09929549694061279, -0.09263595938682556, -0.08597642183303833, -0.0793168842792511, -0.07265734672546387, -0.06599780917167664, -0.059338271617889404, -0.05267873778939247, -0.04601920023560524, -0.03935966640710831, -0.032700128853321075, -0.026040591299533844, -0.01938105747103691, -0.012721523642539978, -0.0060619874857366085, 0.000597548671066761, 0.007257085293531418, 0.0139166209846735, 0.020576156675815582, 0.027235694229602814, 0.03389522805809975, 0.04055476561188698, 0.04721430316567421, 0.05387383699417114, 0.060533374547958374, 0.0671929121017456, 0.07385244965553284, 0.08051198720932007, 0.0871715173125267, 0.09383104741573334, 0.10049058496952057, 0.1071501225233078, 0.11380966007709503, 0.12046919018030167, 0.1271287202835083, 0.13378825783729553, 0.14044779539108276, 0.14710733294487, 0.15376687049865723, 0.16042640805244446, 0.1670859456062317, 0.17374548316001892, 0.18040502071380615, 0.18706455826759338, 0.19372408092021942, 0.20038363337516785, 0.20704317092895508, 0.2137027084827423, 0.22036224603652954, 0.22702178359031677, 0.233681321144104, 0.24034085869789124, 0.24700038135051727, 0.2536599040031433, 0.26031944155693054, 0.2669789791107178, 0.273638516664505, 0.28029805421829224, 0.28695759177207947, 0.2936171293258667, 0.30027666687965393, 0.30693620443344116]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 3.0, 3.0, 3.0, 5.0, 8.0, 10.0, 11.0, 16.0, 13.0, 14.0, 21.0, 19.0, 26.0, 21.0, 19.0, 35.0, 41.0, 21.0, 31.0, 47.0, 31.0, 39.0, 35.0, 36.0, 39.0, 38.0, 38.0, 33.0, 46.0, 42.0, 29.0, 29.0, 21.0, 26.0, 31.0, 21.0, 17.0, 17.0, 15.0, 10.0, 6.0, 12.0, 8.0, 4.0, 3.0, 1.0, 5.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.020572364330291748, -0.019920574501156807, -0.019268784672021866, -0.018616994842886925, -0.017965205013751984, -0.017313415184617043, -0.0166616253554821, -0.01600983552634716, -0.01535804569721222, -0.014706255868077278, -0.014054466038942337, -0.013402676209807396, -0.012750886380672455, -0.012099096551537514, -0.011447306722402573, -0.010795516893267632, -0.01014372706413269, -0.00949193723499775, -0.008840147405862808, -0.008188357576727867, -0.007536567747592926, -0.006884777918457985, -0.006232988089323044, -0.005581198260188103, -0.004929408431053162, -0.0042776186019182205, -0.0036258287727832794, -0.0029740389436483383, -0.002322249114513397, -0.0016704592853784561, -0.001018669456243515, -0.0003668796271085739, 0.0002849102020263672, 0.0009367000311613083, 0.0015884898602962494, 0.0022402796894311905, 0.0028920695185661316, 0.0035438593477010727, 0.004195649176836014, 0.004847439005970955, 0.005499228835105896, 0.006151018664240837, 0.006802808493375778, 0.007454598322510719, 0.00810638815164566, 0.008758177980780602, 0.009409967809915543, 0.010061757639050484, 0.010713547468185425, 0.011365337297320366, 0.012017127126455307, 0.012668916955590248, 0.01332070678472519, 0.01397249661386013, 0.014624286442995071, 0.015276076272130013, 0.015927866101264954, 0.016579655930399895, 0.017231445759534836, 0.017883235588669777, 0.018535025417804718, 0.01918681524693966, 0.0198386050760746, 0.02049039490520954, 0.021142184734344482]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 3.0, 6.0, 3.0, 10.0, 7.0, 11.0, 8.0, 17.0, 16.0, 24.0, 19.0, 24.0, 27.0, 29.0, 36.0, 42.0, 42.0, 38.0, 45.0, 42.0, 51.0, 40.0, 35.0, 40.0, 33.0, 39.0, 39.0, 40.0, 40.0, 40.0, 25.0, 24.0, 13.0, 12.0, 25.0, 8.0, 13.0, 9.0, 7.0, 4.0, 5.0, 6.0, 2.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.28125, -11.888671875, -11.49609375, -11.103515625, -10.7109375, -10.318359375, -9.92578125, -9.533203125, -9.140625, -8.748046875, -8.35546875, -7.962890625, -7.5703125, -7.177734375, -6.78515625, -6.392578125, -6.0, -5.607421875, -5.21484375, -4.822265625, -4.4296875, -4.037109375, -3.64453125, -3.251953125, -2.859375, -2.466796875, -2.07421875, -1.681640625, -1.2890625, -0.896484375, -0.50390625, -0.111328125, 0.28125, 0.673828125, 1.06640625, 1.458984375, 1.8515625, 2.244140625, 2.63671875, 3.029296875, 3.421875, 3.814453125, 4.20703125, 4.599609375, 4.9921875, 5.384765625, 5.77734375, 6.169921875, 6.5625, 6.955078125, 7.34765625, 7.740234375, 8.1328125, 8.525390625, 8.91796875, 9.310546875, 9.703125, 10.095703125, 10.48828125, 10.880859375, 11.2734375, 11.666015625, 12.05859375, 12.451171875, 12.84375]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 0.0, 6.0, 4.0, 9.0, 13.0, 16.0, 20.0, 33.0, 53.0, 61.0, 72.0, 121.0, 158.0, 219.0, 341.0, 473.0, 695.0, 946.0, 1585.0, 2795.0, 5517.0, 18934.0, 177877.0, 761669.0, 56649.0, 10249.0, 3818.0, 2135.0, 1269.0, 877.0, 563.0, 415.0, 275.0, 185.0, 154.0, 108.0, 66.0, 52.0, 43.0, 17.0, 23.0, 12.0, 15.0, 6.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-17.828125, -17.27587890625, -16.7236328125, -16.17138671875, -15.619140625, -15.06689453125, -14.5146484375, -13.96240234375, -13.41015625, -12.85791015625, -12.3056640625, -11.75341796875, -11.201171875, -10.64892578125, -10.0966796875, -9.54443359375, -8.9921875, -8.43994140625, -7.8876953125, -7.33544921875, -6.783203125, -6.23095703125, -5.6787109375, -5.12646484375, -4.57421875, -4.02197265625, -3.4697265625, -2.91748046875, -2.365234375, -1.81298828125, -1.2607421875, -0.70849609375, -0.15625, 0.39599609375, 0.9482421875, 1.50048828125, 2.052734375, 2.60498046875, 3.1572265625, 3.70947265625, 4.26171875, 4.81396484375, 5.3662109375, 5.91845703125, 6.470703125, 7.02294921875, 7.5751953125, 8.12744140625, 8.6796875, 9.23193359375, 9.7841796875, 10.33642578125, 10.888671875, 11.44091796875, 11.9931640625, 12.54541015625, 13.09765625, 13.64990234375, 14.2021484375, 14.75439453125, 15.306640625, 15.85888671875, 16.4111328125, 16.96337890625, 17.515625]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 3.0, 1.0, 6.0, 5.0, 6.0, 6.0, 8.0, 17.0, 15.0, 13.0, 12.0, 23.0, 24.0, 27.0, 31.0, 28.0, 33.0, 33.0, 34.0, 41.0, 35.0, 43.0, 103.0, 1950.0, 101.0, 40.0, 46.0, 33.0, 39.0, 40.0, 33.0, 20.0, 25.0, 25.0, 30.0, 18.0, 17.0, 14.0, 9.0, 15.0, 10.0, 6.0, 4.0, 6.0, 5.0, 5.0, 8.0, 2.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-38.375, -37.19482421875, -36.0146484375, -34.83447265625, -33.654296875, -32.47412109375, -31.2939453125, -30.11376953125, -28.93359375, -27.75341796875, -26.5732421875, -25.39306640625, -24.212890625, -23.03271484375, -21.8525390625, -20.67236328125, -19.4921875, -18.31201171875, -17.1318359375, -15.95166015625, -14.771484375, -13.59130859375, -12.4111328125, -11.23095703125, -10.05078125, -8.87060546875, -7.6904296875, -6.51025390625, -5.330078125, -4.14990234375, -2.9697265625, -1.78955078125, -0.609375, 0.57080078125, 1.7509765625, 2.93115234375, 4.111328125, 5.29150390625, 6.4716796875, 7.65185546875, 8.83203125, 10.01220703125, 11.1923828125, 12.37255859375, 13.552734375, 14.73291015625, 15.9130859375, 17.09326171875, 18.2734375, 19.45361328125, 20.6337890625, 21.81396484375, 22.994140625, 24.17431640625, 25.3544921875, 26.53466796875, 27.71484375, 28.89501953125, 30.0751953125, 31.25537109375, 32.435546875, 33.61572265625, 34.7958984375, 35.97607421875, 37.15625]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 13.0, 8.0, 7.0, 6.0, 7.0, 13.0, 16.0, 16.0, 25.0, 26.0, 48.0, 56.0, 62.0, 109.0, 162.0, 317.0, 711.0, 2232.0, 11178.0, 3103699.0, 22132.0, 2988.0, 851.0, 384.0, 203.0, 124.0, 78.0, 55.0, 39.0, 31.0, 19.0, 18.0, 24.0, 9.0, 6.0, 12.0, 5.0, 3.0, 5.0, 4.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-71.875, -69.3623046875, -66.849609375, -64.3369140625, -61.82421875, -59.3115234375, -56.798828125, -54.2861328125, -51.7734375, -49.2607421875, -46.748046875, -44.2353515625, -41.72265625, -39.2099609375, -36.697265625, -34.1845703125, -31.671875, -29.1591796875, -26.646484375, -24.1337890625, -21.62109375, -19.1083984375, -16.595703125, -14.0830078125, -11.5703125, -9.0576171875, -6.544921875, -4.0322265625, -1.51953125, 0.9931640625, 3.505859375, 6.0185546875, 8.53125, 11.0439453125, 13.556640625, 16.0693359375, 18.58203125, 21.0947265625, 23.607421875, 26.1201171875, 28.6328125, 31.1455078125, 33.658203125, 36.1708984375, 38.68359375, 41.1962890625, 43.708984375, 46.2216796875, 48.734375, 51.2470703125, 53.759765625, 56.2724609375, 58.78515625, 61.2978515625, 63.810546875, 66.3232421875, 68.8359375, 71.3486328125, 73.861328125, 76.3740234375, 78.88671875, 81.3994140625, 83.912109375, 86.4248046875, 88.9375]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 6.0, 11.0, 26.0, 44.0, 92.0, 108.0, 154.0, 206.0, 161.0, 89.0, 64.0, 23.0, 11.0, 8.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.517452239990234, -53.011497497558594, -51.50553894042969, -49.99958419799805, -48.493629455566406, -46.9876708984375, -45.48171615600586, -43.97576141357422, -42.46980285644531, -40.96384811401367, -39.457889556884766, -37.951934814453125, -36.44597625732422, -34.94002151489258, -33.43406677246094, -31.928110122680664, -30.42215347290039, -28.916196823120117, -27.410240173339844, -25.904285430908203, -24.39832878112793, -22.892372131347656, -21.386417388916016, -19.880460739135742, -18.37450408935547, -16.868547439575195, -15.362591743469238, -13.856636047363281, -12.350679397583008, -10.844722747802734, -9.338767051696777, -7.83281135559082, -6.326854705810547, -4.820898532867432, -3.3149423599243164, -1.8089861869812012, -0.30303001403808594, 1.2029261589050293, 2.7088823318481445, 4.214838027954102, 5.720794677734375, 7.22675085067749, 8.732707023620605, 10.238662719726562, 11.744619369506836, 13.25057601928711, 14.756531715393066, 16.262487411499023, 17.768444061279297, 19.27440071105957, 20.780357360839844, 22.286312103271484, 23.792268753051758, 25.29822540283203, 26.804180145263672, 28.310136795043945, 29.81609344482422, 31.322050094604492, 32.828006744384766, 34.333961486816406, 35.83992004394531, 37.34587478637695, 38.851829528808594, 40.3577880859375, 41.86374282836914]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 2.0, 2.0, 4.0, 4.0, 1.0, 4.0, 9.0, 9.0, 14.0, 19.0, 19.0, 10.0, 33.0, 22.0, 32.0, 32.0, 35.0, 38.0, 38.0, 39.0, 41.0, 31.0, 49.0, 62.0, 37.0, 37.0, 41.0, 44.0, 38.0, 31.0, 32.0, 33.0, 29.0, 26.0, 14.0, 28.0, 18.0, 12.0, 11.0, 6.0, 3.0, 5.0, 6.0, 4.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-128.0409698486328, -124.08228302001953, -120.12360382080078, -116.1649169921875, -112.20623779296875, -108.24755096435547, -104.28886413574219, -100.33018493652344, -96.37149810791016, -92.41281127929688, -88.45413208007812, -84.49544525146484, -80.53675842285156, -76.57807922363281, -72.61939239501953, -68.66070556640625, -64.7020263671875, -60.743343353271484, -56.78466033935547, -52.82597351074219, -48.86729049682617, -44.908607482910156, -40.949920654296875, -36.99123764038086, -33.032554626464844, -29.073871612548828, -25.11518669128418, -21.15650177001953, -17.197818756103516, -13.2391357421875, -9.280450820922852, -5.321765899658203, -1.3630828857421875, 2.5956010818481445, 6.554285049438477, 10.512969017028809, 14.47165298461914, 18.430335998535156, 22.389020919799805, 26.347705841064453, 30.30638885498047, 34.265071868896484, 38.2237548828125, 42.18244171142578, 46.1411247253418, 50.09980773925781, 54.058494567871094, 58.01717758178711, 61.975860595703125, 65.9345474243164, 69.89322662353516, 73.85191345214844, 77.81059265136719, 81.76927947998047, 85.72796630859375, 89.6866455078125, 93.64533233642578, 97.60401916503906, 101.56269836425781, 105.5213851928711, 109.48007202148438, 113.43875122070312, 117.3974380493164, 121.35612487792969, 125.31480407714844]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 3.0, 10.0, 12.0, 9.0, 5.0, 17.0, 21.0, 19.0, 13.0, 28.0, 29.0, 28.0, 32.0, 51.0, 44.0, 33.0, 43.0, 50.0, 46.0, 41.0, 42.0, 31.0, 42.0, 37.0, 34.0, 46.0, 40.0, 35.0, 32.0, 15.0, 14.0, 14.0, 19.0, 11.0, 15.0, 8.0, 6.0, 6.0, 4.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-12.609375, -12.2059326171875, -11.802490234375, -11.3990478515625, -10.99560546875, -10.5921630859375, -10.188720703125, -9.7852783203125, -9.3818359375, -8.9783935546875, -8.574951171875, -8.1715087890625, -7.76806640625, -7.3646240234375, -6.961181640625, -6.5577392578125, -6.154296875, -5.7508544921875, -5.347412109375, -4.9439697265625, -4.54052734375, -4.1370849609375, -3.733642578125, -3.3302001953125, -2.9267578125, -2.5233154296875, -2.119873046875, -1.7164306640625, -1.31298828125, -0.9095458984375, -0.506103515625, -0.1026611328125, 0.30078125, 0.7042236328125, 1.107666015625, 1.5111083984375, 1.91455078125, 2.3179931640625, 2.721435546875, 3.1248779296875, 3.5283203125, 3.9317626953125, 4.335205078125, 4.7386474609375, 5.14208984375, 5.5455322265625, 5.948974609375, 6.3524169921875, 6.755859375, 7.1593017578125, 7.562744140625, 7.9661865234375, 8.36962890625, 8.7730712890625, 9.176513671875, 9.5799560546875, 9.9833984375, 10.3868408203125, 10.790283203125, 11.1937255859375, 11.59716796875, 12.0006103515625, 12.404052734375, 12.8074951171875, 13.2109375]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 0.0, 4.0, 10.0, 2.0, 6.0, 7.0, 13.0, 21.0, 26.0, 28.0, 56.0, 74.0, 152.0, 240.0, 413.0, 655.0, 1126.0, 2000.0, 3791.0, 7390.0, 17567.0, 266943.0, 3569451.0, 290294.0, 18004.0, 7270.0, 3684.0, 2085.0, 1209.0, 698.0, 403.0, 237.0, 154.0, 80.0, 68.0, 34.0, 21.0, 20.0, 17.0, 10.0, 8.0, 8.0, 6.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-42.625, -41.31396484375, -40.0029296875, -38.69189453125, -37.380859375, -36.06982421875, -34.7587890625, -33.44775390625, -32.13671875, -30.82568359375, -29.5146484375, -28.20361328125, -26.892578125, -25.58154296875, -24.2705078125, -22.95947265625, -21.6484375, -20.33740234375, -19.0263671875, -17.71533203125, -16.404296875, -15.09326171875, -13.7822265625, -12.47119140625, -11.16015625, -9.84912109375, -8.5380859375, -7.22705078125, -5.916015625, -4.60498046875, -3.2939453125, -1.98291015625, -0.671875, 0.63916015625, 1.9501953125, 3.26123046875, 4.572265625, 5.88330078125, 7.1943359375, 8.50537109375, 9.81640625, 11.12744140625, 12.4384765625, 13.74951171875, 15.060546875, 16.37158203125, 17.6826171875, 18.99365234375, 20.3046875, 21.61572265625, 22.9267578125, 24.23779296875, 25.548828125, 26.85986328125, 28.1708984375, 29.48193359375, 30.79296875, 32.10400390625, 33.4150390625, 34.72607421875, 36.037109375, 37.34814453125, 38.6591796875, 39.97021484375, 41.28125]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 3.0, 3.0, 2.0, 9.0, 5.0, 6.0, 6.0, 10.0, 8.0, 11.0, 18.0, 33.0, 51.0, 87.0, 177.0, 480.0, 931.0, 1041.0, 581.0, 283.0, 121.0, 61.0, 36.0, 28.0, 12.0, 21.0, 15.0, 3.0, 7.0, 6.0, 3.0, 1.0, 3.0, 1.0, 6.0, 0.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-39.0, -37.75048828125, -36.5009765625, -35.25146484375, -34.001953125, -32.75244140625, -31.5029296875, -30.25341796875, -29.00390625, -27.75439453125, -26.5048828125, -25.25537109375, -24.005859375, -22.75634765625, -21.5068359375, -20.25732421875, -19.0078125, -17.75830078125, -16.5087890625, -15.25927734375, -14.009765625, -12.76025390625, -11.5107421875, -10.26123046875, -9.01171875, -7.76220703125, -6.5126953125, -5.26318359375, -4.013671875, -2.76416015625, -1.5146484375, -0.26513671875, 0.984375, 2.23388671875, 3.4833984375, 4.73291015625, 5.982421875, 7.23193359375, 8.4814453125, 9.73095703125, 10.98046875, 12.22998046875, 13.4794921875, 14.72900390625, 15.978515625, 17.22802734375, 18.4775390625, 19.72705078125, 20.9765625, 22.22607421875, 23.4755859375, 24.72509765625, 25.974609375, 27.22412109375, 28.4736328125, 29.72314453125, 30.97265625, 32.22216796875, 33.4716796875, 34.72119140625, 35.970703125, 37.22021484375, 38.4697265625, 39.71923828125, 40.96875]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 7.0, 4.0, 11.0, 12.0, 21.0, 35.0, 40.0, 79.0, 111.0, 129.0, 212.0, 322.0, 509.0, 800.0, 1142.0, 1812.0, 2926.0, 4846.0, 8742.0, 17545.0, 45119.0, 307881.0, 3448619.0, 271582.0, 43565.0, 16886.0, 8460.0, 4815.0, 2853.0, 1811.0, 1183.0, 715.0, 455.0, 350.0, 223.0, 174.0, 113.0, 50.0, 30.0, 23.0, 25.0, 18.0, 13.0, 7.0, 7.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.71875, -41.21875, -39.71875, -38.21875, -36.71875, -35.21875, -33.71875, -32.21875, -30.71875, -29.21875, -27.71875, -26.21875, -24.71875, -23.21875, -21.71875, -20.21875, -18.71875, -17.21875, -15.71875, -14.21875, -12.71875, -11.21875, -9.71875, -8.21875, -6.71875, -5.21875, -3.71875, -2.21875, -0.71875, 0.78125, 2.28125, 3.78125, 5.28125, 6.78125, 8.28125, 9.78125, 11.28125, 12.78125, 14.28125, 15.78125, 17.28125, 18.78125, 20.28125, 21.78125, 23.28125, 24.78125, 26.28125, 27.78125, 29.28125, 30.78125, 32.28125, 33.78125, 35.28125, 36.78125, 38.28125, 39.78125, 41.28125, 42.78125, 44.28125, 45.78125, 47.28125, 48.78125, 50.28125, 51.78125, 53.28125]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0, 8.0, 8.0, 6.0, 7.0, 6.0, 14.0, 17.0, 18.0, 39.0, 44.0, 61.0, 96.0, 119.0, 125.0, 115.0, 85.0, 56.0, 43.0, 30.0, 13.0, 17.0, 18.0, 12.0, 7.0, 8.0, 11.0, 1.0, 5.0, 4.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-121.70426177978516, -117.93956756591797, -114.17488098144531, -110.41018676757812, -106.64549255371094, -102.88079833984375, -99.11610412597656, -95.3514175415039, -91.58672332763672, -87.82202911376953, -84.05734252929688, -80.29264831542969, -76.5279541015625, -72.76325988769531, -68.99856567382812, -65.23387908935547, -61.46918487548828, -57.704490661621094, -53.93980026245117, -50.17510986328125, -46.41041564941406, -42.645721435546875, -38.88103103637695, -35.11634063720703, -31.351646423339844, -27.58695411682129, -23.822261810302734, -20.05756950378418, -16.292877197265625, -12.52818489074707, -8.763492584228516, -4.998800277709961, -1.2341079711914062, 2.5305843353271484, 6.295276641845703, 10.059968948364258, 13.824661254882812, 17.589353561401367, 21.354045867919922, 25.118738174438477, 28.88343048095703, 32.64812469482422, 36.41281509399414, 40.17750549316406, 43.94219970703125, 47.70689392089844, 51.47158432006836, 55.23627471923828, 59.00096893310547, 62.765663146972656, 66.53034973144531, 70.2950439453125, 74.05973815917969, 77.82443237304688, 81.58912658691406, 85.35381317138672, 89.1185073852539, 92.8832015991211, 96.64788818359375, 100.41258239746094, 104.17727661132812, 107.94197082519531, 111.7066650390625, 115.47135162353516, 119.23604583740234]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 1.0, 0.0, 3.0, 4.0, 2.0, 2.0, 10.0, 10.0, 7.0, 11.0, 13.0, 15.0, 22.0, 20.0, 23.0, 21.0, 30.0, 28.0, 31.0, 29.0, 28.0, 41.0, 50.0, 44.0, 52.0, 35.0, 54.0, 50.0, 46.0, 37.0, 34.0, 31.0, 32.0, 26.0, 34.0, 24.0, 16.0, 18.0, 14.0, 10.0, 10.0, 12.0, 8.0, 9.0, 5.0, 2.0, 0.0, 6.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.22354125976562, -81.3347396850586, -78.44593048095703, -75.55712890625, -72.66832733154297, -69.77952575683594, -66.89071655273438, -64.00191497802734, -61.11310958862305, -58.22430419921875, -55.33550262451172, -52.44669723510742, -49.557891845703125, -46.669090270996094, -43.7802848815918, -40.8914794921875, -38.00267791748047, -35.11387252807617, -32.22507095336914, -29.336265563964844, -26.44746208190918, -23.558658599853516, -20.66985321044922, -17.781049728393555, -14.89224624633789, -12.003442764282227, -9.114638328552246, -6.225833892822266, -3.3370304107666016, -0.4482269287109375, 2.4405784606933594, 5.329381942749023, 8.218185424804688, 11.106988906860352, 13.995793342590332, 16.884597778320312, 19.773401260375977, 22.66220474243164, 25.551010131835938, 28.4398136138916, 31.328617095947266, 34.21742248535156, 37.106224060058594, 39.99502944946289, 42.88383483886719, 45.77263641357422, 48.661441802978516, 51.55024719238281, 54.439048767089844, 57.32785415649414, 60.21665573120117, 63.10546112060547, 65.9942626953125, 68.88307189941406, 71.7718734741211, 74.66067504882812, 77.54948425292969, 80.43828582763672, 83.32709503173828, 86.21589660644531, 89.10469818115234, 91.99349975585938, 94.88230895996094, 97.77111053466797, 100.659912109375]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 9.0, 9.0, 9.0, 13.0, 10.0, 16.0, 19.0, 22.0, 24.0, 40.0, 29.0, 35.0, 30.0, 35.0, 36.0, 54.0, 54.0, 44.0, 44.0, 39.0, 42.0, 43.0, 43.0, 36.0, 40.0, 28.0, 30.0, 31.0, 20.0, 14.0, 21.0, 9.0, 12.0, 12.0, 12.0, 12.0, 5.0, 5.0, 1.0, 3.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.5078125, -14.083984375, -13.66015625, -13.236328125, -12.8125, -12.388671875, -11.96484375, -11.541015625, -11.1171875, -10.693359375, -10.26953125, -9.845703125, -9.421875, -8.998046875, -8.57421875, -8.150390625, -7.7265625, -7.302734375, -6.87890625, -6.455078125, -6.03125, -5.607421875, -5.18359375, -4.759765625, -4.3359375, -3.912109375, -3.48828125, -3.064453125, -2.640625, -2.216796875, -1.79296875, -1.369140625, -0.9453125, -0.521484375, -0.09765625, 0.326171875, 0.75, 1.173828125, 1.59765625, 2.021484375, 2.4453125, 2.869140625, 3.29296875, 3.716796875, 4.140625, 4.564453125, 4.98828125, 5.412109375, 5.8359375, 6.259765625, 6.68359375, 7.107421875, 7.53125, 7.955078125, 8.37890625, 8.802734375, 9.2265625, 9.650390625, 10.07421875, 10.498046875, 10.921875, 11.345703125, 11.76953125, 12.193359375, 12.6171875]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 6.0, 16.0, 20.0, 21.0, 40.0, 46.0, 75.0, 109.0, 204.0, 306.0, 501.0, 783.0, 1315.0, 2224.0, 3715.0, 6279.0, 10634.0, 18509.0, 32781.0, 62056.0, 130434.0, 288271.0, 254085.0, 111762.0, 54668.0, 29391.0, 16475.0, 9680.0, 5749.0, 3242.0, 2017.0, 1195.0, 746.0, 419.0, 296.0, 152.0, 126.0, 78.0, 36.0, 33.0, 20.0, 15.0, 12.0, 7.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.7900390625, -1.73211669921875, -1.6741943359375, -1.61627197265625, -1.558349609375, -1.50042724609375, -1.4425048828125, -1.38458251953125, -1.32666015625, -1.26873779296875, -1.2108154296875, -1.15289306640625, -1.094970703125, -1.03704833984375, -0.9791259765625, -0.92120361328125, -0.86328125, -0.80535888671875, -0.7474365234375, -0.68951416015625, -0.631591796875, -0.57366943359375, -0.5157470703125, -0.45782470703125, -0.39990234375, -0.34197998046875, -0.2840576171875, -0.22613525390625, -0.168212890625, -0.11029052734375, -0.0523681640625, 0.00555419921875, 0.0634765625, 0.12139892578125, 0.1793212890625, 0.23724365234375, 0.295166015625, 0.35308837890625, 0.4110107421875, 0.46893310546875, 0.52685546875, 0.58477783203125, 0.6427001953125, 0.70062255859375, 0.758544921875, 0.81646728515625, 0.8743896484375, 0.93231201171875, 0.990234375, 1.04815673828125, 1.1060791015625, 1.16400146484375, 1.221923828125, 1.27984619140625, 1.3377685546875, 1.39569091796875, 1.45361328125, 1.51153564453125, 1.5694580078125, 1.62738037109375, 1.685302734375, 1.74322509765625, 1.8011474609375, 1.85906982421875, 1.9169921875]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 2.0, 1.0, 5.0, 3.0, 5.0, 8.0, 6.0, 8.0, 10.0, 9.0, 11.0, 17.0, 22.0, 26.0, 22.0, 28.0, 26.0, 25.0, 34.0, 30.0, 32.0, 26.0, 44.0, 43.0, 36.0, 1065.0, 35.0, 50.0, 45.0, 34.0, 43.0, 24.0, 30.0, 24.0, 26.0, 40.0, 21.0, 14.0, 19.0, 20.0, 12.0, 7.0, 15.0, 9.0, 7.0, 1.0, 5.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-8.0390625, -7.792236328125, -7.54541015625, -7.298583984375, -7.0517578125, -6.804931640625, -6.55810546875, -6.311279296875, -6.064453125, -5.817626953125, -5.57080078125, -5.323974609375, -5.0771484375, -4.830322265625, -4.58349609375, -4.336669921875, -4.08984375, -3.843017578125, -3.59619140625, -3.349365234375, -3.1025390625, -2.855712890625, -2.60888671875, -2.362060546875, -2.115234375, -1.868408203125, -1.62158203125, -1.374755859375, -1.1279296875, -0.881103515625, -0.63427734375, -0.387451171875, -0.140625, 0.106201171875, 0.35302734375, 0.599853515625, 0.8466796875, 1.093505859375, 1.34033203125, 1.587158203125, 1.833984375, 2.080810546875, 2.32763671875, 2.574462890625, 2.8212890625, 3.068115234375, 3.31494140625, 3.561767578125, 3.80859375, 4.055419921875, 4.30224609375, 4.549072265625, 4.7958984375, 5.042724609375, 5.28955078125, 5.536376953125, 5.783203125, 6.030029296875, 6.27685546875, 6.523681640625, 6.7705078125, 7.017333984375, 7.26416015625, 7.510986328125, 7.7578125]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 5.0, 3.0, 8.0, 18.0, 16.0, 37.0, 66.0, 96.0, 152.0, 210.0, 326.0, 446.0, 727.0, 1000.0, 1507.0, 2221.0, 3435.0, 5141.0, 7787.0, 11880.0, 17991.0, 28046.0, 45058.0, 75261.0, 132252.0, 1183360.0, 276062.0, 119283.0, 68693.0, 41181.0, 25713.0, 16424.0, 10920.0, 7192.0, 4871.0, 3214.0, 2218.0, 1410.0, 996.0, 612.0, 429.0, 320.0, 174.0, 117.0, 89.0, 60.0, 41.0, 23.0, 12.0, 13.0, 9.0, 5.0, 4.0, 3.0, 3.0, 0.0, 1.0], "bins": [-0.76708984375, -0.7437820434570312, -0.7204742431640625, -0.6971664428710938, -0.673858642578125, -0.6505508422851562, -0.6272430419921875, -0.6039352416992188, -0.58062744140625, -0.5573196411132812, -0.5340118408203125, -0.5107040405273438, -0.487396240234375, -0.46408843994140625, -0.4407806396484375, -0.41747283935546875, -0.3941650390625, -0.37085723876953125, -0.3475494384765625, -0.32424163818359375, -0.300933837890625, -0.27762603759765625, -0.2543182373046875, -0.23101043701171875, -0.20770263671875, -0.18439483642578125, -0.1610870361328125, -0.13777923583984375, -0.114471435546875, -0.09116363525390625, -0.0678558349609375, -0.04454803466796875, -0.021240234375, 0.00206756591796875, 0.0253753662109375, 0.04868316650390625, 0.071990966796875, 0.09529876708984375, 0.1186065673828125, 0.14191436767578125, 0.16522216796875, 0.18852996826171875, 0.2118377685546875, 0.23514556884765625, 0.258453369140625, 0.28176116943359375, 0.3050689697265625, 0.32837677001953125, 0.3516845703125, 0.37499237060546875, 0.3983001708984375, 0.42160797119140625, 0.444915771484375, 0.46822357177734375, 0.4915313720703125, 0.5148391723632812, 0.53814697265625, 0.5614547729492188, 0.5847625732421875, 0.6080703735351562, 0.631378173828125, 0.6546859741210938, 0.6779937744140625, 0.7013015747070312, 0.724609375]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 5.0, 5.0, 2.0, 10.0, 11.0, 18.0, 20.0, 25.0, 43.0, 59.0, 72.0, 131.0, 190.0, 122.0, 77.0, 68.0, 41.0, 36.0, 24.0, 12.0, 9.0, 4.0, 1.0, 6.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.032501220703125, -0.031502723693847656, -0.030504226684570312, -0.02950572967529297, -0.028507232666015625, -0.02750873565673828, -0.026510238647460938, -0.025511741638183594, -0.02451324462890625, -0.023514747619628906, -0.022516250610351562, -0.02151775360107422, -0.020519256591796875, -0.01952075958251953, -0.018522262573242188, -0.017523765563964844, -0.0165252685546875, -0.015526771545410156, -0.014528274536132812, -0.013529777526855469, -0.012531280517578125, -0.011532783508300781, -0.010534286499023438, -0.009535789489746094, -0.00853729248046875, -0.007538795471191406, -0.0065402984619140625, -0.005541801452636719, -0.004543304443359375, -0.0035448074340820312, -0.0025463104248046875, -0.0015478134155273438, -0.00054931640625, 0.00044918060302734375, 0.0014476776123046875, 0.0024461746215820312, 0.003444671630859375, 0.004443168640136719, 0.0054416656494140625, 0.006440162658691406, 0.00743865966796875, 0.008437156677246094, 0.009435653686523438, 0.010434150695800781, 0.011432647705078125, 0.012431144714355469, 0.013429641723632812, 0.014428138732910156, 0.0154266357421875, 0.016425132751464844, 0.017423629760742188, 0.01842212677001953, 0.019420623779296875, 0.02041912078857422, 0.021417617797851562, 0.022416114807128906, 0.02341461181640625, 0.024413108825683594, 0.025411605834960938, 0.02641010284423828, 0.027408599853515625, 0.02840709686279297, 0.029405593872070312, 0.030404090881347656, 0.031402587890625]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 4.0, 4.0, 8.0, 9.0, 5.0, 14.0, 18.0, 21.0, 32.0, 33.0, 46.0, 67.0, 106.0, 123.0, 199.0, 347.0, 800.0, 3335.0, 25974.0, 921342.0, 87163.0, 6444.0, 1329.0, 438.0, 206.0, 123.0, 95.0, 62.0, 53.0, 29.0, 23.0, 25.0, 18.0, 13.0, 9.0, 5.0, 11.0, 3.0, 5.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.50927734375, -0.49320220947265625, -0.4771270751953125, -0.46105194091796875, -0.444976806640625, -0.42890167236328125, -0.4128265380859375, -0.39675140380859375, -0.38067626953125, -0.36460113525390625, -0.3485260009765625, -0.33245086669921875, -0.316375732421875, -0.30030059814453125, -0.2842254638671875, -0.26815032958984375, -0.2520751953125, -0.23600006103515625, -0.2199249267578125, -0.20384979248046875, -0.187774658203125, -0.17169952392578125, -0.1556243896484375, -0.13954925537109375, -0.12347412109375, -0.10739898681640625, -0.0913238525390625, -0.07524871826171875, -0.059173583984375, -0.04309844970703125, -0.0270233154296875, -0.01094818115234375, 0.005126953125, 0.02120208740234375, 0.0372772216796875, 0.05335235595703125, 0.069427490234375, 0.08550262451171875, 0.1015777587890625, 0.11765289306640625, 0.13372802734375, 0.14980316162109375, 0.1658782958984375, 0.18195343017578125, 0.198028564453125, 0.21410369873046875, 0.2301788330078125, 0.24625396728515625, 0.2623291015625, 0.27840423583984375, 0.2944793701171875, 0.31055450439453125, 0.326629638671875, 0.34270477294921875, 0.3587799072265625, 0.37485504150390625, 0.39093017578125, 0.40700531005859375, 0.4230804443359375, 0.43915557861328125, 0.455230712890625, 0.47130584716796875, 0.4873809814453125, 0.5034561157226562, 0.51953125]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 6.0, 16.0, 66.0, 250.0, 454.0, 128.0, 52.0, 16.0, 12.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2257242053747177, -0.21600471436977386, -0.20628522336483002, -0.19656573235988617, -0.18684624135494232, -0.17712675034999847, -0.16740724444389343, -0.15768775343894958, -0.14796826243400574, -0.1382487714290619, -0.12852928042411804, -0.1188097894191742, -0.10909029841423035, -0.0993708074092865, -0.08965130895376205, -0.0799318179488182, -0.07021233439445496, -0.06049284338951111, -0.05077335238456726, -0.041053857654333115, -0.03133436664938927, -0.02161487564444542, -0.011895380914211273, -0.0021758899092674255, 0.007543601095676422, 0.01726309210062027, 0.026982584968209267, 0.036702077835798264, 0.04642156884074211, 0.05614105984568596, 0.0658605545759201, 0.07558004558086395, 0.0852995216846466, 0.09501901268959045, 0.1047385036945343, 0.11445799469947815, 0.124177485704422, 0.13389697670936584, 0.1436164677143097, 0.15333595871925354, 0.1630554497241974, 0.17277494072914124, 0.18249443173408508, 0.19221392273902893, 0.20193341374397278, 0.21165290474891663, 0.22137239575386047, 0.23109188675880432, 0.24081139266490936, 0.2505308985710144, 0.26025038957595825, 0.2699698805809021, 0.27968937158584595, 0.2894088625907898, 0.29912835359573364, 0.3088478446006775, 0.31856733560562134, 0.3282868266105652, 0.33800631761550903, 0.3477258086204529, 0.35744529962539673, 0.3671647906303406, 0.3768842816352844, 0.38660377264022827, 0.3963232636451721]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 4.0, 6.0, 6.0, 5.0, 7.0, 7.0, 14.0, 21.0, 13.0, 20.0, 18.0, 16.0, 21.0, 34.0, 33.0, 26.0, 31.0, 31.0, 39.0, 48.0, 46.0, 39.0, 32.0, 43.0, 32.0, 36.0, 37.0, 41.0, 30.0, 26.0, 20.0, 37.0, 29.0, 28.0, 23.0, 21.0, 16.0, 13.0, 11.0, 10.0, 12.0, 7.0, 7.0, 3.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01572597026824951, -0.015226421877741814, -0.014726873487234116, -0.014227325096726418, -0.01372777670621872, -0.013228228315711021, -0.012728679925203323, -0.012229131534695625, -0.011729583144187927, -0.01123003475368023, -0.010730486363172531, -0.010230937972664833, -0.009731389582157135, -0.009231841191649437, -0.008732292801141739, -0.00823274441063404, -0.007733196020126343, -0.007233647629618645, -0.006734099239110947, -0.006234550848603249, -0.0057350024580955505, -0.0052354540675878525, -0.004735905677080154, -0.004236357286572456, -0.0037368088960647583, -0.0032372605055570602, -0.002737712115049362, -0.002238163724541664, -0.001738615334033966, -0.001239066943526268, -0.00073951855301857, -0.0002399701625108719, 0.00025957822799682617, 0.0007591266185045242, 0.0012586750090122223, 0.0017582233995199203, 0.0022577717900276184, 0.0027573201805353165, 0.0032568685710430145, 0.0037564169615507126, 0.004255965352058411, 0.004755513742566109, 0.005255062133073807, 0.005754610523581505, 0.006254158914089203, 0.006753707304596901, 0.007253255695104599, 0.007752804085612297, 0.008252352476119995, 0.008751900866627693, 0.009251449257135391, 0.00975099764764309, 0.010250546038150787, 0.010750094428658485, 0.011249642819166183, 0.011749191209673882, 0.01224873960018158, 0.012748287990689278, 0.013247836381196976, 0.013747384771704674, 0.014246933162212372, 0.01474648155272007, 0.015246029943227768, 0.015745578333735466, 0.016245126724243164]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 9.0, 9.0, 9.0, 13.0, 11.0, 15.0, 20.0, 21.0, 25.0, 40.0, 31.0, 34.0, 28.0, 35.0, 36.0, 54.0, 55.0, 44.0, 44.0, 38.0, 44.0, 42.0, 43.0, 35.0, 40.0, 30.0, 28.0, 32.0, 19.0, 15.0, 20.0, 9.0, 13.0, 12.0, 11.0, 12.0, 5.0, 5.0, 1.0, 3.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.5, -14.076171875, -13.65234375, -13.228515625, -12.8046875, -12.380859375, -11.95703125, -11.533203125, -11.109375, -10.685546875, -10.26171875, -9.837890625, -9.4140625, -8.990234375, -8.56640625, -8.142578125, -7.71875, -7.294921875, -6.87109375, -6.447265625, -6.0234375, -5.599609375, -5.17578125, -4.751953125, -4.328125, -3.904296875, -3.48046875, -3.056640625, -2.6328125, -2.208984375, -1.78515625, -1.361328125, -0.9375, -0.513671875, -0.08984375, 0.333984375, 0.7578125, 1.181640625, 1.60546875, 2.029296875, 2.453125, 2.876953125, 3.30078125, 3.724609375, 4.1484375, 4.572265625, 4.99609375, 5.419921875, 5.84375, 6.267578125, 6.69140625, 7.115234375, 7.5390625, 7.962890625, 8.38671875, 8.810546875, 9.234375, 9.658203125, 10.08203125, 10.505859375, 10.9296875, 11.353515625, 11.77734375, 12.201171875, 12.625]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 1.0, 8.0, 12.0, 11.0, 15.0, 16.0, 28.0, 41.0, 54.0, 70.0, 106.0, 209.0, 316.0, 566.0, 1085.0, 2319.0, 5073.0, 12701.0, 36259.0, 129081.0, 522457.0, 246274.0, 58576.0, 19358.0, 7454.0, 3147.0, 1481.0, 746.0, 416.0, 219.0, 145.0, 78.0, 50.0, 37.0, 37.0, 35.0, 15.0, 17.0, 13.0, 7.0, 8.0, 3.0, 3.0, 1.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.5625, -8.3157958984375, -8.069091796875, -7.8223876953125, -7.57568359375, -7.3289794921875, -7.082275390625, -6.8355712890625, -6.5888671875, -6.3421630859375, -6.095458984375, -5.8487548828125, -5.60205078125, -5.3553466796875, -5.108642578125, -4.8619384765625, -4.615234375, -4.3685302734375, -4.121826171875, -3.8751220703125, -3.62841796875, -3.3817138671875, -3.135009765625, -2.8883056640625, -2.6416015625, -2.3948974609375, -2.148193359375, -1.9014892578125, -1.65478515625, -1.4080810546875, -1.161376953125, -0.9146728515625, -0.66796875, -0.4212646484375, -0.174560546875, 0.0721435546875, 0.31884765625, 0.5655517578125, 0.812255859375, 1.0589599609375, 1.3056640625, 1.5523681640625, 1.799072265625, 2.0457763671875, 2.29248046875, 2.5391845703125, 2.785888671875, 3.0325927734375, 3.279296875, 3.5260009765625, 3.772705078125, 4.0194091796875, 4.26611328125, 4.5128173828125, 4.759521484375, 5.0062255859375, 5.2529296875, 5.4996337890625, 5.746337890625, 5.9930419921875, 6.23974609375, 6.4864501953125, 6.733154296875, 6.9798583984375, 7.2265625]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 7.0, 4.0, 6.0, 8.0, 13.0, 10.0, 10.0, 11.0, 18.0, 25.0, 27.0, 27.0, 33.0, 25.0, 44.0, 37.0, 48.0, 32.0, 37.0, 53.0, 150.0, 1888.0, 108.0, 40.0, 38.0, 31.0, 33.0, 43.0, 31.0, 28.0, 31.0, 29.0, 22.0, 16.0, 16.0, 13.0, 10.0, 9.0, 7.0, 10.0, 9.0, 6.0, 5.0, 2.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.4375, -41.08642578125, -39.7353515625, -38.38427734375, -37.033203125, -35.68212890625, -34.3310546875, -32.97998046875, -31.62890625, -30.27783203125, -28.9267578125, -27.57568359375, -26.224609375, -24.87353515625, -23.5224609375, -22.17138671875, -20.8203125, -19.46923828125, -18.1181640625, -16.76708984375, -15.416015625, -14.06494140625, -12.7138671875, -11.36279296875, -10.01171875, -8.66064453125, -7.3095703125, -5.95849609375, -4.607421875, -3.25634765625, -1.9052734375, -0.55419921875, 0.796875, 2.14794921875, 3.4990234375, 4.85009765625, 6.201171875, 7.55224609375, 8.9033203125, 10.25439453125, 11.60546875, 12.95654296875, 14.3076171875, 15.65869140625, 17.009765625, 18.36083984375, 19.7119140625, 21.06298828125, 22.4140625, 23.76513671875, 25.1162109375, 26.46728515625, 27.818359375, 29.16943359375, 30.5205078125, 31.87158203125, 33.22265625, 34.57373046875, 35.9248046875, 37.27587890625, 38.626953125, 39.97802734375, 41.3291015625, 42.68017578125, 44.03125]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 7.0, 6.0, 10.0, 6.0, 10.0, 16.0, 18.0, 11.0, 25.0, 28.0, 37.0, 56.0, 58.0, 93.0, 111.0, 125.0, 186.0, 355.0, 794.0, 5153.0, 3109949.0, 25971.0, 1271.0, 417.0, 217.0, 199.0, 114.0, 98.0, 72.0, 61.0, 50.0, 37.0, 29.0, 29.0, 11.0, 10.0, 14.0, 10.0, 7.0, 8.0, 6.0, 4.0, 7.0, 4.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0], "bins": [-89.5, -86.841796875, -84.18359375, -81.525390625, -78.8671875, -76.208984375, -73.55078125, -70.892578125, -68.234375, -65.576171875, -62.91796875, -60.259765625, -57.6015625, -54.943359375, -52.28515625, -49.626953125, -46.96875, -44.310546875, -41.65234375, -38.994140625, -36.3359375, -33.677734375, -31.01953125, -28.361328125, -25.703125, -23.044921875, -20.38671875, -17.728515625, -15.0703125, -12.412109375, -9.75390625, -7.095703125, -4.4375, -1.779296875, 0.87890625, 3.537109375, 6.1953125, 8.853515625, 11.51171875, 14.169921875, 16.828125, 19.486328125, 22.14453125, 24.802734375, 27.4609375, 30.119140625, 32.77734375, 35.435546875, 38.09375, 40.751953125, 43.41015625, 46.068359375, 48.7265625, 51.384765625, 54.04296875, 56.701171875, 59.359375, 62.017578125, 64.67578125, 67.333984375, 69.9921875, 72.650390625, 75.30859375, 77.966796875, 80.625]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 535.0, 480.0], "bins": [-804.3517456054688, -791.5792236328125, -778.806640625, -766.0341186523438, -753.2615966796875, -740.489013671875, -727.7164916992188, -714.9439697265625, -702.1714477539062, -689.39892578125, -676.6263427734375, -663.8538208007812, -651.081298828125, -638.3087158203125, -625.5361938476562, -612.763671875, -599.9910888671875, -587.2185668945312, -574.4459838867188, -561.6734619140625, -548.9009399414062, -536.12841796875, -523.3558349609375, -510.58331298828125, -497.810791015625, -485.0382385253906, -472.2657165527344, -459.4931640625, -446.72064208984375, -433.9480895996094, -421.175537109375, -408.40301513671875, -395.6304626464844, -382.85791015625, -370.08538818359375, -357.3128356933594, -344.5403137207031, -331.76776123046875, -318.9952392578125, -306.2226867675781, -293.45013427734375, -280.6775817871094, -267.9050598144531, -255.13250732421875, -242.35997009277344, -229.58743286132812, -216.8148956298828, -204.0423583984375, -191.2698211669922, -178.49728393554688, -165.72474670410156, -152.95220947265625, -140.17965698242188, -127.40711975097656, -114.63458251953125, -101.8620376586914, -89.08950805664062, -76.31697082519531, -63.54442596435547, -50.771888732910156, -37.99934768676758, -25.226806640625, -12.454269409179688, 0.31827545166015625, 13.090814590454102]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 7.0, 3.0, 3.0, 9.0, 7.0, 8.0, 10.0, 8.0, 12.0, 8.0, 19.0, 12.0, 23.0, 13.0, 25.0, 29.0, 31.0, 34.0, 39.0, 38.0, 30.0, 38.0, 37.0, 37.0, 52.0, 49.0, 47.0, 31.0, 45.0, 39.0, 32.0, 27.0, 32.0, 26.0, 23.0, 19.0, 18.0, 12.0, 15.0, 12.0, 11.0, 13.0, 6.0, 5.0, 3.0, 3.0, 0.0, 5.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-108.20925903320312, -104.6911392211914, -101.17302703857422, -97.6549072265625, -94.13679504394531, -90.6186752319336, -87.10055541992188, -83.58244323730469, -80.0643310546875, -76.54621124267578, -73.0280990600586, -69.50997924804688, -65.99186706542969, -62.47374725341797, -58.955631256103516, -55.43751525878906, -51.919395446777344, -48.40127944946289, -44.88316345214844, -41.36504364013672, -37.84693145751953, -34.32881164550781, -30.81069564819336, -27.292579650878906, -23.774463653564453, -20.25634765625, -16.738231658935547, -13.220113754272461, -9.701997756958008, -6.183881759643555, -2.6657638549804688, 0.8523521423339844, 4.370460510253906, 7.888576984405518, 11.406693458557129, 14.924810409545898, 18.44292640686035, 21.961042404174805, 25.47916030883789, 28.997276306152344, 32.5153923034668, 36.03350830078125, 39.5516242980957, 43.069740295410156, 46.587860107421875, 50.10597229003906, 53.62409210205078, 57.142208099365234, 60.66032409667969, 64.1784439086914, 67.6965560913086, 71.21467590332031, 74.7327880859375, 78.25090789794922, 81.76902770996094, 85.28713989257812, 88.80525207519531, 92.32337188720703, 95.84148406982422, 99.35960388183594, 102.87771606445312, 106.39583587646484, 109.91395568847656, 113.43206787109375, 116.95018768310547]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 4.0, 7.0, 10.0, 10.0, 10.0, 15.0, 8.0, 19.0, 22.0, 25.0, 39.0, 27.0, 43.0, 31.0, 30.0, 38.0, 42.0, 54.0, 52.0, 48.0, 36.0, 44.0, 43.0, 37.0, 46.0, 41.0, 28.0, 23.0, 26.0, 25.0, 17.0, 20.0, 9.0, 13.0, 16.0, 8.0, 10.0, 7.0, 4.0, 3.0, 3.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.578125, -14.15380859375, -13.7294921875, -13.30517578125, -12.880859375, -12.45654296875, -12.0322265625, -11.60791015625, -11.18359375, -10.75927734375, -10.3349609375, -9.91064453125, -9.486328125, -9.06201171875, -8.6376953125, -8.21337890625, -7.7890625, -7.36474609375, -6.9404296875, -6.51611328125, -6.091796875, -5.66748046875, -5.2431640625, -4.81884765625, -4.39453125, -3.97021484375, -3.5458984375, -3.12158203125, -2.697265625, -2.27294921875, -1.8486328125, -1.42431640625, -1.0, -0.57568359375, -0.1513671875, 0.27294921875, 0.697265625, 1.12158203125, 1.5458984375, 1.97021484375, 2.39453125, 2.81884765625, 3.2431640625, 3.66748046875, 4.091796875, 4.51611328125, 4.9404296875, 5.36474609375, 5.7890625, 6.21337890625, 6.6376953125, 7.06201171875, 7.486328125, 7.91064453125, 8.3349609375, 8.75927734375, 9.18359375, 9.60791015625, 10.0322265625, 10.45654296875, 10.880859375, 11.30517578125, 11.7294921875, 12.15380859375, 12.578125]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 3.0, 4.0, 4.0, 10.0, 12.0, 15.0, 12.0, 16.0, 19.0, 27.0, 48.0, 65.0, 102.0, 134.0, 239.0, 396.0, 758.0, 1507.0, 3345.0, 8351.0, 38971.0, 3227112.0, 881874.0, 19818.0, 6058.0, 2613.0, 1215.0, 631.0, 332.0, 196.0, 115.0, 77.0, 52.0, 41.0, 27.0, 13.0, 11.0, 13.0, 17.0, 8.0, 6.0, 7.0, 2.0, 4.0, 2.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-60.375, -58.5908203125, -56.806640625, -55.0224609375, -53.23828125, -51.4541015625, -49.669921875, -47.8857421875, -46.1015625, -44.3173828125, -42.533203125, -40.7490234375, -38.96484375, -37.1806640625, -35.396484375, -33.6123046875, -31.828125, -30.0439453125, -28.259765625, -26.4755859375, -24.69140625, -22.9072265625, -21.123046875, -19.3388671875, -17.5546875, -15.7705078125, -13.986328125, -12.2021484375, -10.41796875, -8.6337890625, -6.849609375, -5.0654296875, -3.28125, -1.4970703125, 0.287109375, 2.0712890625, 3.85546875, 5.6396484375, 7.423828125, 9.2080078125, 10.9921875, 12.7763671875, 14.560546875, 16.3447265625, 18.12890625, 19.9130859375, 21.697265625, 23.4814453125, 25.265625, 27.0498046875, 28.833984375, 30.6181640625, 32.40234375, 34.1865234375, 35.970703125, 37.7548828125, 39.5390625, 41.3232421875, 43.107421875, 44.8916015625, 46.67578125, 48.4599609375, 50.244140625, 52.0283203125, 53.8125]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 6.0, 5.0, 4.0, 5.0, 9.0, 7.0, 9.0, 7.0, 12.0, 11.0, 17.0, 17.0, 25.0, 28.0, 49.0, 79.0, 178.0, 327.0, 641.0, 879.0, 764.0, 422.0, 222.0, 129.0, 69.0, 26.0, 21.0, 18.0, 14.0, 14.0, 12.0, 5.0, 5.0, 8.0, 7.0, 6.0, 3.0, 1.0, 4.0, 0.0, 1.0, 3.0, 5.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-35.40625, -34.38671875, -33.3671875, -32.34765625, -31.328125, -30.30859375, -29.2890625, -28.26953125, -27.25, -26.23046875, -25.2109375, -24.19140625, -23.171875, -22.15234375, -21.1328125, -20.11328125, -19.09375, -18.07421875, -17.0546875, -16.03515625, -15.015625, -13.99609375, -12.9765625, -11.95703125, -10.9375, -9.91796875, -8.8984375, -7.87890625, -6.859375, -5.83984375, -4.8203125, -3.80078125, -2.78125, -1.76171875, -0.7421875, 0.27734375, 1.296875, 2.31640625, 3.3359375, 4.35546875, 5.375, 6.39453125, 7.4140625, 8.43359375, 9.453125, 10.47265625, 11.4921875, 12.51171875, 13.53125, 14.55078125, 15.5703125, 16.58984375, 17.609375, 18.62890625, 19.6484375, 20.66796875, 21.6875, 22.70703125, 23.7265625, 24.74609375, 25.765625, 26.78515625, 27.8046875, 28.82421875, 29.84375]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 6.0, 2.0, 2.0, 0.0, 4.0, 1.0, 9.0, 7.0, 7.0, 23.0, 35.0, 75.0, 149.0, 247.0, 449.0, 839.0, 1760.0, 3441.0, 7470.0, 17801.0, 57515.0, 1956658.0, 2057528.0, 57897.0, 17732.0, 7434.0, 3519.0, 1732.0, 886.0, 478.0, 250.0, 129.0, 66.0, 57.0, 22.0, 19.0, 5.0, 9.0, 6.0, 6.0, 2.0, 4.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.65625, -59.45458984375, -57.2529296875, -55.05126953125, -52.849609375, -50.64794921875, -48.4462890625, -46.24462890625, -44.04296875, -41.84130859375, -39.6396484375, -37.43798828125, -35.236328125, -33.03466796875, -30.8330078125, -28.63134765625, -26.4296875, -24.22802734375, -22.0263671875, -19.82470703125, -17.623046875, -15.42138671875, -13.2197265625, -11.01806640625, -8.81640625, -6.61474609375, -4.4130859375, -2.21142578125, -0.009765625, 2.19189453125, 4.3935546875, 6.59521484375, 8.796875, 10.99853515625, 13.2001953125, 15.40185546875, 17.603515625, 19.80517578125, 22.0068359375, 24.20849609375, 26.41015625, 28.61181640625, 30.8134765625, 33.01513671875, 35.216796875, 37.41845703125, 39.6201171875, 41.82177734375, 44.0234375, 46.22509765625, 48.4267578125, 50.62841796875, 52.830078125, 55.03173828125, 57.2333984375, 59.43505859375, 61.63671875, 63.83837890625, 66.0400390625, 68.24169921875, 70.443359375, 72.64501953125, 74.8466796875, 77.04833984375, 79.25]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 4.0, 4.0, 5.0, 8.0, 6.0, 12.0, 17.0, 23.0, 51.0, 63.0, 101.0, 167.0, 157.0, 135.0, 75.0, 51.0, 37.0, 22.0, 14.0, 14.0, 10.0, 11.0, 5.0, 3.0, 5.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-109.67414855957031, -104.3000717163086, -98.92598724365234, -93.55191040039062, -88.17782592773438, -82.80374908447266, -77.42967224121094, -72.05558776855469, -66.68151092529297, -61.307430267333984, -55.933349609375, -50.55927276611328, -45.1851921081543, -39.81111145019531, -34.437034606933594, -29.06295394897461, -23.688873291015625, -18.31479263305664, -12.940713882446289, -7.5666351318359375, -2.192554473876953, 3.1815261840820312, 8.55560302734375, 13.929683685302734, 19.30376434326172, 24.677845001220703, 30.051923751831055, 35.426002502441406, 40.80008316040039, 46.174163818359375, 51.548240661621094, 56.92232131958008, 62.296417236328125, 67.67049407958984, 73.0445785522461, 78.41865539550781, 83.79273986816406, 89.16681671142578, 94.5408935546875, 99.91497802734375, 105.28905487060547, 110.66313171386719, 116.03721618652344, 121.41129302978516, 126.78536987304688, 132.15945434570312, 137.53353881835938, 142.90760803222656, 148.2816925048828, 153.65577697753906, 159.02984619140625, 164.4039306640625, 169.77801513671875, 175.152099609375, 180.5261688232422, 185.90025329589844, 191.27432250976562, 196.64840698242188, 202.02247619628906, 207.3965606689453, 212.77064514160156, 218.14471435546875, 223.518798828125, 228.89288330078125, 234.2669677734375]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 2.0, 7.0, 6.0, 9.0, 7.0, 8.0, 20.0, 21.0, 14.0, 21.0, 17.0, 11.0, 26.0, 28.0, 30.0, 30.0, 30.0, 42.0, 45.0, 39.0, 52.0, 43.0, 41.0, 33.0, 38.0, 35.0, 41.0, 32.0, 33.0, 33.0, 35.0, 24.0, 18.0, 16.0, 17.0, 20.0, 12.0, 13.0, 15.0, 13.0, 4.0, 9.0, 3.0, 2.0, 0.0, 2.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-88.70303344726562, -85.9404525756836, -83.17787170410156, -80.41529846191406, -77.65271759033203, -74.89013671875, -72.12755584716797, -69.36497497558594, -66.60240173339844, -63.839820861816406, -61.07724380493164, -58.31466293334961, -55.552085876464844, -52.78950500488281, -50.02692413330078, -47.26434326171875, -44.50176239013672, -41.73918151855469, -38.97660446166992, -36.21402359008789, -33.451446533203125, -30.688865661621094, -27.926284790039062, -25.163705825805664, -22.401126861572266, -19.638547897338867, -16.87596893310547, -14.113388061523438, -11.350809097290039, -8.58823013305664, -5.825649261474609, -3.063070297241211, -0.30049896240234375, 2.462080478668213, 5.2246599197387695, 7.987239837646484, 10.749818801879883, 13.512397766113281, 16.274978637695312, 19.03755760192871, 21.80013656616211, 24.562715530395508, 27.325294494628906, 30.087875366210938, 32.85045623779297, 35.613033294677734, 38.375614166259766, 41.13819122314453, 43.90077209472656, 46.663352966308594, 49.42593002319336, 52.18851089477539, 54.951087951660156, 57.71366882324219, 60.47624969482422, 63.23883056640625, 66.00140380859375, 68.76398468017578, 71.52656555175781, 74.28913879394531, 77.05171966552734, 79.81430053710938, 82.5768814086914, 85.33946228027344, 88.10204315185547]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 5.0, 6.0, 2.0, 4.0, 14.0, 8.0, 18.0, 18.0, 11.0, 23.0, 21.0, 31.0, 37.0, 44.0, 26.0, 40.0, 31.0, 40.0, 58.0, 47.0, 47.0, 40.0, 44.0, 36.0, 31.0, 39.0, 36.0, 28.0, 27.0, 28.0, 27.0, 25.0, 19.0, 13.0, 15.0, 8.0, 12.0, 6.0, 9.0, 7.0, 8.0, 5.0, 3.0, 2.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-13.9375, -13.5235595703125, -13.109619140625, -12.6956787109375, -12.28173828125, -11.8677978515625, -11.453857421875, -11.0399169921875, -10.6259765625, -10.2120361328125, -9.798095703125, -9.3841552734375, -8.97021484375, -8.5562744140625, -8.142333984375, -7.7283935546875, -7.314453125, -6.9005126953125, -6.486572265625, -6.0726318359375, -5.65869140625, -5.2447509765625, -4.830810546875, -4.4168701171875, -4.0029296875, -3.5889892578125, -3.175048828125, -2.7611083984375, -2.34716796875, -1.9332275390625, -1.519287109375, -1.1053466796875, -0.69140625, -0.2774658203125, 0.136474609375, 0.5504150390625, 0.96435546875, 1.3782958984375, 1.792236328125, 2.2061767578125, 2.6201171875, 3.0340576171875, 3.447998046875, 3.8619384765625, 4.27587890625, 4.6898193359375, 5.103759765625, 5.5177001953125, 5.931640625, 6.3455810546875, 6.759521484375, 7.1734619140625, 7.58740234375, 8.0013427734375, 8.415283203125, 8.8292236328125, 9.2431640625, 9.6571044921875, 10.071044921875, 10.4849853515625, 10.89892578125, 11.3128662109375, 11.726806640625, 12.1407470703125, 12.5546875]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 0.0, 4.0, 5.0, 6.0, 16.0, 18.0, 27.0, 46.0, 68.0, 106.0, 169.0, 265.0, 363.0, 569.0, 782.0, 1159.0, 1752.0, 2398.0, 3775.0, 5636.0, 8416.0, 13411.0, 20949.0, 33847.0, 56956.0, 101411.0, 190447.0, 249411.0, 150500.0, 80700.0, 46652.0, 27766.0, 17628.0, 11219.0, 7398.0, 4822.0, 3235.0, 2176.0, 1470.0, 953.0, 671.0, 410.0, 270.0, 230.0, 150.0, 93.0, 57.0, 46.0, 48.0, 28.0, 12.0, 7.0, 4.0, 4.0, 4.0, 0.0, 0.0, 1.0], "bins": [-1.490234375, -1.44549560546875, -1.4007568359375, -1.35601806640625, -1.311279296875, -1.26654052734375, -1.2218017578125, -1.17706298828125, -1.13232421875, -1.08758544921875, -1.0428466796875, -0.99810791015625, -0.953369140625, -0.90863037109375, -0.8638916015625, -0.81915283203125, -0.7744140625, -0.72967529296875, -0.6849365234375, -0.64019775390625, -0.595458984375, -0.55072021484375, -0.5059814453125, -0.46124267578125, -0.41650390625, -0.37176513671875, -0.3270263671875, -0.28228759765625, -0.237548828125, -0.19281005859375, -0.1480712890625, -0.10333251953125, -0.05859375, -0.01385498046875, 0.0308837890625, 0.07562255859375, 0.120361328125, 0.16510009765625, 0.2098388671875, 0.25457763671875, 0.29931640625, 0.34405517578125, 0.3887939453125, 0.43353271484375, 0.478271484375, 0.52301025390625, 0.5677490234375, 0.61248779296875, 0.6572265625, 0.70196533203125, 0.7467041015625, 0.79144287109375, 0.836181640625, 0.88092041015625, 0.9256591796875, 0.97039794921875, 1.01513671875, 1.05987548828125, 1.1046142578125, 1.14935302734375, 1.194091796875, 1.23883056640625, 1.2835693359375, 1.32830810546875, 1.373046875]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 5.0, 4.0, 6.0, 15.0, 8.0, 6.0, 11.0, 9.0, 19.0, 16.0, 15.0, 18.0, 37.0, 34.0, 42.0, 40.0, 46.0, 39.0, 46.0, 46.0, 1059.0, 32.0, 55.0, 34.0, 38.0, 36.0, 42.0, 37.0, 30.0, 37.0, 30.0, 24.0, 23.0, 15.0, 21.0, 13.0, 10.0, 12.0, 3.0, 4.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.28125, -7.994384765625, -7.70751953125, -7.420654296875, -7.1337890625, -6.846923828125, -6.56005859375, -6.273193359375, -5.986328125, -5.699462890625, -5.41259765625, -5.125732421875, -4.8388671875, -4.552001953125, -4.26513671875, -3.978271484375, -3.69140625, -3.404541015625, -3.11767578125, -2.830810546875, -2.5439453125, -2.257080078125, -1.97021484375, -1.683349609375, -1.396484375, -1.109619140625, -0.82275390625, -0.535888671875, -0.2490234375, 0.037841796875, 0.32470703125, 0.611572265625, 0.8984375, 1.185302734375, 1.47216796875, 1.759033203125, 2.0458984375, 2.332763671875, 2.61962890625, 2.906494140625, 3.193359375, 3.480224609375, 3.76708984375, 4.053955078125, 4.3408203125, 4.627685546875, 4.91455078125, 5.201416015625, 5.48828125, 5.775146484375, 6.06201171875, 6.348876953125, 6.6357421875, 6.922607421875, 7.20947265625, 7.496337890625, 7.783203125, 8.070068359375, 8.35693359375, 8.643798828125, 8.9306640625, 9.217529296875, 9.50439453125, 9.791259765625, 10.078125]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 10.0, 6.0, 11.0, 26.0, 23.0, 34.0, 51.0, 95.0, 141.0, 208.0, 353.0, 531.0, 779.0, 1158.0, 1703.0, 2637.0, 4079.0, 6391.0, 9630.0, 15220.0, 23818.0, 39471.0, 67695.0, 122264.0, 325804.0, 1158663.0, 131262.0, 72534.0, 42149.0, 25421.0, 15888.0, 10039.0, 6544.0, 4345.0, 2797.0, 1869.0, 1224.0, 773.0, 498.0, 325.0, 210.0, 146.0, 101.0, 66.0, 51.0, 34.0, 23.0, 12.0, 16.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.861328125, -0.8352737426757812, -0.8092193603515625, -0.7831649780273438, -0.757110595703125, -0.7310562133789062, -0.7050018310546875, -0.6789474487304688, -0.65289306640625, -0.6268386840820312, -0.6007843017578125, -0.5747299194335938, -0.548675537109375, -0.5226211547851562, -0.4965667724609375, -0.47051239013671875, -0.4444580078125, -0.41840362548828125, -0.3923492431640625, -0.36629486083984375, -0.340240478515625, -0.31418609619140625, -0.2881317138671875, -0.26207733154296875, -0.23602294921875, -0.20996856689453125, -0.1839141845703125, -0.15785980224609375, -0.131805419921875, -0.10575103759765625, -0.0796966552734375, -0.05364227294921875, -0.027587890625, -0.00153350830078125, 0.0245208740234375, 0.05057525634765625, 0.076629638671875, 0.10268402099609375, 0.1287384033203125, 0.15479278564453125, 0.18084716796875, 0.20690155029296875, 0.2329559326171875, 0.25901031494140625, 0.285064697265625, 0.31111907958984375, 0.3371734619140625, 0.36322784423828125, 0.3892822265625, 0.41533660888671875, 0.4413909912109375, 0.46744537353515625, 0.493499755859375, 0.5195541381835938, 0.5456085205078125, 0.5716629028320312, 0.59771728515625, 0.6237716674804688, 0.6498260498046875, 0.6758804321289062, 0.701934814453125, 0.7279891967773438, 0.7540435791015625, 0.7800979614257812, 0.80615234375]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 4.0, 5.0, 6.0, 10.0, 10.0, 9.0, 10.0, 14.0, 15.0, 19.0, 18.0, 21.0, 22.0, 52.0, 74.0, 77.0, 117.0, 121.0, 88.0, 55.0, 52.0, 30.0, 35.0, 22.0, 18.0, 16.0, 7.0, 11.0, 10.0, 2.0, 5.0, 4.0, 8.0, 5.0, 4.0, 4.0, 6.0, 6.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0207366943359375, -0.02004241943359375, -0.01934814453125, -0.01865386962890625, -0.0179595947265625, -0.01726531982421875, -0.016571044921875, -0.01587677001953125, -0.0151824951171875, -0.01448822021484375, -0.0137939453125, -0.01309967041015625, -0.0124053955078125, -0.01171112060546875, -0.011016845703125, -0.01032257080078125, -0.0096282958984375, -0.00893402099609375, -0.00823974609375, -0.00754547119140625, -0.0068511962890625, -0.00615692138671875, -0.005462646484375, -0.00476837158203125, -0.0040740966796875, -0.00337982177734375, -0.002685546875, -0.00199127197265625, -0.0012969970703125, -0.00060272216796875, 9.1552734375e-05, 0.00078582763671875, 0.0014801025390625, 0.00217437744140625, 0.00286865234375, 0.00356292724609375, 0.0042572021484375, 0.00495147705078125, 0.005645751953125, 0.00634002685546875, 0.0070343017578125, 0.00772857666015625, 0.0084228515625, 0.00911712646484375, 0.0098114013671875, 0.01050567626953125, 0.011199951171875, 0.01189422607421875, 0.0125885009765625, 0.01328277587890625, 0.01397705078125, 0.01467132568359375, 0.0153656005859375, 0.01605987548828125, 0.016754150390625, 0.01744842529296875, 0.0181427001953125, 0.01883697509765625, 0.01953125, 0.02022552490234375, 0.0209197998046875, 0.02161407470703125, 0.022308349609375, 0.02300262451171875, 0.0236968994140625]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 1.0, 7.0, 4.0, 7.0, 8.0, 10.0, 11.0, 7.0, 19.0, 22.0, 15.0, 21.0, 24.0, 36.0, 45.0, 50.0, 88.0, 142.0, 218.0, 466.0, 1381.0, 7823.0, 170629.0, 842964.0, 20502.0, 2552.0, 650.0, 236.0, 162.0, 84.0, 67.0, 45.0, 45.0, 37.0, 30.0, 33.0, 26.0, 22.0, 12.0, 12.0, 12.0, 8.0, 4.0, 5.0, 6.0, 3.0, 5.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.416259765625, -0.4040870666503906, -0.39191436767578125, -0.3797416687011719, -0.3675689697265625, -0.3553962707519531, -0.34322357177734375, -0.3310508728027344, -0.318878173828125, -0.3067054748535156, -0.29453277587890625, -0.2823600769042969, -0.2701873779296875, -0.2580146789550781, -0.24584197998046875, -0.23366928100585938, -0.22149658203125, -0.20932388305664062, -0.19715118408203125, -0.18497848510742188, -0.1728057861328125, -0.16063308715820312, -0.14846038818359375, -0.13628768920898438, -0.124114990234375, -0.11194229125976562, -0.09976959228515625, -0.08759689331054688, -0.0754241943359375, -0.06325149536132812, -0.05107879638671875, -0.038906097412109375, -0.0267333984375, -0.014560699462890625, -0.00238800048828125, 0.009784698486328125, 0.0219573974609375, 0.034130096435546875, 0.04630279541015625, 0.058475494384765625, 0.070648193359375, 0.08282089233398438, 0.09499359130859375, 0.10716629028320312, 0.1193389892578125, 0.13151168823242188, 0.14368438720703125, 0.15585708618164062, 0.16802978515625, 0.18020248413085938, 0.19237518310546875, 0.20454788208007812, 0.2167205810546875, 0.22889328002929688, 0.24106597900390625, 0.2532386779785156, 0.265411376953125, 0.2775840759277344, 0.28975677490234375, 0.3019294738769531, 0.3141021728515625, 0.3262748718261719, 0.33844757080078125, 0.3506202697753906, 0.36279296875]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 10.0, 16.0, 56.0, 218.0, 495.0, 120.0, 57.0, 18.0, 12.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10337348282337189, -0.09560608118772507, -0.08783868700265884, -0.08007128536701202, -0.0723038911819458, -0.06453648954629898, -0.05676908791065216, -0.04900169000029564, -0.04123429208993912, -0.033466894179582596, -0.025699494406580925, -0.017932094633579254, -0.010164696723222733, -0.002397298812866211, 0.005370102822780609, 0.01313750073313713, 0.020904898643493652, 0.028672296553850174, 0.036439694464206696, 0.044207096099853516, 0.05197449401021004, 0.05974189192056656, 0.06750929355621338, 0.0752766877412796, 0.08304408937692642, 0.09081149101257324, 0.09857888519763947, 0.10634628683328629, 0.1141136884689331, 0.12188108265399933, 0.12964847683906555, 0.13741588592529297, 0.14518329501152039, 0.1529506891965866, 0.16071809828281403, 0.16848549246788025, 0.17625288665294647, 0.1840202808380127, 0.1917876899242401, 0.19955508410930634, 0.20732247829437256, 0.21508987247943878, 0.2228572815656662, 0.23062467575073242, 0.23839206993579865, 0.24615946412086487, 0.2539268732070923, 0.2616942822933197, 0.2694616913795471, 0.27722910046577454, 0.28499647974967957, 0.292763888835907, 0.3005312979221344, 0.30829867720603943, 0.31606608629226685, 0.32383349537849426, 0.3316008746623993, 0.3393682837486267, 0.34713566303253174, 0.35490307211875916, 0.3626704812049866, 0.3704378604888916, 0.378205269575119, 0.38597267866134644, 0.39374005794525146]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 1.0, 6.0, 4.0, 4.0, 6.0, 16.0, 9.0, 10.0, 12.0, 17.0, 12.0, 22.0, 23.0, 26.0, 20.0, 22.0, 33.0, 35.0, 26.0, 38.0, 30.0, 44.0, 32.0, 30.0, 35.0, 49.0, 26.0, 36.0, 35.0, 43.0, 32.0, 15.0, 31.0, 39.0, 23.0, 20.0, 22.0, 22.0, 16.0, 17.0, 9.0, 10.0, 15.0, 9.0, 3.0, 7.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.02029484510421753, -0.01967526413500309, -0.01905568316578865, -0.01843610219657421, -0.01781652122735977, -0.017196940258145332, -0.016577359288930893, -0.015957778319716454, -0.015338197350502014, -0.014718616381287575, -0.014099035412073135, -0.013479454442858696, -0.012859873473644257, -0.012240292504429817, -0.011620711535215378, -0.011001130566000938, -0.010381549596786499, -0.00976196862757206, -0.00914238765835762, -0.00852280668914318, -0.007903225719928741, -0.007283644750714302, -0.006664063781499863, -0.006044482812285423, -0.005424901843070984, -0.0048053208738565445, -0.004185739904642105, -0.0035661589354276657, -0.0029465779662132263, -0.002326996996998787, -0.0017074160277843475, -0.0010878350585699081, -0.00046825408935546875, 0.00015132687985897064, 0.00077090784907341, 0.0013904888182878494, 0.002010069787502289, 0.002629650756716728, 0.0032492317259311676, 0.003868812695145607, 0.004488393664360046, 0.005107974633574486, 0.005727555602788925, 0.0063471365720033646, 0.006966717541217804, 0.007586298510432243, 0.008205879479646683, 0.008825460448861122, 0.009445041418075562, 0.010064622387290001, 0.01068420335650444, 0.01130378432571888, 0.011923365294933319, 0.012542946264147758, 0.013162527233362198, 0.013782108202576637, 0.014401689171791077, 0.015021270141005516, 0.015640851110219955, 0.016260432079434395, 0.016880013048648834, 0.017499594017863274, 0.018119174987077713, 0.018738755956292152, 0.019358336925506592]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 5.0, 6.0, 2.0, 4.0, 14.0, 9.0, 17.0, 18.0, 12.0, 22.0, 22.0, 30.0, 37.0, 44.0, 27.0, 39.0, 33.0, 38.0, 59.0, 46.0, 47.0, 41.0, 45.0, 34.0, 32.0, 39.0, 35.0, 28.0, 27.0, 28.0, 27.0, 25.0, 19.0, 13.0, 15.0, 8.0, 12.0, 6.0, 9.0, 7.0, 8.0, 5.0, 3.0, 2.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-13.9296875, -13.515869140625, -13.10205078125, -12.688232421875, -12.2744140625, -11.860595703125, -11.44677734375, -11.032958984375, -10.619140625, -10.205322265625, -9.79150390625, -9.377685546875, -8.9638671875, -8.550048828125, -8.13623046875, -7.722412109375, -7.30859375, -6.894775390625, -6.48095703125, -6.067138671875, -5.6533203125, -5.239501953125, -4.82568359375, -4.411865234375, -3.998046875, -3.584228515625, -3.17041015625, -2.756591796875, -2.3427734375, -1.928955078125, -1.51513671875, -1.101318359375, -0.6875, -0.273681640625, 0.14013671875, 0.553955078125, 0.9677734375, 1.381591796875, 1.79541015625, 2.209228515625, 2.623046875, 3.036865234375, 3.45068359375, 3.864501953125, 4.2783203125, 4.692138671875, 5.10595703125, 5.519775390625, 5.93359375, 6.347412109375, 6.76123046875, 7.175048828125, 7.5888671875, 8.002685546875, 8.41650390625, 8.830322265625, 9.244140625, 9.657958984375, 10.07177734375, 10.485595703125, 10.8994140625, 11.313232421875, 11.72705078125, 12.140869140625, 12.5546875]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 4.0, 7.0, 11.0, 11.0, 13.0, 11.0, 25.0, 40.0, 59.0, 77.0, 174.0, 306.0, 432.0, 816.0, 1622.0, 3248.0, 7765.0, 21845.0, 71718.0, 294335.0, 486593.0, 108760.0, 31273.0, 10740.0, 4227.0, 2037.0, 1044.0, 520.0, 346.0, 194.0, 102.0, 67.0, 35.0, 32.0, 20.0, 13.0, 15.0, 7.0, 2.0, 3.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.8828125, -6.66192626953125, -6.4410400390625, -6.22015380859375, -5.999267578125, -5.77838134765625, -5.5574951171875, -5.33660888671875, -5.11572265625, -4.89483642578125, -4.6739501953125, -4.45306396484375, -4.232177734375, -4.01129150390625, -3.7904052734375, -3.56951904296875, -3.3486328125, -3.12774658203125, -2.9068603515625, -2.68597412109375, -2.465087890625, -2.24420166015625, -2.0233154296875, -1.80242919921875, -1.58154296875, -1.36065673828125, -1.1397705078125, -0.91888427734375, -0.697998046875, -0.47711181640625, -0.2562255859375, -0.03533935546875, 0.185546875, 0.40643310546875, 0.6273193359375, 0.84820556640625, 1.069091796875, 1.28997802734375, 1.5108642578125, 1.73175048828125, 1.95263671875, 2.17352294921875, 2.3944091796875, 2.61529541015625, 2.836181640625, 3.05706787109375, 3.2779541015625, 3.49884033203125, 3.7197265625, 3.94061279296875, 4.1614990234375, 4.38238525390625, 4.603271484375, 4.82415771484375, 5.0450439453125, 5.26593017578125, 5.48681640625, 5.70770263671875, 5.9285888671875, 6.14947509765625, 6.370361328125, 6.59124755859375, 6.8121337890625, 7.03302001953125, 7.25390625]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 5.0, 6.0, 13.0, 6.0, 10.0, 12.0, 13.0, 21.0, 20.0, 25.0, 16.0, 25.0, 30.0, 32.0, 36.0, 34.0, 33.0, 41.0, 48.0, 61.0, 1650.0, 431.0, 65.0, 36.0, 33.0, 40.0, 30.0, 35.0, 33.0, 24.0, 34.0, 23.0, 25.0, 12.0, 20.0, 16.0, 14.0, 10.0, 7.0, 8.0, 5.0, 5.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-39.84375, -38.5146484375, -37.185546875, -35.8564453125, -34.52734375, -33.1982421875, -31.869140625, -30.5400390625, -29.2109375, -27.8818359375, -26.552734375, -25.2236328125, -23.89453125, -22.5654296875, -21.236328125, -19.9072265625, -18.578125, -17.2490234375, -15.919921875, -14.5908203125, -13.26171875, -11.9326171875, -10.603515625, -9.2744140625, -7.9453125, -6.6162109375, -5.287109375, -3.9580078125, -2.62890625, -1.2998046875, 0.029296875, 1.3583984375, 2.6875, 4.0166015625, 5.345703125, 6.6748046875, 8.00390625, 9.3330078125, 10.662109375, 11.9912109375, 13.3203125, 14.6494140625, 15.978515625, 17.3076171875, 18.63671875, 19.9658203125, 21.294921875, 22.6240234375, 23.953125, 25.2822265625, 26.611328125, 27.9404296875, 29.26953125, 30.5986328125, 31.927734375, 33.2568359375, 34.5859375, 35.9150390625, 37.244140625, 38.5732421875, 39.90234375, 41.2314453125, 42.560546875, 43.8896484375, 45.21875]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 5.0, 3.0, 8.0, 10.0, 9.0, 16.0, 14.0, 27.0, 17.0, 30.0, 27.0, 61.0, 70.0, 78.0, 108.0, 136.0, 191.0, 270.0, 492.0, 1531.0, 64718.0, 3071773.0, 4114.0, 759.0, 355.0, 187.0, 143.0, 119.0, 104.0, 70.0, 60.0, 37.0, 29.0, 37.0, 20.0, 15.0, 13.0, 16.0, 7.0, 7.0, 10.0, 3.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-80.75, -78.390625, -76.03125, -73.671875, -71.3125, -68.953125, -66.59375, -64.234375, -61.875, -59.515625, -57.15625, -54.796875, -52.4375, -50.078125, -47.71875, -45.359375, -43.0, -40.640625, -38.28125, -35.921875, -33.5625, -31.203125, -28.84375, -26.484375, -24.125, -21.765625, -19.40625, -17.046875, -14.6875, -12.328125, -9.96875, -7.609375, -5.25, -2.890625, -0.53125, 1.828125, 4.1875, 6.546875, 8.90625, 11.265625, 13.625, 15.984375, 18.34375, 20.703125, 23.0625, 25.421875, 27.78125, 30.140625, 32.5, 34.859375, 37.21875, 39.578125, 41.9375, 44.296875, 46.65625, 49.015625, 51.375, 53.734375, 56.09375, 58.453125, 60.8125, 63.171875, 65.53125, 67.890625, 70.25]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 12.0, 24.0, 103.0, 255.0, 284.0, 207.0, 88.0, 30.0, 8.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.617923736572266, -20.640039443969727, -18.662155151367188, -16.684268951416016, -14.706384658813477, -12.728500366210938, -10.750615119934082, -8.772729873657227, -6.7948455810546875, -4.81696081161499, -2.839076042175293, -0.8611912727355957, 1.1166934967041016, 3.0945777893066406, 5.072463035583496, 7.050348281860352, 9.02823257446289, 11.00611686706543, 12.984002113342285, 14.96188735961914, 16.93977165222168, 18.91765594482422, 20.89554214477539, 22.87342643737793, 24.85131072998047, 26.829195022583008, 28.807079315185547, 30.78496551513672, 32.762847900390625, 34.7407341003418, 36.71862030029297, 38.696502685546875, 40.67439270019531, 42.652278900146484, 44.63016128540039, 46.60804748535156, 48.58592987060547, 50.56381607055664, 52.54170227050781, 54.51958465576172, 56.49747085571289, 58.47535705566406, 60.45323944091797, 62.43112564086914, 64.40901184082031, 66.38689422607422, 68.36477661132812, 70.34266662597656, 72.32054901123047, 74.29843139648438, 76.27632141113281, 78.25420379638672, 80.23208618164062, 82.20997619628906, 84.18785858154297, 86.16574096679688, 88.14363098144531, 90.12151336669922, 92.09940338134766, 94.07728576660156, 96.05516815185547, 98.03305053710938, 100.01094055175781, 101.98882293701172, 103.96670532226562]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 7.0, 1.0, 10.0, 5.0, 8.0, 6.0, 13.0, 15.0, 10.0, 22.0, 29.0, 16.0, 29.0, 24.0, 27.0, 34.0, 41.0, 44.0, 33.0, 38.0, 45.0, 49.0, 37.0, 43.0, 39.0, 42.0, 25.0, 36.0, 31.0, 28.0, 33.0, 27.0, 21.0, 32.0, 16.0, 18.0, 17.0, 8.0, 11.0, 12.0, 6.0, 4.0, 3.0, 4.0, 3.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-128.55751037597656, -124.38248443603516, -120.20745086669922, -116.03242492675781, -111.85739135742188, -107.68236541748047, -103.50733947753906, -99.33230590820312, -95.15727996826172, -90.98225402832031, -86.80722045898438, -82.63219451904297, -78.45716857910156, -74.28213500976562, -70.10710906982422, -65.93208312988281, -61.757049560546875, -57.5820198059082, -53.40699005126953, -49.231964111328125, -45.05693435668945, -40.88190460205078, -36.706878662109375, -32.5318489074707, -28.35681915283203, -24.18178939819336, -20.00676155090332, -15.831732749938965, -11.65670394897461, -7.4816741943359375, -3.3066463470458984, 0.8683815002441406, 5.043426513671875, 9.21845531463623, 13.393484115600586, 17.568511962890625, 21.743541717529297, 25.91857147216797, 30.093599319458008, 34.26862716674805, 38.44365692138672, 42.61868667602539, 46.79371643066406, 50.96874237060547, 55.14377212524414, 59.31880187988281, 63.49382781982422, 67.66885375976562, 71.84388732910156, 76.01891326904297, 80.1939468383789, 84.36897277832031, 88.54400634765625, 92.71903228759766, 96.89405822753906, 101.069091796875, 105.2441177368164, 109.41914367675781, 113.59417724609375, 117.76920318603516, 121.94422912597656, 126.1192626953125, 130.29429626464844, 134.4693145751953, 138.64434814453125]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 6.0, 3.0, 5.0, 5.0, 7.0, 9.0, 14.0, 13.0, 20.0, 15.0, 23.0, 28.0, 26.0, 35.0, 47.0, 25.0, 40.0, 33.0, 46.0, 59.0, 51.0, 34.0, 49.0, 35.0, 34.0, 34.0, 39.0, 38.0, 23.0, 32.0, 26.0, 28.0, 23.0, 15.0, 12.0, 11.0, 12.0, 8.0, 10.0, 7.0, 10.0, 3.0, 4.0, 4.0, 2.0, 1.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-14.0546875, -13.6337890625, -13.212890625, -12.7919921875, -12.37109375, -11.9501953125, -11.529296875, -11.1083984375, -10.6875, -10.2666015625, -9.845703125, -9.4248046875, -9.00390625, -8.5830078125, -8.162109375, -7.7412109375, -7.3203125, -6.8994140625, -6.478515625, -6.0576171875, -5.63671875, -5.2158203125, -4.794921875, -4.3740234375, -3.953125, -3.5322265625, -3.111328125, -2.6904296875, -2.26953125, -1.8486328125, -1.427734375, -1.0068359375, -0.5859375, -0.1650390625, 0.255859375, 0.6767578125, 1.09765625, 1.5185546875, 1.939453125, 2.3603515625, 2.78125, 3.2021484375, 3.623046875, 4.0439453125, 4.46484375, 4.8857421875, 5.306640625, 5.7275390625, 6.1484375, 6.5693359375, 6.990234375, 7.4111328125, 7.83203125, 8.2529296875, 8.673828125, 9.0947265625, 9.515625, 9.9365234375, 10.357421875, 10.7783203125, 11.19921875, 11.6201171875, 12.041015625, 12.4619140625, 12.8828125]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 7.0, 7.0, 8.0, 12.0, 15.0, 22.0, 29.0, 34.0, 45.0, 80.0, 118.0, 161.0, 236.0, 417.0, 830.0, 1586.0, 3121.0, 7385.0, 24870.0, 2289261.0, 1828677.0, 23115.0, 7147.0, 3138.0, 1679.0, 930.0, 502.0, 263.0, 156.0, 128.0, 87.0, 66.0, 38.0, 28.0, 19.0, 12.0, 20.0, 12.0, 11.0, 2.0, 8.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.125, -64.234375, -62.34375, -60.453125, -58.5625, -56.671875, -54.78125, -52.890625, -51.0, -49.109375, -47.21875, -45.328125, -43.4375, -41.546875, -39.65625, -37.765625, -35.875, -33.984375, -32.09375, -30.203125, -28.3125, -26.421875, -24.53125, -22.640625, -20.75, -18.859375, -16.96875, -15.078125, -13.1875, -11.296875, -9.40625, -7.515625, -5.625, -3.734375, -1.84375, 0.046875, 1.9375, 3.828125, 5.71875, 7.609375, 9.5, 11.390625, 13.28125, 15.171875, 17.0625, 18.953125, 20.84375, 22.734375, 24.625, 26.515625, 28.40625, 30.296875, 32.1875, 34.078125, 35.96875, 37.859375, 39.75, 41.640625, 43.53125, 45.421875, 47.3125, 49.203125, 51.09375, 52.984375, 54.875]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 3.0, 2.0, 1.0, 3.0, 2.0, 12.0, 7.0, 13.0, 18.0, 12.0, 33.0, 44.0, 64.0, 118.0, 292.0, 626.0, 1064.0, 865.0, 422.0, 202.0, 90.0, 49.0, 36.0, 21.0, 14.0, 12.0, 7.0, 7.0, 9.0, 3.0, 6.0, 5.0, 4.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.125, -36.92578125, -35.7265625, -34.52734375, -33.328125, -32.12890625, -30.9296875, -29.73046875, -28.53125, -27.33203125, -26.1328125, -24.93359375, -23.734375, -22.53515625, -21.3359375, -20.13671875, -18.9375, -17.73828125, -16.5390625, -15.33984375, -14.140625, -12.94140625, -11.7421875, -10.54296875, -9.34375, -8.14453125, -6.9453125, -5.74609375, -4.546875, -3.34765625, -2.1484375, -0.94921875, 0.25, 1.44921875, 2.6484375, 3.84765625, 5.046875, 6.24609375, 7.4453125, 8.64453125, 9.84375, 11.04296875, 12.2421875, 13.44140625, 14.640625, 15.83984375, 17.0390625, 18.23828125, 19.4375, 20.63671875, 21.8359375, 23.03515625, 24.234375, 25.43359375, 26.6328125, 27.83203125, 29.03125, 30.23046875, 31.4296875, 32.62890625, 33.828125, 35.02734375, 36.2265625, 37.42578125, 38.625]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 1.0, 1.0, 3.0, 2.0, 0.0, 10.0, 7.0, 11.0, 13.0, 35.0, 51.0, 66.0, 113.0, 186.0, 282.0, 480.0, 763.0, 1284.0, 2206.0, 4084.0, 8124.0, 18193.0, 56896.0, 931847.0, 3030367.0, 93566.0, 24080.0, 10158.0, 4860.0, 2772.0, 1513.0, 869.0, 542.0, 336.0, 203.0, 139.0, 72.0, 52.0, 33.0, 25.0, 17.0, 12.0, 4.0, 4.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-55.0625, -53.349609375, -51.63671875, -49.923828125, -48.2109375, -46.498046875, -44.78515625, -43.072265625, -41.359375, -39.646484375, -37.93359375, -36.220703125, -34.5078125, -32.794921875, -31.08203125, -29.369140625, -27.65625, -25.943359375, -24.23046875, -22.517578125, -20.8046875, -19.091796875, -17.37890625, -15.666015625, -13.953125, -12.240234375, -10.52734375, -8.814453125, -7.1015625, -5.388671875, -3.67578125, -1.962890625, -0.25, 1.462890625, 3.17578125, 4.888671875, 6.6015625, 8.314453125, 10.02734375, 11.740234375, 13.453125, 15.166015625, 16.87890625, 18.591796875, 20.3046875, 22.017578125, 23.73046875, 25.443359375, 27.15625, 28.869140625, 30.58203125, 32.294921875, 34.0078125, 35.720703125, 37.43359375, 39.146484375, 40.859375, 42.572265625, 44.28515625, 45.998046875, 47.7109375, 49.423828125, 51.13671875, 52.849609375, 54.5625]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 4.0, 4.0, 7.0, 9.0, 13.0, 21.0, 21.0, 36.0, 65.0, 80.0, 130.0, 165.0, 150.0, 97.0, 58.0, 40.0, 24.0, 16.0, 19.0, 8.0, 10.0, 9.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-157.1263427734375, -152.4529266357422, -147.7794952392578, -143.1060791015625, -138.43264770507812, -133.7592315673828, -129.0858154296875, -124.41238403320312, -119.73896789550781, -115.06554412841797, -110.39212036132812, -105.71870422363281, -101.04528045654297, -96.37185668945312, -91.69843292236328, -87.02500915527344, -82.3515853881836, -77.67816162109375, -73.0047378540039, -68.33131408691406, -63.65789794921875, -58.984474182128906, -54.31105041503906, -49.637630462646484, -44.96420669555664, -40.2907829284668, -35.61736297607422, -30.943939208984375, -26.270517349243164, -21.597095489501953, -16.92367172241211, -12.250251770019531, -7.5768280029296875, -2.9034056663513184, 1.7700166702270508, 6.443439483642578, 11.116861343383789, 15.790283203125, 20.463706970214844, 25.137126922607422, 29.810550689697266, 34.48397445678711, 39.15739440917969, 43.83081817626953, 48.504241943359375, 53.17766189575195, 57.8510856628418, 62.524505615234375, 67.19792938232422, 71.87135314941406, 76.5447769165039, 81.21820068359375, 85.89161682128906, 90.5650405883789, 95.23846435546875, 99.91188049316406, 104.58531188964844, 109.25873565673828, 113.93215942382812, 118.60557556152344, 123.27899932861328, 127.95242309570312, 132.6258544921875, 137.2992706298828, 141.97268676757812]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 4.0, 5.0, 6.0, 12.0, 15.0, 13.0, 16.0, 16.0, 21.0, 17.0, 36.0, 39.0, 35.0, 36.0, 36.0, 60.0, 39.0, 44.0, 49.0, 38.0, 41.0, 42.0, 41.0, 40.0, 56.0, 31.0, 30.0, 28.0, 23.0, 17.0, 23.0, 22.0, 9.0, 17.0, 16.0, 9.0, 10.0, 8.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-85.65242004394531, -82.71452331542969, -79.77661895751953, -76.8387222290039, -73.90081787109375, -70.96292114257812, -68.0250244140625, -65.08712005615234, -62.14921951293945, -59.21131896972656, -56.27341842651367, -53.33551788330078, -50.397621154785156, -47.459716796875, -44.521820068359375, -41.583919525146484, -38.646018981933594, -35.7081184387207, -32.77021789550781, -29.832319259643555, -26.894418716430664, -23.956518173217773, -21.018619537353516, -18.080718994140625, -15.142818450927734, -12.204917907714844, -9.26701831817627, -6.329118728637695, -3.3912181854248047, -0.45331764221191406, 2.4845809936523438, 5.422481536865234, 8.360374450683594, 11.298274993896484, 14.236174583435059, 17.174074172973633, 20.111974716186523, 23.049875259399414, 25.987773895263672, 28.925674438476562, 31.863574981689453, 34.801475524902344, 37.739376068115234, 40.677276611328125, 43.61517333984375, 46.553077697753906, 49.49097442626953, 52.42887496948242, 55.36677551269531, 58.3046760559082, 61.242576599121094, 64.18047332763672, 67.11837768554688, 70.0562744140625, 72.99417114257812, 75.93207550048828, 78.86997985839844, 81.80787658691406, 84.74578094482422, 87.68367767333984, 90.62158203125, 93.55947875976562, 96.49737548828125, 99.4352798461914, 102.37317657470703]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 6.0, 7.0, 6.0, 9.0, 7.0, 9.0, 13.0, 24.0, 17.0, 16.0, 20.0, 29.0, 34.0, 30.0, 36.0, 31.0, 44.0, 47.0, 49.0, 44.0, 47.0, 55.0, 32.0, 37.0, 53.0, 50.0, 23.0, 29.0, 29.0, 30.0, 20.0, 20.0, 16.0, 13.0, 15.0, 19.0, 13.0, 7.0, 5.0, 5.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-14.5078125, -14.0758056640625, -13.643798828125, -13.2117919921875, -12.77978515625, -12.3477783203125, -11.915771484375, -11.4837646484375, -11.0517578125, -10.6197509765625, -10.187744140625, -9.7557373046875, -9.32373046875, -8.8917236328125, -8.459716796875, -8.0277099609375, -7.595703125, -7.1636962890625, -6.731689453125, -6.2996826171875, -5.86767578125, -5.4356689453125, -5.003662109375, -4.5716552734375, -4.1396484375, -3.7076416015625, -3.275634765625, -2.8436279296875, -2.41162109375, -1.9796142578125, -1.547607421875, -1.1156005859375, -0.68359375, -0.2515869140625, 0.180419921875, 0.6124267578125, 1.04443359375, 1.4764404296875, 1.908447265625, 2.3404541015625, 2.7724609375, 3.2044677734375, 3.636474609375, 4.0684814453125, 4.50048828125, 4.9324951171875, 5.364501953125, 5.7965087890625, 6.228515625, 6.6605224609375, 7.092529296875, 7.5245361328125, 7.95654296875, 8.3885498046875, 8.820556640625, 9.2525634765625, 9.6845703125, 10.1165771484375, 10.548583984375, 10.9805908203125, 11.41259765625, 11.8446044921875, 12.276611328125, 12.7086181640625, 13.140625]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 6.0, 11.0, 15.0, 19.0, 19.0, 47.0, 62.0, 92.0, 160.0, 226.0, 347.0, 516.0, 808.0, 1274.0, 1894.0, 3005.0, 4650.0, 7343.0, 11551.0, 18735.0, 31086.0, 53804.0, 101014.0, 199439.0, 267719.0, 154495.0, 78863.0, 43218.0, 25488.0, 15359.0, 9957.0, 6070.0, 3967.0, 2606.0, 1674.0, 1044.0, 696.0, 417.0, 314.0, 179.0, 123.0, 81.0, 59.0, 37.0, 27.0, 17.0, 13.0, 7.0, 3.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.5966796875, -1.545684814453125, -1.49468994140625, -1.443695068359375, -1.3927001953125, -1.341705322265625, -1.29071044921875, -1.239715576171875, -1.188720703125, -1.137725830078125, -1.08673095703125, -1.035736083984375, -0.9847412109375, -0.933746337890625, -0.88275146484375, -0.831756591796875, -0.78076171875, -0.729766845703125, -0.67877197265625, -0.627777099609375, -0.5767822265625, -0.525787353515625, -0.47479248046875, -0.423797607421875, -0.372802734375, -0.321807861328125, -0.27081298828125, -0.219818115234375, -0.1688232421875, -0.117828369140625, -0.06683349609375, -0.015838623046875, 0.03515625, 0.086151123046875, 0.13714599609375, 0.188140869140625, 0.2391357421875, 0.290130615234375, 0.34112548828125, 0.392120361328125, 0.443115234375, 0.494110107421875, 0.54510498046875, 0.596099853515625, 0.6470947265625, 0.698089599609375, 0.74908447265625, 0.800079345703125, 0.85107421875, 0.902069091796875, 0.95306396484375, 1.004058837890625, 1.0550537109375, 1.106048583984375, 1.15704345703125, 1.208038330078125, 1.259033203125, 1.310028076171875, 1.36102294921875, 1.412017822265625, 1.4630126953125, 1.514007568359375, 1.56500244140625, 1.615997314453125, 1.6669921875]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 4.0, 7.0, 7.0, 12.0, 1.0, 11.0, 13.0, 9.0, 19.0, 19.0, 14.0, 14.0, 28.0, 25.0, 33.0, 25.0, 35.0, 27.0, 41.0, 28.0, 24.0, 33.0, 41.0, 1070.0, 44.0, 36.0, 37.0, 40.0, 28.0, 35.0, 31.0, 24.0, 32.0, 35.0, 23.0, 21.0, 15.0, 16.0, 9.0, 15.0, 6.0, 6.0, 9.0, 10.0, 4.0, 6.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-7.0703125, -6.8367919921875, -6.603271484375, -6.3697509765625, -6.13623046875, -5.9027099609375, -5.669189453125, -5.4356689453125, -5.2021484375, -4.9686279296875, -4.735107421875, -4.5015869140625, -4.26806640625, -4.0345458984375, -3.801025390625, -3.5675048828125, -3.333984375, -3.1004638671875, -2.866943359375, -2.6334228515625, -2.39990234375, -2.1663818359375, -1.932861328125, -1.6993408203125, -1.4658203125, -1.2322998046875, -0.998779296875, -0.7652587890625, -0.53173828125, -0.2982177734375, -0.064697265625, 0.1688232421875, 0.40234375, 0.6358642578125, 0.869384765625, 1.1029052734375, 1.33642578125, 1.5699462890625, 1.803466796875, 2.0369873046875, 2.2705078125, 2.5040283203125, 2.737548828125, 2.9710693359375, 3.20458984375, 3.4381103515625, 3.671630859375, 3.9051513671875, 4.138671875, 4.3721923828125, 4.605712890625, 4.8392333984375, 5.07275390625, 5.3062744140625, 5.539794921875, 5.7733154296875, 6.0068359375, 6.2403564453125, 6.473876953125, 6.7073974609375, 6.94091796875, 7.1744384765625, 7.407958984375, 7.6414794921875, 7.875]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 12.0, 11.0, 19.0, 22.0, 28.0, 53.0, 87.0, 132.0, 235.0, 316.0, 505.0, 750.0, 1246.0, 1986.0, 2771.0, 4439.0, 6654.0, 10150.0, 15848.0, 24633.0, 40037.0, 68162.0, 119303.0, 260851.0, 1204070.0, 135753.0, 76914.0, 44762.0, 27460.0, 17520.0, 11225.0, 7361.0, 4905.0, 3044.0, 2113.0, 1365.0, 848.0, 526.0, 369.0, 230.0, 167.0, 90.0, 67.0, 36.0, 20.0, 18.0, 8.0, 5.0, 7.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.75927734375, -0.7356338500976562, -0.7119903564453125, -0.6883468627929688, -0.664703369140625, -0.6410598754882812, -0.6174163818359375, -0.5937728881835938, -0.57012939453125, -0.5464859008789062, -0.5228424072265625, -0.49919891357421875, -0.475555419921875, -0.45191192626953125, -0.4282684326171875, -0.40462493896484375, -0.3809814453125, -0.35733795166015625, -0.3336944580078125, -0.31005096435546875, -0.286407470703125, -0.26276397705078125, -0.2391204833984375, -0.21547698974609375, -0.19183349609375, -0.16819000244140625, -0.1445465087890625, -0.12090301513671875, -0.097259521484375, -0.07361602783203125, -0.0499725341796875, -0.02632904052734375, -0.002685546875, 0.02095794677734375, 0.0446014404296875, 0.06824493408203125, 0.091888427734375, 0.11553192138671875, 0.1391754150390625, 0.16281890869140625, 0.18646240234375, 0.21010589599609375, 0.2337493896484375, 0.25739288330078125, 0.281036376953125, 0.30467987060546875, 0.3283233642578125, 0.35196685791015625, 0.3756103515625, 0.39925384521484375, 0.4228973388671875, 0.44654083251953125, 0.470184326171875, 0.49382781982421875, 0.5174713134765625, 0.5411148071289062, 0.56475830078125, 0.5884017944335938, 0.6120452880859375, 0.6356887817382812, 0.659332275390625, 0.6829757690429688, 0.7066192626953125, 0.7302627563476562, 0.75390625]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 5.0, 1.0, 6.0, 6.0, 12.0, 11.0, 14.0, 14.0, 18.0, 48.0, 46.0, 51.0, 59.0, 76.0, 104.0, 76.0, 78.0, 68.0, 66.0, 67.0, 42.0, 33.0, 28.0, 13.0, 12.0, 5.0, 11.0, 8.0, 4.0, 4.0, 5.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.022979736328125, -0.02219676971435547, -0.021413803100585938, -0.020630836486816406, -0.019847869873046875, -0.019064903259277344, -0.018281936645507812, -0.01749897003173828, -0.01671600341796875, -0.01593303680419922, -0.015150070190429688, -0.014367103576660156, -0.013584136962890625, -0.012801170349121094, -0.012018203735351562, -0.011235237121582031, -0.0104522705078125, -0.009669303894042969, -0.008886337280273438, -0.008103370666503906, -0.007320404052734375, -0.006537437438964844, -0.0057544708251953125, -0.004971504211425781, -0.00418853759765625, -0.0034055709838867188, -0.0026226043701171875, -0.0018396377563476562, -0.001056671142578125, -0.00027370452880859375, 0.0005092620849609375, 0.0012922286987304688, 0.0020751953125, 0.0028581619262695312, 0.0036411285400390625, 0.004424095153808594, 0.005207061767578125, 0.005990028381347656, 0.0067729949951171875, 0.007555961608886719, 0.00833892822265625, 0.009121894836425781, 0.009904861450195312, 0.010687828063964844, 0.011470794677734375, 0.012253761291503906, 0.013036727905273438, 0.013819694519042969, 0.0146026611328125, 0.015385627746582031, 0.016168594360351562, 0.016951560974121094, 0.017734527587890625, 0.018517494201660156, 0.019300460815429688, 0.02008342742919922, 0.02086639404296875, 0.02164936065673828, 0.022432327270507812, 0.023215293884277344, 0.023998260498046875, 0.024781227111816406, 0.025564193725585938, 0.02634716033935547, 0.027130126953125]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 4.0, 4.0, 6.0, 2.0, 17.0, 20.0, 23.0, 33.0, 36.0, 33.0, 71.0, 90.0, 123.0, 242.0, 436.0, 1011.0, 3184.0, 23254.0, 909347.0, 101162.0, 6413.0, 1591.0, 591.0, 303.0, 160.0, 132.0, 66.0, 48.0, 32.0, 33.0, 18.0, 16.0, 12.0, 8.0, 10.0, 5.0, 3.0, 2.0, 6.0, 1.0, 3.0, 5.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.466552734375, -0.4522895812988281, -0.43802642822265625, -0.4237632751464844, -0.4095001220703125, -0.3952369689941406, -0.38097381591796875, -0.3667106628417969, -0.352447509765625, -0.3381843566894531, -0.32392120361328125, -0.3096580505371094, -0.2953948974609375, -0.2811317443847656, -0.26686859130859375, -0.2526054382324219, -0.23834228515625, -0.22407913208007812, -0.20981597900390625, -0.19555282592773438, -0.1812896728515625, -0.16702651977539062, -0.15276336669921875, -0.13850021362304688, -0.124237060546875, -0.10997390747070312, -0.09571075439453125, -0.08144760131835938, -0.0671844482421875, -0.052921295166015625, -0.03865814208984375, -0.024394989013671875, -0.0101318359375, 0.004131317138671875, 0.01839447021484375, 0.032657623291015625, 0.0469207763671875, 0.061183929443359375, 0.07544708251953125, 0.08971023559570312, 0.103973388671875, 0.11823654174804688, 0.13249969482421875, 0.14676284790039062, 0.1610260009765625, 0.17528915405273438, 0.18955230712890625, 0.20381546020507812, 0.21807861328125, 0.23234176635742188, 0.24660491943359375, 0.2608680725097656, 0.2751312255859375, 0.2893943786621094, 0.30365753173828125, 0.3179206848144531, 0.332183837890625, 0.3464469909667969, 0.36071014404296875, 0.3749732971191406, 0.3892364501953125, 0.4034996032714844, 0.41776275634765625, 0.4320259094238281, 0.4462890625]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 6.0, 10.0, 28.0, 68.0, 203.0, 412.0, 153.0, 63.0, 33.0, 12.0, 8.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0875474140048027, -0.0810135081410408, -0.0744796097278595, -0.0679457038640976, -0.06141179800033569, -0.05487789586186409, -0.04834399372339249, -0.041810087859630585, -0.03527618572115898, -0.02874228172004223, -0.022208377718925476, -0.015674475580453873, -0.00914057157933712, -0.0026066675782203674, 0.003927234560251236, 0.010461140424013138, 0.01699504256248474, 0.023528946563601494, 0.030062850564718246, 0.03659675270318985, 0.04313065856695175, 0.049664560705423355, 0.05619846284389496, 0.06273236870765686, 0.06926627457141876, 0.07580018043518066, 0.08233407884836197, 0.08886798471212387, 0.09540189057588577, 0.10193578898906708, 0.10846969485282898, 0.11500360071659088, 0.12153749167919159, 0.1280713975429535, 0.1346053034067154, 0.1411392092704773, 0.147673100233078, 0.1542070060968399, 0.1607409119606018, 0.1672748178243637, 0.1738087236881256, 0.1803426295518875, 0.18687653541564941, 0.19341042637825012, 0.19994433224201202, 0.20647823810577393, 0.21301214396953583, 0.21954604983329773, 0.22607994079589844, 0.23261384665966034, 0.23914775252342224, 0.24568164348602295, 0.25221556425094604, 0.25874945521354675, 0.26528334617614746, 0.27181726694107056, 0.27835118770599365, 0.28488507866859436, 0.29141899943351746, 0.29795289039611816, 0.30448681116104126, 0.31102070212364197, 0.3175545930862427, 0.32408851385116577, 0.3306224048137665]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 4.0, 2.0, 7.0, 12.0, 13.0, 15.0, 11.0, 14.0, 20.0, 17.0, 17.0, 16.0, 23.0, 26.0, 37.0, 28.0, 39.0, 44.0, 39.0, 31.0, 43.0, 44.0, 42.0, 37.0, 38.0, 34.0, 34.0, 33.0, 34.0, 33.0, 24.0, 18.0, 32.0, 25.0, 18.0, 17.0, 17.0, 17.0, 11.0, 7.0, 7.0, 7.0, 5.0, 5.0, 1.0, 1.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.027836382389068604, -0.027014771476387978, -0.02619316056370735, -0.025371549651026726, -0.0245499387383461, -0.023728327825665474, -0.022906716912984848, -0.022085106000304222, -0.021263495087623596, -0.02044188417494297, -0.019620273262262344, -0.01879866234958172, -0.017977051436901093, -0.017155440524220467, -0.01633382961153984, -0.015512218698859215, -0.014690607786178589, -0.013868996873497963, -0.013047385960817337, -0.012225775048136711, -0.011404164135456085, -0.01058255322277546, -0.009760942310094833, -0.008939331397414207, -0.008117720484733582, -0.007296109572052956, -0.00647449865937233, -0.005652887746691704, -0.004831276834011078, -0.004009665921330452, -0.003188055008649826, -0.0023664440959692, -0.0015448331832885742, -0.0007232222706079483, 9.838864207267761e-05, 0.0009199995547533035, 0.0017416104674339294, 0.0025632213801145554, 0.0033848322927951813, 0.004206443205475807, 0.005028054118156433, 0.005849665030837059, 0.006671275943517685, 0.007492886856198311, 0.008314497768878937, 0.009136108681559563, 0.009957719594240189, 0.010779330506920815, 0.01160094141960144, 0.012422552332282066, 0.013244163244962692, 0.014065774157643318, 0.014887385070323944, 0.01570899598300457, 0.016530606895685196, 0.017352217808365822, 0.018173828721046448, 0.018995439633727074, 0.0198170505464077, 0.020638661459088326, 0.02146027237176895, 0.022281883284449577, 0.023103494197130203, 0.02392510510981083, 0.024746716022491455]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 6.0, 7.0, 6.0, 9.0, 7.0, 7.0, 15.0, 24.0, 16.0, 17.0, 19.0, 30.0, 34.0, 30.0, 35.0, 32.0, 44.0, 47.0, 49.0, 44.0, 47.0, 55.0, 31.0, 38.0, 53.0, 48.0, 25.0, 28.0, 30.0, 30.0, 20.0, 20.0, 16.0, 13.0, 15.0, 19.0, 13.0, 7.0, 5.0, 5.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-14.515625, -14.08349609375, -13.6513671875, -13.21923828125, -12.787109375, -12.35498046875, -11.9228515625, -11.49072265625, -11.05859375, -10.62646484375, -10.1943359375, -9.76220703125, -9.330078125, -8.89794921875, -8.4658203125, -8.03369140625, -7.6015625, -7.16943359375, -6.7373046875, -6.30517578125, -5.873046875, -5.44091796875, -5.0087890625, -4.57666015625, -4.14453125, -3.71240234375, -3.2802734375, -2.84814453125, -2.416015625, -1.98388671875, -1.5517578125, -1.11962890625, -0.6875, -0.25537109375, 0.1767578125, 0.60888671875, 1.041015625, 1.47314453125, 1.9052734375, 2.33740234375, 2.76953125, 3.20166015625, 3.6337890625, 4.06591796875, 4.498046875, 4.93017578125, 5.3623046875, 5.79443359375, 6.2265625, 6.65869140625, 7.0908203125, 7.52294921875, 7.955078125, 8.38720703125, 8.8193359375, 9.25146484375, 9.68359375, 10.11572265625, 10.5478515625, 10.97998046875, 11.412109375, 11.84423828125, 12.2763671875, 12.70849609375, 13.140625]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 5.0, 10.0, 10.0, 17.0, 20.0, 26.0, 45.0, 46.0, 70.0, 100.0, 157.0, 227.0, 332.0, 639.0, 1069.0, 2064.0, 4333.0, 10008.0, 26216.0, 75178.0, 251741.0, 449274.0, 148791.0, 47257.0, 17170.0, 6853.0, 3075.0, 1561.0, 850.0, 498.0, 311.0, 174.0, 114.0, 93.0, 68.0, 49.0, 27.0, 17.0, 18.0, 14.0, 13.0, 5.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.5390625, -7.298095703125, -7.05712890625, -6.816162109375, -6.5751953125, -6.334228515625, -6.09326171875, -5.852294921875, -5.611328125, -5.370361328125, -5.12939453125, -4.888427734375, -4.6474609375, -4.406494140625, -4.16552734375, -3.924560546875, -3.68359375, -3.442626953125, -3.20166015625, -2.960693359375, -2.7197265625, -2.478759765625, -2.23779296875, -1.996826171875, -1.755859375, -1.514892578125, -1.27392578125, -1.032958984375, -0.7919921875, -0.551025390625, -0.31005859375, -0.069091796875, 0.171875, 0.412841796875, 0.65380859375, 0.894775390625, 1.1357421875, 1.376708984375, 1.61767578125, 1.858642578125, 2.099609375, 2.340576171875, 2.58154296875, 2.822509765625, 3.0634765625, 3.304443359375, 3.54541015625, 3.786376953125, 4.02734375, 4.268310546875, 4.50927734375, 4.750244140625, 4.9912109375, 5.232177734375, 5.47314453125, 5.714111328125, 5.955078125, 6.196044921875, 6.43701171875, 6.677978515625, 6.9189453125, 7.159912109375, 7.40087890625, 7.641845703125, 7.8828125]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 7.0, 7.0, 7.0, 16.0, 16.0, 14.0, 21.0, 18.0, 21.0, 24.0, 24.0, 38.0, 32.0, 40.0, 52.0, 37.0, 49.0, 58.0, 130.0, 1807.0, 148.0, 76.0, 40.0, 35.0, 37.0, 33.0, 34.0, 36.0, 43.0, 27.0, 16.0, 14.0, 20.0, 9.0, 11.0, 14.0, 11.0, 8.0, 5.0, 4.0, 5.0, 2.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-37.875, -36.5947265625, -35.314453125, -34.0341796875, -32.75390625, -31.4736328125, -30.193359375, -28.9130859375, -27.6328125, -26.3525390625, -25.072265625, -23.7919921875, -22.51171875, -21.2314453125, -19.951171875, -18.6708984375, -17.390625, -16.1103515625, -14.830078125, -13.5498046875, -12.26953125, -10.9892578125, -9.708984375, -8.4287109375, -7.1484375, -5.8681640625, -4.587890625, -3.3076171875, -2.02734375, -0.7470703125, 0.533203125, 1.8134765625, 3.09375, 4.3740234375, 5.654296875, 6.9345703125, 8.21484375, 9.4951171875, 10.775390625, 12.0556640625, 13.3359375, 14.6162109375, 15.896484375, 17.1767578125, 18.45703125, 19.7373046875, 21.017578125, 22.2978515625, 23.578125, 24.8583984375, 26.138671875, 27.4189453125, 28.69921875, 29.9794921875, 31.259765625, 32.5400390625, 33.8203125, 35.1005859375, 36.380859375, 37.6611328125, 38.94140625, 40.2216796875, 41.501953125, 42.7822265625, 44.0625]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 8.0, 7.0, 8.0, 9.0, 17.0, 30.0, 30.0, 46.0, 57.0, 123.0, 176.0, 242.0, 599.0, 1898.0, 16542.0, 3109646.0, 13283.0, 1714.0, 535.0, 243.0, 191.0, 105.0, 58.0, 42.0, 32.0, 29.0, 19.0, 10.0, 7.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-129.75, -125.345703125, -120.94140625, -116.537109375, -112.1328125, -107.728515625, -103.32421875, -98.919921875, -94.515625, -90.111328125, -85.70703125, -81.302734375, -76.8984375, -72.494140625, -68.08984375, -63.685546875, -59.28125, -54.876953125, -50.47265625, -46.068359375, -41.6640625, -37.259765625, -32.85546875, -28.451171875, -24.046875, -19.642578125, -15.23828125, -10.833984375, -6.4296875, -2.025390625, 2.37890625, 6.783203125, 11.1875, 15.591796875, 19.99609375, 24.400390625, 28.8046875, 33.208984375, 37.61328125, 42.017578125, 46.421875, 50.826171875, 55.23046875, 59.634765625, 64.0390625, 68.443359375, 72.84765625, 77.251953125, 81.65625, 86.060546875, 90.46484375, 94.869140625, 99.2734375, 103.677734375, 108.08203125, 112.486328125, 116.890625, 121.294921875, 125.69921875, 130.103515625, 134.5078125, 138.912109375, 143.31640625, 147.720703125, 152.125]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 33.0, 943.0, 45.0], "bins": [-1874.1378173828125, -1844.176513671875, -1814.215087890625, -1784.2537841796875, -1754.2923583984375, -1724.3310546875, -1694.36962890625, -1664.4083251953125, -1634.4468994140625, -1604.485595703125, -1574.524169921875, -1544.5628662109375, -1514.6014404296875, -1484.64013671875, -1454.6787109375, -1424.7174072265625, -1394.7559814453125, -1364.794677734375, -1334.833251953125, -1304.8719482421875, -1274.9105224609375, -1244.94921875, -1214.98779296875, -1185.0264892578125, -1155.0650634765625, -1125.103759765625, -1095.142333984375, -1065.1810302734375, -1035.2196044921875, -1005.2582397460938, -975.296875, -945.3355102539062, -915.3742065429688, -885.412841796875, -855.4514770507812, -825.4901123046875, -795.5287475585938, -765.5673828125, -735.6060180664062, -705.6446533203125, -675.683349609375, -645.7219848632812, -615.7606201171875, -585.7992553710938, -555.837890625, -525.8765258789062, -495.9151611328125, -465.95379638671875, -435.992431640625, -406.03106689453125, -376.0697021484375, -346.10833740234375, -316.14697265625, -286.18560791015625, -256.2242431640625, -226.2628936767578, -196.301513671875, -166.34014892578125, -136.3787841796875, -106.41742706298828, -76.45606231689453, -46.49470520019531, -16.533340454101562, 13.428024291992188, 43.38938903808594]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 5.0, 4.0, 9.0, 3.0, 12.0, 14.0, 18.0, 18.0, 16.0, 20.0, 24.0, 30.0, 22.0, 22.0, 32.0, 40.0, 35.0, 45.0, 51.0, 50.0, 43.0, 45.0, 43.0, 49.0, 40.0, 38.0, 33.0, 22.0, 34.0, 32.0, 20.0, 13.0, 27.0, 23.0, 16.0, 14.0, 13.0, 8.0, 7.0, 4.0, 5.0, 2.0, 2.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-125.19329071044922, -121.64056396484375, -118.08784484863281, -114.53511810302734, -110.9823989868164, -107.42967224121094, -103.876953125, -100.32422637939453, -96.77149963378906, -93.2187728881836, -89.66605377197266, -86.11332702636719, -82.56060791015625, -79.00788116455078, -75.45515441894531, -71.90243530273438, -68.34971618652344, -64.79698944091797, -61.24427032470703, -57.69154357910156, -54.138824462890625, -50.586097717285156, -47.03337478637695, -43.48065185546875, -39.92792892456055, -36.375205993652344, -32.82248306274414, -29.269758224487305, -25.7170352935791, -22.1643123626709, -18.611587524414062, -15.05886459350586, -11.506134033203125, -7.953410625457764, -4.400687217712402, -0.8479633331298828, 2.7047595977783203, 6.257482528686523, 9.81020736694336, 13.362930297851562, 16.915653228759766, 20.46837615966797, 24.021099090576172, 27.573823928833008, 31.12654685974121, 34.67926788330078, 38.23199462890625, 41.78471755981445, 45.337440490722656, 48.89016342163086, 52.44288635253906, 55.99561309814453, 59.54833221435547, 63.10105895996094, 66.65377807617188, 70.20650482177734, 73.75923156738281, 77.31195831298828, 80.86467742919922, 84.41740417480469, 87.97012329101562, 91.5228500366211, 95.07557678222656, 98.6282958984375, 102.18101501464844]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 4.0, 0.0, 3.0, 5.0, 15.0, 6.0, 10.0, 13.0, 16.0, 17.0, 13.0, 23.0, 23.0, 32.0, 28.0, 46.0, 36.0, 34.0, 45.0, 40.0, 51.0, 50.0, 51.0, 52.0, 40.0, 49.0, 28.0, 34.0, 26.0, 40.0, 23.0, 23.0, 22.0, 13.0, 23.0, 7.0, 19.0, 12.0, 10.0, 8.0, 5.0, 4.0, 7.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-15.1875, -14.73974609375, -14.2919921875, -13.84423828125, -13.396484375, -12.94873046875, -12.5009765625, -12.05322265625, -11.60546875, -11.15771484375, -10.7099609375, -10.26220703125, -9.814453125, -9.36669921875, -8.9189453125, -8.47119140625, -8.0234375, -7.57568359375, -7.1279296875, -6.68017578125, -6.232421875, -5.78466796875, -5.3369140625, -4.88916015625, -4.44140625, -3.99365234375, -3.5458984375, -3.09814453125, -2.650390625, -2.20263671875, -1.7548828125, -1.30712890625, -0.859375, -0.41162109375, 0.0361328125, 0.48388671875, 0.931640625, 1.37939453125, 1.8271484375, 2.27490234375, 2.72265625, 3.17041015625, 3.6181640625, 4.06591796875, 4.513671875, 4.96142578125, 5.4091796875, 5.85693359375, 6.3046875, 6.75244140625, 7.2001953125, 7.64794921875, 8.095703125, 8.54345703125, 8.9912109375, 9.43896484375, 9.88671875, 10.33447265625, 10.7822265625, 11.22998046875, 11.677734375, 12.12548828125, 12.5732421875, 13.02099609375, 13.46875]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 10.0, 13.0, 10.0, 21.0, 19.0, 26.0, 33.0, 31.0, 69.0, 91.0, 135.0, 199.0, 289.0, 486.0, 883.0, 1596.0, 3138.0, 6799.0, 16900.0, 118393.0, 3600812.0, 402175.0, 24394.0, 8973.0, 4035.0, 2040.0, 1046.0, 567.0, 362.0, 219.0, 162.0, 87.0, 56.0, 57.0, 31.0, 25.0, 32.0, 20.0, 16.0, 7.0, 11.0, 4.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-58.46875, -56.78125, -55.09375, -53.40625, -51.71875, -50.03125, -48.34375, -46.65625, -44.96875, -43.28125, -41.59375, -39.90625, -38.21875, -36.53125, -34.84375, -33.15625, -31.46875, -29.78125, -28.09375, -26.40625, -24.71875, -23.03125, -21.34375, -19.65625, -17.96875, -16.28125, -14.59375, -12.90625, -11.21875, -9.53125, -7.84375, -6.15625, -4.46875, -2.78125, -1.09375, 0.59375, 2.28125, 3.96875, 5.65625, 7.34375, 9.03125, 10.71875, 12.40625, 14.09375, 15.78125, 17.46875, 19.15625, 20.84375, 22.53125, 24.21875, 25.90625, 27.59375, 29.28125, 30.96875, 32.65625, 34.34375, 36.03125, 37.71875, 39.40625, 41.09375, 42.78125, 44.46875, 46.15625, 47.84375, 49.53125]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 4.0, 2.0, 6.0, 7.0, 6.0, 5.0, 10.0, 9.0, 10.0, 18.0, 24.0, 32.0, 36.0, 63.0, 114.0, 225.0, 565.0, 1099.0, 946.0, 452.0, 172.0, 80.0, 47.0, 35.0, 24.0, 18.0, 16.0, 13.0, 19.0, 7.0, 5.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.6875, -32.38623046875, -31.0849609375, -29.78369140625, -28.482421875, -27.18115234375, -25.8798828125, -24.57861328125, -23.27734375, -21.97607421875, -20.6748046875, -19.37353515625, -18.072265625, -16.77099609375, -15.4697265625, -14.16845703125, -12.8671875, -11.56591796875, -10.2646484375, -8.96337890625, -7.662109375, -6.36083984375, -5.0595703125, -3.75830078125, -2.45703125, -1.15576171875, 0.1455078125, 1.44677734375, 2.748046875, 4.04931640625, 5.3505859375, 6.65185546875, 7.953125, 9.25439453125, 10.5556640625, 11.85693359375, 13.158203125, 14.45947265625, 15.7607421875, 17.06201171875, 18.36328125, 19.66455078125, 20.9658203125, 22.26708984375, 23.568359375, 24.86962890625, 26.1708984375, 27.47216796875, 28.7734375, 30.07470703125, 31.3759765625, 32.67724609375, 33.978515625, 35.27978515625, 36.5810546875, 37.88232421875, 39.18359375, 40.48486328125, 41.7861328125, 43.08740234375, 44.388671875, 45.68994140625, 46.9912109375, 48.29248046875, 49.59375]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 5.0, 7.0, 4.0, 6.0, 13.0, 11.0, 29.0, 35.0, 64.0, 94.0, 162.0, 279.0, 460.0, 969.0, 1746.0, 3484.0, 7797.0, 19178.0, 61691.0, 1551409.0, 2439790.0, 70109.0, 20745.0, 8295.0, 3757.0, 1811.0, 939.0, 567.0, 314.0, 191.0, 106.0, 59.0, 45.0, 29.0, 30.0, 18.0, 9.0, 14.0, 4.0, 6.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-79.0, -76.92333984375, -74.8466796875, -72.77001953125, -70.693359375, -68.61669921875, -66.5400390625, -64.46337890625, -62.38671875, -60.31005859375, -58.2333984375, -56.15673828125, -54.080078125, -52.00341796875, -49.9267578125, -47.85009765625, -45.7734375, -43.69677734375, -41.6201171875, -39.54345703125, -37.466796875, -35.39013671875, -33.3134765625, -31.23681640625, -29.16015625, -27.08349609375, -25.0068359375, -22.93017578125, -20.853515625, -18.77685546875, -16.7001953125, -14.62353515625, -12.546875, -10.47021484375, -8.3935546875, -6.31689453125, -4.240234375, -2.16357421875, -0.0869140625, 1.98974609375, 4.06640625, 6.14306640625, 8.2197265625, 10.29638671875, 12.373046875, 14.44970703125, 16.5263671875, 18.60302734375, 20.6796875, 22.75634765625, 24.8330078125, 26.90966796875, 28.986328125, 31.06298828125, 33.1396484375, 35.21630859375, 37.29296875, 39.36962890625, 41.4462890625, 43.52294921875, 45.599609375, 47.67626953125, 49.7529296875, 51.82958984375, 53.90625]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 6.0, 4.0, 6.0, 7.0, 12.0, 14.0, 29.0, 23.0, 40.0, 55.0, 101.0, 131.0, 153.0, 143.0, 97.0, 57.0, 39.0, 21.0, 17.0, 15.0, 6.0, 12.0, 6.0, 8.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-95.68331909179688, -90.7453842163086, -85.80744934082031, -80.86951446533203, -75.93157958984375, -70.99364471435547, -66.05570983886719, -61.117774963378906, -56.179840087890625, -51.241905212402344, -46.30397033691406, -41.36603546142578, -36.4281005859375, -31.49016571044922, -26.552230834960938, -21.614295959472656, -16.676361083984375, -11.738426208496094, -6.8004913330078125, -1.8625564575195312, 3.07537841796875, 8.013313293457031, 12.951248168945312, 17.889183044433594, 22.827117919921875, 27.765052795410156, 32.70298767089844, 37.64092254638672, 42.578857421875, 47.51679229736328, 52.45472717285156, 57.392662048339844, 62.330596923828125, 67.2685317993164, 72.20646667480469, 77.14440155029297, 82.08233642578125, 87.02027130126953, 91.95820617675781, 96.8961410522461, 101.83407592773438, 106.77201080322266, 111.70994567871094, 116.64788055419922, 121.5858154296875, 126.52375030517578, 131.46168518066406, 136.39962768554688, 141.33755493164062, 146.27548217773438, 151.2134246826172, 156.1513671875, 161.08929443359375, 166.0272216796875, 170.9651641845703, 175.90310668945312, 180.84103393554688, 185.77896118164062, 190.71690368652344, 195.65484619140625, 200.5927734375, 205.53070068359375, 210.46864318847656, 215.40658569335938, 220.34451293945312]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 5.0, 4.0, 3.0, 6.0, 4.0, 4.0, 9.0, 6.0, 10.0, 4.0, 13.0, 14.0, 18.0, 15.0, 22.0, 19.0, 25.0, 35.0, 26.0, 29.0, 28.0, 26.0, 27.0, 28.0, 32.0, 30.0, 34.0, 30.0, 26.0, 36.0, 28.0, 37.0, 39.0, 42.0, 29.0, 27.0, 21.0, 27.0, 25.0, 21.0, 23.0, 17.0, 14.0, 11.0, 13.0, 7.0, 18.0, 4.0, 13.0, 8.0, 7.0, 3.0, 1.0, 3.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-71.44918060302734, -69.10608673095703, -66.76298522949219, -64.41989135742188, -62.07678985595703, -59.73369598388672, -57.39059829711914, -55.04750061035156, -52.704402923583984, -50.361305236816406, -48.01820755004883, -45.67510986328125, -43.33201599121094, -40.988914489746094, -38.64582061767578, -36.3027229309082, -33.959625244140625, -31.616527557373047, -29.27342987060547, -26.930334091186523, -24.587236404418945, -22.244138717651367, -19.901042938232422, -17.557945251464844, -15.214847564697266, -12.871749877929688, -10.528653144836426, -8.185556411743164, -5.842458724975586, -3.499361038208008, -1.156264305114746, 1.1868324279785156, 3.5299224853515625, 5.873019695281982, 8.216116905212402, 10.559213638305664, 12.902311325073242, 15.24540901184082, 17.588504791259766, 19.931602478027344, 22.274700164794922, 24.6177978515625, 26.960895538330078, 29.303991317749023, 31.6470890045166, 33.99018859863281, 36.333282470703125, 38.6763801574707, 41.01947784423828, 43.36257553100586, 45.70567321777344, 48.048770904541016, 50.391868591308594, 52.734962463378906, 55.078060150146484, 57.42115783691406, 59.76425552368164, 62.10735321044922, 64.45044708251953, 66.79354858398438, 69.13664245605469, 71.47974395751953, 73.82283782958984, 76.16593933105469, 78.509033203125]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 4.0, 3.0, 3.0, 10.0, 4.0, 11.0, 11.0, 15.0, 20.0, 22.0, 18.0, 14.0, 30.0, 32.0, 37.0, 29.0, 40.0, 40.0, 41.0, 52.0, 44.0, 56.0, 32.0, 50.0, 34.0, 38.0, 49.0, 30.0, 32.0, 26.0, 33.0, 19.0, 18.0, 18.0, 14.0, 14.0, 9.0, 7.0, 14.0, 8.0, 8.0, 3.0, 5.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-15.1015625, -14.6640625, -14.2265625, -13.7890625, -13.3515625, -12.9140625, -12.4765625, -12.0390625, -11.6015625, -11.1640625, -10.7265625, -10.2890625, -9.8515625, -9.4140625, -8.9765625, -8.5390625, -8.1015625, -7.6640625, -7.2265625, -6.7890625, -6.3515625, -5.9140625, -5.4765625, -5.0390625, -4.6015625, -4.1640625, -3.7265625, -3.2890625, -2.8515625, -2.4140625, -1.9765625, -1.5390625, -1.1015625, -0.6640625, -0.2265625, 0.2109375, 0.6484375, 1.0859375, 1.5234375, 1.9609375, 2.3984375, 2.8359375, 3.2734375, 3.7109375, 4.1484375, 4.5859375, 5.0234375, 5.4609375, 5.8984375, 6.3359375, 6.7734375, 7.2109375, 7.6484375, 8.0859375, 8.5234375, 8.9609375, 9.3984375, 9.8359375, 10.2734375, 10.7109375, 11.1484375, 11.5859375, 12.0234375, 12.4609375, 12.8984375]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 2.0, 4.0, 1.0, 6.0, 10.0, 7.0, 11.0, 24.0, 47.0, 64.0, 80.0, 157.0, 187.0, 353.0, 542.0, 802.0, 1300.0, 2014.0, 3027.0, 4632.0, 6996.0, 10469.0, 16438.0, 26657.0, 44942.0, 80533.0, 153109.0, 256905.0, 193934.0, 101840.0, 55475.0, 32057.0, 19737.0, 12626.0, 8317.0, 5343.0, 3391.0, 2303.0, 1480.0, 928.0, 626.0, 429.0, 255.0, 168.0, 115.0, 82.0, 47.0, 31.0, 20.0, 17.0, 8.0, 6.0, 4.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.578125, -1.5283203125, -1.478515625, -1.4287109375, -1.37890625, -1.3291015625, -1.279296875, -1.2294921875, -1.1796875, -1.1298828125, -1.080078125, -1.0302734375, -0.98046875, -0.9306640625, -0.880859375, -0.8310546875, -0.78125, -0.7314453125, -0.681640625, -0.6318359375, -0.58203125, -0.5322265625, -0.482421875, -0.4326171875, -0.3828125, -0.3330078125, -0.283203125, -0.2333984375, -0.18359375, -0.1337890625, -0.083984375, -0.0341796875, 0.015625, 0.0654296875, 0.115234375, 0.1650390625, 0.21484375, 0.2646484375, 0.314453125, 0.3642578125, 0.4140625, 0.4638671875, 0.513671875, 0.5634765625, 0.61328125, 0.6630859375, 0.712890625, 0.7626953125, 0.8125, 0.8623046875, 0.912109375, 0.9619140625, 1.01171875, 1.0615234375, 1.111328125, 1.1611328125, 1.2109375, 1.2607421875, 1.310546875, 1.3603515625, 1.41015625, 1.4599609375, 1.509765625, 1.5595703125, 1.609375]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 6.0, 7.0, 9.0, 7.0, 17.0, 6.0, 16.0, 17.0, 16.0, 27.0, 27.0, 34.0, 22.0, 22.0, 36.0, 32.0, 30.0, 40.0, 36.0, 46.0, 38.0, 1067.0, 52.0, 32.0, 32.0, 36.0, 28.0, 30.0, 39.0, 28.0, 29.0, 23.0, 21.0, 10.0, 28.0, 17.0, 12.0, 13.0, 6.0, 9.0, 10.0, 6.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0], "bins": [-8.6171875, -8.35107421875, -8.0849609375, -7.81884765625, -7.552734375, -7.28662109375, -7.0205078125, -6.75439453125, -6.48828125, -6.22216796875, -5.9560546875, -5.68994140625, -5.423828125, -5.15771484375, -4.8916015625, -4.62548828125, -4.359375, -4.09326171875, -3.8271484375, -3.56103515625, -3.294921875, -3.02880859375, -2.7626953125, -2.49658203125, -2.23046875, -1.96435546875, -1.6982421875, -1.43212890625, -1.166015625, -0.89990234375, -0.6337890625, -0.36767578125, -0.1015625, 0.16455078125, 0.4306640625, 0.69677734375, 0.962890625, 1.22900390625, 1.4951171875, 1.76123046875, 2.02734375, 2.29345703125, 2.5595703125, 2.82568359375, 3.091796875, 3.35791015625, 3.6240234375, 3.89013671875, 4.15625, 4.42236328125, 4.6884765625, 4.95458984375, 5.220703125, 5.48681640625, 5.7529296875, 6.01904296875, 6.28515625, 6.55126953125, 6.8173828125, 7.08349609375, 7.349609375, 7.61572265625, 7.8818359375, 8.14794921875, 8.4140625]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 4.0, 5.0, 1.0, 6.0, 13.0, 9.0, 21.0, 35.0, 61.0, 95.0, 120.0, 207.0, 333.0, 469.0, 725.0, 1115.0, 1558.0, 2436.0, 3623.0, 5558.0, 8203.0, 12869.0, 19744.0, 30939.0, 49893.0, 83158.0, 143531.0, 1257732.0, 191013.0, 109577.0, 64025.0, 38848.0, 24491.0, 16012.0, 10342.0, 6905.0, 4585.0, 3052.0, 1967.0, 1308.0, 844.0, 589.0, 373.0, 259.0, 153.0, 119.0, 70.0, 49.0, 35.0, 29.0, 12.0, 12.0, 6.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.77880859375, -0.7542800903320312, -0.7297515869140625, -0.7052230834960938, -0.680694580078125, -0.6561660766601562, -0.6316375732421875, -0.6071090698242188, -0.58258056640625, -0.5580520629882812, -0.5335235595703125, -0.5089950561523438, -0.484466552734375, -0.45993804931640625, -0.4354095458984375, -0.41088104248046875, -0.3863525390625, -0.36182403564453125, -0.3372955322265625, -0.31276702880859375, -0.288238525390625, -0.26371002197265625, -0.2391815185546875, -0.21465301513671875, -0.19012451171875, -0.16559600830078125, -0.1410675048828125, -0.11653900146484375, -0.092010498046875, -0.06748199462890625, -0.0429534912109375, -0.01842498779296875, 0.006103515625, 0.03063201904296875, 0.0551605224609375, 0.07968902587890625, 0.104217529296875, 0.12874603271484375, 0.1532745361328125, 0.17780303955078125, 0.20233154296875, 0.22686004638671875, 0.2513885498046875, 0.27591705322265625, 0.300445556640625, 0.32497406005859375, 0.3495025634765625, 0.37403106689453125, 0.3985595703125, 0.42308807373046875, 0.4476165771484375, 0.47214508056640625, 0.496673583984375, 0.5212020874023438, 0.5457305908203125, 0.5702590942382812, 0.59478759765625, 0.6193161010742188, 0.6438446044921875, 0.6683731079101562, 0.692901611328125, 0.7174301147460938, 0.7419586181640625, 0.7664871215820312, 0.791015625]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 5.0, 8.0, 6.0, 12.0, 18.0, 27.0, 39.0, 60.0, 83.0, 129.0, 183.0, 145.0, 90.0, 58.0, 28.0, 28.0, 14.0, 13.0, 11.0, 8.0, 6.0, 6.0, 8.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.04205322265625, -0.04076671600341797, -0.03948020935058594, -0.038193702697753906, -0.036907196044921875, -0.035620689392089844, -0.03433418273925781, -0.03304767608642578, -0.03176116943359375, -0.03047466278076172, -0.029188156127929688, -0.027901649475097656, -0.026615142822265625, -0.025328636169433594, -0.024042129516601562, -0.02275562286376953, -0.0214691162109375, -0.02018260955810547, -0.018896102905273438, -0.017609596252441406, -0.016323089599609375, -0.015036582946777344, -0.013750076293945312, -0.012463569641113281, -0.01117706298828125, -0.009890556335449219, -0.008604049682617188, -0.007317543029785156, -0.006031036376953125, -0.004744529724121094, -0.0034580230712890625, -0.0021715164184570312, -0.000885009765625, 0.00040149688720703125, 0.0016880035400390625, 0.0029745101928710938, 0.004261016845703125, 0.005547523498535156, 0.0068340301513671875, 0.008120536804199219, 0.00940704345703125, 0.010693550109863281, 0.011980056762695312, 0.013266563415527344, 0.014553070068359375, 0.015839576721191406, 0.017126083374023438, 0.01841259002685547, 0.0196990966796875, 0.02098560333251953, 0.022272109985351562, 0.023558616638183594, 0.024845123291015625, 0.026131629943847656, 0.027418136596679688, 0.02870464324951172, 0.02999114990234375, 0.03127765655517578, 0.03256416320800781, 0.033850669860839844, 0.035137176513671875, 0.036423683166503906, 0.03771018981933594, 0.03899669647216797, 0.040283203125]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 7.0, 8.0, 13.0, 13.0, 21.0, 43.0, 43.0, 97.0, 138.0, 372.0, 1727.0, 68309.0, 969309.0, 7228.0, 650.0, 259.0, 122.0, 72.0, 39.0, 19.0, 19.0, 13.0, 8.0, 4.0, 0.0, 2.0, 3.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.81298828125, -0.7869720458984375, -0.760955810546875, -0.7349395751953125, -0.70892333984375, -0.6829071044921875, -0.656890869140625, -0.6308746337890625, -0.6048583984375, -0.5788421630859375, -0.552825927734375, -0.5268096923828125, -0.50079345703125, -0.4747772216796875, -0.448760986328125, -0.4227447509765625, -0.396728515625, -0.3707122802734375, -0.344696044921875, -0.3186798095703125, -0.29266357421875, -0.2666473388671875, -0.240631103515625, -0.2146148681640625, -0.1885986328125, -0.1625823974609375, -0.136566162109375, -0.1105499267578125, -0.08453369140625, -0.0585174560546875, -0.032501220703125, -0.0064849853515625, 0.01953125, 0.0455474853515625, 0.071563720703125, 0.0975799560546875, 0.12359619140625, 0.1496124267578125, 0.175628662109375, 0.2016448974609375, 0.2276611328125, 0.2536773681640625, 0.279693603515625, 0.3057098388671875, 0.33172607421875, 0.3577423095703125, 0.383758544921875, 0.4097747802734375, 0.435791015625, 0.4618072509765625, 0.487823486328125, 0.5138397216796875, 0.53985595703125, 0.5658721923828125, 0.591888427734375, 0.6179046630859375, 0.6439208984375, 0.6699371337890625, 0.695953369140625, 0.7219696044921875, 0.74798583984375, 0.7740020751953125, 0.800018310546875, 0.8260345458984375, 0.85205078125]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 8.0, 26.0, 92.0, 425.0, 315.0, 86.0, 30.0, 17.0, 6.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12032121419906616, -0.1093047633767128, -0.09828831255435944, -0.08727185428142548, -0.07625540345907211, -0.06523895263671875, -0.05422249436378479, -0.04320604354143143, -0.032189592719078064, -0.02117314003407955, -0.01015668734908104, 0.0008597671985626221, 0.011876218020915985, 0.022892668843269348, 0.03390912711620331, 0.04492557793855667, 0.055942028760910034, 0.0669584795832634, 0.07797493040561676, 0.08899138867855072, 0.10000783950090408, 0.11102429032325745, 0.1220407485961914, 0.13305720686912537, 0.14407365024089813, 0.1550901085138321, 0.16610655188560486, 0.17712301015853882, 0.18813946843147278, 0.19915591180324554, 0.2101723700761795, 0.22118881344795227, 0.23220527172088623, 0.2432217299938202, 0.25423818826675415, 0.2652546167373657, 0.2762710750102997, 0.28728753328323364, 0.2983039915561676, 0.30932044982910156, 0.32033687829971313, 0.3313533365726471, 0.34236979484558105, 0.3533862233161926, 0.3644026815891266, 0.37541913986206055, 0.3864355981349945, 0.39745205640792847, 0.4084685146808624, 0.4194849729537964, 0.43050143122673035, 0.4415178894996643, 0.4525343179702759, 0.46355077624320984, 0.4745672345161438, 0.48558369278907776, 0.4966001510620117, 0.5076165795326233, 0.5186330676078796, 0.5296494960784912, 0.5406659841537476, 0.5516824126243591, 0.5626988410949707, 0.573715329170227, 0.5847317576408386]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 7.0, 2.0, 9.0, 8.0, 13.0, 15.0, 10.0, 20.0, 27.0, 20.0, 26.0, 28.0, 19.0, 29.0, 27.0, 32.0, 32.0, 37.0, 27.0, 42.0, 33.0, 39.0, 44.0, 27.0, 38.0, 32.0, 56.0, 37.0, 42.0, 29.0, 30.0, 25.0, 19.0, 19.0, 19.0, 20.0, 16.0, 5.0, 9.0, 10.0, 6.0, 4.0, 3.0, 3.0, 3.0, 3.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.048168838024139404, -0.04663674533367157, -0.045104652643203735, -0.0435725562274456, -0.04204046353697777, -0.040508370846509933, -0.0389762744307518, -0.037444181740283966, -0.03591208904981613, -0.0343799963593483, -0.03284790366888046, -0.03131580725312233, -0.029783714562654495, -0.02825162187218666, -0.026719527319073677, -0.025187432765960693, -0.02365534007549286, -0.022123247385025024, -0.02059115283191204, -0.019059058278799057, -0.017526965588331223, -0.015994872897863388, -0.014462778344750404, -0.012930684722959995, -0.011398591101169586, -0.009866497479379177, -0.008334403857588768, -0.006802310235798359, -0.00527021661400795, -0.0037381229922175407, -0.0022060293704271317, -0.0006739357486367226, 0.0008581578731536865, 0.0023902514949440956, 0.003922345116734505, 0.005454438738524914, 0.006986532360315323, 0.008518625982105732, 0.010050719603896141, 0.01158281322568655, 0.01311490684747696, 0.014647000469267368, 0.016179094091057777, 0.01771118864417076, 0.019243281334638596, 0.02077537402510643, 0.022307468578219414, 0.023839563131332397, 0.025371655821800232, 0.026903748512268066, 0.02843584306538105, 0.029967937618494034, 0.03150003030896187, 0.0330321229994297, 0.034564219415187836, 0.03609631210565567, 0.037628404796123505, 0.03916049748659134, 0.040692590177059174, 0.042224686592817307, 0.04375677928328514, 0.045288871973752975, 0.04682096838951111, 0.04835306107997894, 0.04988515377044678]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 4.0, 3.0, 3.0, 10.0, 4.0, 12.0, 10.0, 17.0, 19.0, 22.0, 17.0, 14.0, 30.0, 32.0, 38.0, 28.0, 41.0, 40.0, 40.0, 52.0, 45.0, 55.0, 32.0, 50.0, 34.0, 38.0, 49.0, 30.0, 32.0, 26.0, 33.0, 19.0, 18.0, 18.0, 14.0, 14.0, 9.0, 7.0, 14.0, 8.0, 8.0, 3.0, 5.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-15.09375, -14.6563720703125, -14.218994140625, -13.7816162109375, -13.34423828125, -12.9068603515625, -12.469482421875, -12.0321044921875, -11.5947265625, -11.1573486328125, -10.719970703125, -10.2825927734375, -9.84521484375, -9.4078369140625, -8.970458984375, -8.5330810546875, -8.095703125, -7.6583251953125, -7.220947265625, -6.7835693359375, -6.34619140625, -5.9088134765625, -5.471435546875, -5.0340576171875, -4.5966796875, -4.1593017578125, -3.721923828125, -3.2845458984375, -2.84716796875, -2.4097900390625, -1.972412109375, -1.5350341796875, -1.09765625, -0.6602783203125, -0.222900390625, 0.2144775390625, 0.65185546875, 1.0892333984375, 1.526611328125, 1.9639892578125, 2.4013671875, 2.8387451171875, 3.276123046875, 3.7135009765625, 4.15087890625, 4.5882568359375, 5.025634765625, 5.4630126953125, 5.900390625, 6.3377685546875, 6.775146484375, 7.2125244140625, 7.64990234375, 8.0872802734375, 8.524658203125, 8.9620361328125, 9.3994140625, 9.8367919921875, 10.274169921875, 10.7115478515625, 11.14892578125, 11.5863037109375, 12.023681640625, 12.4610595703125, 12.8984375]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 5.0, 3.0, 7.0, 5.0, 13.0, 14.0, 11.0, 11.0, 20.0, 20.0, 26.0, 36.0, 52.0, 71.0, 146.0, 260.0, 708.0, 1959.0, 7229.0, 29680.0, 142554.0, 573571.0, 230662.0, 46188.0, 10642.0, 2934.0, 878.0, 332.0, 180.0, 85.0, 71.0, 26.0, 37.0, 32.0, 20.0, 15.0, 17.0, 10.0, 4.0, 7.0, 4.0, 5.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.7734375, -8.4671630859375, -8.160888671875, -7.8546142578125, -7.54833984375, -7.2420654296875, -6.935791015625, -6.6295166015625, -6.3232421875, -6.0169677734375, -5.710693359375, -5.4044189453125, -5.09814453125, -4.7918701171875, -4.485595703125, -4.1793212890625, -3.873046875, -3.5667724609375, -3.260498046875, -2.9542236328125, -2.64794921875, -2.3416748046875, -2.035400390625, -1.7291259765625, -1.4228515625, -1.1165771484375, -0.810302734375, -0.5040283203125, -0.19775390625, 0.1085205078125, 0.414794921875, 0.7210693359375, 1.02734375, 1.3336181640625, 1.639892578125, 1.9461669921875, 2.25244140625, 2.5587158203125, 2.864990234375, 3.1712646484375, 3.4775390625, 3.7838134765625, 4.090087890625, 4.3963623046875, 4.70263671875, 5.0089111328125, 5.315185546875, 5.6214599609375, 5.927734375, 6.2340087890625, 6.540283203125, 6.8465576171875, 7.15283203125, 7.4591064453125, 7.765380859375, 8.0716552734375, 8.3779296875, 8.6842041015625, 8.990478515625, 9.2967529296875, 9.60302734375, 9.9093017578125, 10.215576171875, 10.5218505859375, 10.828125]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 4.0, 3.0, 9.0, 10.0, 7.0, 9.0, 14.0, 13.0, 19.0, 19.0, 21.0, 25.0, 32.0, 33.0, 40.0, 55.0, 50.0, 62.0, 78.0, 350.0, 1687.0, 85.0, 55.0, 52.0, 43.0, 39.0, 36.0, 18.0, 31.0, 27.0, 26.0, 23.0, 18.0, 12.0, 9.0, 12.0, 6.0, 7.0, 6.0, 6.0, 7.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.71875, -46.318359375, -44.91796875, -43.517578125, -42.1171875, -40.716796875, -39.31640625, -37.916015625, -36.515625, -35.115234375, -33.71484375, -32.314453125, -30.9140625, -29.513671875, -28.11328125, -26.712890625, -25.3125, -23.912109375, -22.51171875, -21.111328125, -19.7109375, -18.310546875, -16.91015625, -15.509765625, -14.109375, -12.708984375, -11.30859375, -9.908203125, -8.5078125, -7.107421875, -5.70703125, -4.306640625, -2.90625, -1.505859375, -0.10546875, 1.294921875, 2.6953125, 4.095703125, 5.49609375, 6.896484375, 8.296875, 9.697265625, 11.09765625, 12.498046875, 13.8984375, 15.298828125, 16.69921875, 18.099609375, 19.5, 20.900390625, 22.30078125, 23.701171875, 25.1015625, 26.501953125, 27.90234375, 29.302734375, 30.703125, 32.103515625, 33.50390625, 34.904296875, 36.3046875, 37.705078125, 39.10546875, 40.505859375, 41.90625]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 8.0, 5.0, 6.0, 7.0, 11.0, 7.0, 13.0, 14.0, 21.0, 31.0, 34.0, 54.0, 60.0, 75.0, 107.0, 132.0, 191.0, 300.0, 653.0, 3671.0, 3066963.0, 70334.0, 1642.0, 480.0, 236.0, 180.0, 112.0, 84.0, 67.0, 47.0, 37.0, 29.0, 24.0, 17.0, 14.0, 11.0, 6.0, 13.0, 5.0, 7.0, 5.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-90.6875, -87.64453125, -84.6015625, -81.55859375, -78.515625, -75.47265625, -72.4296875, -69.38671875, -66.34375, -63.30078125, -60.2578125, -57.21484375, -54.171875, -51.12890625, -48.0859375, -45.04296875, -42.0, -38.95703125, -35.9140625, -32.87109375, -29.828125, -26.78515625, -23.7421875, -20.69921875, -17.65625, -14.61328125, -11.5703125, -8.52734375, -5.484375, -2.44140625, 0.6015625, 3.64453125, 6.6875, 9.73046875, 12.7734375, 15.81640625, 18.859375, 21.90234375, 24.9453125, 27.98828125, 31.03125, 34.07421875, 37.1171875, 40.16015625, 43.203125, 46.24609375, 49.2890625, 52.33203125, 55.375, 58.41796875, 61.4609375, 64.50390625, 67.546875, 70.58984375, 73.6328125, 76.67578125, 79.71875, 82.76171875, 85.8046875, 88.84765625, 91.890625, 94.93359375, 97.9765625, 101.01953125, 104.0625]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 28.0, 930.0, 60.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-753.763671875, -740.4360961914062, -727.1084594726562, -713.7808837890625, -700.4532470703125, -687.1256713867188, -673.7980346679688, -660.470458984375, -647.142822265625, -633.8152465820312, -620.4876098632812, -607.1600341796875, -593.8323974609375, -580.5048217773438, -567.1771850585938, -553.849609375, -540.5220336914062, -527.1944580078125, -513.8668212890625, -500.5392150878906, -487.21160888671875, -473.884033203125, -460.556396484375, -447.22882080078125, -433.90118408203125, -420.5735778808594, -407.2459716796875, -393.9183654785156, -380.59075927734375, -367.26318359375, -353.935546875, -340.60797119140625, -327.28033447265625, -313.9527282714844, -300.6251220703125, -287.2975158691406, -273.96990966796875, -260.642333984375, -247.31471252441406, -233.98712158203125, -220.65951538085938, -207.3319091796875, -194.00430297851562, -180.67669677734375, -167.34910583496094, -154.02149963378906, -140.6938934326172, -127.36629486083984, -114.03868865966797, -100.7110824584961, -87.38348388671875, -74.05587768554688, -60.728275299072266, -47.400672912597656, -34.07306671142578, -20.745468139648438, -7.4178619384765625, 5.909741401672363, 19.23734474182129, 32.56494903564453, 45.89255142211914, 59.22015380859375, 72.54776000976562, 85.87535858154297, 99.20296478271484]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 3.0, 5.0, 2.0, 11.0, 7.0, 10.0, 6.0, 14.0, 9.0, 15.0, 19.0, 18.0, 22.0, 20.0, 19.0, 27.0, 21.0, 22.0, 19.0, 17.0, 42.0, 29.0, 38.0, 45.0, 42.0, 41.0, 38.0, 43.0, 27.0, 35.0, 42.0, 34.0, 32.0, 24.0, 29.0, 31.0, 20.0, 21.0, 14.0, 25.0, 8.0, 8.0, 8.0, 8.0, 7.0, 8.0, 4.0, 4.0, 3.0, 2.0, 4.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0], "bins": [-97.35313415527344, -93.98736572265625, -90.62159729003906, -87.25582885742188, -83.89006042480469, -80.5242919921875, -77.15852355957031, -73.79275512695312, -70.42698669433594, -67.06121826171875, -63.69544982910156, -60.329681396484375, -56.96391296386719, -53.59814453125, -50.23237228393555, -46.86660385131836, -43.500831604003906, -40.13506317138672, -36.76929473876953, -33.403526306152344, -30.037755966186523, -26.671987533569336, -23.306217193603516, -19.940448760986328, -16.57468032836914, -13.208911895751953, -9.84314250946045, -6.477373123168945, -3.111604690551758, 0.2541637420654297, 3.61993408203125, 6.9857025146484375, 10.351463317871094, 13.717231750488281, 17.08300018310547, 20.44877052307129, 23.814538955688477, 27.180307388305664, 30.546077728271484, 33.91184616088867, 37.27761459350586, 40.64338302612305, 44.009151458740234, 47.37492370605469, 50.740692138671875, 54.10646057128906, 57.47222900390625, 60.83799743652344, 64.20376586914062, 67.56953430175781, 70.935302734375, 74.30107116699219, 77.66683959960938, 81.03260803222656, 84.39837646484375, 87.76414489746094, 91.12991333007812, 94.49568176269531, 97.8614501953125, 101.22721862792969, 104.59298706054688, 107.95875549316406, 111.32452392578125, 114.69029235839844, 118.05606842041016]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 3.0, 4.0, 7.0, 5.0, 12.0, 10.0, 14.0, 17.0, 16.0, 21.0, 19.0, 18.0, 34.0, 32.0, 29.0, 44.0, 37.0, 40.0, 45.0, 45.0, 52.0, 36.0, 46.0, 41.0, 43.0, 42.0, 43.0, 31.0, 35.0, 22.0, 19.0, 21.0, 17.0, 16.0, 17.0, 11.0, 7.0, 8.0, 15.0, 9.0, 5.0, 5.0, 3.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-15.1171875, -14.673828125, -14.23046875, -13.787109375, -13.34375, -12.900390625, -12.45703125, -12.013671875, -11.5703125, -11.126953125, -10.68359375, -10.240234375, -9.796875, -9.353515625, -8.91015625, -8.466796875, -8.0234375, -7.580078125, -7.13671875, -6.693359375, -6.25, -5.806640625, -5.36328125, -4.919921875, -4.4765625, -4.033203125, -3.58984375, -3.146484375, -2.703125, -2.259765625, -1.81640625, -1.373046875, -0.9296875, -0.486328125, -0.04296875, 0.400390625, 0.84375, 1.287109375, 1.73046875, 2.173828125, 2.6171875, 3.060546875, 3.50390625, 3.947265625, 4.390625, 4.833984375, 5.27734375, 5.720703125, 6.1640625, 6.607421875, 7.05078125, 7.494140625, 7.9375, 8.380859375, 8.82421875, 9.267578125, 9.7109375, 10.154296875, 10.59765625, 11.041015625, 11.484375, 11.927734375, 12.37109375, 12.814453125, 13.2578125]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 2.0, 6.0, 4.0, 12.0, 11.0, 10.0, 19.0, 21.0, 30.0, 38.0, 37.0, 64.0, 79.0, 110.0, 214.0, 527.0, 1316.0, 3713.0, 11272.0, 132950.0, 3935442.0, 91584.0, 10679.0, 3646.0, 1341.0, 533.0, 213.0, 96.0, 63.0, 52.0, 42.0, 32.0, 33.0, 20.0, 17.0, 15.0, 12.0, 11.0, 7.0, 7.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-83.625, -81.33203125, -79.0390625, -76.74609375, -74.453125, -72.16015625, -69.8671875, -67.57421875, -65.28125, -62.98828125, -60.6953125, -58.40234375, -56.109375, -53.81640625, -51.5234375, -49.23046875, -46.9375, -44.64453125, -42.3515625, -40.05859375, -37.765625, -35.47265625, -33.1796875, -30.88671875, -28.59375, -26.30078125, -24.0078125, -21.71484375, -19.421875, -17.12890625, -14.8359375, -12.54296875, -10.25, -7.95703125, -5.6640625, -3.37109375, -1.078125, 1.21484375, 3.5078125, 5.80078125, 8.09375, 10.38671875, 12.6796875, 14.97265625, 17.265625, 19.55859375, 21.8515625, 24.14453125, 26.4375, 28.73046875, 31.0234375, 33.31640625, 35.609375, 37.90234375, 40.1953125, 42.48828125, 44.78125, 47.07421875, 49.3671875, 51.66015625, 53.953125, 56.24609375, 58.5390625, 60.83203125, 63.125]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 6.0, 9.0, 7.0, 16.0, 25.0, 34.0, 44.0, 50.0, 91.0, 234.0, 558.0, 1073.0, 1000.0, 458.0, 202.0, 73.0, 61.0, 33.0, 22.0, 10.0, 17.0, 13.0, 9.0, 7.0, 2.0, 3.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.25, -38.94677734375, -37.6435546875, -36.34033203125, -35.037109375, -33.73388671875, -32.4306640625, -31.12744140625, -29.82421875, -28.52099609375, -27.2177734375, -25.91455078125, -24.611328125, -23.30810546875, -22.0048828125, -20.70166015625, -19.3984375, -18.09521484375, -16.7919921875, -15.48876953125, -14.185546875, -12.88232421875, -11.5791015625, -10.27587890625, -8.97265625, -7.66943359375, -6.3662109375, -5.06298828125, -3.759765625, -2.45654296875, -1.1533203125, 0.14990234375, 1.453125, 2.75634765625, 4.0595703125, 5.36279296875, 6.666015625, 7.96923828125, 9.2724609375, 10.57568359375, 11.87890625, 13.18212890625, 14.4853515625, 15.78857421875, 17.091796875, 18.39501953125, 19.6982421875, 21.00146484375, 22.3046875, 23.60791015625, 24.9111328125, 26.21435546875, 27.517578125, 28.82080078125, 30.1240234375, 31.42724609375, 32.73046875, 34.03369140625, 35.3369140625, 36.64013671875, 37.943359375, 39.24658203125, 40.5498046875, 41.85302734375, 43.15625]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 3.0, 3.0, 4.0, 4.0, 5.0, 12.0, 16.0, 29.0, 40.0, 87.0, 195.0, 450.0, 986.0, 2660.0, 8852.0, 45940.0, 3670186.0, 431922.0, 24201.0, 5456.0, 1834.0, 712.0, 324.0, 170.0, 91.0, 42.0, 16.0, 13.0, 12.0, 8.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-111.125, -107.83984375, -104.5546875, -101.26953125, -97.984375, -94.69921875, -91.4140625, -88.12890625, -84.84375, -81.55859375, -78.2734375, -74.98828125, -71.703125, -68.41796875, -65.1328125, -61.84765625, -58.5625, -55.27734375, -51.9921875, -48.70703125, -45.421875, -42.13671875, -38.8515625, -35.56640625, -32.28125, -28.99609375, -25.7109375, -22.42578125, -19.140625, -15.85546875, -12.5703125, -9.28515625, -6.0, -2.71484375, 0.5703125, 3.85546875, 7.140625, 10.42578125, 13.7109375, 16.99609375, 20.28125, 23.56640625, 26.8515625, 30.13671875, 33.421875, 36.70703125, 39.9921875, 43.27734375, 46.5625, 49.84765625, 53.1328125, 56.41796875, 59.703125, 62.98828125, 66.2734375, 69.55859375, 72.84375, 76.12890625, 79.4140625, 82.69921875, 85.984375, 89.26953125, 92.5546875, 95.83984375, 99.125]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 5.0, 7.0, 6.0, 13.0, 11.0, 16.0, 27.0, 20.0, 45.0, 59.0, 89.0, 102.0, 148.0, 131.0, 94.0, 73.0, 43.0, 27.0, 29.0, 13.0, 9.0, 13.0, 7.0, 2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-146.2808074951172, -142.3976287841797, -138.51443481445312, -134.63125610351562, -130.74807739257812, -126.86489868164062, -122.9817123413086, -119.09852600097656, -115.21534729003906, -111.33216857910156, -107.44898223876953, -103.5657958984375, -99.6826171875, -95.7994384765625, -91.91625213623047, -88.03306579589844, -84.14988708496094, -80.26670837402344, -76.3835220336914, -72.50033569335938, -68.61715698242188, -64.73397827148438, -60.850791931152344, -56.96760940551758, -53.08442687988281, -49.20124435424805, -45.31806182861328, -41.434879302978516, -37.55169677734375, -33.668514251708984, -29.78533172607422, -25.902149200439453, -22.018959045410156, -18.13577651977539, -14.252593994140625, -10.36941146850586, -6.486228942871094, -2.603046417236328, 1.2801361083984375, 5.163318634033203, 9.046501159667969, 12.929683685302734, 16.8128662109375, 20.696048736572266, 24.57923126220703, 28.462413787841797, 32.34559631347656, 36.22877883911133, 40.111961364746094, 43.99514389038086, 47.878326416015625, 51.76150894165039, 55.644691467285156, 59.52787399291992, 63.41105651855469, 67.29423522949219, 71.17742156982422, 75.06060791015625, 78.94378662109375, 82.82696533203125, 86.71015167236328, 90.59333801269531, 94.47651672363281, 98.35969543457031, 102.24288177490234]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 10.0, 10.0, 7.0, 8.0, 18.0, 26.0, 17.0, 21.0, 22.0, 26.0, 36.0, 23.0, 38.0, 48.0, 40.0, 38.0, 32.0, 34.0, 41.0, 41.0, 44.0, 43.0, 37.0, 40.0, 39.0, 28.0, 30.0, 31.0, 19.0, 21.0, 12.0, 25.0, 19.0, 11.0, 14.0, 10.0, 9.0, 7.0, 4.0, 6.0, 3.0, 7.0, 4.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-74.97794342041016, -72.29045104980469, -69.60296630859375, -66.91548156738281, -64.22798919677734, -61.54050064086914, -58.85301208496094, -56.165523529052734, -53.47803497314453, -50.79054641723633, -48.103057861328125, -45.41556930541992, -42.72808074951172, -40.040592193603516, -37.35310363769531, -34.66561508178711, -31.978126525878906, -29.290637969970703, -26.6031494140625, -23.915660858154297, -21.228172302246094, -18.54068374633789, -15.853195190429688, -13.165706634521484, -10.478218078613281, -7.790729522705078, -5.103240966796875, -2.415752410888672, 0.27173614501953125, 2.9592247009277344, 5.6467132568359375, 8.33420181274414, 11.021697998046875, 13.709186553955078, 16.39667510986328, 19.084163665771484, 21.771652221679688, 24.45914077758789, 27.146629333496094, 29.834117889404297, 32.5216064453125, 35.2090950012207, 37.896583557128906, 40.58407211303711, 43.27156066894531, 45.959049224853516, 48.64653778076172, 51.33402633666992, 54.021514892578125, 56.70900344848633, 59.39649200439453, 62.083980560302734, 64.77146911621094, 67.45895385742188, 70.14644622802734, 72.83393859863281, 75.52142333984375, 78.20890808105469, 80.89640045166016, 83.58389282226562, 86.27137756347656, 88.9588623046875, 91.64635467529297, 94.33384704589844, 97.02133178710938]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 8.0, 10.0, 4.0, 12.0, 10.0, 12.0, 21.0, 19.0, 28.0, 31.0, 39.0, 41.0, 37.0, 44.0, 45.0, 46.0, 38.0, 44.0, 53.0, 59.0, 41.0, 45.0, 41.0, 36.0, 31.0, 30.0, 33.0, 32.0, 15.0, 16.0, 13.0, 18.0, 10.0, 11.0, 9.0, 5.0, 6.0, 1.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.71875, -16.22802734375, -15.7373046875, -15.24658203125, -14.755859375, -14.26513671875, -13.7744140625, -13.28369140625, -12.79296875, -12.30224609375, -11.8115234375, -11.32080078125, -10.830078125, -10.33935546875, -9.8486328125, -9.35791015625, -8.8671875, -8.37646484375, -7.8857421875, -7.39501953125, -6.904296875, -6.41357421875, -5.9228515625, -5.43212890625, -4.94140625, -4.45068359375, -3.9599609375, -3.46923828125, -2.978515625, -2.48779296875, -1.9970703125, -1.50634765625, -1.015625, -0.52490234375, -0.0341796875, 0.45654296875, 0.947265625, 1.43798828125, 1.9287109375, 2.41943359375, 2.91015625, 3.40087890625, 3.8916015625, 4.38232421875, 4.873046875, 5.36376953125, 5.8544921875, 6.34521484375, 6.8359375, 7.32666015625, 7.8173828125, 8.30810546875, 8.798828125, 9.28955078125, 9.7802734375, 10.27099609375, 10.76171875, 11.25244140625, 11.7431640625, 12.23388671875, 12.724609375, 13.21533203125, 13.7060546875, 14.19677734375, 14.6875]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 10.0, 20.0, 21.0, 20.0, 36.0, 49.0, 55.0, 72.0, 146.0, 209.0, 292.0, 468.0, 763.0, 1097.0, 1780.0, 2777.0, 4194.0, 6669.0, 10935.0, 17791.0, 29223.0, 48866.0, 84949.0, 155109.0, 248800.0, 185444.0, 102381.0, 58099.0, 33934.0, 20425.0, 12413.0, 7886.0, 5008.0, 3044.0, 2005.0, 1199.0, 814.0, 565.0, 344.0, 243.0, 141.0, 96.0, 40.0, 40.0, 14.0, 22.0, 11.0, 13.0, 7.0, 4.0, 1.0, 5.0, 5.0, 2.0, 7.0, 0.0, 1.0, 2.0], "bins": [-1.57421875, -1.522857666015625, -1.47149658203125, -1.420135498046875, -1.3687744140625, -1.317413330078125, -1.26605224609375, -1.214691162109375, -1.163330078125, -1.111968994140625, -1.06060791015625, -1.009246826171875, -0.9578857421875, -0.906524658203125, -0.85516357421875, -0.803802490234375, -0.75244140625, -0.701080322265625, -0.64971923828125, -0.598358154296875, -0.5469970703125, -0.495635986328125, -0.44427490234375, -0.392913818359375, -0.341552734375, -0.290191650390625, -0.23883056640625, -0.187469482421875, -0.1361083984375, -0.084747314453125, -0.03338623046875, 0.017974853515625, 0.0693359375, 0.120697021484375, 0.17205810546875, 0.223419189453125, 0.2747802734375, 0.326141357421875, 0.37750244140625, 0.428863525390625, 0.480224609375, 0.531585693359375, 0.58294677734375, 0.634307861328125, 0.6856689453125, 0.737030029296875, 0.78839111328125, 0.839752197265625, 0.89111328125, 0.942474365234375, 0.99383544921875, 1.045196533203125, 1.0965576171875, 1.147918701171875, 1.19927978515625, 1.250640869140625, 1.302001953125, 1.353363037109375, 1.40472412109375, 1.456085205078125, 1.5074462890625, 1.558807373046875, 1.61016845703125, 1.661529541015625, 1.712890625]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 6.0, 5.0, 5.0, 5.0, 4.0, 8.0, 10.0, 12.0, 7.0, 14.0, 17.0, 17.0, 24.0, 22.0, 28.0, 38.0, 20.0, 29.0, 38.0, 44.0, 36.0, 39.0, 34.0, 43.0, 1071.0, 45.0, 39.0, 44.0, 29.0, 32.0, 35.0, 38.0, 32.0, 20.0, 24.0, 20.0, 16.0, 10.0, 17.0, 15.0, 10.0, 10.0, 7.0, 4.0, 6.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.0625, -7.78564453125, -7.5087890625, -7.23193359375, -6.955078125, -6.67822265625, -6.4013671875, -6.12451171875, -5.84765625, -5.57080078125, -5.2939453125, -5.01708984375, -4.740234375, -4.46337890625, -4.1865234375, -3.90966796875, -3.6328125, -3.35595703125, -3.0791015625, -2.80224609375, -2.525390625, -2.24853515625, -1.9716796875, -1.69482421875, -1.41796875, -1.14111328125, -0.8642578125, -0.58740234375, -0.310546875, -0.03369140625, 0.2431640625, 0.52001953125, 0.796875, 1.07373046875, 1.3505859375, 1.62744140625, 1.904296875, 2.18115234375, 2.4580078125, 2.73486328125, 3.01171875, 3.28857421875, 3.5654296875, 3.84228515625, 4.119140625, 4.39599609375, 4.6728515625, 4.94970703125, 5.2265625, 5.50341796875, 5.7802734375, 6.05712890625, 6.333984375, 6.61083984375, 6.8876953125, 7.16455078125, 7.44140625, 7.71826171875, 7.9951171875, 8.27197265625, 8.548828125, 8.82568359375, 9.1025390625, 9.37939453125, 9.65625]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 9.0, 12.0, 14.0, 26.0, 41.0, 51.0, 85.0, 171.0, 246.0, 389.0, 612.0, 932.0, 1436.0, 2379.0, 3807.0, 6178.0, 9881.0, 16273.0, 26850.0, 47361.0, 88540.0, 170944.0, 1310818.0, 187683.0, 96220.0, 51404.0, 29115.0, 17288.0, 10674.0, 6416.0, 4214.0, 2703.0, 1580.0, 1011.0, 645.0, 429.0, 241.0, 156.0, 91.0, 79.0, 35.0, 37.0, 22.0, 14.0, 13.0, 7.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.98193359375, -0.9517822265625, -0.921630859375, -0.8914794921875, -0.861328125, -0.8311767578125, -0.801025390625, -0.7708740234375, -0.74072265625, -0.7105712890625, -0.680419921875, -0.6502685546875, -0.6201171875, -0.5899658203125, -0.559814453125, -0.5296630859375, -0.49951171875, -0.4693603515625, -0.439208984375, -0.4090576171875, -0.37890625, -0.3487548828125, -0.318603515625, -0.2884521484375, -0.25830078125, -0.2281494140625, -0.197998046875, -0.1678466796875, -0.1376953125, -0.1075439453125, -0.077392578125, -0.0472412109375, -0.01708984375, 0.0130615234375, 0.043212890625, 0.0733642578125, 0.103515625, 0.1336669921875, 0.163818359375, 0.1939697265625, 0.22412109375, 0.2542724609375, 0.284423828125, 0.3145751953125, 0.3447265625, 0.3748779296875, 0.405029296875, 0.4351806640625, 0.46533203125, 0.4954833984375, 0.525634765625, 0.5557861328125, 0.5859375, 0.6160888671875, 0.646240234375, 0.6763916015625, 0.70654296875, 0.7366943359375, 0.766845703125, 0.7969970703125, 0.8271484375, 0.8572998046875, 0.887451171875, 0.9176025390625, 0.94775390625]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 7.0, 5.0, 7.0, 12.0, 6.0, 17.0, 16.0, 14.0, 19.0, 30.0, 43.0, 57.0, 80.0, 139.0, 160.0, 131.0, 66.0, 49.0, 29.0, 24.0, 16.0, 14.0, 11.0, 16.0, 4.0, 5.0, 7.0, 4.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05169677734375, -0.05014657974243164, -0.04859638214111328, -0.04704618453979492, -0.04549598693847656, -0.0439457893371582, -0.042395591735839844, -0.040845394134521484, -0.039295196533203125, -0.037744998931884766, -0.036194801330566406, -0.03464460372924805, -0.03309440612792969, -0.03154420852661133, -0.02999401092529297, -0.02844381332397461, -0.02689361572265625, -0.02534341812133789, -0.02379322052001953, -0.022243022918701172, -0.020692825317382812, -0.019142627716064453, -0.017592430114746094, -0.016042232513427734, -0.014492034912109375, -0.012941837310791016, -0.011391639709472656, -0.009841442108154297, -0.008291244506835938, -0.006741046905517578, -0.005190849304199219, -0.0036406517028808594, -0.0020904541015625, -0.0005402565002441406, 0.0010099411010742188, 0.002560138702392578, 0.0041103363037109375, 0.005660533905029297, 0.007210731506347656, 0.008760929107666016, 0.010311126708984375, 0.011861324310302734, 0.013411521911621094, 0.014961719512939453, 0.016511917114257812, 0.018062114715576172, 0.01961231231689453, 0.02116250991821289, 0.02271270751953125, 0.02426290512084961, 0.02581310272216797, 0.027363300323486328, 0.028913497924804688, 0.030463695526123047, 0.032013893127441406, 0.033564090728759766, 0.035114288330078125, 0.036664485931396484, 0.038214683532714844, 0.0397648811340332, 0.04131507873535156, 0.04286527633666992, 0.04441547393798828, 0.04596567153930664, 0.047515869140625]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 2.0, 6.0, 11.0, 18.0, 15.0, 33.0, 48.0, 61.0, 123.0, 227.0, 835.0, 11543.0, 984434.0, 48648.0, 1809.0, 313.0, 150.0, 84.0, 55.0, 30.0, 26.0, 21.0, 12.0, 8.0, 9.0, 7.0, 8.0, 2.0, 6.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.044921875, -1.0108642578125, -0.976806640625, -0.9427490234375, -0.90869140625, -0.8746337890625, -0.840576171875, -0.8065185546875, -0.7724609375, -0.7384033203125, -0.704345703125, -0.6702880859375, -0.63623046875, -0.6021728515625, -0.568115234375, -0.5340576171875, -0.5, -0.4659423828125, -0.431884765625, -0.3978271484375, -0.36376953125, -0.3297119140625, -0.295654296875, -0.2615966796875, -0.2275390625, -0.1934814453125, -0.159423828125, -0.1253662109375, -0.09130859375, -0.0572509765625, -0.023193359375, 0.0108642578125, 0.044921875, 0.0789794921875, 0.113037109375, 0.1470947265625, 0.18115234375, 0.2152099609375, 0.249267578125, 0.2833251953125, 0.3173828125, 0.3514404296875, 0.385498046875, 0.4195556640625, 0.45361328125, 0.4876708984375, 0.521728515625, 0.5557861328125, 0.58984375, 0.6239013671875, 0.657958984375, 0.6920166015625, 0.72607421875, 0.7601318359375, 0.794189453125, 0.8282470703125, 0.8623046875, 0.8963623046875, 0.930419921875, 0.9644775390625, 0.99853515625, 1.0325927734375, 1.066650390625, 1.1007080078125, 1.134765625]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 10.0, 13.0, 42.0, 96.0, 476.0, 221.0, 89.0, 39.0, 16.0, 5.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.42249006032943726, -0.4096030294895172, -0.39671602845191956, -0.3838289976119995, -0.37094199657440186, -0.3580549657344818, -0.34516793489456177, -0.3322809338569641, -0.31939390301704407, -0.306506872177124, -0.29361987113952637, -0.2807328402996063, -0.26784583926200867, -0.2549588084220886, -0.24207179248332977, -0.22918477654457092, -0.21629776060581207, -0.20341074466705322, -0.19052372872829437, -0.17763671278953552, -0.16474968194961548, -0.15186266601085663, -0.13897565007209778, -0.12608861923217773, -0.11320161074399948, -0.10031459480524063, -0.08742757141590118, -0.07454055547714233, -0.061653535813093185, -0.04876651614904404, -0.03587950021028519, -0.02299247682094574, -0.01010546088218689, 0.0027815578505396843, 0.015668576583266258, 0.028555594384670258, 0.041442614048719406, 0.054329633712768555, 0.0672166496515274, 0.08010367304086685, 0.0929906889796257, 0.10587770491838455, 0.118764728307724, 0.13165174424648285, 0.1445387601852417, 0.15742579102516174, 0.1703127920627594, 0.18319982290267944, 0.1960868388414383, 0.20897385478019714, 0.221860870718956, 0.23474788665771484, 0.2476349174976349, 0.26052194833755493, 0.2734089493751526, 0.28629598021507263, 0.2991829812526703, 0.31207001209259033, 0.324957013130188, 0.33784404397010803, 0.3507310450077057, 0.36361807584762573, 0.3765050768852234, 0.38939210772514343, 0.4022791385650635]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 2.0, 9.0, 5.0, 5.0, 6.0, 16.0, 7.0, 19.0, 15.0, 16.0, 24.0, 12.0, 27.0, 24.0, 30.0, 28.0, 31.0, 34.0, 44.0, 28.0, 38.0, 39.0, 37.0, 36.0, 45.0, 33.0, 36.0, 43.0, 34.0, 34.0, 43.0, 23.0, 20.0, 24.0, 21.0, 24.0, 11.0, 15.0, 8.0, 11.0, 12.0, 3.0, 9.0, 3.0, 7.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.05724400281906128, -0.05544813722372055, -0.05365227162837982, -0.051856402307748795, -0.050060536712408066, -0.04826467111706734, -0.04646880179643631, -0.04467293620109558, -0.04287707060575485, -0.041081205010414124, -0.039285339415073395, -0.03748947009444237, -0.03569360449910164, -0.03389773890376091, -0.03210186958312988, -0.030306003987789154, -0.028510138392448425, -0.026714272797107697, -0.02491840533912182, -0.02312253788113594, -0.021326672285795212, -0.019530806690454483, -0.017734939232468605, -0.015939071774482727, -0.014143206179141998, -0.012347339652478695, -0.010551473125815392, -0.008755606599152088, -0.006959740072488785, -0.005163873545825481, -0.003368007019162178, -0.0015721404924988747, 0.0002237260341644287, 0.002019592560827732, 0.0038154590874910355, 0.005611325614154339, 0.007407192140817642, 0.009203058667480946, 0.010998925194144249, 0.012794791720807552, 0.014590658247470856, 0.016386523842811584, 0.018182391300797462, 0.01997825875878334, 0.02177412435412407, 0.023569989949464798, 0.025365857407450676, 0.027161724865436554, 0.028957590460777283, 0.03075345605611801, 0.03254932165145874, 0.03434519097208977, 0.036141056567430496, 0.037936922162771225, 0.03973279148340225, 0.04152865707874298, 0.04332452267408371, 0.04512038826942444, 0.04691625386476517, 0.048712123185396194, 0.05050798878073692, 0.05230385437607765, 0.05409972369670868, 0.05589558929204941, 0.05769145488739014]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 8.0, 10.0, 4.0, 12.0, 10.0, 12.0, 21.0, 19.0, 28.0, 33.0, 37.0, 41.0, 38.0, 43.0, 45.0, 46.0, 38.0, 44.0, 54.0, 58.0, 41.0, 45.0, 41.0, 36.0, 30.0, 31.0, 33.0, 32.0, 15.0, 16.0, 13.0, 18.0, 10.0, 11.0, 9.0, 5.0, 6.0, 1.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.71875, -16.22802734375, -15.7373046875, -15.24658203125, -14.755859375, -14.26513671875, -13.7744140625, -13.28369140625, -12.79296875, -12.30224609375, -11.8115234375, -11.32080078125, -10.830078125, -10.33935546875, -9.8486328125, -9.35791015625, -8.8671875, -8.37646484375, -7.8857421875, -7.39501953125, -6.904296875, -6.41357421875, -5.9228515625, -5.43212890625, -4.94140625, -4.45068359375, -3.9599609375, -3.46923828125, -2.978515625, -2.48779296875, -1.9970703125, -1.50634765625, -1.015625, -0.52490234375, -0.0341796875, 0.45654296875, 0.947265625, 1.43798828125, 1.9287109375, 2.41943359375, 2.91015625, 3.40087890625, 3.8916015625, 4.38232421875, 4.873046875, 5.36376953125, 5.8544921875, 6.34521484375, 6.8359375, 7.32666015625, 7.8173828125, 8.30810546875, 8.798828125, 9.28955078125, 9.7802734375, 10.27099609375, 10.76171875, 11.25244140625, 11.7431640625, 12.23388671875, 12.724609375, 13.21533203125, 13.7060546875, 14.19677734375, 14.6875]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 5.0, 8.0, 12.0, 18.0, 20.0, 27.0, 41.0, 57.0, 77.0, 138.0, 199.0, 312.0, 524.0, 797.0, 1228.0, 1913.0, 3359.0, 7987.0, 29222.0, 172196.0, 646635.0, 142970.0, 25304.0, 7222.0, 3160.0, 1811.0, 1157.0, 749.0, 484.0, 314.0, 188.0, 147.0, 84.0, 62.0, 32.0, 35.0, 22.0, 16.0, 8.0, 7.0, 1.0, 3.0, 6.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.484375, -11.1304931640625, -10.776611328125, -10.4227294921875, -10.06884765625, -9.7149658203125, -9.361083984375, -9.0072021484375, -8.6533203125, -8.2994384765625, -7.945556640625, -7.5916748046875, -7.23779296875, -6.8839111328125, -6.530029296875, -6.1761474609375, -5.822265625, -5.4683837890625, -5.114501953125, -4.7606201171875, -4.40673828125, -4.0528564453125, -3.698974609375, -3.3450927734375, -2.9912109375, -2.6373291015625, -2.283447265625, -1.9295654296875, -1.57568359375, -1.2218017578125, -0.867919921875, -0.5140380859375, -0.16015625, 0.1937255859375, 0.547607421875, 0.9014892578125, 1.25537109375, 1.6092529296875, 1.963134765625, 2.3170166015625, 2.6708984375, 3.0247802734375, 3.378662109375, 3.7325439453125, 4.08642578125, 4.4403076171875, 4.794189453125, 5.1480712890625, 5.501953125, 5.8558349609375, 6.209716796875, 6.5635986328125, 6.91748046875, 7.2713623046875, 7.625244140625, 7.9791259765625, 8.3330078125, 8.6868896484375, 9.040771484375, 9.3946533203125, 9.74853515625, 10.1024169921875, 10.456298828125, 10.8101806640625, 11.1640625]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 5.0, 2.0, 2.0, 4.0, 3.0, 4.0, 8.0, 4.0, 9.0, 7.0, 13.0, 9.0, 12.0, 21.0, 18.0, 28.0, 22.0, 40.0, 30.0, 38.0, 37.0, 33.0, 45.0, 59.0, 83.0, 1756.0, 268.0, 75.0, 43.0, 39.0, 40.0, 49.0, 38.0, 29.0, 27.0, 25.0, 20.0, 20.0, 19.0, 12.0, 16.0, 11.0, 13.0, 8.0, 7.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-34.375, -33.1806640625, -31.986328125, -30.7919921875, -29.59765625, -28.4033203125, -27.208984375, -26.0146484375, -24.8203125, -23.6259765625, -22.431640625, -21.2373046875, -20.04296875, -18.8486328125, -17.654296875, -16.4599609375, -15.265625, -14.0712890625, -12.876953125, -11.6826171875, -10.48828125, -9.2939453125, -8.099609375, -6.9052734375, -5.7109375, -4.5166015625, -3.322265625, -2.1279296875, -0.93359375, 0.2607421875, 1.455078125, 2.6494140625, 3.84375, 5.0380859375, 6.232421875, 7.4267578125, 8.62109375, 9.8154296875, 11.009765625, 12.2041015625, 13.3984375, 14.5927734375, 15.787109375, 16.9814453125, 18.17578125, 19.3701171875, 20.564453125, 21.7587890625, 22.953125, 24.1474609375, 25.341796875, 26.5361328125, 27.73046875, 28.9248046875, 30.119140625, 31.3134765625, 32.5078125, 33.7021484375, 34.896484375, 36.0908203125, 37.28515625, 38.4794921875, 39.673828125, 40.8681640625, 42.0625]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 4.0, 4.0, 2.0, 6.0, 6.0, 12.0, 19.0, 22.0, 27.0, 34.0, 42.0, 60.0, 79.0, 87.0, 124.0, 157.0, 223.0, 327.0, 864.0, 9252.0, 3121293.0, 10928.0, 885.0, 320.0, 218.0, 149.0, 140.0, 87.0, 82.0, 57.0, 48.0, 36.0, 22.0, 21.0, 14.0, 10.0, 15.0, 9.0, 11.0, 4.0, 6.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-98.3125, -95.3798828125, -92.447265625, -89.5146484375, -86.58203125, -83.6494140625, -80.716796875, -77.7841796875, -74.8515625, -71.9189453125, -68.986328125, -66.0537109375, -63.12109375, -60.1884765625, -57.255859375, -54.3232421875, -51.390625, -48.4580078125, -45.525390625, -42.5927734375, -39.66015625, -36.7275390625, -33.794921875, -30.8623046875, -27.9296875, -24.9970703125, -22.064453125, -19.1318359375, -16.19921875, -13.2666015625, -10.333984375, -7.4013671875, -4.46875, -1.5361328125, 1.396484375, 4.3291015625, 7.26171875, 10.1943359375, 13.126953125, 16.0595703125, 18.9921875, 21.9248046875, 24.857421875, 27.7900390625, 30.72265625, 33.6552734375, 36.587890625, 39.5205078125, 42.453125, 45.3857421875, 48.318359375, 51.2509765625, 54.18359375, 57.1162109375, 60.048828125, 62.9814453125, 65.9140625, 68.8466796875, 71.779296875, 74.7119140625, 77.64453125, 80.5771484375, 83.509765625, 86.4423828125, 89.375]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 23.0, 134.0, 426.0, 329.0, 89.0, 12.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.34568214416504, -17.37533950805664, -14.404998779296875, -11.434657096862793, -8.464315414428711, -5.493973731994629, -2.523632049560547, 0.44671058654785156, 3.417051315307617, 6.387392997741699, 9.357734680175781, 12.328076362609863, 15.298418045043945, 18.268760681152344, 21.23910140991211, 24.209444046020508, 27.179784774780273, 30.150127410888672, 33.12046813964844, 36.0908088684082, 39.06114959716797, 42.031494140625, 45.001834869384766, 47.97217559814453, 50.94252014160156, 53.91286087036133, 56.883201599121094, 59.853546142578125, 62.82388687133789, 65.79422760009766, 68.76457214355469, 71.73490905761719, 74.70524597167969, 77.67559051513672, 80.64592742919922, 83.61627197265625, 86.58660888671875, 89.55695343017578, 92.52729797363281, 95.49763488769531, 98.46797943115234, 101.43832397460938, 104.40866088867188, 107.3790054321289, 110.34934997558594, 113.31968688964844, 116.29003143310547, 119.2603759765625, 122.230712890625, 125.20105743408203, 128.17140197753906, 131.14173889160156, 134.11207580566406, 137.08242797851562, 140.05276489257812, 143.02310180664062, 145.99343872070312, 148.96377563476562, 151.9341278076172, 154.9044647216797, 157.8748016357422, 160.84515380859375, 163.81549072265625, 166.78582763671875, 169.7561798095703]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 7.0, 5.0, 5.0, 11.0, 7.0, 6.0, 14.0, 15.0, 16.0, 17.0, 35.0, 20.0, 38.0, 22.0, 38.0, 32.0, 42.0, 41.0, 34.0, 50.0, 49.0, 37.0, 56.0, 33.0, 36.0, 44.0, 29.0, 28.0, 35.0, 30.0, 31.0, 26.0, 22.0, 21.0, 12.0, 11.0, 8.0, 7.0, 7.0, 9.0, 8.0, 5.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-108.66925811767578, -105.16291809082031, -101.65657043457031, -98.15023040771484, -94.64389038085938, -91.13754272460938, -87.6312026977539, -84.12486267089844, -80.61851501464844, -77.11217498779297, -73.60582733154297, -70.0994873046875, -66.59314727783203, -63.0868034362793, -59.58045959472656, -56.074119567871094, -52.567779541015625, -49.06143569946289, -45.55509567260742, -42.04875183105469, -38.54241180419922, -35.036067962646484, -31.52972412109375, -28.02338218688965, -24.517040252685547, -21.010698318481445, -17.504356384277344, -13.99801254272461, -10.491670608520508, -6.985328674316406, -3.478984832763672, 0.027357101440429688, 3.53369140625, 7.04003381729126, 10.54637622833252, 14.052719116210938, 17.55906105041504, 21.06540298461914, 24.571746826171875, 28.078088760375977, 31.584430694580078, 35.09077453613281, 38.59711456298828, 42.103458404541016, 45.60980224609375, 49.11614227294922, 52.62248611450195, 56.12882995605469, 59.635169982910156, 63.14151382446289, 66.64785766601562, 70.1541976928711, 73.66053771972656, 77.16688537597656, 80.67322540283203, 84.1795654296875, 87.6859130859375, 91.19225311279297, 94.69860076904297, 98.20494079589844, 101.7112808227539, 105.21762084960938, 108.72396850585938, 112.23030853271484, 115.73664855957031]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 6.0, 7.0, 8.0, 4.0, 11.0, 11.0, 12.0, 19.0, 18.0, 30.0, 21.0, 40.0, 36.0, 33.0, 49.0, 45.0, 44.0, 45.0, 45.0, 49.0, 58.0, 39.0, 41.0, 44.0, 41.0, 33.0, 39.0, 28.0, 28.0, 20.0, 17.0, 14.0, 10.0, 18.0, 7.0, 14.0, 6.0, 5.0, 5.0, 3.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-17.03125, -16.536376953125, -16.04150390625, -15.546630859375, -15.0517578125, -14.556884765625, -14.06201171875, -13.567138671875, -13.072265625, -12.577392578125, -12.08251953125, -11.587646484375, -11.0927734375, -10.597900390625, -10.10302734375, -9.608154296875, -9.11328125, -8.618408203125, -8.12353515625, -7.628662109375, -7.1337890625, -6.638916015625, -6.14404296875, -5.649169921875, -5.154296875, -4.659423828125, -4.16455078125, -3.669677734375, -3.1748046875, -2.679931640625, -2.18505859375, -1.690185546875, -1.1953125, -0.700439453125, -0.20556640625, 0.289306640625, 0.7841796875, 1.279052734375, 1.77392578125, 2.268798828125, 2.763671875, 3.258544921875, 3.75341796875, 4.248291015625, 4.7431640625, 5.238037109375, 5.73291015625, 6.227783203125, 6.72265625, 7.217529296875, 7.71240234375, 8.207275390625, 8.7021484375, 9.197021484375, 9.69189453125, 10.186767578125, 10.681640625, 11.176513671875, 11.67138671875, 12.166259765625, 12.6611328125, 13.156005859375, 13.65087890625, 14.145751953125, 14.640625]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 0.0, 11.0, 20.0, 23.0, 26.0, 32.0, 55.0, 74.0, 92.0, 134.0, 243.0, 332.0, 554.0, 1051.0, 2062.0, 4452.0, 10937.0, 111921.0, 3753620.0, 282946.0, 14641.0, 5390.0, 2503.0, 1255.0, 683.0, 411.0, 256.0, 166.0, 123.0, 69.0, 52.0, 45.0, 32.0, 24.0, 16.0, 8.0, 13.0, 2.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-64.375, -62.56689453125, -60.7587890625, -58.95068359375, -57.142578125, -55.33447265625, -53.5263671875, -51.71826171875, -49.91015625, -48.10205078125, -46.2939453125, -44.48583984375, -42.677734375, -40.86962890625, -39.0615234375, -37.25341796875, -35.4453125, -33.63720703125, -31.8291015625, -30.02099609375, -28.212890625, -26.40478515625, -24.5966796875, -22.78857421875, -20.98046875, -19.17236328125, -17.3642578125, -15.55615234375, -13.748046875, -11.93994140625, -10.1318359375, -8.32373046875, -6.515625, -4.70751953125, -2.8994140625, -1.09130859375, 0.716796875, 2.52490234375, 4.3330078125, 6.14111328125, 7.94921875, 9.75732421875, 11.5654296875, 13.37353515625, 15.181640625, 16.98974609375, 18.7978515625, 20.60595703125, 22.4140625, 24.22216796875, 26.0302734375, 27.83837890625, 29.646484375, 31.45458984375, 33.2626953125, 35.07080078125, 36.87890625, 38.68701171875, 40.4951171875, 42.30322265625, 44.111328125, 45.91943359375, 47.7275390625, 49.53564453125, 51.34375]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 4.0, 6.0, 3.0, 3.0, 4.0, 7.0, 7.0, 2.0, 15.0, 14.0, 15.0, 15.0, 21.0, 27.0, 51.0, 92.0, 157.0, 367.0, 581.0, 893.0, 733.0, 465.0, 243.0, 102.0, 70.0, 39.0, 42.0, 20.0, 12.0, 14.0, 6.0, 9.0, 3.0, 7.0, 6.0, 5.0, 5.0, 2.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.21875, -28.267333984375, -27.31591796875, -26.364501953125, -25.4130859375, -24.461669921875, -23.51025390625, -22.558837890625, -21.607421875, -20.656005859375, -19.70458984375, -18.753173828125, -17.8017578125, -16.850341796875, -15.89892578125, -14.947509765625, -13.99609375, -13.044677734375, -12.09326171875, -11.141845703125, -10.1904296875, -9.239013671875, -8.28759765625, -7.336181640625, -6.384765625, -5.433349609375, -4.48193359375, -3.530517578125, -2.5791015625, -1.627685546875, -0.67626953125, 0.275146484375, 1.2265625, 2.177978515625, 3.12939453125, 4.080810546875, 5.0322265625, 5.983642578125, 6.93505859375, 7.886474609375, 8.837890625, 9.789306640625, 10.74072265625, 11.692138671875, 12.6435546875, 13.594970703125, 14.54638671875, 15.497802734375, 16.44921875, 17.400634765625, 18.35205078125, 19.303466796875, 20.2548828125, 21.206298828125, 22.15771484375, 23.109130859375, 24.060546875, 25.011962890625, 25.96337890625, 26.914794921875, 27.8662109375, 28.817626953125, 29.76904296875, 30.720458984375, 31.671875]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 4.0, 6.0, 6.0, 6.0, 1.0, 9.0, 9.0, 14.0, 8.0, 21.0, 27.0, 44.0, 86.0, 143.0, 251.0, 543.0, 1259.0, 2961.0, 8229.0, 26313.0, 285671.0, 3774374.0, 70076.0, 15186.0, 5221.0, 2041.0, 837.0, 415.0, 198.0, 102.0, 62.0, 44.0, 28.0, 22.0, 15.0, 14.0, 10.0, 2.0, 4.0, 8.0, 8.0, 7.0, 1.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.625, -79.1728515625, -76.720703125, -74.2685546875, -71.81640625, -69.3642578125, -66.912109375, -64.4599609375, -62.0078125, -59.5556640625, -57.103515625, -54.6513671875, -52.19921875, -49.7470703125, -47.294921875, -44.8427734375, -42.390625, -39.9384765625, -37.486328125, -35.0341796875, -32.58203125, -30.1298828125, -27.677734375, -25.2255859375, -22.7734375, -20.3212890625, -17.869140625, -15.4169921875, -12.96484375, -10.5126953125, -8.060546875, -5.6083984375, -3.15625, -0.7041015625, 1.748046875, 4.2001953125, 6.65234375, 9.1044921875, 11.556640625, 14.0087890625, 16.4609375, 18.9130859375, 21.365234375, 23.8173828125, 26.26953125, 28.7216796875, 31.173828125, 33.6259765625, 36.078125, 38.5302734375, 40.982421875, 43.4345703125, 45.88671875, 48.3388671875, 50.791015625, 53.2431640625, 55.6953125, 58.1474609375, 60.599609375, 63.0517578125, 65.50390625, 67.9560546875, 70.408203125, 72.8603515625, 75.3125]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 8.0, 7.0, 21.0, 36.0, 60.0, 147.0, 274.0, 238.0, 100.0, 46.0, 30.0, 19.0, 11.0, 9.0, 3.0, 1.0, 2.0], "bins": [-413.81341552734375, -406.13128662109375, -398.44915771484375, -390.76702880859375, -383.08489990234375, -375.40277099609375, -367.72064208984375, -360.03851318359375, -352.35638427734375, -344.67425537109375, -336.99212646484375, -329.30999755859375, -321.62786865234375, -313.94573974609375, -306.26361083984375, -298.58148193359375, -290.8993835449219, -283.2172546386719, -275.5351257324219, -267.8529968261719, -260.1708679199219, -252.48873901367188, -244.80661010742188, -237.12449645996094, -229.44235229492188, -221.76022338867188, -214.07809448242188, -206.39596557617188, -198.71383666992188, -191.03170776367188, -183.34957885742188, -175.66746520996094, -167.98533630371094, -160.30320739746094, -152.62107849121094, -144.93894958496094, -137.25682067871094, -129.57470703125, -121.89257049560547, -114.21044921875, -106.5283203125, -98.84619140625, -91.1640625, -83.48193359375, -75.79981231689453, -68.11768341064453, -60.43555450439453, -52.7534294128418, -45.07129669189453, -37.38916778564453, -29.707042694091797, -22.024913787841797, -14.34278678894043, -6.6606597900390625, 1.0214691162109375, 8.703594207763672, 16.385723114013672, 24.06785011291504, 31.749977111816406, 39.432106018066406, 47.114234924316406, 54.79636001586914, 62.47848892211914, 70.16061401367188, 77.84274291992188]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 7.0, 5.0, 13.0, 7.0, 7.0, 11.0, 6.0, 6.0, 19.0, 19.0, 21.0, 28.0, 23.0, 30.0, 33.0, 37.0, 39.0, 41.0, 40.0, 47.0, 34.0, 43.0, 36.0, 38.0, 30.0, 34.0, 31.0, 34.0, 29.0, 39.0, 26.0, 21.0, 20.0, 19.0, 25.0, 17.0, 22.0, 10.0, 10.0, 7.0, 5.0, 11.0, 7.0, 4.0, 2.0, 6.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-72.63909912109375, -70.26516723632812, -67.8912353515625, -65.51730346679688, -63.143367767333984, -60.76943588256836, -58.39550018310547, -56.021568298339844, -53.64763641357422, -51.273704528808594, -48.89977264404297, -46.52583694458008, -44.15190505981445, -41.77797317504883, -39.40403747558594, -37.03010559082031, -34.65617370605469, -32.28224182128906, -29.908308029174805, -27.534374237060547, -25.160442352294922, -22.786510467529297, -20.41257667541504, -18.03864288330078, -15.664710998535156, -13.290778160095215, -10.916845321655273, -8.542912483215332, -6.168979644775391, -3.795046806335449, -1.4211139678955078, 0.95281982421875, 3.326751708984375, 5.700684547424316, 8.074617385864258, 10.4485502243042, 12.82248306274414, 15.196415901184082, 17.570348739624023, 19.94428253173828, 22.318214416503906, 24.69214630126953, 27.06608009338379, 29.440013885498047, 31.813945770263672, 34.1878776550293, 36.56181335449219, 38.93574523925781, 41.30967712402344, 43.68360900878906, 46.05754089355469, 48.43147659301758, 50.8054084777832, 53.17934036254883, 55.55327606201172, 57.927207946777344, 60.30113983154297, 62.675071716308594, 65.04900360107422, 67.42293548583984, 69.796875, 72.17080688476562, 74.54473876953125, 76.91867065429688, 79.2926025390625]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 7.0, 6.0, 5.0, 8.0, 12.0, 7.0, 15.0, 21.0, 28.0, 32.0, 33.0, 33.0, 32.0, 36.0, 48.0, 38.0, 48.0, 46.0, 41.0, 41.0, 47.0, 39.0, 52.0, 45.0, 46.0, 29.0, 28.0, 35.0, 22.0, 19.0, 22.0, 16.0, 22.0, 15.0, 7.0, 7.0, 7.0, 5.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-17.265625, -16.776123046875, -16.28662109375, -15.797119140625, -15.3076171875, -14.818115234375, -14.32861328125, -13.839111328125, -13.349609375, -12.860107421875, -12.37060546875, -11.881103515625, -11.3916015625, -10.902099609375, -10.41259765625, -9.923095703125, -9.43359375, -8.944091796875, -8.45458984375, -7.965087890625, -7.4755859375, -6.986083984375, -6.49658203125, -6.007080078125, -5.517578125, -5.028076171875, -4.53857421875, -4.049072265625, -3.5595703125, -3.070068359375, -2.58056640625, -2.091064453125, -1.6015625, -1.112060546875, -0.62255859375, -0.133056640625, 0.3564453125, 0.845947265625, 1.33544921875, 1.824951171875, 2.314453125, 2.803955078125, 3.29345703125, 3.782958984375, 4.2724609375, 4.761962890625, 5.25146484375, 5.740966796875, 6.23046875, 6.719970703125, 7.20947265625, 7.698974609375, 8.1884765625, 8.677978515625, 9.16748046875, 9.656982421875, 10.146484375, 10.635986328125, 11.12548828125, 11.614990234375, 12.1044921875, 12.593994140625, 13.08349609375, 13.572998046875, 14.0625]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 3.0, 8.0, 5.0, 11.0, 15.0, 29.0, 20.0, 34.0, 55.0, 84.0, 115.0, 212.0, 363.0, 599.0, 1031.0, 1705.0, 2989.0, 5123.0, 8803.0, 15294.0, 26289.0, 46211.0, 85184.0, 165906.0, 268557.0, 194419.0, 99739.0, 53834.0, 30074.0, 17503.0, 10105.0, 5849.0, 3417.0, 2015.0, 1198.0, 673.0, 424.0, 255.0, 162.0, 90.0, 57.0, 39.0, 19.0, 16.0, 11.0, 7.0, 3.0, 5.0, 3.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.5732421875, -1.518280029296875, -1.46331787109375, -1.408355712890625, -1.3533935546875, -1.298431396484375, -1.24346923828125, -1.188507080078125, -1.133544921875, -1.078582763671875, -1.02362060546875, -0.968658447265625, -0.9136962890625, -0.858734130859375, -0.80377197265625, -0.748809814453125, -0.69384765625, -0.638885498046875, -0.58392333984375, -0.528961181640625, -0.4739990234375, -0.419036865234375, -0.36407470703125, -0.309112548828125, -0.254150390625, -0.199188232421875, -0.14422607421875, -0.089263916015625, -0.0343017578125, 0.020660400390625, 0.07562255859375, 0.130584716796875, 0.185546875, 0.240509033203125, 0.29547119140625, 0.350433349609375, 0.4053955078125, 0.460357666015625, 0.51531982421875, 0.570281982421875, 0.625244140625, 0.680206298828125, 0.73516845703125, 0.790130615234375, 0.8450927734375, 0.900054931640625, 0.95501708984375, 1.009979248046875, 1.06494140625, 1.119903564453125, 1.17486572265625, 1.229827880859375, 1.2847900390625, 1.339752197265625, 1.39471435546875, 1.449676513671875, 1.504638671875, 1.559600830078125, 1.61456298828125, 1.669525146484375, 1.7244873046875, 1.779449462890625, 1.83441162109375, 1.889373779296875, 1.9443359375]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 5.0, 5.0, 8.0, 3.0, 7.0, 11.0, 4.0, 8.0, 9.0, 11.0, 13.0, 23.0, 17.0, 20.0, 23.0, 34.0, 43.0, 30.0, 26.0, 30.0, 32.0, 28.0, 42.0, 41.0, 1056.0, 36.0, 32.0, 30.0, 36.0, 35.0, 26.0, 40.0, 22.0, 32.0, 23.0, 23.0, 29.0, 23.0, 12.0, 22.0, 18.0, 13.0, 7.0, 10.0, 6.0, 10.0, 4.0, 3.0, 6.0, 3.0, 1.0, 2.0, 3.0], "bins": [-8.75, -8.50531005859375, -8.2606201171875, -8.01593017578125, -7.771240234375, -7.52655029296875, -7.2818603515625, -7.03717041015625, -6.79248046875, -6.54779052734375, -6.3031005859375, -6.05841064453125, -5.813720703125, -5.56903076171875, -5.3243408203125, -5.07965087890625, -4.8349609375, -4.59027099609375, -4.3455810546875, -4.10089111328125, -3.856201171875, -3.61151123046875, -3.3668212890625, -3.12213134765625, -2.87744140625, -2.63275146484375, -2.3880615234375, -2.14337158203125, -1.898681640625, -1.65399169921875, -1.4093017578125, -1.16461181640625, -0.919921875, -0.67523193359375, -0.4305419921875, -0.18585205078125, 0.058837890625, 0.30352783203125, 0.5482177734375, 0.79290771484375, 1.03759765625, 1.28228759765625, 1.5269775390625, 1.77166748046875, 2.016357421875, 2.26104736328125, 2.5057373046875, 2.75042724609375, 2.9951171875, 3.23980712890625, 3.4844970703125, 3.72918701171875, 3.973876953125, 4.21856689453125, 4.4632568359375, 4.70794677734375, 4.95263671875, 5.19732666015625, 5.4420166015625, 5.68670654296875, 5.931396484375, 6.17608642578125, 6.4207763671875, 6.66546630859375, 6.91015625]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 7.0, 8.0, 13.0, 17.0, 29.0, 32.0, 67.0, 100.0, 148.0, 239.0, 378.0, 567.0, 851.0, 1315.0, 1965.0, 3017.0, 4505.0, 6672.0, 10281.0, 15328.0, 24063.0, 38290.0, 63832.0, 108523.0, 182786.0, 1256414.0, 148022.0, 87460.0, 51897.0, 31899.0, 20022.0, 12958.0, 8563.0, 5598.0, 3839.0, 2485.0, 1710.0, 1146.0, 721.0, 464.0, 322.0, 221.0, 118.0, 81.0, 64.0, 39.0, 20.0, 15.0, 8.0, 9.0, 7.0, 2.0, 2.0, 3.0, 1.0, 1.0], "bins": [-0.83154296875, -0.8065719604492188, -0.7816009521484375, -0.7566299438476562, -0.731658935546875, -0.7066879272460938, -0.6817169189453125, -0.6567459106445312, -0.63177490234375, -0.6068038940429688, -0.5818328857421875, -0.5568618774414062, -0.531890869140625, -0.5069198608398438, -0.4819488525390625, -0.45697784423828125, -0.4320068359375, -0.40703582763671875, -0.3820648193359375, -0.35709381103515625, -0.332122802734375, -0.30715179443359375, -0.2821807861328125, -0.25720977783203125, -0.23223876953125, -0.20726776123046875, -0.1822967529296875, -0.15732574462890625, -0.132354736328125, -0.10738372802734375, -0.0824127197265625, -0.05744171142578125, -0.032470703125, -0.00749969482421875, 0.0174713134765625, 0.04244232177734375, 0.067413330078125, 0.09238433837890625, 0.1173553466796875, 0.14232635498046875, 0.16729736328125, 0.19226837158203125, 0.2172393798828125, 0.24221038818359375, 0.267181396484375, 0.29215240478515625, 0.3171234130859375, 0.34209442138671875, 0.3670654296875, 0.39203643798828125, 0.4170074462890625, 0.44197845458984375, 0.466949462890625, 0.49192047119140625, 0.5168914794921875, 0.5418624877929688, 0.56683349609375, 0.5918045043945312, 0.6167755126953125, 0.6417465209960938, 0.666717529296875, 0.6916885375976562, 0.7166595458984375, 0.7416305541992188, 0.7666015625]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 3.0, 0.0, 5.0, 3.0, 1.0, 6.0, 10.0, 14.0, 9.0, 22.0, 14.0, 29.0, 31.0, 46.0, 53.0, 86.0, 135.0, 152.0, 117.0, 67.0, 41.0, 38.0, 32.0, 19.0, 14.0, 10.0, 9.0, 11.0, 10.0, 7.0, 5.0, 4.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0419921875, -0.04059648513793945, -0.039200782775878906, -0.03780508041381836, -0.03640937805175781, -0.035013675689697266, -0.03361797332763672, -0.03222227096557617, -0.030826568603515625, -0.029430866241455078, -0.02803516387939453, -0.026639461517333984, -0.025243759155273438, -0.02384805679321289, -0.022452354431152344, -0.021056652069091797, -0.01966094970703125, -0.018265247344970703, -0.016869544982910156, -0.01547384262084961, -0.014078140258789062, -0.012682437896728516, -0.011286735534667969, -0.009891033172607422, -0.008495330810546875, -0.007099628448486328, -0.005703926086425781, -0.004308223724365234, -0.0029125213623046875, -0.0015168190002441406, -0.00012111663818359375, 0.0012745857238769531, 0.0026702880859375, 0.004065990447998047, 0.005461692810058594, 0.006857395172119141, 0.008253097534179688, 0.009648799896240234, 0.011044502258300781, 0.012440204620361328, 0.013835906982421875, 0.015231609344482422, 0.01662731170654297, 0.018023014068603516, 0.019418716430664062, 0.02081441879272461, 0.022210121154785156, 0.023605823516845703, 0.02500152587890625, 0.026397228240966797, 0.027792930603027344, 0.02918863296508789, 0.030584335327148438, 0.031980037689208984, 0.03337574005126953, 0.03477144241333008, 0.036167144775390625, 0.03756284713745117, 0.03895854949951172, 0.040354251861572266, 0.04174995422363281, 0.04314565658569336, 0.044541358947753906, 0.04593706130981445, 0.047332763671875]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 10.0, 8.0, 7.0, 7.0, 17.0, 18.0, 20.0, 19.0, 47.0, 67.0, 117.0, 284.0, 1967.0, 785502.0, 258488.0, 1393.0, 280.0, 103.0, 59.0, 39.0, 26.0, 24.0, 13.0, 15.0, 11.0, 7.0, 2.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1171875, -1.0842742919921875, -1.051361083984375, -1.0184478759765625, -0.98553466796875, -0.9526214599609375, -0.919708251953125, -0.8867950439453125, -0.8538818359375, -0.8209686279296875, -0.788055419921875, -0.7551422119140625, -0.72222900390625, -0.6893157958984375, -0.656402587890625, -0.6234893798828125, -0.590576171875, -0.5576629638671875, -0.524749755859375, -0.4918365478515625, -0.45892333984375, -0.4260101318359375, -0.393096923828125, -0.3601837158203125, -0.3272705078125, -0.2943572998046875, -0.261444091796875, -0.2285308837890625, -0.19561767578125, -0.1627044677734375, -0.129791259765625, -0.0968780517578125, -0.06396484375, -0.0310516357421875, 0.001861572265625, 0.0347747802734375, 0.06768798828125, 0.1006011962890625, 0.133514404296875, 0.1664276123046875, 0.1993408203125, 0.2322540283203125, 0.265167236328125, 0.2980804443359375, 0.33099365234375, 0.3639068603515625, 0.396820068359375, 0.4297332763671875, 0.462646484375, 0.4955596923828125, 0.528472900390625, 0.5613861083984375, 0.59429931640625, 0.6272125244140625, 0.660125732421875, 0.6930389404296875, 0.7259521484375, 0.7588653564453125, 0.791778564453125, 0.8246917724609375, 0.85760498046875, 0.8905181884765625, 0.923431396484375, 0.9563446044921875, 0.9892578125]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 8.0, 13.0, 41.0, 70.0, 196.0, 383.0, 168.0, 63.0, 25.0, 23.0, 8.0, 2.0, 9.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07136602699756622, -0.0644640251994133, -0.05756201595067978, -0.050660014152526855, -0.04375800862908363, -0.03685600310564041, -0.029954001307487488, -0.023051995784044266, -0.016149990260601044, -0.009247985668480396, -0.002345981076359749, 0.004556022584438324, 0.011458028107881546, 0.018360033631324768, 0.02526203542947769, 0.032164040952920914, 0.039066046476364136, 0.04596805199980736, 0.05287005752325058, 0.0597720593214035, 0.06667406857013702, 0.07357607036828995, 0.08047807216644287, 0.08738008141517639, 0.09428208321332932, 0.10118408501148224, 0.10808609426021576, 0.11498809605836868, 0.1218900978565216, 0.12879210710525513, 0.13569411635398865, 0.14259611070156097, 0.1494981050491333, 0.15640011429786682, 0.16330210864543915, 0.17020411789417267, 0.1771061271429062, 0.18400812149047852, 0.19091013073921204, 0.19781213998794556, 0.20471414923667908, 0.2116161584854126, 0.21851815283298492, 0.22542016208171844, 0.23232217133045197, 0.2392241656780243, 0.2461261749267578, 0.25302818417549133, 0.25993019342422485, 0.2668322026729584, 0.2737342119216919, 0.280636191368103, 0.28753820061683655, 0.29444020986557007, 0.3013422191143036, 0.3082442283630371, 0.31514620780944824, 0.32204821705818176, 0.3289502263069153, 0.3358522057533264, 0.34275421500205994, 0.34965622425079346, 0.356558233499527, 0.3634602427482605, 0.370362251996994]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 4.0, 6.0, 6.0, 10.0, 13.0, 25.0, 16.0, 23.0, 33.0, 19.0, 27.0, 23.0, 26.0, 50.0, 36.0, 29.0, 52.0, 37.0, 52.0, 32.0, 48.0, 49.0, 34.0, 46.0, 47.0, 31.0, 39.0, 35.0, 23.0, 26.0, 29.0, 26.0, 11.0, 7.0, 10.0, 8.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06251299381256104, -0.060667648911476135, -0.05882230028510094, -0.05697695165872574, -0.05513160675764084, -0.05328626185655594, -0.05144091323018074, -0.04959556460380554, -0.04775021970272064, -0.04590487480163574, -0.044059526175260544, -0.042214177548885345, -0.040368832647800446, -0.038523487746715546, -0.03667813912034035, -0.03483279049396515, -0.03298744559288025, -0.0311420988291502, -0.02929675206542015, -0.0274514053016901, -0.025606058537960052, -0.023760711774230003, -0.021915365010499954, -0.020070018246769905, -0.018224671483039856, -0.016379324719309807, -0.014533977955579758, -0.012688631191849709, -0.01084328442811966, -0.00899793766438961, -0.007152590900659561, -0.005307244136929512, -0.003461897373199463, -0.0016165506094694138, 0.00022879615426063538, 0.0020741429179906845, 0.003919489681720734, 0.005764836445450783, 0.007610183209180832, 0.009455529972910881, 0.01130087673664093, 0.01314622350037098, 0.014991570264101028, 0.016836917027831078, 0.018682263791561127, 0.020527610555291176, 0.022372957319021225, 0.024218304082751274, 0.026063650846481323, 0.027908997610211372, 0.02975434437394142, 0.03159969300031662, 0.03344503790140152, 0.03529038280248642, 0.03713573142886162, 0.038981080055236816, 0.040826424956321716, 0.042671769857406616, 0.044517118483781815, 0.04636246711015701, 0.04820781201124191, 0.05005315691232681, 0.05189850553870201, 0.05374385416507721, 0.05558919906616211]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 7.0, 6.0, 5.0, 8.0, 12.0, 7.0, 16.0, 19.0, 29.0, 32.0, 33.0, 33.0, 32.0, 36.0, 48.0, 38.0, 48.0, 46.0, 40.0, 42.0, 47.0, 39.0, 53.0, 44.0, 46.0, 29.0, 28.0, 34.0, 23.0, 20.0, 21.0, 16.0, 22.0, 15.0, 7.0, 7.0, 7.0, 5.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-17.265625, -16.776123046875, -16.28662109375, -15.797119140625, -15.3076171875, -14.818115234375, -14.32861328125, -13.839111328125, -13.349609375, -12.860107421875, -12.37060546875, -11.881103515625, -11.3916015625, -10.902099609375, -10.41259765625, -9.923095703125, -9.43359375, -8.944091796875, -8.45458984375, -7.965087890625, -7.4755859375, -6.986083984375, -6.49658203125, -6.007080078125, -5.517578125, -5.028076171875, -4.53857421875, -4.049072265625, -3.5595703125, -3.070068359375, -2.58056640625, -2.091064453125, -1.6015625, -1.112060546875, -0.62255859375, -0.133056640625, 0.3564453125, 0.845947265625, 1.33544921875, 1.824951171875, 2.314453125, 2.803955078125, 3.29345703125, 3.782958984375, 4.2724609375, 4.761962890625, 5.25146484375, 5.740966796875, 6.23046875, 6.719970703125, 7.20947265625, 7.698974609375, 8.1884765625, 8.677978515625, 9.16748046875, 9.656982421875, 10.146484375, 10.635986328125, 11.12548828125, 11.614990234375, 12.1044921875, 12.593994140625, 13.08349609375, 13.572998046875, 14.0625]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 7.0, 8.0, 6.0, 10.0, 14.0, 11.0, 18.0, 32.0, 47.0, 65.0, 78.0, 124.0, 159.0, 309.0, 567.0, 1421.0, 4979.0, 24291.0, 222755.0, 709317.0, 68524.0, 11145.0, 2647.0, 915.0, 422.0, 212.0, 145.0, 100.0, 52.0, 40.0, 33.0, 25.0, 27.0, 18.0, 9.0, 7.0, 7.0, 5.0, 4.0, 3.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-16.078125, -15.6221923828125, -15.166259765625, -14.7103271484375, -14.25439453125, -13.7984619140625, -13.342529296875, -12.8865966796875, -12.4306640625, -11.9747314453125, -11.518798828125, -11.0628662109375, -10.60693359375, -10.1510009765625, -9.695068359375, -9.2391357421875, -8.783203125, -8.3272705078125, -7.871337890625, -7.4154052734375, -6.95947265625, -6.5035400390625, -6.047607421875, -5.5916748046875, -5.1357421875, -4.6798095703125, -4.223876953125, -3.7679443359375, -3.31201171875, -2.8560791015625, -2.400146484375, -1.9442138671875, -1.48828125, -1.0323486328125, -0.576416015625, -0.1204833984375, 0.33544921875, 0.7913818359375, 1.247314453125, 1.7032470703125, 2.1591796875, 2.6151123046875, 3.071044921875, 3.5269775390625, 3.98291015625, 4.4388427734375, 4.894775390625, 5.3507080078125, 5.806640625, 6.2625732421875, 6.718505859375, 7.1744384765625, 7.63037109375, 8.0863037109375, 8.542236328125, 8.9981689453125, 9.4541015625, 9.9100341796875, 10.365966796875, 10.8218994140625, 11.27783203125, 11.7337646484375, 12.189697265625, 12.6456298828125, 13.1015625]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 3.0, 3.0, 8.0, 3.0, 12.0, 12.0, 16.0, 12.0, 10.0, 18.0, 30.0, 23.0, 29.0, 26.0, 31.0, 27.0, 36.0, 41.0, 33.0, 41.0, 50.0, 192.0, 1886.0, 81.0, 34.0, 43.0, 46.0, 28.0, 32.0, 40.0, 28.0, 19.0, 18.0, 20.0, 13.0, 19.0, 16.0, 13.0, 13.0, 12.0, 6.0, 4.0, 5.0, 9.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-35.59375, -34.45654296875, -33.3193359375, -32.18212890625, -31.044921875, -29.90771484375, -28.7705078125, -27.63330078125, -26.49609375, -25.35888671875, -24.2216796875, -23.08447265625, -21.947265625, -20.81005859375, -19.6728515625, -18.53564453125, -17.3984375, -16.26123046875, -15.1240234375, -13.98681640625, -12.849609375, -11.71240234375, -10.5751953125, -9.43798828125, -8.30078125, -7.16357421875, -6.0263671875, -4.88916015625, -3.751953125, -2.61474609375, -1.4775390625, -0.34033203125, 0.796875, 1.93408203125, 3.0712890625, 4.20849609375, 5.345703125, 6.48291015625, 7.6201171875, 8.75732421875, 9.89453125, 11.03173828125, 12.1689453125, 13.30615234375, 14.443359375, 15.58056640625, 16.7177734375, 17.85498046875, 18.9921875, 20.12939453125, 21.2666015625, 22.40380859375, 23.541015625, 24.67822265625, 25.8154296875, 26.95263671875, 28.08984375, 29.22705078125, 30.3642578125, 31.50146484375, 32.638671875, 33.77587890625, 34.9130859375, 36.05029296875, 37.1875]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 10.0, 7.0, 5.0, 4.0, 14.0, 16.0, 14.0, 18.0, 23.0, 19.0, 30.0, 42.0, 55.0, 79.0, 102.0, 110.0, 140.0, 214.0, 316.0, 693.0, 3998.0, 3116559.0, 20711.0, 1087.0, 398.0, 243.0, 173.0, 125.0, 104.0, 89.0, 55.0, 53.0, 36.0, 37.0, 24.0, 20.0, 21.0, 12.0, 18.0, 10.0, 5.0, 6.0, 5.0, 1.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-78.25, -75.85546875, -73.4609375, -71.06640625, -68.671875, -66.27734375, -63.8828125, -61.48828125, -59.09375, -56.69921875, -54.3046875, -51.91015625, -49.515625, -47.12109375, -44.7265625, -42.33203125, -39.9375, -37.54296875, -35.1484375, -32.75390625, -30.359375, -27.96484375, -25.5703125, -23.17578125, -20.78125, -18.38671875, -15.9921875, -13.59765625, -11.203125, -8.80859375, -6.4140625, -4.01953125, -1.625, 0.76953125, 3.1640625, 5.55859375, 7.953125, 10.34765625, 12.7421875, 15.13671875, 17.53125, 19.92578125, 22.3203125, 24.71484375, 27.109375, 29.50390625, 31.8984375, 34.29296875, 36.6875, 39.08203125, 41.4765625, 43.87109375, 46.265625, 48.66015625, 51.0546875, 53.44921875, 55.84375, 58.23828125, 60.6328125, 63.02734375, 65.421875, 67.81640625, 70.2109375, 72.60546875, 75.0]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [7.0, 51.0, 376.0, 502.0, 83.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.273372650146484, -6.994553565979004, -3.7157340049743652, -0.43691444396972656, 2.841904640197754, 6.120723724365234, 9.399543762207031, 12.678361892700195, 15.957181930541992, 19.23600196838379, 22.514820098876953, 25.79364013671875, 29.072460174560547, 32.351280212402344, 35.630096435546875, 38.90891647338867, 42.18773651123047, 45.466556549072266, 48.74537658691406, 52.024192810058594, 55.30301284790039, 58.58183288574219, 61.860652923583984, 65.13947296142578, 68.41828918457031, 71.69710540771484, 74.9759292602539, 78.25474548339844, 81.5335693359375, 84.81238555908203, 88.09120178222656, 91.37002563476562, 94.64884185791016, 97.92765808105469, 101.20648193359375, 104.48529815673828, 107.76412200927734, 111.04293823242188, 114.32176208496094, 117.60057830810547, 120.87939453125, 124.15821075439453, 127.4370346069336, 130.71585083007812, 133.9946746826172, 137.27349853515625, 140.55230712890625, 143.8311309814453, 147.10995483398438, 150.38877868652344, 153.66758728027344, 156.9464111328125, 160.22523498535156, 163.50405883789062, 166.78286743164062, 170.0616912841797, 173.3404998779297, 176.61932373046875, 179.89813232421875, 183.1769561767578, 186.45578002929688, 189.73458862304688, 193.01341247558594, 196.292236328125, 199.57106018066406]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 7.0, 10.0, 6.0, 4.0, 11.0, 17.0, 15.0, 21.0, 15.0, 28.0, 23.0, 28.0, 33.0, 34.0, 43.0, 37.0, 31.0, 46.0, 42.0, 59.0, 45.0, 35.0, 39.0, 38.0, 40.0, 39.0, 48.0, 35.0, 27.0, 22.0, 19.0, 21.0, 16.0, 13.0, 11.0, 9.0, 7.0, 10.0, 6.0, 3.0, 3.0, 5.0, 2.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-119.44609832763672, -115.95172119140625, -112.45734405517578, -108.96296691894531, -105.46858978271484, -101.97421264648438, -98.47984313964844, -94.98545837402344, -91.4910888671875, -87.99671173095703, -84.50233459472656, -81.0079574584961, -77.51358032226562, -74.01920318603516, -70.52482604980469, -67.03045654296875, -63.53607177734375, -60.04169464111328, -56.54731750488281, -53.052940368652344, -49.558563232421875, -46.064186096191406, -42.5698127746582, -39.075435638427734, -35.581058502197266, -32.0866813659668, -28.592304229736328, -25.097929000854492, -21.603551864624023, -18.109174728393555, -14.614799499511719, -11.12042236328125, -7.6260528564453125, -4.131676197052002, -0.6372995376586914, 2.857076644897461, 6.35145378112793, 9.845830917358398, 13.340206146240234, 16.834583282470703, 20.328960418701172, 23.82333755493164, 27.31771469116211, 30.812089920043945, 34.30646514892578, 37.80084228515625, 41.29521942138672, 44.78959655761719, 48.283973693847656, 51.778350830078125, 55.272727966308594, 58.76710510253906, 62.26148223876953, 65.755859375, 69.25022888183594, 72.74461364746094, 76.23898315429688, 79.73336029052734, 83.22773742675781, 86.72211456298828, 90.21649169921875, 93.71086883544922, 97.20524597167969, 100.69961547851562, 104.19400024414062]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 7.0, 5.0, 4.0, 12.0, 13.0, 7.0, 17.0, 24.0, 24.0, 33.0, 36.0, 35.0, 31.0, 35.0, 46.0, 43.0, 40.0, 47.0, 35.0, 53.0, 40.0, 48.0, 45.0, 48.0, 39.0, 28.0, 29.0, 31.0, 26.0, 21.0, 18.0, 19.0, 18.0, 13.0, 10.0, 8.0, 5.0, 5.0, 6.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-17.078125, -16.59130859375, -16.1044921875, -15.61767578125, -15.130859375, -14.64404296875, -14.1572265625, -13.67041015625, -13.18359375, -12.69677734375, -12.2099609375, -11.72314453125, -11.236328125, -10.74951171875, -10.2626953125, -9.77587890625, -9.2890625, -8.80224609375, -8.3154296875, -7.82861328125, -7.341796875, -6.85498046875, -6.3681640625, -5.88134765625, -5.39453125, -4.90771484375, -4.4208984375, -3.93408203125, -3.447265625, -2.96044921875, -2.4736328125, -1.98681640625, -1.5, -1.01318359375, -0.5263671875, -0.03955078125, 0.447265625, 0.93408203125, 1.4208984375, 1.90771484375, 2.39453125, 2.88134765625, 3.3681640625, 3.85498046875, 4.341796875, 4.82861328125, 5.3154296875, 5.80224609375, 6.2890625, 6.77587890625, 7.2626953125, 7.74951171875, 8.236328125, 8.72314453125, 9.2099609375, 9.69677734375, 10.18359375, 10.67041015625, 11.1572265625, 11.64404296875, 12.130859375, 12.61767578125, 13.1044921875, 13.59130859375, 14.078125]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 5.0, 10.0, 16.0, 29.0, 33.0, 37.0, 74.0, 101.0, 123.0, 165.0, 253.0, 356.0, 524.0, 781.0, 1157.0, 1786.0, 3200.0, 5471.0, 10970.0, 61006.0, 1049730.0, 2836047.0, 187401.0, 17036.0, 7198.0, 3879.0, 2288.0, 1437.0, 964.0, 620.0, 429.0, 330.0, 208.0, 159.0, 117.0, 93.0, 73.0, 46.0, 41.0, 28.0, 19.0, 11.0, 10.0, 5.0, 5.0, 6.0, 4.0, 1.0, 2.0], "bins": [-38.78125, -37.710205078125, -36.63916015625, -35.568115234375, -34.4970703125, -33.426025390625, -32.35498046875, -31.283935546875, -30.212890625, -29.141845703125, -28.07080078125, -26.999755859375, -25.9287109375, -24.857666015625, -23.78662109375, -22.715576171875, -21.64453125, -20.573486328125, -19.50244140625, -18.431396484375, -17.3603515625, -16.289306640625, -15.21826171875, -14.147216796875, -13.076171875, -12.005126953125, -10.93408203125, -9.863037109375, -8.7919921875, -7.720947265625, -6.64990234375, -5.578857421875, -4.5078125, -3.436767578125, -2.36572265625, -1.294677734375, -0.2236328125, 0.847412109375, 1.91845703125, 2.989501953125, 4.060546875, 5.131591796875, 6.20263671875, 7.273681640625, 8.3447265625, 9.415771484375, 10.48681640625, 11.557861328125, 12.62890625, 13.699951171875, 14.77099609375, 15.842041015625, 16.9130859375, 17.984130859375, 19.05517578125, 20.126220703125, 21.197265625, 22.268310546875, 23.33935546875, 24.410400390625, 25.4814453125, 26.552490234375, 27.62353515625, 28.694580078125, 29.765625]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 6.0, 7.0, 7.0, 8.0, 11.0, 7.0, 15.0, 15.0, 17.0, 25.0, 37.0, 62.0, 104.0, 183.0, 369.0, 599.0, 949.0, 660.0, 412.0, 234.0, 115.0, 62.0, 42.0, 26.0, 27.0, 16.0, 13.0, 11.0, 8.0, 7.0, 4.0, 3.0, 4.0, 7.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-29.40625, -28.503662109375, -27.60107421875, -26.698486328125, -25.7958984375, -24.893310546875, -23.99072265625, -23.088134765625, -22.185546875, -21.282958984375, -20.38037109375, -19.477783203125, -18.5751953125, -17.672607421875, -16.77001953125, -15.867431640625, -14.96484375, -14.062255859375, -13.15966796875, -12.257080078125, -11.3544921875, -10.451904296875, -9.54931640625, -8.646728515625, -7.744140625, -6.841552734375, -5.93896484375, -5.036376953125, -4.1337890625, -3.231201171875, -2.32861328125, -1.426025390625, -0.5234375, 0.379150390625, 1.28173828125, 2.184326171875, 3.0869140625, 3.989501953125, 4.89208984375, 5.794677734375, 6.697265625, 7.599853515625, 8.50244140625, 9.405029296875, 10.3076171875, 11.210205078125, 12.11279296875, 13.015380859375, 13.91796875, 14.820556640625, 15.72314453125, 16.625732421875, 17.5283203125, 18.430908203125, 19.33349609375, 20.236083984375, 21.138671875, 22.041259765625, 22.94384765625, 23.846435546875, 24.7490234375, 25.651611328125, 26.55419921875, 27.456787109375, 28.359375]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 0.0, 3.0, 1.0, 3.0, 5.0, 1.0, 1.0, 6.0, 6.0, 13.0, 18.0, 22.0, 28.0, 40.0, 48.0, 98.0, 198.0, 511.0, 1429.0, 5719.0, 35389.0, 3839211.0, 291125.0, 15584.0, 3169.0, 890.0, 361.0, 175.0, 71.0, 44.0, 33.0, 14.0, 21.0, 13.0, 11.0, 8.0, 4.0, 4.0, 6.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-105.5, -102.07421875, -98.6484375, -95.22265625, -91.796875, -88.37109375, -84.9453125, -81.51953125, -78.09375, -74.66796875, -71.2421875, -67.81640625, -64.390625, -60.96484375, -57.5390625, -54.11328125, -50.6875, -47.26171875, -43.8359375, -40.41015625, -36.984375, -33.55859375, -30.1328125, -26.70703125, -23.28125, -19.85546875, -16.4296875, -13.00390625, -9.578125, -6.15234375, -2.7265625, 0.69921875, 4.125, 7.55078125, 10.9765625, 14.40234375, 17.828125, 21.25390625, 24.6796875, 28.10546875, 31.53125, 34.95703125, 38.3828125, 41.80859375, 45.234375, 48.66015625, 52.0859375, 55.51171875, 58.9375, 62.36328125, 65.7890625, 69.21484375, 72.640625, 76.06640625, 79.4921875, 82.91796875, 86.34375, 89.76953125, 93.1953125, 96.62109375, 100.046875, 103.47265625, 106.8984375, 110.32421875, 113.75]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 3.0, 11.0, 27.0, 50.0, 103.0, 242.0, 304.0, 159.0, 50.0, 25.0, 20.0, 6.0, 5.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-186.51565551757812, -179.0924835205078, -171.6693115234375, -164.2461395263672, -156.82296752929688, -149.3997802734375, -141.9766082763672, -134.55343627929688, -127.13026428222656, -119.70709228515625, -112.28392028808594, -104.8607406616211, -97.43756866455078, -90.01439666748047, -82.59121704101562, -75.16804504394531, -67.744873046875, -60.32170104980469, -52.89852523803711, -45.47534942626953, -38.05217742919922, -30.629005432128906, -23.205829620361328, -15.78265380859375, -8.359481811523438, -0.9363079071044922, 6.486865997314453, 13.910039901733398, 21.333213806152344, 28.756385803222656, 36.179561614990234, 43.60273742675781, 51.025909423828125, 58.44908142089844, 65.87225341796875, 73.2954330444336, 80.7186050415039, 88.14177703857422, 95.56495666503906, 102.98812866210938, 110.41130065917969, 117.83447265625, 125.25764465332031, 132.68081665039062, 140.10400390625, 147.52716064453125, 154.95034790039062, 162.37351989746094, 169.79669189453125, 177.21986389160156, 184.64303588867188, 192.0662078857422, 199.4893798828125, 206.91256713867188, 214.3357391357422, 221.7589111328125, 229.1820831298828, 236.60525512695312, 244.02842712402344, 251.45159912109375, 258.8747863769531, 266.2979431152344, 273.72113037109375, 281.144287109375, 288.5674743652344]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 4.0, 2.0, 2.0, 3.0, 12.0, 8.0, 4.0, 13.0, 12.0, 17.0, 21.0, 18.0, 19.0, 27.0, 24.0, 22.0, 28.0, 36.0, 39.0, 41.0, 34.0, 43.0, 39.0, 31.0, 45.0, 50.0, 37.0, 29.0, 38.0, 32.0, 31.0, 32.0, 23.0, 27.0, 26.0, 16.0, 26.0, 21.0, 15.0, 9.0, 5.0, 12.0, 7.0, 8.0, 3.0, 8.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.77050018310547, -64.57345581054688, -62.37641906738281, -60.179378509521484, -57.982337951660156, -55.78529739379883, -53.5882568359375, -51.39121627807617, -49.194175720214844, -46.997135162353516, -44.80009460449219, -42.60305404663086, -40.40601348876953, -38.2089729309082, -36.011932373046875, -33.81489181518555, -31.61785125732422, -29.42081069946289, -27.223770141601562, -25.026729583740234, -22.829689025878906, -20.632648468017578, -18.43560791015625, -16.238567352294922, -14.041526794433594, -11.844486236572266, -9.647445678710938, -7.450405120849609, -5.253364562988281, -3.056324005126953, -0.859283447265625, 1.3377571105957031, 3.5348052978515625, 5.731845855712891, 7.928886413574219, 10.125926971435547, 12.322967529296875, 14.520008087158203, 16.71704864501953, 18.91408920288086, 21.111129760742188, 23.308170318603516, 25.505210876464844, 27.702251434326172, 29.8992919921875, 32.09633255004883, 34.293373107910156, 36.490413665771484, 38.68745422363281, 40.88449478149414, 43.08153533935547, 45.2785758972168, 47.475616455078125, 49.67265701293945, 51.86969757080078, 54.06673812866211, 56.26377868652344, 58.460819244384766, 60.657859802246094, 62.85490036010742, 65.05194091796875, 67.24897766113281, 69.4460220336914, 71.64306640625, 73.84010314941406]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 6.0, 10.0, 2.0, 13.0, 17.0, 16.0, 21.0, 21.0, 14.0, 30.0, 30.0, 36.0, 25.0, 42.0, 40.0, 39.0, 46.0, 41.0, 44.0, 33.0, 41.0, 47.0, 37.0, 35.0, 44.0, 37.0, 28.0, 29.0, 23.0, 26.0, 21.0, 14.0, 23.0, 16.0, 6.0, 12.0, 5.0, 10.0, 8.0, 2.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 4.0], "bins": [-15.5078125, -15.05712890625, -14.6064453125, -14.15576171875, -13.705078125, -13.25439453125, -12.8037109375, -12.35302734375, -11.90234375, -11.45166015625, -11.0009765625, -10.55029296875, -10.099609375, -9.64892578125, -9.1982421875, -8.74755859375, -8.296875, -7.84619140625, -7.3955078125, -6.94482421875, -6.494140625, -6.04345703125, -5.5927734375, -5.14208984375, -4.69140625, -4.24072265625, -3.7900390625, -3.33935546875, -2.888671875, -2.43798828125, -1.9873046875, -1.53662109375, -1.0859375, -0.63525390625, -0.1845703125, 0.26611328125, 0.716796875, 1.16748046875, 1.6181640625, 2.06884765625, 2.51953125, 2.97021484375, 3.4208984375, 3.87158203125, 4.322265625, 4.77294921875, 5.2236328125, 5.67431640625, 6.125, 6.57568359375, 7.0263671875, 7.47705078125, 7.927734375, 8.37841796875, 8.8291015625, 9.27978515625, 9.73046875, 10.18115234375, 10.6318359375, 11.08251953125, 11.533203125, 11.98388671875, 12.4345703125, 12.88525390625, 13.3359375]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 2.0, 3.0, 6.0, 7.0, 9.0, 16.0, 21.0, 60.0, 67.0, 112.0, 179.0, 267.0, 424.0, 672.0, 1006.0, 1576.0, 2409.0, 4022.0, 6631.0, 10590.0, 17131.0, 28886.0, 48958.0, 87852.0, 160691.0, 245979.0, 187165.0, 102853.0, 56345.0, 32985.0, 19904.0, 12085.0, 7445.0, 4542.0, 2870.0, 1717.0, 1092.0, 694.0, 443.0, 259.0, 201.0, 126.0, 101.0, 52.0, 45.0, 16.0, 16.0, 10.0, 10.0, 4.0, 5.0, 2.0, 2.0, 2.0, 1.0], "bins": [-1.6201171875, -1.573333740234375, -1.52655029296875, -1.479766845703125, -1.4329833984375, -1.386199951171875, -1.33941650390625, -1.292633056640625, -1.245849609375, -1.199066162109375, -1.15228271484375, -1.105499267578125, -1.0587158203125, -1.011932373046875, -0.96514892578125, -0.918365478515625, -0.87158203125, -0.824798583984375, -0.77801513671875, -0.731231689453125, -0.6844482421875, -0.637664794921875, -0.59088134765625, -0.544097900390625, -0.497314453125, -0.450531005859375, -0.40374755859375, -0.356964111328125, -0.3101806640625, -0.263397216796875, -0.21661376953125, -0.169830322265625, -0.123046875, -0.076263427734375, -0.02947998046875, 0.017303466796875, 0.0640869140625, 0.110870361328125, 0.15765380859375, 0.204437255859375, 0.251220703125, 0.298004150390625, 0.34478759765625, 0.391571044921875, 0.4383544921875, 0.485137939453125, 0.53192138671875, 0.578704833984375, 0.62548828125, 0.672271728515625, 0.71905517578125, 0.765838623046875, 0.8126220703125, 0.859405517578125, 0.90618896484375, 0.952972412109375, 0.999755859375, 1.046539306640625, 1.09332275390625, 1.140106201171875, 1.1868896484375, 1.233673095703125, 1.28045654296875, 1.327239990234375, 1.3740234375]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 7.0, 6.0, 6.0, 10.0, 5.0, 8.0, 13.0, 17.0, 20.0, 18.0, 27.0, 19.0, 24.0, 26.0, 26.0, 35.0, 33.0, 27.0, 30.0, 54.0, 41.0, 45.0, 1061.0, 38.0, 35.0, 44.0, 44.0, 42.0, 37.0, 34.0, 25.0, 19.0, 21.0, 23.0, 18.0, 18.0, 14.0, 16.0, 9.0, 14.0, 7.0, 4.0, 2.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-9.4609375, -9.17529296875, -8.8896484375, -8.60400390625, -8.318359375, -8.03271484375, -7.7470703125, -7.46142578125, -7.17578125, -6.89013671875, -6.6044921875, -6.31884765625, -6.033203125, -5.74755859375, -5.4619140625, -5.17626953125, -4.890625, -4.60498046875, -4.3193359375, -4.03369140625, -3.748046875, -3.46240234375, -3.1767578125, -2.89111328125, -2.60546875, -2.31982421875, -2.0341796875, -1.74853515625, -1.462890625, -1.17724609375, -0.8916015625, -0.60595703125, -0.3203125, -0.03466796875, 0.2509765625, 0.53662109375, 0.822265625, 1.10791015625, 1.3935546875, 1.67919921875, 1.96484375, 2.25048828125, 2.5361328125, 2.82177734375, 3.107421875, 3.39306640625, 3.6787109375, 3.96435546875, 4.25, 4.53564453125, 4.8212890625, 5.10693359375, 5.392578125, 5.67822265625, 5.9638671875, 6.24951171875, 6.53515625, 6.82080078125, 7.1064453125, 7.39208984375, 7.677734375, 7.96337890625, 8.2490234375, 8.53466796875, 8.8203125]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 11.0, 10.0, 16.0, 35.0, 64.0, 71.0, 101.0, 141.0, 248.0, 395.0, 579.0, 884.0, 1398.0, 2110.0, 3416.0, 5117.0, 8038.0, 12141.0, 19383.0, 31642.0, 53554.0, 94284.0, 170547.0, 1291756.0, 169470.0, 93207.0, 53342.0, 31380.0, 19408.0, 11856.0, 7876.0, 5095.0, 3377.0, 2169.0, 1393.0, 942.0, 619.0, 378.0, 227.0, 141.0, 100.0, 79.0, 46.0, 30.0, 29.0, 12.0, 9.0, 3.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.88232421875, -0.85430908203125, -0.8262939453125, -0.79827880859375, -0.770263671875, -0.74224853515625, -0.7142333984375, -0.68621826171875, -0.658203125, -0.63018798828125, -0.6021728515625, -0.57415771484375, -0.546142578125, -0.51812744140625, -0.4901123046875, -0.46209716796875, -0.43408203125, -0.40606689453125, -0.3780517578125, -0.35003662109375, -0.322021484375, -0.29400634765625, -0.2659912109375, -0.23797607421875, -0.2099609375, -0.18194580078125, -0.1539306640625, -0.12591552734375, -0.097900390625, -0.06988525390625, -0.0418701171875, -0.01385498046875, 0.01416015625, 0.04217529296875, 0.0701904296875, 0.09820556640625, 0.126220703125, 0.15423583984375, 0.1822509765625, 0.21026611328125, 0.23828125, 0.26629638671875, 0.2943115234375, 0.32232666015625, 0.350341796875, 0.37835693359375, 0.4063720703125, 0.43438720703125, 0.46240234375, 0.49041748046875, 0.5184326171875, 0.54644775390625, 0.574462890625, 0.60247802734375, 0.6304931640625, 0.65850830078125, 0.6865234375, 0.71453857421875, 0.7425537109375, 0.77056884765625, 0.798583984375, 0.82659912109375, 0.8546142578125, 0.88262939453125, 0.91064453125]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 12.0, 37.0, 36.0, 64.0, 99.0, 126.0, 148.0, 149.0, 112.0, 75.0, 58.0, 29.0, 21.0, 5.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0391845703125, -0.03802061080932617, -0.036856651306152344, -0.035692691802978516, -0.03452873229980469, -0.03336477279663086, -0.03220081329345703, -0.031036853790283203, -0.029872894287109375, -0.028708934783935547, -0.02754497528076172, -0.02638101577758789, -0.025217056274414062, -0.024053096771240234, -0.022889137268066406, -0.021725177764892578, -0.02056121826171875, -0.019397258758544922, -0.018233299255371094, -0.017069339752197266, -0.015905380249023438, -0.01474142074584961, -0.013577461242675781, -0.012413501739501953, -0.011249542236328125, -0.010085582733154297, -0.008921623229980469, -0.007757663726806641, -0.0065937042236328125, -0.005429744720458984, -0.004265785217285156, -0.003101825714111328, -0.0019378662109375, -0.0007739067077636719, 0.00039005279541015625, 0.0015540122985839844, 0.0027179718017578125, 0.0038819313049316406, 0.005045890808105469, 0.006209850311279297, 0.007373809814453125, 0.008537769317626953, 0.009701728820800781, 0.01086568832397461, 0.012029647827148438, 0.013193607330322266, 0.014357566833496094, 0.015521526336669922, 0.01668548583984375, 0.017849445343017578, 0.019013404846191406, 0.020177364349365234, 0.021341323852539062, 0.02250528335571289, 0.02366924285888672, 0.024833202362060547, 0.025997161865234375, 0.027161121368408203, 0.02832508087158203, 0.02948904037475586, 0.030652999877929688, 0.031816959381103516, 0.032980918884277344, 0.03414487838745117, 0.035308837890625]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 5.0, 3.0, 3.0, 8.0, 11.0, 16.0, 38.0, 80.0, 160.0, 359.0, 4417.0, 1037842.0, 4938.0, 356.0, 151.0, 70.0, 46.0, 10.0, 16.0, 5.0, 2.0, 3.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.765625, -0.7405319213867188, -0.7154388427734375, -0.6903457641601562, -0.665252685546875, -0.6401596069335938, -0.6150665283203125, -0.5899734497070312, -0.56488037109375, -0.5397872924804688, -0.5146942138671875, -0.48960113525390625, -0.464508056640625, -0.43941497802734375, -0.4143218994140625, -0.38922882080078125, -0.3641357421875, -0.33904266357421875, -0.3139495849609375, -0.28885650634765625, -0.263763427734375, -0.23867034912109375, -0.2135772705078125, -0.18848419189453125, -0.16339111328125, -0.13829803466796875, -0.1132049560546875, -0.08811187744140625, -0.063018798828125, -0.03792572021484375, -0.0128326416015625, 0.01226043701171875, 0.037353515625, 0.06244659423828125, 0.0875396728515625, 0.11263275146484375, 0.137725830078125, 0.16281890869140625, 0.1879119873046875, 0.21300506591796875, 0.23809814453125, 0.26319122314453125, 0.2882843017578125, 0.31337738037109375, 0.338470458984375, 0.36356353759765625, 0.3886566162109375, 0.41374969482421875, 0.4388427734375, 0.46393585205078125, 0.4890289306640625, 0.5141220092773438, 0.539215087890625, 0.5643081665039062, 0.5894012451171875, 0.6144943237304688, 0.63958740234375, 0.6646804809570312, 0.6897735595703125, 0.7148666381835938, 0.739959716796875, 0.7650527954101562, 0.7901458740234375, 0.8152389526367188, 0.84033203125]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [4.0, 3.0, 35.0, 146.0, 600.0, 165.0, 39.0, 17.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.025875117629766464, -0.02000894397497177, -0.014142771251499653, -0.008276598528027534, -0.0024104248732328415, 0.0034557487815618515, 0.009321920573711395, 0.015188094228506088, 0.02105426788330078, 0.026920441538095474, 0.03278661519289017, 0.03865278512239456, 0.04451896250247955, 0.05038513243198395, 0.05625130608677864, 0.062117479741573334, 0.06798365712165833, 0.07384982705116272, 0.07971600443124771, 0.0855821743607521, 0.0914483517408371, 0.09731452167034149, 0.10318069159984589, 0.10904686897993088, 0.11491303890943527, 0.12077920883893967, 0.12664538621902466, 0.13251155614852905, 0.13837772607803345, 0.14424391090869904, 0.15011008083820343, 0.15597625076770782, 0.16184242069721222, 0.1677085906267166, 0.173574760556221, 0.1794409453868866, 0.185307115316391, 0.19117328524589539, 0.19703945517539978, 0.20290562510490417, 0.20877180993556976, 0.21463797986507416, 0.22050414979457855, 0.22637033462524414, 0.23223650455474854, 0.23810267448425293, 0.24396884441375732, 0.24983501434326172, 0.2557011842727661, 0.2615673542022705, 0.2674335241317749, 0.2732996940612793, 0.2791658639907837, 0.2850320637226105, 0.29089823365211487, 0.29676440358161926, 0.30263057351112366, 0.30849674344062805, 0.31436291337013245, 0.32022908329963684, 0.32609525322914124, 0.331961452960968, 0.3378276228904724, 0.3436937928199768, 0.3495599627494812]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 1.0, 8.0, 9.0, 8.0, 11.0, 14.0, 11.0, 13.0, 13.0, 14.0, 21.0, 15.0, 23.0, 24.0, 26.0, 28.0, 26.0, 32.0, 30.0, 31.0, 36.0, 29.0, 34.0, 31.0, 41.0, 48.0, 31.0, 42.0, 43.0, 26.0, 31.0, 34.0, 32.0, 29.0, 22.0, 21.0, 19.0, 15.0, 18.0, 16.0, 14.0, 6.0, 5.0, 6.0, 3.0, 7.0, 1.0, 2.0, 2.0, 5.0, 1.0, 0.0, 1.0], "bins": [-0.030151307582855225, -0.02926386147737503, -0.028376417234539986, -0.02748897299170494, -0.026601526886224747, -0.025714080780744553, -0.024826636537909508, -0.023939192295074463, -0.02305174618959427, -0.022164300084114075, -0.02127685584127903, -0.020389411598443985, -0.01950196549296379, -0.018614519387483597, -0.017727075144648552, -0.016839630901813507, -0.015952184796333313, -0.015064739622175694, -0.014177294448018074, -0.013289849273860455, -0.012402404099702835, -0.011514958925545216, -0.010627513751387596, -0.009740068577229977, -0.008852623403072357, -0.007965178228914738, -0.007077733054757118, -0.006190287880599499, -0.005302842706441879, -0.00441539753228426, -0.0035279523581266403, -0.002640507183969021, -0.0017530620098114014, -0.0008656168356537819, 2.1828338503837585e-05, 0.0009092735126614571, 0.0017967186868190765, 0.002684163860976696, 0.0035716090351343155, 0.004459054209291935, 0.0053464993834495544, 0.006233944557607174, 0.007121389731764793, 0.008008834905922413, 0.008896280080080032, 0.009783725254237652, 0.010671170428395271, 0.01155861560255289, 0.01244606077671051, 0.01333350595086813, 0.01422095112502575, 0.015108396299183369, 0.015995841473340988, 0.016883287578821182, 0.017770731821656227, 0.018658176064491272, 0.019545622169971466, 0.02043306827545166, 0.021320512518286705, 0.02220795676112175, 0.023095402866601944, 0.023982848972082138, 0.024870293214917183, 0.025757737457752228, 0.026645183563232422]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 6.0, 10.0, 2.0, 13.0, 17.0, 16.0, 21.0, 21.0, 14.0, 30.0, 30.0, 36.0, 25.0, 42.0, 40.0, 39.0, 46.0, 41.0, 44.0, 33.0, 41.0, 47.0, 37.0, 35.0, 44.0, 37.0, 28.0, 29.0, 24.0, 25.0, 21.0, 14.0, 23.0, 16.0, 6.0, 12.0, 5.0, 10.0, 8.0, 2.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 4.0], "bins": [-15.5078125, -15.05712890625, -14.6064453125, -14.15576171875, -13.705078125, -13.25439453125, -12.8037109375, -12.35302734375, -11.90234375, -11.45166015625, -11.0009765625, -10.55029296875, -10.099609375, -9.64892578125, -9.1982421875, -8.74755859375, -8.296875, -7.84619140625, -7.3955078125, -6.94482421875, -6.494140625, -6.04345703125, -5.5927734375, -5.14208984375, -4.69140625, -4.24072265625, -3.7900390625, -3.33935546875, -2.888671875, -2.43798828125, -1.9873046875, -1.53662109375, -1.0859375, -0.63525390625, -0.1845703125, 0.26611328125, 0.716796875, 1.16748046875, 1.6181640625, 2.06884765625, 2.51953125, 2.97021484375, 3.4208984375, 3.87158203125, 4.322265625, 4.77294921875, 5.2236328125, 5.67431640625, 6.125, 6.57568359375, 7.0263671875, 7.47705078125, 7.927734375, 8.37841796875, 8.8291015625, 9.27978515625, 9.73046875, 10.18115234375, 10.6318359375, 11.08251953125, 11.533203125, 11.98388671875, 12.4345703125, 12.88525390625, 13.3359375]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 6.0, 9.0, 10.0, 15.0, 21.0, 30.0, 38.0, 52.0, 107.0, 120.0, 186.0, 253.0, 380.0, 657.0, 1056.0, 1894.0, 3259.0, 6343.0, 13059.0, 29137.0, 70294.0, 188489.0, 418975.0, 187956.0, 69596.0, 29076.0, 13193.0, 6322.0, 3240.0, 1843.0, 1067.0, 617.0, 395.0, 275.0, 164.0, 118.0, 92.0, 57.0, 40.0, 35.0, 23.0, 16.0, 13.0, 8.0, 7.0, 4.0, 4.0, 6.0, 4.0, 4.0, 1.0], "bins": [-6.91796875, -6.72308349609375, -6.5281982421875, -6.33331298828125, -6.138427734375, -5.94354248046875, -5.7486572265625, -5.55377197265625, -5.35888671875, -5.16400146484375, -4.9691162109375, -4.77423095703125, -4.579345703125, -4.38446044921875, -4.1895751953125, -3.99468994140625, -3.7998046875, -3.60491943359375, -3.4100341796875, -3.21514892578125, -3.020263671875, -2.82537841796875, -2.6304931640625, -2.43560791015625, -2.24072265625, -2.04583740234375, -1.8509521484375, -1.65606689453125, -1.461181640625, -1.26629638671875, -1.0714111328125, -0.87652587890625, -0.681640625, -0.48675537109375, -0.2918701171875, -0.09698486328125, 0.097900390625, 0.29278564453125, 0.4876708984375, 0.68255615234375, 0.87744140625, 1.07232666015625, 1.2672119140625, 1.46209716796875, 1.656982421875, 1.85186767578125, 2.0467529296875, 2.24163818359375, 2.4365234375, 2.63140869140625, 2.8262939453125, 3.02117919921875, 3.216064453125, 3.41094970703125, 3.6058349609375, 3.80072021484375, 3.99560546875, 4.19049072265625, 4.3853759765625, 4.58026123046875, 4.775146484375, 4.97003173828125, 5.1649169921875, 5.35980224609375, 5.5546875]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 3.0, 4.0, 7.0, 9.0, 11.0, 12.0, 19.0, 15.0, 27.0, 32.0, 30.0, 34.0, 45.0, 39.0, 38.0, 42.0, 60.0, 105.0, 1847.0, 188.0, 73.0, 58.0, 38.0, 43.0, 42.0, 39.0, 24.0, 29.0, 19.0, 23.0, 19.0, 11.0, 14.0, 8.0, 13.0, 3.0, 7.0, 7.0, 6.0, 2.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0], "bins": [-49.625, -48.2705078125, -46.916015625, -45.5615234375, -44.20703125, -42.8525390625, -41.498046875, -40.1435546875, -38.7890625, -37.4345703125, -36.080078125, -34.7255859375, -33.37109375, -32.0166015625, -30.662109375, -29.3076171875, -27.953125, -26.5986328125, -25.244140625, -23.8896484375, -22.53515625, -21.1806640625, -19.826171875, -18.4716796875, -17.1171875, -15.7626953125, -14.408203125, -13.0537109375, -11.69921875, -10.3447265625, -8.990234375, -7.6357421875, -6.28125, -4.9267578125, -3.572265625, -2.2177734375, -0.86328125, 0.4912109375, 1.845703125, 3.2001953125, 4.5546875, 5.9091796875, 7.263671875, 8.6181640625, 9.97265625, 11.3271484375, 12.681640625, 14.0361328125, 15.390625, 16.7451171875, 18.099609375, 19.4541015625, 20.80859375, 22.1630859375, 23.517578125, 24.8720703125, 26.2265625, 27.5810546875, 28.935546875, 30.2900390625, 31.64453125, 32.9990234375, 34.353515625, 35.7080078125, 37.0625]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 5.0, 10.0, 4.0, 8.0, 13.0, 13.0, 21.0, 27.0, 30.0, 40.0, 57.0, 68.0, 89.0, 121.0, 158.0, 252.0, 421.0, 1104.0, 18260.0, 3117897.0, 5152.0, 782.0, 354.0, 218.0, 152.0, 114.0, 85.0, 57.0, 43.0, 44.0, 19.0, 21.0, 16.0, 12.0, 8.0, 6.0, 4.0, 6.0, 5.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-87.9375, -84.7236328125, -81.509765625, -78.2958984375, -75.08203125, -71.8681640625, -68.654296875, -65.4404296875, -62.2265625, -59.0126953125, -55.798828125, -52.5849609375, -49.37109375, -46.1572265625, -42.943359375, -39.7294921875, -36.515625, -33.3017578125, -30.087890625, -26.8740234375, -23.66015625, -20.4462890625, -17.232421875, -14.0185546875, -10.8046875, -7.5908203125, -4.376953125, -1.1630859375, 2.05078125, 5.2646484375, 8.478515625, 11.6923828125, 14.90625, 18.1201171875, 21.333984375, 24.5478515625, 27.76171875, 30.9755859375, 34.189453125, 37.4033203125, 40.6171875, 43.8310546875, 47.044921875, 50.2587890625, 53.47265625, 56.6865234375, 59.900390625, 63.1142578125, 66.328125, 69.5419921875, 72.755859375, 75.9697265625, 79.18359375, 82.3974609375, 85.611328125, 88.8251953125, 92.0390625, 95.2529296875, 98.466796875, 101.6806640625, 104.89453125, 108.1083984375, 111.322265625, 114.5361328125, 117.75]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 7.0, 132.0, 604.0, 255.0, 15.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.84003829956055, -27.916202545166016, -22.99236488342285, -18.068527221679688, -13.144691467285156, -8.220855712890625, -3.297018051147461, 1.6268196105957031, 6.550655364990234, 11.474492073059082, 16.39832878112793, 21.322166442871094, 26.246002197265625, 31.169837951660156, 36.09367370605469, 41.017513275146484, 45.941349029541016, 50.86518478393555, 55.789024353027344, 60.712860107421875, 65.6366958618164, 70.56053161621094, 75.48436737060547, 80.408203125, 85.33204650878906, 90.2558822631836, 95.17971801757812, 100.10355377197266, 105.02738952636719, 109.95123291015625, 114.87506866455078, 119.79890441894531, 124.72274780273438, 129.64659118652344, 134.57041931152344, 139.4942626953125, 144.4180908203125, 149.34193420410156, 154.26576232910156, 159.18960571289062, 164.11343383789062, 169.0372772216797, 173.9611053466797, 178.88494873046875, 183.80877685546875, 188.7326202392578, 193.6564483642578, 198.58029174804688, 203.50413513183594, 208.427978515625, 213.351806640625, 218.27565002441406, 223.19947814941406, 228.12332153320312, 233.04714965820312, 237.9709930419922, 242.89483642578125, 247.8186798095703, 252.7425079345703, 257.6663513183594, 262.5901794433594, 267.5140075683594, 272.4378662109375, 277.3616943359375, 282.2855224609375]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 3.0, 8.0, 2.0, 6.0, 12.0, 5.0, 12.0, 14.0, 25.0, 21.0, 21.0, 26.0, 30.0, 21.0, 37.0, 32.0, 30.0, 28.0, 42.0, 36.0, 42.0, 42.0, 42.0, 56.0, 40.0, 32.0, 47.0, 28.0, 32.0, 32.0, 33.0, 24.0, 20.0, 22.0, 17.0, 13.0, 10.0, 18.0, 10.0, 9.0, 6.0, 5.0, 4.0, 6.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-114.08296203613281, -110.76636505126953, -107.44976043701172, -104.13316345214844, -100.81655883789062, -97.49996185302734, -94.18336486816406, -90.86676025390625, -87.55016326904297, -84.23356628417969, -80.91696166992188, -77.6003646850586, -74.28376770019531, -70.9671630859375, -67.65056610107422, -64.33396911621094, -61.017364501953125, -57.70076370239258, -54.38416290283203, -51.06756591796875, -47.7509651184082, -44.434364318847656, -41.117767333984375, -37.80116653442383, -34.48456573486328, -31.167964935302734, -27.85136604309082, -24.534767150878906, -21.21816635131836, -17.901565551757812, -14.584966659545898, -11.268367767333984, -7.9517669677734375, -4.635167121887207, -1.3185672760009766, 1.998032569885254, 5.314632415771484, 8.631233215332031, 11.947832107543945, 15.26443099975586, 18.581031799316406, 21.897632598876953, 25.214231491088867, 28.53083038330078, 31.847431182861328, 35.164031982421875, 38.480628967285156, 41.7972297668457, 45.11383056640625, 48.4304313659668, 51.747032165527344, 55.063629150390625, 58.38022994995117, 61.69683074951172, 65.013427734375, 68.33003234863281, 71.6466293334961, 74.96322631835938, 78.27983093261719, 81.59642791748047, 84.91302490234375, 88.22962951660156, 91.54622650146484, 94.86282348632812, 98.17942810058594]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 6.0, 6.0, 8.0, 12.0, 13.0, 12.0, 25.0, 17.0, 15.0, 34.0, 25.0, 34.0, 25.0, 39.0, 45.0, 45.0, 37.0, 46.0, 43.0, 35.0, 43.0, 33.0, 36.0, 41.0, 41.0, 39.0, 33.0, 30.0, 30.0, 17.0, 26.0, 12.0, 19.0, 18.0, 6.0, 15.0, 12.0, 6.0, 5.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 4.0, 2.0], "bins": [-15.6796875, -15.227783203125, -14.77587890625, -14.323974609375, -13.8720703125, -13.420166015625, -12.96826171875, -12.516357421875, -12.064453125, -11.612548828125, -11.16064453125, -10.708740234375, -10.2568359375, -9.804931640625, -9.35302734375, -8.901123046875, -8.44921875, -7.997314453125, -7.54541015625, -7.093505859375, -6.6416015625, -6.189697265625, -5.73779296875, -5.285888671875, -4.833984375, -4.382080078125, -3.93017578125, -3.478271484375, -3.0263671875, -2.574462890625, -2.12255859375, -1.670654296875, -1.21875, -0.766845703125, -0.31494140625, 0.136962890625, 0.5888671875, 1.040771484375, 1.49267578125, 1.944580078125, 2.396484375, 2.848388671875, 3.30029296875, 3.752197265625, 4.2041015625, 4.656005859375, 5.10791015625, 5.559814453125, 6.01171875, 6.463623046875, 6.91552734375, 7.367431640625, 7.8193359375, 8.271240234375, 8.72314453125, 9.175048828125, 9.626953125, 10.078857421875, 10.53076171875, 10.982666015625, 11.4345703125, 11.886474609375, 12.33837890625, 12.790283203125, 13.2421875]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 3.0, 9.0, 6.0, 11.0, 15.0, 23.0, 37.0, 47.0, 75.0, 84.0, 122.0, 193.0, 268.0, 400.0, 595.0, 911.0, 1514.0, 3256.0, 8152.0, 54044.0, 2263617.0, 1811089.0, 34622.0, 7438.0, 3292.0, 1586.0, 925.0, 570.0, 379.0, 270.0, 185.0, 142.0, 101.0, 81.0, 63.0, 24.0, 39.0, 30.0, 21.0, 14.0, 9.0, 7.0, 4.0, 4.0, 0.0, 2.0, 4.0, 4.0, 2.0, 1.0], "bins": [-50.65625, -49.20751953125, -47.7587890625, -46.31005859375, -44.861328125, -43.41259765625, -41.9638671875, -40.51513671875, -39.06640625, -37.61767578125, -36.1689453125, -34.72021484375, -33.271484375, -31.82275390625, -30.3740234375, -28.92529296875, -27.4765625, -26.02783203125, -24.5791015625, -23.13037109375, -21.681640625, -20.23291015625, -18.7841796875, -17.33544921875, -15.88671875, -14.43798828125, -12.9892578125, -11.54052734375, -10.091796875, -8.64306640625, -7.1943359375, -5.74560546875, -4.296875, -2.84814453125, -1.3994140625, 0.04931640625, 1.498046875, 2.94677734375, 4.3955078125, 5.84423828125, 7.29296875, 8.74169921875, 10.1904296875, 11.63916015625, 13.087890625, 14.53662109375, 15.9853515625, 17.43408203125, 18.8828125, 20.33154296875, 21.7802734375, 23.22900390625, 24.677734375, 26.12646484375, 27.5751953125, 29.02392578125, 30.47265625, 31.92138671875, 33.3701171875, 34.81884765625, 36.267578125, 37.71630859375, 39.1650390625, 40.61376953125, 42.0625]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 3.0, 6.0, 8.0, 4.0, 10.0, 6.0, 15.0, 17.0, 18.0, 19.0, 43.0, 61.0, 117.0, 242.0, 481.0, 880.0, 983.0, 579.0, 239.0, 133.0, 63.0, 38.0, 26.0, 15.0, 19.0, 14.0, 12.0, 7.0, 8.0, 4.0, 3.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-38.8125, -37.79296875, -36.7734375, -35.75390625, -34.734375, -33.71484375, -32.6953125, -31.67578125, -30.65625, -29.63671875, -28.6171875, -27.59765625, -26.578125, -25.55859375, -24.5390625, -23.51953125, -22.5, -21.48046875, -20.4609375, -19.44140625, -18.421875, -17.40234375, -16.3828125, -15.36328125, -14.34375, -13.32421875, -12.3046875, -11.28515625, -10.265625, -9.24609375, -8.2265625, -7.20703125, -6.1875, -5.16796875, -4.1484375, -3.12890625, -2.109375, -1.08984375, -0.0703125, 0.94921875, 1.96875, 2.98828125, 4.0078125, 5.02734375, 6.046875, 7.06640625, 8.0859375, 9.10546875, 10.125, 11.14453125, 12.1640625, 13.18359375, 14.203125, 15.22265625, 16.2421875, 17.26171875, 18.28125, 19.30078125, 20.3203125, 21.33984375, 22.359375, 23.37890625, 24.3984375, 25.41796875, 26.4375]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 8.0, 8.0, 12.0, 25.0, 21.0, 33.0, 64.0, 86.0, 198.0, 514.0, 1657.0, 8029.0, 83561.0, 4046108.0, 46147.0, 5669.0, 1288.0, 417.0, 179.0, 78.0, 52.0, 38.0, 26.0, 10.0, 10.0, 9.0, 8.0, 11.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-103.6875, -99.7607421875, -95.833984375, -91.9072265625, -87.98046875, -84.0537109375, -80.126953125, -76.2001953125, -72.2734375, -68.3466796875, -64.419921875, -60.4931640625, -56.56640625, -52.6396484375, -48.712890625, -44.7861328125, -40.859375, -36.9326171875, -33.005859375, -29.0791015625, -25.15234375, -21.2255859375, -17.298828125, -13.3720703125, -9.4453125, -5.5185546875, -1.591796875, 2.3349609375, 6.26171875, 10.1884765625, 14.115234375, 18.0419921875, 21.96875, 25.8955078125, 29.822265625, 33.7490234375, 37.67578125, 41.6025390625, 45.529296875, 49.4560546875, 53.3828125, 57.3095703125, 61.236328125, 65.1630859375, 69.08984375, 73.0166015625, 76.943359375, 80.8701171875, 84.796875, 88.7236328125, 92.650390625, 96.5771484375, 100.50390625, 104.4306640625, 108.357421875, 112.2841796875, 116.2109375, 120.1376953125, 124.064453125, 127.9912109375, 131.91796875, 135.8447265625, 139.771484375, 143.6982421875, 147.625]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 5.0, 8.0, 5.0, 16.0, 27.0, 46.0, 84.0, 190.0, 259.0, 182.0, 91.0, 43.0, 25.0, 7.0, 10.0, 6.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-161.24630737304688, -155.5892333984375, -149.93214416503906, -144.2750701904297, -138.6179962158203, -132.96090698242188, -127.3038330078125, -121.64675903320312, -115.98967742919922, -110.33259582519531, -104.67552185058594, -99.01844024658203, -93.36135864257812, -87.70428466796875, -82.04720306396484, -76.39012145996094, -70.73304748535156, -65.07596588134766, -59.41889190673828, -53.761810302734375, -48.104732513427734, -42.447654724121094, -36.79057312011719, -31.133495330810547, -25.476417541503906, -19.819339752197266, -14.162260055541992, -8.505180358886719, -2.848102569580078, 2.8089752197265625, 8.466056823730469, 14.12313461303711, 19.780227661132812, 25.437305450439453, 31.094385147094727, 36.75146484375, 42.40854263305664, 48.06562042236328, 53.72270202636719, 59.37977981567383, 65.03685760498047, 70.69393920898438, 76.35101318359375, 82.00809478759766, 87.66517639160156, 93.32225036621094, 98.97933197021484, 104.63641357421875, 110.29348754882812, 115.95056915283203, 121.6076431274414, 127.26472473144531, 132.9217987060547, 138.57888793945312, 144.2359619140625, 149.89303588867188, 155.55010986328125, 161.20718383789062, 166.86427307128906, 172.52134704589844, 178.1784210205078, 183.83551025390625, 189.49258422851562, 195.149658203125, 200.80674743652344]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 8.0, 0.0, 4.0, 8.0, 13.0, 8.0, 21.0, 10.0, 13.0, 10.0, 16.0, 22.0, 19.0, 35.0, 25.0, 25.0, 39.0, 30.0, 28.0, 41.0, 39.0, 40.0, 31.0, 40.0, 40.0, 24.0, 47.0, 40.0, 32.0, 36.0, 25.0, 29.0, 27.0, 15.0, 25.0, 22.0, 18.0, 9.0, 16.0, 10.0, 9.0, 10.0, 7.0, 9.0, 10.0, 4.0, 3.0, 4.0, 3.0, 1.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-61.555450439453125, -59.51859664916992, -57.481746673583984, -55.44489288330078, -53.408042907714844, -51.37118911743164, -49.33433532714844, -47.2974853515625, -45.2606315612793, -43.223777770996094, -41.186927795410156, -39.15007400512695, -37.11322021484375, -35.07637023925781, -33.03951644897461, -31.00266456604004, -28.96581268310547, -26.9289608001709, -24.892108917236328, -22.855255126953125, -20.818403244018555, -18.781551361083984, -16.74469757080078, -14.707845687866211, -12.67099380493164, -10.63414192199707, -8.597289085388184, -6.560436725616455, -4.523584365844727, -2.4867324829101562, -0.44987964630126953, 1.5869731903076172, 3.6238250732421875, 5.660677433013916, 7.6975297927856445, 9.734382629394531, 11.771234512329102, 13.808086395263672, 15.844939231872559, 17.881792068481445, 19.918643951416016, 21.955495834350586, 23.992347717285156, 26.02920150756836, 28.06605339050293, 30.1029052734375, 32.1397590637207, 34.176612854003906, 36.213462829589844, 38.25031661987305, 40.287166595458984, 42.32402038574219, 44.360870361328125, 46.39772415161133, 48.43457794189453, 50.47142791748047, 52.50828170776367, 54.545135498046875, 56.58198547363281, 58.618839263916016, 60.65569305419922, 62.692543029785156, 64.7293930053711, 66.76625061035156, 68.8031005859375]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 4.0, 1.0, 4.0, 9.0, 10.0, 12.0, 13.0, 12.0, 21.0, 30.0, 16.0, 27.0, 28.0, 37.0, 24.0, 16.0, 45.0, 46.0, 34.0, 51.0, 35.0, 48.0, 38.0, 33.0, 40.0, 34.0, 27.0, 34.0, 27.0, 40.0, 28.0, 28.0, 18.0, 24.0, 19.0, 13.0, 16.0, 14.0, 8.0, 11.0, 7.0, 9.0, 5.0, 4.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-13.7734375, -13.3431396484375, -12.912841796875, -12.4825439453125, -12.05224609375, -11.6219482421875, -11.191650390625, -10.7613525390625, -10.3310546875, -9.9007568359375, -9.470458984375, -9.0401611328125, -8.60986328125, -8.1795654296875, -7.749267578125, -7.3189697265625, -6.888671875, -6.4583740234375, -6.028076171875, -5.5977783203125, -5.16748046875, -4.7371826171875, -4.306884765625, -3.8765869140625, -3.4462890625, -3.0159912109375, -2.585693359375, -2.1553955078125, -1.72509765625, -1.2947998046875, -0.864501953125, -0.4342041015625, -0.00390625, 0.4263916015625, 0.856689453125, 1.2869873046875, 1.71728515625, 2.1475830078125, 2.577880859375, 3.0081787109375, 3.4384765625, 3.8687744140625, 4.299072265625, 4.7293701171875, 5.15966796875, 5.5899658203125, 6.020263671875, 6.4505615234375, 6.880859375, 7.3111572265625, 7.741455078125, 8.1717529296875, 8.60205078125, 9.0323486328125, 9.462646484375, 9.8929443359375, 10.3232421875, 10.7535400390625, 11.183837890625, 11.6141357421875, 12.04443359375, 12.4747314453125, 12.905029296875, 13.3353271484375, 13.765625]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 8.0, 8.0, 11.0, 17.0, 42.0, 49.0, 78.0, 117.0, 138.0, 246.0, 358.0, 631.0, 940.0, 1439.0, 2209.0, 3396.0, 5431.0, 8680.0, 13729.0, 21931.0, 35402.0, 58075.0, 100568.0, 177974.0, 237592.0, 155526.0, 87870.0, 51425.0, 31761.0, 19473.0, 12170.0, 7757.0, 5011.0, 3120.0, 1905.0, 1218.0, 762.0, 507.0, 340.0, 219.0, 147.0, 95.0, 66.0, 44.0, 22.0, 20.0, 6.0, 6.0, 9.0, 6.0, 8.0, 1.0, 0.0, 2.0], "bins": [-1.53125, -1.4867095947265625, -1.442169189453125, -1.3976287841796875, -1.35308837890625, -1.3085479736328125, -1.264007568359375, -1.2194671630859375, -1.1749267578125, -1.1303863525390625, -1.085845947265625, -1.0413055419921875, -0.99676513671875, -0.9522247314453125, -0.907684326171875, -0.8631439208984375, -0.818603515625, -0.7740631103515625, -0.729522705078125, -0.6849822998046875, -0.64044189453125, -0.5959014892578125, -0.551361083984375, -0.5068206787109375, -0.4622802734375, -0.4177398681640625, -0.373199462890625, -0.3286590576171875, -0.28411865234375, -0.2395782470703125, -0.195037841796875, -0.1504974365234375, -0.10595703125, -0.0614166259765625, -0.016876220703125, 0.0276641845703125, 0.07220458984375, 0.1167449951171875, 0.161285400390625, 0.2058258056640625, 0.2503662109375, 0.2949066162109375, 0.339447021484375, 0.3839874267578125, 0.42852783203125, 0.4730682373046875, 0.517608642578125, 0.5621490478515625, 0.606689453125, 0.6512298583984375, 0.695770263671875, 0.7403106689453125, 0.78485107421875, 0.8293914794921875, 0.873931884765625, 0.9184722900390625, 0.9630126953125, 1.0075531005859375, 1.052093505859375, 1.0966339111328125, 1.14117431640625, 1.1857147216796875, 1.230255126953125, 1.2747955322265625, 1.3193359375]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 3.0, 3.0, 6.0, 4.0, 6.0, 7.0, 24.0, 18.0, 11.0, 14.0, 19.0, 29.0, 20.0, 31.0, 29.0, 29.0, 29.0, 39.0, 39.0, 45.0, 38.0, 38.0, 1062.0, 37.0, 50.0, 43.0, 32.0, 36.0, 38.0, 30.0, 36.0, 25.0, 27.0, 14.0, 14.0, 25.0, 9.0, 17.0, 13.0, 8.0, 10.0, 8.0, 3.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.375, -8.0994873046875, -7.823974609375, -7.5484619140625, -7.27294921875, -6.9974365234375, -6.721923828125, -6.4464111328125, -6.1708984375, -5.8953857421875, -5.619873046875, -5.3443603515625, -5.06884765625, -4.7933349609375, -4.517822265625, -4.2423095703125, -3.966796875, -3.6912841796875, -3.415771484375, -3.1402587890625, -2.86474609375, -2.5892333984375, -2.313720703125, -2.0382080078125, -1.7626953125, -1.4871826171875, -1.211669921875, -0.9361572265625, -0.66064453125, -0.3851318359375, -0.109619140625, 0.1658935546875, 0.44140625, 0.7169189453125, 0.992431640625, 1.2679443359375, 1.54345703125, 1.8189697265625, 2.094482421875, 2.3699951171875, 2.6455078125, 2.9210205078125, 3.196533203125, 3.4720458984375, 3.74755859375, 4.0230712890625, 4.298583984375, 4.5740966796875, 4.849609375, 5.1251220703125, 5.400634765625, 5.6761474609375, 5.95166015625, 6.2271728515625, 6.502685546875, 6.7781982421875, 7.0537109375, 7.3292236328125, 7.604736328125, 7.8802490234375, 8.15576171875, 8.4312744140625, 8.706787109375, 8.9822998046875, 9.2578125]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 8.0, 7.0, 13.0, 20.0, 28.0, 32.0, 93.0, 116.0, 167.0, 261.0, 401.0, 562.0, 888.0, 1375.0, 2069.0, 3192.0, 4884.0, 7660.0, 12195.0, 19286.0, 31544.0, 54478.0, 95248.0, 172042.0, 1285713.0, 170968.0, 95191.0, 53792.0, 31456.0, 19506.0, 11935.0, 7802.0, 4970.0, 3230.0, 2021.0, 1421.0, 867.0, 560.0, 355.0, 258.0, 202.0, 107.0, 75.0, 54.0, 21.0, 8.0, 16.0, 20.0, 13.0, 5.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.90087890625, -0.8739852905273438, -0.8470916748046875, -0.8201980590820312, -0.793304443359375, -0.7664108276367188, -0.7395172119140625, -0.7126235961914062, -0.68572998046875, -0.6588363647460938, -0.6319427490234375, -0.6050491333007812, -0.578155517578125, -0.5512619018554688, -0.5243682861328125, -0.49747467041015625, -0.4705810546875, -0.44368743896484375, -0.4167938232421875, -0.38990020751953125, -0.363006591796875, -0.33611297607421875, -0.3092193603515625, -0.28232574462890625, -0.25543212890625, -0.22853851318359375, -0.2016448974609375, -0.17475128173828125, -0.147857666015625, -0.12096405029296875, -0.0940704345703125, -0.06717681884765625, -0.040283203125, -0.01338958740234375, 0.0135040283203125, 0.04039764404296875, 0.067291259765625, 0.09418487548828125, 0.1210784912109375, 0.14797210693359375, 0.17486572265625, 0.20175933837890625, 0.2286529541015625, 0.25554656982421875, 0.282440185546875, 0.30933380126953125, 0.3362274169921875, 0.36312103271484375, 0.3900146484375, 0.41690826416015625, 0.4438018798828125, 0.47069549560546875, 0.497589111328125, 0.5244827270507812, 0.5513763427734375, 0.5782699584960938, 0.60516357421875, 0.6320571899414062, 0.6589508056640625, 0.6858444213867188, 0.712738037109375, 0.7396316528320312, 0.7665252685546875, 0.7934188842773438, 0.8203125]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 2.0, 2.0, 2.0, 2.0, 7.0, 6.0, 7.0, 6.0, 4.0, 13.0, 4.0, 14.0, 15.0, 24.0, 20.0, 24.0, 24.0, 30.0, 30.0, 30.0, 52.0, 68.0, 77.0, 92.0, 78.0, 60.0, 45.0, 36.0, 32.0, 39.0, 25.0, 25.0, 17.0, 18.0, 13.0, 10.0, 9.0, 10.0, 6.0, 5.0, 2.0, 5.0, 7.0, 5.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0145721435546875, -0.01407313346862793, -0.01357412338256836, -0.013075113296508789, -0.012576103210449219, -0.012077093124389648, -0.011578083038330078, -0.011079072952270508, -0.010580062866210938, -0.010081052780151367, -0.009582042694091797, -0.009083032608032227, -0.008584022521972656, -0.008085012435913086, -0.007586002349853516, -0.007086992263793945, -0.006587982177734375, -0.006088972091674805, -0.005589962005615234, -0.005090951919555664, -0.004591941833496094, -0.0040929317474365234, -0.003593921661376953, -0.003094911575317383, -0.0025959014892578125, -0.002096891403198242, -0.0015978813171386719, -0.0010988712310791016, -0.0005998611450195312, -0.00010085105895996094, 0.0003981590270996094, 0.0008971691131591797, 0.00139617919921875, 0.0018951892852783203, 0.0023941993713378906, 0.002893209457397461, 0.0033922195434570312, 0.0038912296295166016, 0.004390239715576172, 0.004889249801635742, 0.0053882598876953125, 0.005887269973754883, 0.006386280059814453, 0.0068852901458740234, 0.007384300231933594, 0.007883310317993164, 0.008382320404052734, 0.008881330490112305, 0.009380340576171875, 0.009879350662231445, 0.010378360748291016, 0.010877370834350586, 0.011376380920410156, 0.011875391006469727, 0.012374401092529297, 0.012873411178588867, 0.013372421264648438, 0.013871431350708008, 0.014370441436767578, 0.014869451522827148, 0.015368461608886719, 0.01586747169494629, 0.01636648178100586, 0.01686549186706543, 0.017364501953125]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 3.0, 3.0, 9.0, 7.0, 9.0, 7.0, 13.0, 14.0, 14.0, 22.0, 15.0, 15.0, 30.0, 44.0, 64.0, 72.0, 95.0, 186.0, 283.0, 1037.0, 19707.0, 991344.0, 33322.0, 1336.0, 304.0, 155.0, 109.0, 75.0, 50.0, 39.0, 36.0, 30.0, 18.0, 24.0, 10.0, 5.0, 12.0, 7.0, 5.0, 11.0, 6.0, 2.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.34716796875, -0.336822509765625, -0.32647705078125, -0.316131591796875, -0.3057861328125, -0.295440673828125, -0.28509521484375, -0.274749755859375, -0.264404296875, -0.254058837890625, -0.24371337890625, -0.233367919921875, -0.2230224609375, -0.212677001953125, -0.20233154296875, -0.191986083984375, -0.181640625, -0.171295166015625, -0.16094970703125, -0.150604248046875, -0.1402587890625, -0.129913330078125, -0.11956787109375, -0.109222412109375, -0.098876953125, -0.088531494140625, -0.07818603515625, -0.067840576171875, -0.0574951171875, -0.047149658203125, -0.03680419921875, -0.026458740234375, -0.01611328125, -0.005767822265625, 0.00457763671875, 0.014923095703125, 0.0252685546875, 0.035614013671875, 0.04595947265625, 0.056304931640625, 0.066650390625, 0.076995849609375, 0.08734130859375, 0.097686767578125, 0.1080322265625, 0.118377685546875, 0.12872314453125, 0.139068603515625, 0.1494140625, 0.159759521484375, 0.17010498046875, 0.180450439453125, 0.1907958984375, 0.201141357421875, 0.21148681640625, 0.221832275390625, 0.232177734375, 0.242523193359375, 0.25286865234375, 0.263214111328125, 0.2735595703125, 0.283905029296875, 0.29425048828125, 0.304595947265625, 0.31494140625]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 20.0, 130.0, 664.0, 146.0, 44.0, 9.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.04348637908697128, -0.037645310163497925, -0.031804244965314865, -0.025963177904486656, -0.020122110843658447, -0.014281043782830238, -0.00843997672200203, -0.0025989115238189697, 0.0032421573996543884, 0.009083224460482597, 0.014924291521310806, 0.020765358582139015, 0.026606425642967224, 0.03244749456644058, 0.03828855976462364, 0.0441296249628067, 0.04997069388628006, 0.05581176280975342, 0.06165282800793648, 0.06749389320611954, 0.0733349621295929, 0.07917603105306625, 0.08501709997653961, 0.09085816144943237, 0.09669923037290573, 0.10254029929637909, 0.10838136076927185, 0.11422242969274521, 0.12006349861621857, 0.12590456008911133, 0.13174563646316528, 0.13758669793605804, 0.1434277594089508, 0.14926882088184357, 0.15510989725589752, 0.16095095872879028, 0.16679203510284424, 0.172633096575737, 0.17847415804862976, 0.18431523442268372, 0.19015629589557648, 0.19599735736846924, 0.2018384337425232, 0.20767949521541595, 0.21352055668830872, 0.21936163306236267, 0.22520269453525543, 0.2310437560081482, 0.23688483238220215, 0.2427258938550949, 0.24856697022914886, 0.2544080317020416, 0.2602491080760956, 0.26609015464782715, 0.2719312310218811, 0.27777230739593506, 0.283613383769989, 0.28945446014404297, 0.29529550671577454, 0.3011365830898285, 0.30697765946388245, 0.312818706035614, 0.31865978240966797, 0.3245008587837219, 0.3303419053554535]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 2.0, 3.0, 1.0, 3.0, 4.0, 9.0, 7.0, 9.0, 10.0, 10.0, 13.0, 18.0, 18.0, 26.0, 31.0, 24.0, 24.0, 32.0, 33.0, 28.0, 33.0, 43.0, 44.0, 49.0, 39.0, 46.0, 43.0, 51.0, 43.0, 36.0, 33.0, 38.0, 27.0, 25.0, 22.0, 29.0, 21.0, 20.0, 16.0, 8.0, 11.0, 8.0, 3.0, 8.0, 3.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02180624008178711, -0.021124038845300674, -0.02044183947145939, -0.019759640097618103, -0.019077438861131668, -0.018395237624645233, -0.017713038250803947, -0.017030838876962662, -0.016348637640476227, -0.015666436403989792, -0.014984237030148506, -0.014302036724984646, -0.013619836419820786, -0.012937636114656925, -0.012255435809493065, -0.011573235504329205, -0.010891035199165344, -0.010208834894001484, -0.009526634588837624, -0.008844434283673763, -0.008162233978509903, -0.007480033673346043, -0.006797833368182182, -0.006115633063018322, -0.005433432757854462, -0.004751232452690601, -0.004069032147526741, -0.0033868318423628807, -0.0027046315371990204, -0.00202243123203516, -0.0013402309268712997, -0.0006580306217074394, 2.41696834564209e-05, 0.0007063699886202812, 0.0013885702937841415, 0.002070770598948002, 0.002752970904111862, 0.0034351712092757225, 0.004117371514439583, 0.004799571819603443, 0.0054817721247673035, 0.006163972429931164, 0.006846172735095024, 0.007528373040258884, 0.008210573345422745, 0.008892773650586605, 0.009574973955750465, 0.010257174260914326, 0.010939374566078186, 0.011621574871242046, 0.012303775176405907, 0.012985975481569767, 0.013668175786733627, 0.014350376091897488, 0.015032576397061348, 0.015714775770902634, 0.01639697700738907, 0.017079178243875504, 0.01776137761771679, 0.018443576991558075, 0.01912577822804451, 0.019807979464530945, 0.02049017883837223, 0.021172378212213516, 0.02185457944869995]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 4.0, 1.0, 4.0, 9.0, 10.0, 12.0, 13.0, 12.0, 21.0, 30.0, 16.0, 27.0, 28.0, 37.0, 24.0, 16.0, 44.0, 47.0, 34.0, 51.0, 35.0, 48.0, 38.0, 33.0, 40.0, 34.0, 27.0, 35.0, 25.0, 41.0, 28.0, 28.0, 18.0, 24.0, 19.0, 13.0, 16.0, 14.0, 8.0, 11.0, 7.0, 9.0, 5.0, 4.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-13.7734375, -13.3431396484375, -12.912841796875, -12.4825439453125, -12.05224609375, -11.6219482421875, -11.191650390625, -10.7613525390625, -10.3310546875, -9.9007568359375, -9.470458984375, -9.0401611328125, -8.60986328125, -8.1795654296875, -7.749267578125, -7.3189697265625, -6.888671875, -6.4583740234375, -6.028076171875, -5.5977783203125, -5.16748046875, -4.7371826171875, -4.306884765625, -3.8765869140625, -3.4462890625, -3.0159912109375, -2.585693359375, -2.1553955078125, -1.72509765625, -1.2947998046875, -0.864501953125, -0.4342041015625, -0.00390625, 0.4263916015625, 0.856689453125, 1.2869873046875, 1.71728515625, 2.1475830078125, 2.577880859375, 3.0081787109375, 3.4384765625, 3.8687744140625, 4.299072265625, 4.7293701171875, 5.15966796875, 5.5899658203125, 6.020263671875, 6.4505615234375, 6.880859375, 7.3111572265625, 7.741455078125, 8.1717529296875, 8.60205078125, 9.0323486328125, 9.462646484375, 9.8929443359375, 10.3232421875, 10.7535400390625, 11.183837890625, 11.6141357421875, 12.04443359375, 12.4747314453125, 12.905029296875, 13.3353271484375, 13.765625]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 0.0, 4.0, 3.0, 15.0, 14.0, 20.0, 21.0, 48.0, 41.0, 71.0, 91.0, 106.0, 186.0, 263.0, 355.0, 528.0, 777.0, 1205.0, 2070.0, 3838.0, 9849.0, 44511.0, 345375.0, 549715.0, 65372.0, 12964.0, 4767.0, 2388.0, 1328.0, 897.0, 503.0, 342.0, 229.0, 163.0, 120.0, 92.0, 67.0, 53.0, 45.0, 24.0, 25.0, 20.0, 11.0, 9.0, 8.0, 9.0, 7.0, 6.0, 6.0, 3.0, 1.0, 0.0, 2.0], "bins": [-16.96875, -16.47119140625, -15.9736328125, -15.47607421875, -14.978515625, -14.48095703125, -13.9833984375, -13.48583984375, -12.98828125, -12.49072265625, -11.9931640625, -11.49560546875, -10.998046875, -10.50048828125, -10.0029296875, -9.50537109375, -9.0078125, -8.51025390625, -8.0126953125, -7.51513671875, -7.017578125, -6.52001953125, -6.0224609375, -5.52490234375, -5.02734375, -4.52978515625, -4.0322265625, -3.53466796875, -3.037109375, -2.53955078125, -2.0419921875, -1.54443359375, -1.046875, -0.54931640625, -0.0517578125, 0.44580078125, 0.943359375, 1.44091796875, 1.9384765625, 2.43603515625, 2.93359375, 3.43115234375, 3.9287109375, 4.42626953125, 4.923828125, 5.42138671875, 5.9189453125, 6.41650390625, 6.9140625, 7.41162109375, 7.9091796875, 8.40673828125, 8.904296875, 9.40185546875, 9.8994140625, 10.39697265625, 10.89453125, 11.39208984375, 11.8896484375, 12.38720703125, 12.884765625, 13.38232421875, 13.8798828125, 14.37744140625, 14.875]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 2.0, 4.0, 2.0, 8.0, 8.0, 9.0, 12.0, 17.0, 18.0, 18.0, 17.0, 23.0, 11.0, 22.0, 42.0, 34.0, 41.0, 52.0, 42.0, 78.0, 108.0, 1855.0, 146.0, 52.0, 72.0, 36.0, 42.0, 33.0, 36.0, 29.0, 30.0, 21.0, 29.0, 23.0, 14.0, 17.0, 8.0, 10.0, 4.0, 5.0, 9.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-36.6875, -35.52685546875, -34.3662109375, -33.20556640625, -32.044921875, -30.88427734375, -29.7236328125, -28.56298828125, -27.40234375, -26.24169921875, -25.0810546875, -23.92041015625, -22.759765625, -21.59912109375, -20.4384765625, -19.27783203125, -18.1171875, -16.95654296875, -15.7958984375, -14.63525390625, -13.474609375, -12.31396484375, -11.1533203125, -9.99267578125, -8.83203125, -7.67138671875, -6.5107421875, -5.35009765625, -4.189453125, -3.02880859375, -1.8681640625, -0.70751953125, 0.453125, 1.61376953125, 2.7744140625, 3.93505859375, 5.095703125, 6.25634765625, 7.4169921875, 8.57763671875, 9.73828125, 10.89892578125, 12.0595703125, 13.22021484375, 14.380859375, 15.54150390625, 16.7021484375, 17.86279296875, 19.0234375, 20.18408203125, 21.3447265625, 22.50537109375, 23.666015625, 24.82666015625, 25.9873046875, 27.14794921875, 28.30859375, 29.46923828125, 30.6298828125, 31.79052734375, 32.951171875, 34.11181640625, 35.2724609375, 36.43310546875, 37.59375]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 9.0, 5.0, 17.0, 19.0, 36.0, 78.0, 137.0, 335.0, 728.0, 9750.0, 3129398.0, 4076.0, 593.0, 256.0, 110.0, 64.0, 44.0, 22.0, 13.0, 9.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-170.25, -164.25390625, -158.2578125, -152.26171875, -146.265625, -140.26953125, -134.2734375, -128.27734375, -122.28125, -116.28515625, -110.2890625, -104.29296875, -98.296875, -92.30078125, -86.3046875, -80.30859375, -74.3125, -68.31640625, -62.3203125, -56.32421875, -50.328125, -44.33203125, -38.3359375, -32.33984375, -26.34375, -20.34765625, -14.3515625, -8.35546875, -2.359375, 3.63671875, 9.6328125, 15.62890625, 21.625, 27.62109375, 33.6171875, 39.61328125, 45.609375, 51.60546875, 57.6015625, 63.59765625, 69.59375, 75.58984375, 81.5859375, 87.58203125, 93.578125, 99.57421875, 105.5703125, 111.56640625, 117.5625, 123.55859375, 129.5546875, 135.55078125, 141.546875, 147.54296875, 153.5390625, 159.53515625, 165.53125, 171.52734375, 177.5234375, 183.51953125, 189.515625, 195.51171875, 201.5078125, 207.50390625, 213.5]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 30.0, 265.0, 542.0, 146.0, 20.0, 7.0], "bins": [-374.1932678222656, -367.989501953125, -361.7857666015625, -355.5820007324219, -349.3782653808594, -343.17449951171875, -336.9707336425781, -330.7669982910156, -324.563232421875, -318.3594665527344, -312.1557312011719, -305.95196533203125, -299.74822998046875, -293.5444641113281, -287.3406982421875, -281.136962890625, -274.9331970214844, -268.72943115234375, -262.52569580078125, -256.3219299316406, -250.11817932128906, -243.9144287109375, -237.71067810058594, -231.50692749023438, -225.3031768798828, -219.09942626953125, -212.8956756591797, -206.69190979003906, -200.4881591796875, -194.28440856933594, -188.08065795898438, -181.87689208984375, -175.6731414794922, -169.46939086914062, -163.26564025878906, -157.06187438964844, -150.85812377929688, -144.6543731689453, -138.45062255859375, -132.24685668945312, -126.0431137084961, -119.83936309814453, -113.63560485839844, -107.43185424804688, -101.22809600830078, -95.02434539794922, -88.82058715820312, -82.61683654785156, -76.41307830810547, -70.2093276977539, -64.00556945800781, -57.80181884765625, -51.598060607910156, -45.394309997558594, -39.190555572509766, -32.98680114746094, -26.783048629760742, -20.579294204711914, -14.375540733337402, -8.17178726196289, -1.9680328369140625, 4.235721588134766, 10.439474105834961, 16.64322853088379, 22.846982955932617]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 3.0, 9.0, 4.0, 14.0, 20.0, 11.0, 18.0, 18.0, 16.0, 18.0, 28.0, 26.0, 37.0, 29.0, 37.0, 55.0, 38.0, 33.0, 40.0, 65.0, 44.0, 36.0, 30.0, 37.0, 30.0, 33.0, 35.0, 33.0, 34.0, 21.0, 24.0, 20.0, 21.0, 14.0, 14.0, 15.0, 9.0, 7.0, 8.0, 7.0, 2.0, 5.0, 6.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-106.68331146240234, -103.46924591064453, -100.25518035888672, -97.0411148071289, -93.8270492553711, -90.61298370361328, -87.39892578125, -84.18486022949219, -80.97079467773438, -77.75672912597656, -74.54266357421875, -71.32859802246094, -68.11453247070312, -64.90046691894531, -61.686405181884766, -58.47233963012695, -55.258270263671875, -52.04420471191406, -48.83013916015625, -45.61607360839844, -42.402008056640625, -39.18794250488281, -35.973880767822266, -32.75981521606445, -29.54574966430664, -26.331684112548828, -23.117618560791016, -19.903554916381836, -16.689489364624023, -13.475423812866211, -10.261360168457031, -7.047294616699219, -3.8332366943359375, -0.6191716194152832, 2.594893455505371, 5.808958053588867, 9.02302360534668, 12.237089157104492, 15.451152801513672, 18.665218353271484, 21.879283905029297, 25.09334945678711, 28.307415008544922, 31.5214786529541, 34.73554229736328, 37.949607849121094, 41.163673400878906, 44.37773895263672, 47.59180450439453, 50.805870056152344, 54.019935607910156, 57.23400115966797, 60.44806671142578, 63.662132263183594, 66.87619018554688, 70.09025573730469, 73.3043212890625, 76.51838684082031, 79.73245239257812, 82.94651794433594, 86.16058349609375, 89.37464904785156, 92.58871459960938, 95.80278015136719, 99.016845703125]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 4.0, 8.0, 9.0, 8.0, 19.0, 19.0, 21.0, 25.0, 31.0, 14.0, 34.0, 37.0, 30.0, 33.0, 37.0, 41.0, 55.0, 37.0, 26.0, 45.0, 35.0, 54.0, 35.0, 40.0, 35.0, 25.0, 30.0, 23.0, 27.0, 26.0, 26.0, 16.0, 19.0, 15.0, 9.0, 11.0, 14.0, 4.0, 5.0, 6.0, 2.0, 2.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-14.7265625, -14.269287109375, -13.81201171875, -13.354736328125, -12.8974609375, -12.440185546875, -11.98291015625, -11.525634765625, -11.068359375, -10.611083984375, -10.15380859375, -9.696533203125, -9.2392578125, -8.781982421875, -8.32470703125, -7.867431640625, -7.41015625, -6.952880859375, -6.49560546875, -6.038330078125, -5.5810546875, -5.123779296875, -4.66650390625, -4.209228515625, -3.751953125, -3.294677734375, -2.83740234375, -2.380126953125, -1.9228515625, -1.465576171875, -1.00830078125, -0.551025390625, -0.09375, 0.363525390625, 0.82080078125, 1.278076171875, 1.7353515625, 2.192626953125, 2.64990234375, 3.107177734375, 3.564453125, 4.021728515625, 4.47900390625, 4.936279296875, 5.3935546875, 5.850830078125, 6.30810546875, 6.765380859375, 7.22265625, 7.679931640625, 8.13720703125, 8.594482421875, 9.0517578125, 9.509033203125, 9.96630859375, 10.423583984375, 10.880859375, 11.338134765625, 11.79541015625, 12.252685546875, 12.7099609375, 13.167236328125, 13.62451171875, 14.081787109375, 14.5390625]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 6.0, 7.0, 7.0, 8.0, 11.0, 20.0, 25.0, 27.0, 39.0, 48.0, 79.0, 140.0, 253.0, 481.0, 882.0, 1786.0, 3367.0, 7261.0, 39342.0, 2579382.0, 1524498.0, 23037.0, 6514.0, 3038.0, 1714.0, 948.0, 520.0, 311.0, 184.0, 115.0, 77.0, 36.0, 33.0, 18.0, 17.0, 17.0, 8.0, 8.0, 4.0, 7.0, 4.0, 3.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-54.5, -52.84521484375, -51.1904296875, -49.53564453125, -47.880859375, -46.22607421875, -44.5712890625, -42.91650390625, -41.26171875, -39.60693359375, -37.9521484375, -36.29736328125, -34.642578125, -32.98779296875, -31.3330078125, -29.67822265625, -28.0234375, -26.36865234375, -24.7138671875, -23.05908203125, -21.404296875, -19.74951171875, -18.0947265625, -16.43994140625, -14.78515625, -13.13037109375, -11.4755859375, -9.82080078125, -8.166015625, -6.51123046875, -4.8564453125, -3.20166015625, -1.546875, 0.10791015625, 1.7626953125, 3.41748046875, 5.072265625, 6.72705078125, 8.3818359375, 10.03662109375, 11.69140625, 13.34619140625, 15.0009765625, 16.65576171875, 18.310546875, 19.96533203125, 21.6201171875, 23.27490234375, 24.9296875, 26.58447265625, 28.2392578125, 29.89404296875, 31.548828125, 33.20361328125, 34.8583984375, 36.51318359375, 38.16796875, 39.82275390625, 41.4775390625, 43.13232421875, 44.787109375, 46.44189453125, 48.0966796875, 49.75146484375, 51.40625]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 4.0, 6.0, 11.0, 8.0, 8.0, 9.0, 9.0, 16.0, 18.0, 24.0, 39.0, 65.0, 124.0, 218.0, 484.0, 783.0, 947.0, 626.0, 305.0, 145.0, 79.0, 35.0, 27.0, 17.0, 20.0, 10.0, 6.0, 4.0, 5.0, 6.0, 4.0, 3.0, 2.0, 6.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-32.59375, -31.6396484375, -30.685546875, -29.7314453125, -28.77734375, -27.8232421875, -26.869140625, -25.9150390625, -24.9609375, -24.0068359375, -23.052734375, -22.0986328125, -21.14453125, -20.1904296875, -19.236328125, -18.2822265625, -17.328125, -16.3740234375, -15.419921875, -14.4658203125, -13.51171875, -12.5576171875, -11.603515625, -10.6494140625, -9.6953125, -8.7412109375, -7.787109375, -6.8330078125, -5.87890625, -4.9248046875, -3.970703125, -3.0166015625, -2.0625, -1.1083984375, -0.154296875, 0.7998046875, 1.75390625, 2.7080078125, 3.662109375, 4.6162109375, 5.5703125, 6.5244140625, 7.478515625, 8.4326171875, 9.38671875, 10.3408203125, 11.294921875, 12.2490234375, 13.203125, 14.1572265625, 15.111328125, 16.0654296875, 17.01953125, 17.9736328125, 18.927734375, 19.8818359375, 20.8359375, 21.7900390625, 22.744140625, 23.6982421875, 24.65234375, 25.6064453125, 26.560546875, 27.5146484375, 28.46875]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 3.0, 3.0, 2.0, 8.0, 3.0, 7.0, 11.0, 14.0, 16.0, 35.0, 58.0, 84.0, 190.0, 422.0, 1450.0, 6925.0, 64026.0, 4069577.0, 43877.0, 5578.0, 1191.0, 379.0, 162.0, 77.0, 57.0, 38.0, 21.0, 14.0, 9.0, 7.0, 12.0, 7.0, 9.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-125.4375, -121.1767578125, -116.916015625, -112.6552734375, -108.39453125, -104.1337890625, -99.873046875, -95.6123046875, -91.3515625, -87.0908203125, -82.830078125, -78.5693359375, -74.30859375, -70.0478515625, -65.787109375, -61.5263671875, -57.265625, -53.0048828125, -48.744140625, -44.4833984375, -40.22265625, -35.9619140625, -31.701171875, -27.4404296875, -23.1796875, -18.9189453125, -14.658203125, -10.3974609375, -6.13671875, -1.8759765625, 2.384765625, 6.6455078125, 10.90625, 15.1669921875, 19.427734375, 23.6884765625, 27.94921875, 32.2099609375, 36.470703125, 40.7314453125, 44.9921875, 49.2529296875, 53.513671875, 57.7744140625, 62.03515625, 66.2958984375, 70.556640625, 74.8173828125, 79.078125, 83.3388671875, 87.599609375, 91.8603515625, 96.12109375, 100.3818359375, 104.642578125, 108.9033203125, 113.1640625, 117.4248046875, 121.685546875, 125.9462890625, 130.20703125, 134.4677734375, 138.728515625, 142.9892578125, 147.25]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 8.0, 4.0, 7.0, 3.0, 11.0, 9.0, 14.0, 16.0, 31.0, 36.0, 44.0, 75.0, 121.0, 120.0, 141.0, 98.0, 74.0, 55.0, 33.0, 26.0, 23.0, 14.0, 14.0, 10.0, 3.0, 5.0, 2.0, 3.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-116.70932006835938, -113.93148803710938, -111.15364837646484, -108.37581634521484, -105.59797668457031, -102.82014465332031, -100.04231262207031, -97.26447296142578, -94.48663330078125, -91.70880126953125, -88.93096160888672, -86.15312957763672, -83.37528991699219, -80.59745788574219, -77.81962585449219, -75.04178619384766, -72.26395416259766, -69.48612213134766, -66.70828247070312, -63.930450439453125, -61.152610778808594, -58.374778747558594, -55.59694290161133, -52.81910705566406, -50.0412712097168, -47.26343536376953, -44.485599517822266, -41.707763671875, -38.929931640625, -36.15209197998047, -33.37425994873047, -30.596424102783203, -27.818580627441406, -25.04074478149414, -22.262908935546875, -19.485074996948242, -16.707239151000977, -13.929403305053711, -11.151569366455078, -8.373733520507812, -5.595897674560547, -2.8180623054504395, -0.04022693634033203, 2.737607955932617, 5.515443801879883, 8.293279647827148, 11.071113586425781, 13.848949432373047, 16.626785278320312, 19.404621124267578, 22.182456970214844, 24.960290908813477, 27.738126754760742, 30.515962600708008, 33.29379653930664, 36.071632385253906, 38.84946823120117, 41.62730407714844, 44.4051399230957, 47.18297576904297, 49.96080780029297, 52.7386474609375, 55.5164794921875, 58.294315338134766, 61.07215118408203]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 5.0, 3.0, 6.0, 7.0, 7.0, 10.0, 11.0, 13.0, 13.0, 11.0, 14.0, 21.0, 15.0, 25.0, 27.0, 29.0, 28.0, 29.0, 28.0, 19.0, 37.0, 31.0, 34.0, 36.0, 47.0, 53.0, 43.0, 44.0, 39.0, 30.0, 19.0, 29.0, 24.0, 39.0, 20.0, 27.0, 26.0, 17.0, 20.0, 10.0, 14.0, 13.0, 8.0, 5.0, 5.0, 2.0, 3.0, 3.0, 3.0, 1.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-63.53112030029297, -61.490440368652344, -59.44975662231445, -57.40907669067383, -55.36839294433594, -53.32771301269531, -51.28703308105469, -49.24635314941406, -47.20566940307617, -45.16498947143555, -43.124305725097656, -41.08362579345703, -39.042945861816406, -37.002262115478516, -34.96158218383789, -32.9208984375, -30.880218505859375, -28.839536666870117, -26.79885482788086, -24.758174896240234, -22.717493057250977, -20.67681121826172, -18.636131286621094, -16.595449447631836, -14.554767608642578, -12.51408576965332, -10.473404884338379, -8.432723999023438, -6.39204216003418, -4.351360321044922, -2.3106794357299805, -0.26999855041503906, 1.7706756591796875, 3.811357021331787, 5.852038383483887, 7.892719745635986, 9.933401107788086, 11.974082946777344, 14.014763832092285, 16.055444717407227, 18.096126556396484, 20.136808395385742, 22.177490234375, 24.218170166015625, 26.258852005004883, 28.29953384399414, 30.340213775634766, 32.380897521972656, 34.42157745361328, 36.462257385253906, 38.5029411315918, 40.54362106323242, 42.58430480957031, 44.62498474121094, 46.66566467285156, 48.70634460449219, 50.74702835083008, 52.7877082824707, 54.828392028808594, 56.86907196044922, 58.909751892089844, 60.950435638427734, 62.99111557006836, 65.03179931640625, 67.07247924804688]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 8.0, 4.0, 6.0, 9.0, 10.0, 7.0, 17.0, 13.0, 15.0, 30.0, 21.0, 20.0, 23.0, 42.0, 30.0, 30.0, 36.0, 40.0, 31.0, 46.0, 44.0, 54.0, 26.0, 38.0, 41.0, 44.0, 22.0, 28.0, 33.0, 22.0, 25.0, 34.0, 25.0, 16.0, 23.0, 15.0, 10.0, 19.0, 11.0, 5.0, 5.0, 5.0, 7.0, 5.0, 4.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0], "bins": [-14.0078125, -13.567138671875, -13.12646484375, -12.685791015625, -12.2451171875, -11.804443359375, -11.36376953125, -10.923095703125, -10.482421875, -10.041748046875, -9.60107421875, -9.160400390625, -8.7197265625, -8.279052734375, -7.83837890625, -7.397705078125, -6.95703125, -6.516357421875, -6.07568359375, -5.635009765625, -5.1943359375, -4.753662109375, -4.31298828125, -3.872314453125, -3.431640625, -2.990966796875, -2.55029296875, -2.109619140625, -1.6689453125, -1.228271484375, -0.78759765625, -0.346923828125, 0.09375, 0.534423828125, 0.97509765625, 1.415771484375, 1.8564453125, 2.297119140625, 2.73779296875, 3.178466796875, 3.619140625, 4.059814453125, 4.50048828125, 4.941162109375, 5.3818359375, 5.822509765625, 6.26318359375, 6.703857421875, 7.14453125, 7.585205078125, 8.02587890625, 8.466552734375, 8.9072265625, 9.347900390625, 9.78857421875, 10.229248046875, 10.669921875, 11.110595703125, 11.55126953125, 11.991943359375, 12.4326171875, 12.873291015625, 13.31396484375, 13.754638671875, 14.1953125]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 5.0, 9.0, 5.0, 14.0, 25.0, 39.0, 79.0, 69.0, 142.0, 186.0, 292.0, 491.0, 786.0, 1312.0, 2064.0, 3266.0, 5161.0, 8408.0, 13775.0, 22336.0, 38546.0, 68898.0, 127093.0, 230479.0, 231079.0, 127808.0, 68982.0, 38884.0, 22626.0, 13638.0, 8588.0, 5125.0, 3149.0, 1926.0, 1240.0, 729.0, 452.0, 279.0, 198.0, 135.0, 72.0, 61.0, 32.0, 37.0, 15.0, 11.0, 6.0, 4.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6943359375, -1.639678955078125, -1.58502197265625, -1.530364990234375, -1.4757080078125, -1.421051025390625, -1.36639404296875, -1.311737060546875, -1.257080078125, -1.202423095703125, -1.14776611328125, -1.093109130859375, -1.0384521484375, -0.983795166015625, -0.92913818359375, -0.874481201171875, -0.81982421875, -0.765167236328125, -0.71051025390625, -0.655853271484375, -0.6011962890625, -0.546539306640625, -0.49188232421875, -0.437225341796875, -0.382568359375, -0.327911376953125, -0.27325439453125, -0.218597412109375, -0.1639404296875, -0.109283447265625, -0.05462646484375, 3.0517578125e-05, 0.0546875, 0.109344482421875, 0.16400146484375, 0.218658447265625, 0.2733154296875, 0.327972412109375, 0.38262939453125, 0.437286376953125, 0.491943359375, 0.546600341796875, 0.60125732421875, 0.655914306640625, 0.7105712890625, 0.765228271484375, 0.81988525390625, 0.874542236328125, 0.92919921875, 0.983856201171875, 1.03851318359375, 1.093170166015625, 1.1478271484375, 1.202484130859375, 1.25714111328125, 1.311798095703125, 1.366455078125, 1.421112060546875, 1.47576904296875, 1.530426025390625, 1.5850830078125, 1.639739990234375, 1.69439697265625, 1.749053955078125, 1.8037109375]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 4.0, 3.0, 9.0, 7.0, 10.0, 24.0, 20.0, 18.0, 29.0, 34.0, 32.0, 36.0, 28.0, 47.0, 50.0, 41.0, 42.0, 55.0, 1077.0, 46.0, 57.0, 38.0, 40.0, 38.0, 43.0, 40.0, 22.0, 20.0, 23.0, 21.0, 14.0, 11.0, 10.0, 12.0, 8.0, 10.0, 1.0, 2.0, 0.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-12.7578125, -12.40869140625, -12.0595703125, -11.71044921875, -11.361328125, -11.01220703125, -10.6630859375, -10.31396484375, -9.96484375, -9.61572265625, -9.2666015625, -8.91748046875, -8.568359375, -8.21923828125, -7.8701171875, -7.52099609375, -7.171875, -6.82275390625, -6.4736328125, -6.12451171875, -5.775390625, -5.42626953125, -5.0771484375, -4.72802734375, -4.37890625, -4.02978515625, -3.6806640625, -3.33154296875, -2.982421875, -2.63330078125, -2.2841796875, -1.93505859375, -1.5859375, -1.23681640625, -0.8876953125, -0.53857421875, -0.189453125, 0.15966796875, 0.5087890625, 0.85791015625, 1.20703125, 1.55615234375, 1.9052734375, 2.25439453125, 2.603515625, 2.95263671875, 3.3017578125, 3.65087890625, 4.0, 4.34912109375, 4.6982421875, 5.04736328125, 5.396484375, 5.74560546875, 6.0947265625, 6.44384765625, 6.79296875, 7.14208984375, 7.4912109375, 7.84033203125, 8.189453125, 8.53857421875, 8.8876953125, 9.23681640625, 9.5859375]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 4.0, 4.0, 3.0, 6.0, 4.0, 10.0, 16.0, 21.0, 28.0, 42.0, 65.0, 95.0, 192.0, 326.0, 551.0, 973.0, 1722.0, 3121.0, 5675.0, 10432.0, 19693.0, 39379.0, 81452.0, 179045.0, 1363997.0, 204800.0, 92700.0, 44281.0, 22203.0, 11837.0, 6463.0, 3571.0, 1865.0, 1069.0, 596.0, 351.0, 210.0, 94.0, 72.0, 45.0, 43.0, 29.0, 21.0, 11.0, 6.0, 6.0, 5.0, 3.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.193359375, -1.151611328125, -1.10986328125, -1.068115234375, -1.0263671875, -0.984619140625, -0.94287109375, -0.901123046875, -0.859375, -0.817626953125, -0.77587890625, -0.734130859375, -0.6923828125, -0.650634765625, -0.60888671875, -0.567138671875, -0.525390625, -0.483642578125, -0.44189453125, -0.400146484375, -0.3583984375, -0.316650390625, -0.27490234375, -0.233154296875, -0.19140625, -0.149658203125, -0.10791015625, -0.066162109375, -0.0244140625, 0.017333984375, 0.05908203125, 0.100830078125, 0.142578125, 0.184326171875, 0.22607421875, 0.267822265625, 0.3095703125, 0.351318359375, 0.39306640625, 0.434814453125, 0.4765625, 0.518310546875, 0.56005859375, 0.601806640625, 0.6435546875, 0.685302734375, 0.72705078125, 0.768798828125, 0.810546875, 0.852294921875, 0.89404296875, 0.935791015625, 0.9775390625, 1.019287109375, 1.06103515625, 1.102783203125, 1.14453125, 1.186279296875, 1.22802734375, 1.269775390625, 1.3115234375, 1.353271484375, 1.39501953125, 1.436767578125, 1.478515625]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 5.0, 1.0, 4.0, 3.0, 6.0, 1.0, 6.0, 4.0, 5.0, 11.0, 6.0, 12.0, 23.0, 27.0, 41.0, 38.0, 34.0, 58.0, 72.0, 55.0, 114.0, 98.0, 81.0, 44.0, 40.0, 40.0, 36.0, 31.0, 25.0, 17.0, 12.0, 13.0, 9.0, 7.0, 10.0, 3.0, 6.0, 2.0, 2.0, 1.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.07080078125, -0.06871604919433594, -0.06663131713867188, -0.06454658508300781, -0.06246185302734375, -0.06037712097167969, -0.058292388916015625, -0.05620765686035156, -0.0541229248046875, -0.05203819274902344, -0.049953460693359375, -0.04786872863769531, -0.04578399658203125, -0.04369926452636719, -0.041614532470703125, -0.03952980041503906, -0.037445068359375, -0.03536033630371094, -0.033275604248046875, -0.031190872192382812, -0.02910614013671875, -0.027021408081054688, -0.024936676025390625, -0.022851943969726562, -0.0207672119140625, -0.018682479858398438, -0.016597747802734375, -0.014513015747070312, -0.01242828369140625, -0.010343551635742188, -0.008258819580078125, -0.0061740875244140625, -0.00408935546875, -0.0020046234130859375, 8.0108642578125e-05, 0.0021648406982421875, 0.00424957275390625, 0.0063343048095703125, 0.008419036865234375, 0.010503768920898438, 0.0125885009765625, 0.014673233032226562, 0.016757965087890625, 0.018842697143554688, 0.02092742919921875, 0.023012161254882812, 0.025096893310546875, 0.027181625366210938, 0.029266357421875, 0.03135108947753906, 0.033435821533203125, 0.03552055358886719, 0.03760528564453125, 0.03969001770019531, 0.041774749755859375, 0.04385948181152344, 0.0459442138671875, 0.04802894592285156, 0.050113677978515625, 0.05219841003417969, 0.05428314208984375, 0.05636787414550781, 0.058452606201171875, 0.06053733825683594, 0.0626220703125]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 4.0, 2.0, 5.0, 7.0, 8.0, 14.0, 10.0, 17.0, 24.0, 22.0, 38.0, 56.0, 72.0, 98.0, 136.0, 256.0, 950.0, 21276.0, 1004926.0, 18970.0, 836.0, 280.0, 154.0, 99.0, 72.0, 60.0, 30.0, 35.0, 20.0, 12.0, 15.0, 7.0, 8.0, 8.0, 6.0, 4.0, 4.0, 6.0, 2.0, 3.0, 2.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.353515625, -1.3105316162109375, -1.267547607421875, -1.2245635986328125, -1.18157958984375, -1.1385955810546875, -1.095611572265625, -1.0526275634765625, -1.0096435546875, -0.9666595458984375, -0.923675537109375, -0.8806915283203125, -0.83770751953125, -0.7947235107421875, -0.751739501953125, -0.7087554931640625, -0.665771484375, -0.6227874755859375, -0.579803466796875, -0.5368194580078125, -0.49383544921875, -0.4508514404296875, -0.407867431640625, -0.3648834228515625, -0.3218994140625, -0.2789154052734375, -0.235931396484375, -0.1929473876953125, -0.14996337890625, -0.1069793701171875, -0.063995361328125, -0.0210113525390625, 0.02197265625, 0.0649566650390625, 0.107940673828125, 0.1509246826171875, 0.19390869140625, 0.2368927001953125, 0.279876708984375, 0.3228607177734375, 0.3658447265625, 0.4088287353515625, 0.451812744140625, 0.4947967529296875, 0.53778076171875, 0.5807647705078125, 0.623748779296875, 0.6667327880859375, 0.709716796875, 0.7527008056640625, 0.795684814453125, 0.8386688232421875, 0.88165283203125, 0.9246368408203125, 0.967620849609375, 1.0106048583984375, 1.0535888671875, 1.0965728759765625, 1.139556884765625, 1.1825408935546875, 1.22552490234375, 1.2685089111328125, 1.311492919921875, 1.3544769287109375, 1.3974609375]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 17.0, 89.0, 729.0, 153.0, 25.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4743356704711914, -1.4370964765548706, -1.3998572826385498, -1.362618088722229, -1.3253788948059082, -1.288139820098877, -1.2509005069732666, -1.2136614322662354, -1.1764222383499146, -1.1391830444335938, -1.101943850517273, -1.0647046566009521, -1.0274654626846313, -0.9902263283729553, -0.9529871344566345, -0.9157480001449585, -0.8785087466239929, -0.8412695527076721, -0.8040303587913513, -0.7667912244796753, -0.7295520305633545, -0.6923128366470337, -0.6550736427307129, -0.6178344488143921, -0.5805952548980713, -0.5433560609817505, -0.5061168670654297, -0.4688777029514313, -0.43163853883743286, -0.39439934492111206, -0.35716015100479126, -0.31992098689079285, -0.2826818823814392, -0.2454427033662796, -0.20820352435112, -0.1709643304347992, -0.1337251514196396, -0.09648597240447998, -0.05924677848815918, -0.022007614374160767, 0.015231579542160034, 0.05247076228260994, 0.08970994502305984, 0.12694913148880005, 0.16418831050395966, 0.20142748951911926, 0.23866668343544006, 0.2759058475494385, 0.3131450414657593, 0.3503842353820801, 0.3876233994960785, 0.4248625934123993, 0.4621017575263977, 0.4993409514427185, 0.5365801453590393, 0.5738192796707153, 0.6110584735870361, 0.6482976675033569, 0.6855368614196777, 0.7227760553359985, 0.7600151896476746, 0.7972543835639954, 0.8344935774803162, 0.8717327117919922, 0.9089719653129578]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 5.0, 1.0, 8.0, 6.0, 7.0, 5.0, 7.0, 15.0, 12.0, 25.0, 17.0, 18.0, 19.0, 40.0, 32.0, 33.0, 45.0, 44.0, 39.0, 49.0, 33.0, 48.0, 45.0, 49.0, 40.0, 43.0, 38.0, 40.0, 33.0, 26.0, 29.0, 34.0, 23.0, 24.0, 19.0, 16.0, 9.0, 11.0, 8.0, 4.0, 2.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.1353248953819275, -0.1309289038181305, -0.1265329122543335, -0.1221369281411171, -0.1177409365773201, -0.1133449450135231, -0.1089489609003067, -0.1045529693365097, -0.10015697777271271, -0.09576098620891571, -0.09136499464511871, -0.08696901053190231, -0.08257301896810532, -0.07817702740430832, -0.07378104329109192, -0.06938505172729492, -0.06498906016349792, -0.06059306859970093, -0.05619708076119423, -0.05180109292268753, -0.04740510135889053, -0.043009109795093536, -0.03861312195658684, -0.03421713411808014, -0.029821142554283142, -0.025425152853131294, -0.021029163151979446, -0.0166331734508276, -0.01223718374967575, -0.007841194048523903, -0.003445204347372055, 0.0009507853537797928, 0.005346775054931641, 0.009742764756083488, 0.014138754457235336, 0.018534744158387184, 0.022930733859539032, 0.02732672356069088, 0.03172271326184273, 0.036118701100349426, 0.04051469266414642, 0.04491068422794342, 0.04930667206645012, 0.05370265990495682, 0.058098651468753815, 0.06249464303255081, 0.06689062714576721, 0.07128661870956421, 0.0756826102733612, 0.0800786018371582, 0.0844745934009552, 0.0888705775141716, 0.0932665690779686, 0.0976625606417656, 0.102058544754982, 0.10645453631877899, 0.11085052788257599, 0.11524651944637299, 0.11964251101016998, 0.12403849512338638, 0.12843447923660278, 0.13283047080039978, 0.13722646236419678, 0.14162245392799377, 0.14601844549179077]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 8.0, 4.0, 7.0, 8.0, 10.0, 7.0, 17.0, 13.0, 15.0, 30.0, 21.0, 20.0, 23.0, 40.0, 32.0, 31.0, 35.0, 40.0, 31.0, 45.0, 44.0, 56.0, 25.0, 36.0, 40.0, 47.0, 21.0, 29.0, 33.0, 22.0, 25.0, 34.0, 25.0, 16.0, 23.0, 15.0, 10.0, 19.0, 11.0, 5.0, 5.0, 5.0, 7.0, 5.0, 4.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0], "bins": [-14.0078125, -13.5672607421875, -13.126708984375, -12.6861572265625, -12.24560546875, -11.8050537109375, -11.364501953125, -10.9239501953125, -10.4833984375, -10.0428466796875, -9.602294921875, -9.1617431640625, -8.72119140625, -8.2806396484375, -7.840087890625, -7.3995361328125, -6.958984375, -6.5184326171875, -6.077880859375, -5.6373291015625, -5.19677734375, -4.7562255859375, -4.315673828125, -3.8751220703125, -3.4345703125, -2.9940185546875, -2.553466796875, -2.1129150390625, -1.67236328125, -1.2318115234375, -0.791259765625, -0.3507080078125, 0.08984375, 0.5303955078125, 0.970947265625, 1.4114990234375, 1.85205078125, 2.2926025390625, 2.733154296875, 3.1737060546875, 3.6142578125, 4.0548095703125, 4.495361328125, 4.9359130859375, 5.37646484375, 5.8170166015625, 6.257568359375, 6.6981201171875, 7.138671875, 7.5792236328125, 8.019775390625, 8.4603271484375, 8.90087890625, 9.3414306640625, 9.781982421875, 10.2225341796875, 10.6630859375, 11.1036376953125, 11.544189453125, 11.9847412109375, 12.42529296875, 12.8658447265625, 13.306396484375, 13.7469482421875, 14.1875]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 8.0, 6.0, 10.0, 10.0, 14.0, 15.0, 27.0, 29.0, 37.0, 62.0, 55.0, 94.0, 112.0, 181.0, 249.0, 434.0, 707.0, 1264.0, 2504.0, 6432.0, 35287.0, 762145.0, 214454.0, 15709.0, 4246.0, 1875.0, 943.0, 514.0, 362.0, 211.0, 133.0, 112.0, 78.0, 47.0, 42.0, 29.0, 24.0, 27.0, 18.0, 7.0, 8.0, 9.0, 6.0, 10.0, 4.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0], "bins": [-23.96875, -23.215087890625, -22.46142578125, -21.707763671875, -20.9541015625, -20.200439453125, -19.44677734375, -18.693115234375, -17.939453125, -17.185791015625, -16.43212890625, -15.678466796875, -14.9248046875, -14.171142578125, -13.41748046875, -12.663818359375, -11.91015625, -11.156494140625, -10.40283203125, -9.649169921875, -8.8955078125, -8.141845703125, -7.38818359375, -6.634521484375, -5.880859375, -5.127197265625, -4.37353515625, -3.619873046875, -2.8662109375, -2.112548828125, -1.35888671875, -0.605224609375, 0.1484375, 0.902099609375, 1.65576171875, 2.409423828125, 3.1630859375, 3.916748046875, 4.67041015625, 5.424072265625, 6.177734375, 6.931396484375, 7.68505859375, 8.438720703125, 9.1923828125, 9.946044921875, 10.69970703125, 11.453369140625, 12.20703125, 12.960693359375, 13.71435546875, 14.468017578125, 15.2216796875, 15.975341796875, 16.72900390625, 17.482666015625, 18.236328125, 18.989990234375, 19.74365234375, 20.497314453125, 21.2509765625, 22.004638671875, 22.75830078125, 23.511962890625, 24.265625]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 5.0, 7.0, 11.0, 6.0, 9.0, 14.0, 17.0, 14.0, 23.0, 22.0, 22.0, 26.0, 28.0, 44.0, 41.0, 42.0, 54.0, 50.0, 80.0, 182.0, 1830.0, 93.0, 50.0, 50.0, 45.0, 40.0, 29.0, 30.0, 27.0, 21.0, 22.0, 19.0, 13.0, 15.0, 18.0, 8.0, 8.0, 8.0, 7.0, 5.0, 4.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.03125, -31.81640625, -30.6015625, -29.38671875, -28.171875, -26.95703125, -25.7421875, -24.52734375, -23.3125, -22.09765625, -20.8828125, -19.66796875, -18.453125, -17.23828125, -16.0234375, -14.80859375, -13.59375, -12.37890625, -11.1640625, -9.94921875, -8.734375, -7.51953125, -6.3046875, -5.08984375, -3.875, -2.66015625, -1.4453125, -0.23046875, 0.984375, 2.19921875, 3.4140625, 4.62890625, 5.84375, 7.05859375, 8.2734375, 9.48828125, 10.703125, 11.91796875, 13.1328125, 14.34765625, 15.5625, 16.77734375, 17.9921875, 19.20703125, 20.421875, 21.63671875, 22.8515625, 24.06640625, 25.28125, 26.49609375, 27.7109375, 28.92578125, 30.140625, 31.35546875, 32.5703125, 33.78515625, 35.0, 36.21484375, 37.4296875, 38.64453125, 39.859375, 41.07421875, 42.2890625, 43.50390625, 44.71875]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 5.0, 5.0, 5.0, 10.0, 8.0, 6.0, 16.0, 16.0, 14.0, 21.0, 19.0, 26.0, 26.0, 49.0, 50.0, 94.0, 132.0, 203.0, 451.0, 2084.0, 2880214.0, 259496.0, 1598.0, 421.0, 222.0, 117.0, 87.0, 68.0, 41.0, 33.0, 21.0, 27.0, 22.0, 18.0, 16.0, 17.0, 9.0, 4.0, 9.0, 8.0, 5.0, 7.0, 2.0, 3.0, 0.0, 2.0, 1.0, 4.0], "bins": [-130.625, -127.0888671875, -123.552734375, -120.0166015625, -116.48046875, -112.9443359375, -109.408203125, -105.8720703125, -102.3359375, -98.7998046875, -95.263671875, -91.7275390625, -88.19140625, -84.6552734375, -81.119140625, -77.5830078125, -74.046875, -70.5107421875, -66.974609375, -63.4384765625, -59.90234375, -56.3662109375, -52.830078125, -49.2939453125, -45.7578125, -42.2216796875, -38.685546875, -35.1494140625, -31.61328125, -28.0771484375, -24.541015625, -21.0048828125, -17.46875, -13.9326171875, -10.396484375, -6.8603515625, -3.32421875, 0.2119140625, 3.748046875, 7.2841796875, 10.8203125, 14.3564453125, 17.892578125, 21.4287109375, 24.96484375, 28.5009765625, 32.037109375, 35.5732421875, 39.109375, 42.6455078125, 46.181640625, 49.7177734375, 53.25390625, 56.7900390625, 60.326171875, 63.8623046875, 67.3984375, 70.9345703125, 74.470703125, 78.0068359375, 81.54296875, 85.0791015625, 88.615234375, 92.1513671875, 95.6875]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 6.0, 81.0, 542.0, 359.0, 31.0], "bins": [-239.0032501220703, -235.13783264160156, -231.2724151611328, -227.40699768066406, -223.54159545898438, -219.67617797851562, -215.81076049804688, -211.94534301757812, -208.07992553710938, -204.21450805664062, -200.34909057617188, -196.48367309570312, -192.61825561523438, -188.7528533935547, -184.88743591308594, -181.0220184326172, -177.15660095214844, -173.2911834716797, -169.42576599121094, -165.5603485107422, -161.6949462890625, -157.82952880859375, -153.964111328125, -150.09869384765625, -146.2332763671875, -142.36785888671875, -138.50244140625, -134.63702392578125, -130.7716064453125, -126.90619659423828, -123.04078674316406, -119.17536926269531, -115.30994415283203, -111.44452667236328, -107.57911682128906, -103.71369934082031, -99.84828186035156, -95.98286437988281, -92.11744689941406, -88.25203704833984, -84.3866195678711, -80.52120208740234, -76.65579223632812, -72.79037475585938, -68.92495727539062, -65.05953979492188, -61.19412612915039, -57.328712463378906, -53.463294982910156, -49.597877502441406, -45.73246383666992, -41.86705017089844, -38.00163269042969, -34.13621520996094, -30.270801544189453, -26.405385971069336, -22.53997039794922, -18.6745548248291, -14.809139251708984, -10.943723678588867, -7.07830810546875, -3.212892532348633, 0.6525230407714844, 4.517938613891602, 8.383353233337402]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 6.0, 5.0, 11.0, 10.0, 9.0, 18.0, 17.0, 20.0, 17.0, 20.0, 28.0, 39.0, 22.0, 33.0, 37.0, 45.0, 41.0, 44.0, 44.0, 40.0, 45.0, 42.0, 47.0, 37.0, 45.0, 32.0, 32.0, 38.0, 37.0, 15.0, 19.0, 14.0, 14.0, 17.0, 14.0, 10.0, 8.0, 12.0, 3.0, 6.0, 5.0, 3.0, 2.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-117.60169219970703, -114.11853790283203, -110.63538360595703, -107.15222930908203, -103.66907501220703, -100.18592071533203, -96.7027587890625, -93.2196044921875, -89.7364501953125, -86.2532958984375, -82.7701416015625, -79.2869873046875, -75.8038330078125, -72.3206787109375, -68.8375244140625, -65.3543701171875, -61.8712158203125, -58.3880615234375, -54.9049072265625, -51.4217529296875, -47.9385986328125, -44.4554443359375, -40.972286224365234, -37.489131927490234, -34.005977630615234, -30.522823333740234, -27.039669036865234, -23.5565128326416, -20.0733585357666, -16.5902042388916, -13.107048034667969, -9.623893737792969, -6.1407318115234375, -2.6575770378112793, 0.8255777359008789, 4.308732986450195, 7.791887283325195, 11.275041580200195, 14.758197784423828, 18.241352081298828, 21.724506378173828, 25.207660675048828, 28.690814971923828, 32.173973083496094, 35.657127380371094, 39.140281677246094, 42.623435974121094, 46.106590270996094, 49.589744567871094, 53.072898864746094, 56.556053161621094, 60.039207458496094, 63.522361755371094, 67.0055160522461, 70.48867797851562, 73.97183227539062, 77.45498657226562, 80.93814086914062, 84.42129516601562, 87.90444946289062, 91.38760375976562, 94.87075805664062, 98.35391235351562, 101.83706665039062, 105.32022094726562]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 7.0, 3.0, 9.0, 7.0, 9.0, 8.0, 12.0, 15.0, 16.0, 19.0, 28.0, 14.0, 25.0, 25.0, 36.0, 26.0, 37.0, 40.0, 32.0, 37.0, 42.0, 42.0, 36.0, 42.0, 37.0, 38.0, 42.0, 25.0, 31.0, 23.0, 24.0, 28.0, 25.0, 22.0, 27.0, 16.0, 13.0, 18.0, 14.0, 9.0, 15.0, 5.0, 2.0, 5.0, 4.0, 6.0, 6.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0], "bins": [-13.7265625, -13.29345703125, -12.8603515625, -12.42724609375, -11.994140625, -11.56103515625, -11.1279296875, -10.69482421875, -10.26171875, -9.82861328125, -9.3955078125, -8.96240234375, -8.529296875, -8.09619140625, -7.6630859375, -7.22998046875, -6.796875, -6.36376953125, -5.9306640625, -5.49755859375, -5.064453125, -4.63134765625, -4.1982421875, -3.76513671875, -3.33203125, -2.89892578125, -2.4658203125, -2.03271484375, -1.599609375, -1.16650390625, -0.7333984375, -0.30029296875, 0.1328125, 0.56591796875, 0.9990234375, 1.43212890625, 1.865234375, 2.29833984375, 2.7314453125, 3.16455078125, 3.59765625, 4.03076171875, 4.4638671875, 4.89697265625, 5.330078125, 5.76318359375, 6.1962890625, 6.62939453125, 7.0625, 7.49560546875, 7.9287109375, 8.36181640625, 8.794921875, 9.22802734375, 9.6611328125, 10.09423828125, 10.52734375, 10.96044921875, 11.3935546875, 11.82666015625, 12.259765625, 12.69287109375, 13.1259765625, 13.55908203125, 13.9921875]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 9.0, 8.0, 5.0, 18.0, 28.0, 21.0, 40.0, 55.0, 72.0, 121.0, 129.0, 207.0, 330.0, 495.0, 758.0, 1164.0, 1899.0, 3121.0, 5497.0, 9304.0, 26234.0, 234277.0, 2488211.0, 1296852.0, 90545.0, 14695.0, 7375.0, 4566.0, 2765.0, 1720.0, 1186.0, 805.0, 498.0, 339.0, 245.0, 175.0, 148.0, 96.0, 71.0, 51.0, 34.0, 38.0, 16.0, 19.0, 7.0, 15.0, 4.0, 6.0, 4.0, 2.0, 4.0, 9.0], "bins": [-34.15625, -33.17578125, -32.1953125, -31.21484375, -30.234375, -29.25390625, -28.2734375, -27.29296875, -26.3125, -25.33203125, -24.3515625, -23.37109375, -22.390625, -21.41015625, -20.4296875, -19.44921875, -18.46875, -17.48828125, -16.5078125, -15.52734375, -14.546875, -13.56640625, -12.5859375, -11.60546875, -10.625, -9.64453125, -8.6640625, -7.68359375, -6.703125, -5.72265625, -4.7421875, -3.76171875, -2.78125, -1.80078125, -0.8203125, 0.16015625, 1.140625, 2.12109375, 3.1015625, 4.08203125, 5.0625, 6.04296875, 7.0234375, 8.00390625, 8.984375, 9.96484375, 10.9453125, 11.92578125, 12.90625, 13.88671875, 14.8671875, 15.84765625, 16.828125, 17.80859375, 18.7890625, 19.76953125, 20.75, 21.73046875, 22.7109375, 23.69140625, 24.671875, 25.65234375, 26.6328125, 27.61328125, 28.59375]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 4.0, 10.0, 9.0, 13.0, 21.0, 18.0, 37.0, 56.0, 101.0, 203.0, 516.0, 1003.0, 1045.0, 544.0, 242.0, 102.0, 58.0, 20.0, 20.0, 19.0, 11.0, 7.0, 5.0, 3.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.28125, -38.94091796875, -37.6005859375, -36.26025390625, -34.919921875, -33.57958984375, -32.2392578125, -30.89892578125, -29.55859375, -28.21826171875, -26.8779296875, -25.53759765625, -24.197265625, -22.85693359375, -21.5166015625, -20.17626953125, -18.8359375, -17.49560546875, -16.1552734375, -14.81494140625, -13.474609375, -12.13427734375, -10.7939453125, -9.45361328125, -8.11328125, -6.77294921875, -5.4326171875, -4.09228515625, -2.751953125, -1.41162109375, -0.0712890625, 1.26904296875, 2.609375, 3.94970703125, 5.2900390625, 6.63037109375, 7.970703125, 9.31103515625, 10.6513671875, 11.99169921875, 13.33203125, 14.67236328125, 16.0126953125, 17.35302734375, 18.693359375, 20.03369140625, 21.3740234375, 22.71435546875, 24.0546875, 25.39501953125, 26.7353515625, 28.07568359375, 29.416015625, 30.75634765625, 32.0966796875, 33.43701171875, 34.77734375, 36.11767578125, 37.4580078125, 38.79833984375, 40.138671875, 41.47900390625, 42.8193359375, 44.15966796875, 45.5]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 10.0, 8.0, 15.0, 17.0, 39.0, 91.0, 161.0, 355.0, 881.0, 2906.0, 18016.0, 3249942.0, 904265.0, 13719.0, 2437.0, 773.0, 309.0, 149.0, 71.0, 47.0, 32.0, 10.0, 13.0, 8.0, 2.0, 0.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-140.25, -135.9921875, -131.734375, -127.4765625, -123.21875, -118.9609375, -114.703125, -110.4453125, -106.1875, -101.9296875, -97.671875, -93.4140625, -89.15625, -84.8984375, -80.640625, -76.3828125, -72.125, -67.8671875, -63.609375, -59.3515625, -55.09375, -50.8359375, -46.578125, -42.3203125, -38.0625, -33.8046875, -29.546875, -25.2890625, -21.03125, -16.7734375, -12.515625, -8.2578125, -4.0, 0.2578125, 4.515625, 8.7734375, 13.03125, 17.2890625, 21.546875, 25.8046875, 30.0625, 34.3203125, 38.578125, 42.8359375, 47.09375, 51.3515625, 55.609375, 59.8671875, 64.125, 68.3828125, 72.640625, 76.8984375, 81.15625, 85.4140625, 89.671875, 93.9296875, 98.1875, 102.4453125, 106.703125, 110.9609375, 115.21875, 119.4765625, 123.734375, 127.9921875, 132.25]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 7.0, 17.0, 134.0, 651.0, 177.0, 31.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1150.5255126953125, -1130.531982421875, -1110.5384521484375, -1090.544921875, -1070.551513671875, -1050.5579833984375, -1030.564453125, -1010.5709228515625, -990.577392578125, -970.5838623046875, -950.59033203125, -930.5968627929688, -910.6033325195312, -890.6098022460938, -870.6163330078125, -850.622802734375, -830.6292724609375, -810.6357421875, -790.6422119140625, -770.6487426757812, -750.6552124023438, -730.6616821289062, -710.668212890625, -690.6746826171875, -670.68115234375, -650.6876220703125, -630.694091796875, -610.7006225585938, -590.7070922851562, -570.7135620117188, -550.7200927734375, -530.7265625, -510.7330322265625, -490.739501953125, -470.7460021972656, -450.75250244140625, -430.75897216796875, -410.76544189453125, -390.7719421386719, -370.7784423828125, -350.784912109375, -330.7913818359375, -310.7978820800781, -290.80438232421875, -270.81085205078125, -250.8173370361328, -230.82382202148438, -210.83030700683594, -190.83680725097656, -170.84329223632812, -150.8497772216797, -130.85626220703125, -110.86274719238281, -90.86923217773438, -70.87571716308594, -50.8822021484375, -30.888687133789062, -10.895172119140625, 9.098342895507812, 29.09185791015625, 49.08537292480469, 69.07888793945312, 89.07240295410156, 109.06591796875, 129.05943298339844]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 8.0, 9.0, 10.0, 6.0, 2.0, 12.0, 12.0, 17.0, 15.0, 15.0, 19.0, 35.0, 21.0, 32.0, 28.0, 28.0, 40.0, 27.0, 42.0, 35.0, 56.0, 39.0, 41.0, 37.0, 52.0, 33.0, 36.0, 40.0, 23.0, 30.0, 24.0, 36.0, 26.0, 19.0, 10.0, 27.0, 17.0, 12.0, 9.0, 5.0, 7.0, 10.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.24681091308594, -72.58232116699219, -69.91783142089844, -67.25334930419922, -64.58885955810547, -61.92436981201172, -59.25988006591797, -56.595394134521484, -53.930908203125, -51.26641845703125, -48.601932525634766, -45.937442779541016, -43.27295684814453, -40.60846710205078, -37.94397735595703, -35.27949142456055, -32.6150016784668, -29.95051383972168, -27.286026000976562, -24.621536254882812, -21.957050323486328, -19.292560577392578, -16.62807273864746, -13.963584899902344, -11.299097061157227, -8.63460922241211, -5.970120906829834, -3.3056325912475586, -0.6411447525024414, 2.023343086242676, 4.687831878662109, 7.352319717407227, 10.016807556152344, 12.681295394897461, 15.345783233642578, 18.010272979736328, 20.674758911132812, 23.339248657226562, 26.00373649597168, 28.668224334716797, 31.332712173461914, 33.99720001220703, 36.66168975830078, 39.326175689697266, 41.990665435791016, 44.6551513671875, 47.31964111328125, 49.984130859375, 52.648616790771484, 55.313106536865234, 57.97759246826172, 60.64208221435547, 63.30656814575195, 65.97105407714844, 68.63554382324219, 71.30003356933594, 73.96452331542969, 76.62901306152344, 79.29350280761719, 81.9579849243164, 84.62247467041016, 87.2869644165039, 89.95145416259766, 92.61593627929688, 95.28042602539062]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 2.0, 5.0, 11.0, 12.0, 14.0, 11.0, 15.0, 14.0, 17.0, 20.0, 22.0, 34.0, 36.0, 36.0, 32.0, 33.0, 37.0, 35.0, 34.0, 40.0, 43.0, 34.0, 40.0, 46.0, 31.0, 34.0, 39.0, 30.0, 27.0, 29.0, 22.0, 21.0, 17.0, 15.0, 22.0, 13.0, 8.0, 11.0, 10.0, 11.0, 8.0, 3.0, 7.0, 4.0, 3.0, 2.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-13.53125, -13.0953369140625, -12.659423828125, -12.2235107421875, -11.78759765625, -11.3516845703125, -10.915771484375, -10.4798583984375, -10.0439453125, -9.6080322265625, -9.172119140625, -8.7362060546875, -8.30029296875, -7.8643798828125, -7.428466796875, -6.9925537109375, -6.556640625, -6.1207275390625, -5.684814453125, -5.2489013671875, -4.81298828125, -4.3770751953125, -3.941162109375, -3.5052490234375, -3.0693359375, -2.6334228515625, -2.197509765625, -1.7615966796875, -1.32568359375, -0.8897705078125, -0.453857421875, -0.0179443359375, 0.41796875, 0.8538818359375, 1.289794921875, 1.7257080078125, 2.16162109375, 2.5975341796875, 3.033447265625, 3.4693603515625, 3.9052734375, 4.3411865234375, 4.777099609375, 5.2130126953125, 5.64892578125, 6.0848388671875, 6.520751953125, 6.9566650390625, 7.392578125, 7.8284912109375, 8.264404296875, 8.7003173828125, 9.13623046875, 9.5721435546875, 10.008056640625, 10.4439697265625, 10.8798828125, 11.3157958984375, 11.751708984375, 12.1876220703125, 12.62353515625, 13.0594482421875, 13.495361328125, 13.9312744140625, 14.3671875]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 8.0, 6.0, 17.0, 23.0, 31.0, 49.0, 52.0, 80.0, 106.0, 158.0, 225.0, 329.0, 523.0, 804.0, 1201.0, 1852.0, 2654.0, 4044.0, 6028.0, 9039.0, 14282.0, 22323.0, 35359.0, 57702.0, 99588.0, 172832.0, 225357.0, 158613.0, 90612.0, 52813.0, 32557.0, 20423.0, 13487.0, 8526.0, 5690.0, 3761.0, 2375.0, 1632.0, 1067.0, 707.0, 518.0, 338.0, 218.0, 200.0, 118.0, 85.0, 52.0, 28.0, 16.0, 20.0, 7.0, 7.0, 6.0, 4.0, 5.0, 5.0, 2.0, 3.0], "bins": [-1.412109375, -1.3685455322265625, -1.324981689453125, -1.2814178466796875, -1.23785400390625, -1.1942901611328125, -1.150726318359375, -1.1071624755859375, -1.0635986328125, -1.0200347900390625, -0.976470947265625, -0.9329071044921875, -0.88934326171875, -0.8457794189453125, -0.802215576171875, -0.7586517333984375, -0.715087890625, -0.6715240478515625, -0.627960205078125, -0.5843963623046875, -0.54083251953125, -0.4972686767578125, -0.453704833984375, -0.4101409912109375, -0.3665771484375, -0.3230133056640625, -0.279449462890625, -0.2358856201171875, -0.19232177734375, -0.1487579345703125, -0.105194091796875, -0.0616302490234375, -0.01806640625, 0.0254974365234375, 0.069061279296875, 0.1126251220703125, 0.15618896484375, 0.1997528076171875, 0.243316650390625, 0.2868804931640625, 0.3304443359375, 0.3740081787109375, 0.417572021484375, 0.4611358642578125, 0.50469970703125, 0.5482635498046875, 0.591827392578125, 0.6353912353515625, 0.678955078125, 0.7225189208984375, 0.766082763671875, 0.8096466064453125, 0.85321044921875, 0.8967742919921875, 0.940338134765625, 0.9839019775390625, 1.0274658203125, 1.0710296630859375, 1.114593505859375, 1.1581573486328125, 1.20172119140625, 1.2452850341796875, 1.288848876953125, 1.3324127197265625, 1.3759765625]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 9.0, 7.0, 6.0, 8.0, 7.0, 6.0, 13.0, 18.0, 19.0, 12.0, 18.0, 28.0, 27.0, 23.0, 32.0, 35.0, 40.0, 35.0, 31.0, 44.0, 37.0, 37.0, 1064.0, 51.0, 35.0, 24.0, 28.0, 29.0, 34.0, 34.0, 32.0, 32.0, 24.0, 27.0, 16.0, 17.0, 22.0, 14.0, 10.0, 5.0, 3.0, 8.0, 10.0, 5.0, 2.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-9.8046875, -9.519775390625, -9.23486328125, -8.949951171875, -8.6650390625, -8.380126953125, -8.09521484375, -7.810302734375, -7.525390625, -7.240478515625, -6.95556640625, -6.670654296875, -6.3857421875, -6.100830078125, -5.81591796875, -5.531005859375, -5.24609375, -4.961181640625, -4.67626953125, -4.391357421875, -4.1064453125, -3.821533203125, -3.53662109375, -3.251708984375, -2.966796875, -2.681884765625, -2.39697265625, -2.112060546875, -1.8271484375, -1.542236328125, -1.25732421875, -0.972412109375, -0.6875, -0.402587890625, -0.11767578125, 0.167236328125, 0.4521484375, 0.737060546875, 1.02197265625, 1.306884765625, 1.591796875, 1.876708984375, 2.16162109375, 2.446533203125, 2.7314453125, 3.016357421875, 3.30126953125, 3.586181640625, 3.87109375, 4.156005859375, 4.44091796875, 4.725830078125, 5.0107421875, 5.295654296875, 5.58056640625, 5.865478515625, 6.150390625, 6.435302734375, 6.72021484375, 7.005126953125, 7.2900390625, 7.574951171875, 7.85986328125, 8.144775390625, 8.4296875]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 9.0, 10.0, 20.0, 20.0, 31.0, 48.0, 73.0, 104.0, 190.0, 335.0, 476.0, 671.0, 984.0, 1596.0, 2376.0, 3612.0, 5473.0, 8504.0, 13286.0, 20977.0, 33131.0, 53987.0, 90250.0, 154340.0, 1264957.0, 174459.0, 103169.0, 61633.0, 37325.0, 23043.0, 14643.0, 9583.0, 6059.0, 4064.0, 2684.0, 1694.0, 1077.0, 804.0, 517.0, 307.0, 231.0, 137.0, 91.0, 44.0, 36.0, 29.0, 17.0, 8.0, 11.0, 9.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.8525390625, -0.8246994018554688, -0.7968597412109375, -0.7690200805664062, -0.741180419921875, -0.7133407592773438, -0.6855010986328125, -0.6576614379882812, -0.62982177734375, -0.6019821166992188, -0.5741424560546875, -0.5463027954101562, -0.518463134765625, -0.49062347412109375, -0.4627838134765625, -0.43494415283203125, -0.4071044921875, -0.37926483154296875, -0.3514251708984375, -0.32358551025390625, -0.295745849609375, -0.26790618896484375, -0.2400665283203125, -0.21222686767578125, -0.18438720703125, -0.15654754638671875, -0.1287078857421875, -0.10086822509765625, -0.073028564453125, -0.04518890380859375, -0.0173492431640625, 0.01049041748046875, 0.038330078125, 0.06616973876953125, 0.0940093994140625, 0.12184906005859375, 0.149688720703125, 0.17752838134765625, 0.2053680419921875, 0.23320770263671875, 0.26104736328125, 0.28888702392578125, 0.3167266845703125, 0.34456634521484375, 0.372406005859375, 0.40024566650390625, 0.4280853271484375, 0.45592498779296875, 0.4837646484375, 0.5116043090820312, 0.5394439697265625, 0.5672836303710938, 0.595123291015625, 0.6229629516601562, 0.6508026123046875, 0.6786422729492188, 0.70648193359375, 0.7343215942382812, 0.7621612548828125, 0.7900009155273438, 0.817840576171875, 0.8456802368164062, 0.8735198974609375, 0.9013595581054688, 0.92919921875]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 4.0, 1.0, 3.0, 6.0, 7.0, 11.0, 5.0, 7.0, 14.0, 15.0, 11.0, 13.0, 20.0, 19.0, 40.0, 42.0, 65.0, 95.0, 126.0, 134.0, 95.0, 80.0, 41.0, 34.0, 22.0, 12.0, 18.0, 13.0, 15.0, 11.0, 5.0, 6.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.03857421875, -0.03747081756591797, -0.03636741638183594, -0.035264015197753906, -0.034160614013671875, -0.033057212829589844, -0.03195381164550781, -0.03085041046142578, -0.02974700927734375, -0.02864360809326172, -0.027540206909179688, -0.026436805725097656, -0.025333404541015625, -0.024230003356933594, -0.023126602172851562, -0.02202320098876953, -0.0209197998046875, -0.01981639862060547, -0.018712997436523438, -0.017609596252441406, -0.016506195068359375, -0.015402793884277344, -0.014299392700195312, -0.013195991516113281, -0.01209259033203125, -0.010989189147949219, -0.009885787963867188, -0.008782386779785156, -0.007678985595703125, -0.006575584411621094, -0.0054721832275390625, -0.004368782043457031, -0.003265380859375, -0.0021619796752929688, -0.0010585784912109375, 4.482269287109375e-05, 0.001148223876953125, 0.0022516250610351562, 0.0033550262451171875, 0.004458427429199219, 0.00556182861328125, 0.006665229797363281, 0.0077686309814453125, 0.008872032165527344, 0.009975433349609375, 0.011078834533691406, 0.012182235717773438, 0.013285636901855469, 0.0143890380859375, 0.015492439270019531, 0.016595840454101562, 0.017699241638183594, 0.018802642822265625, 0.019906044006347656, 0.021009445190429688, 0.02211284637451172, 0.02321624755859375, 0.02431964874267578, 0.025423049926757812, 0.026526451110839844, 0.027629852294921875, 0.028733253479003906, 0.029836654663085938, 0.03094005584716797, 0.03204345703125]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 6.0, 4.0, 9.0, 14.0, 15.0, 22.0, 25.0, 32.0, 32.0, 71.0, 84.0, 197.0, 541.0, 7681.0, 974562.0, 63152.0, 1405.0, 242.0, 118.0, 87.0, 53.0, 42.0, 31.0, 27.0, 12.0, 19.0, 9.0, 12.0, 9.0, 10.0, 6.0, 5.0, 5.0, 4.0, 2.0, 0.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.70263671875, -0.6790084838867188, -0.6553802490234375, -0.6317520141601562, -0.608123779296875, -0.5844955444335938, -0.5608673095703125, -0.5372390747070312, -0.51361083984375, -0.48998260498046875, -0.4663543701171875, -0.44272613525390625, -0.419097900390625, -0.39546966552734375, -0.3718414306640625, -0.34821319580078125, -0.3245849609375, -0.30095672607421875, -0.2773284912109375, -0.25370025634765625, -0.230072021484375, -0.20644378662109375, -0.1828155517578125, -0.15918731689453125, -0.13555908203125, -0.11193084716796875, -0.0883026123046875, -0.06467437744140625, -0.041046142578125, -0.01741790771484375, 0.0062103271484375, 0.02983856201171875, 0.053466796875, 0.07709503173828125, 0.1007232666015625, 0.12435150146484375, 0.147979736328125, 0.17160797119140625, 0.1952362060546875, 0.21886444091796875, 0.24249267578125, 0.26612091064453125, 0.2897491455078125, 0.31337738037109375, 0.337005615234375, 0.36063385009765625, 0.3842620849609375, 0.40789031982421875, 0.4315185546875, 0.45514678955078125, 0.4787750244140625, 0.5024032592773438, 0.526031494140625, 0.5496597290039062, 0.5732879638671875, 0.5969161987304688, 0.62054443359375, 0.6441726684570312, 0.6678009033203125, 0.6914291381835938, 0.715057373046875, 0.7386856079101562, 0.7623138427734375, 0.7859420776367188, 0.8095703125]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 7.0, 30.0, 104.0, 576.0, 227.0, 51.0, 10.0, 7.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3132428526878357, -0.3014827072620392, -0.2897225618362427, -0.27796244621276855, -0.26620230078697205, -0.25444215536117554, -0.24268202483654022, -0.2309218943119049, -0.2191617488861084, -0.2074016034603119, -0.19564147293567657, -0.18388134241104126, -0.17212119698524475, -0.16036105155944824, -0.14860092103481293, -0.1368407905101776, -0.1250806450843811, -0.11332050710916519, -0.10156036913394928, -0.08980023115873337, -0.07804009318351746, -0.06627995520830154, -0.05451981723308563, -0.04275967925786972, -0.03099954128265381, -0.019239403307437897, -0.007479265332221985, 0.004280872642993927, 0.01604101061820984, 0.02780114859342575, 0.03956128656864166, 0.051321424543857574, 0.06308159232139587, 0.07484173029661179, 0.0866018682718277, 0.09836200624704361, 0.11012214422225952, 0.12188228219747543, 0.13364242017269135, 0.14540255069732666, 0.15716269612312317, 0.16892284154891968, 0.180682972073555, 0.1924431025981903, 0.20420324802398682, 0.21596339344978333, 0.22772352397441864, 0.23948365449905396, 0.25124379992485046, 0.263003945350647, 0.2747640609741211, 0.2865242063999176, 0.2982843518257141, 0.3100444972515106, 0.32180464267730713, 0.33356475830078125, 0.34532490372657776, 0.35708504915237427, 0.3688451647758484, 0.3806053102016449, 0.3923654556274414, 0.4041256010532379, 0.4158857464790344, 0.42764586210250854, 0.43940600752830505]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 5.0, 3.0, 6.0, 8.0, 10.0, 6.0, 12.0, 21.0, 22.0, 18.0, 24.0, 38.0, 34.0, 28.0, 43.0, 43.0, 36.0, 39.0, 33.0, 47.0, 47.0, 36.0, 44.0, 45.0, 40.0, 47.0, 40.0, 31.0, 31.0, 26.0, 22.0, 24.0, 19.0, 18.0, 16.0, 3.0, 10.0, 10.0, 4.0, 7.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04542136192321777, -0.04374955594539642, -0.042077746242284775, -0.040405936539173126, -0.038734130561351776, -0.037062324583530426, -0.03539051488041878, -0.03371870517730713, -0.03204689919948578, -0.03037509135901928, -0.02870328351855278, -0.02703147567808628, -0.02535966783761978, -0.023687859997153282, -0.022016052156686783, -0.020344244316220284, -0.018672436475753784, -0.017000628635287285, -0.015328820794820786, -0.013657012954354286, -0.011985205113887787, -0.010313397273421288, -0.008641589432954788, -0.006969781592488289, -0.0052979737520217896, -0.0036261659115552902, -0.001954358071088791, -0.00028255023062229156, 0.0013892576098442078, 0.003061065450310707, 0.004732873290777206, 0.006404681131243706, 0.008076488971710205, 0.009748296812176704, 0.011420104652643204, 0.013091912493109703, 0.014763720333576202, 0.0164355281740427, 0.0181073360145092, 0.0197791438549757, 0.0214509516954422, 0.0231227595359087, 0.0247945673763752, 0.026466375216841698, 0.028138183057308197, 0.029809990897774696, 0.031481798738241196, 0.033153608441352844, 0.034825414419174194, 0.036497220396995544, 0.03816903010010719, 0.03984083980321884, 0.04151264578104019, 0.04318445175886154, 0.04485626146197319, 0.04652807116508484, 0.04819987714290619, 0.04987168312072754, 0.05154349282383919, 0.053215302526950836, 0.054887108504772186, 0.056558914482593536, 0.058230724185705185, 0.059902533888816833, 0.061574339866638184]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 2.0, 5.0, 12.0, 11.0, 14.0, 11.0, 15.0, 14.0, 17.0, 20.0, 22.0, 34.0, 36.0, 36.0, 32.0, 33.0, 37.0, 35.0, 34.0, 41.0, 42.0, 35.0, 39.0, 46.0, 32.0, 33.0, 39.0, 30.0, 27.0, 29.0, 22.0, 22.0, 16.0, 15.0, 22.0, 13.0, 8.0, 11.0, 10.0, 11.0, 8.0, 3.0, 7.0, 4.0, 3.0, 2.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-13.53125, -13.09521484375, -12.6591796875, -12.22314453125, -11.787109375, -11.35107421875, -10.9150390625, -10.47900390625, -10.04296875, -9.60693359375, -9.1708984375, -8.73486328125, -8.298828125, -7.86279296875, -7.4267578125, -6.99072265625, -6.5546875, -6.11865234375, -5.6826171875, -5.24658203125, -4.810546875, -4.37451171875, -3.9384765625, -3.50244140625, -3.06640625, -2.63037109375, -2.1943359375, -1.75830078125, -1.322265625, -0.88623046875, -0.4501953125, -0.01416015625, 0.421875, 0.85791015625, 1.2939453125, 1.72998046875, 2.166015625, 2.60205078125, 3.0380859375, 3.47412109375, 3.91015625, 4.34619140625, 4.7822265625, 5.21826171875, 5.654296875, 6.09033203125, 6.5263671875, 6.96240234375, 7.3984375, 7.83447265625, 8.2705078125, 8.70654296875, 9.142578125, 9.57861328125, 10.0146484375, 10.45068359375, 10.88671875, 11.32275390625, 11.7587890625, 12.19482421875, 12.630859375, 13.06689453125, 13.5029296875, 13.93896484375, 14.375]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 5.0, 7.0, 7.0, 15.0, 10.0, 25.0, 18.0, 35.0, 43.0, 38.0, 80.0, 94.0, 183.0, 266.0, 444.0, 778.0, 1567.0, 3197.0, 8605.0, 28732.0, 115311.0, 511916.0, 285972.0, 63427.0, 17201.0, 5452.0, 2356.0, 1080.0, 620.0, 386.0, 199.0, 134.0, 94.0, 62.0, 45.0, 34.0, 22.0, 16.0, 21.0, 12.0, 12.0, 6.0, 4.0, 6.0, 6.0, 4.0, 1.0, 5.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-12.7421875, -12.328369140625, -11.91455078125, -11.500732421875, -11.0869140625, -10.673095703125, -10.25927734375, -9.845458984375, -9.431640625, -9.017822265625, -8.60400390625, -8.190185546875, -7.7763671875, -7.362548828125, -6.94873046875, -6.534912109375, -6.12109375, -5.707275390625, -5.29345703125, -4.879638671875, -4.4658203125, -4.052001953125, -3.63818359375, -3.224365234375, -2.810546875, -2.396728515625, -1.98291015625, -1.569091796875, -1.1552734375, -0.741455078125, -0.32763671875, 0.086181640625, 0.5, 0.913818359375, 1.32763671875, 1.741455078125, 2.1552734375, 2.569091796875, 2.98291015625, 3.396728515625, 3.810546875, 4.224365234375, 4.63818359375, 5.052001953125, 5.4658203125, 5.879638671875, 6.29345703125, 6.707275390625, 7.12109375, 7.534912109375, 7.94873046875, 8.362548828125, 8.7763671875, 9.190185546875, 9.60400390625, 10.017822265625, 10.431640625, 10.845458984375, 11.25927734375, 11.673095703125, 12.0869140625, 12.500732421875, 12.91455078125, 13.328369140625, 13.7421875]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 7.0, 1.0, 9.0, 13.0, 10.0, 14.0, 11.0, 10.0, 15.0, 21.0, 29.0, 20.0, 31.0, 36.0, 34.0, 38.0, 44.0, 55.0, 84.0, 309.0, 1680.0, 98.0, 79.0, 49.0, 44.0, 40.0, 36.0, 25.0, 31.0, 35.0, 18.0, 19.0, 20.0, 13.0, 10.0, 9.0, 18.0, 9.0, 11.0, 9.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.5, -34.24072265625, -32.9814453125, -31.72216796875, -30.462890625, -29.20361328125, -27.9443359375, -26.68505859375, -25.42578125, -24.16650390625, -22.9072265625, -21.64794921875, -20.388671875, -19.12939453125, -17.8701171875, -16.61083984375, -15.3515625, -14.09228515625, -12.8330078125, -11.57373046875, -10.314453125, -9.05517578125, -7.7958984375, -6.53662109375, -5.27734375, -4.01806640625, -2.7587890625, -1.49951171875, -0.240234375, 1.01904296875, 2.2783203125, 3.53759765625, 4.796875, 6.05615234375, 7.3154296875, 8.57470703125, 9.833984375, 11.09326171875, 12.3525390625, 13.61181640625, 14.87109375, 16.13037109375, 17.3896484375, 18.64892578125, 19.908203125, 21.16748046875, 22.4267578125, 23.68603515625, 24.9453125, 26.20458984375, 27.4638671875, 28.72314453125, 29.982421875, 31.24169921875, 32.5009765625, 33.76025390625, 35.01953125, 36.27880859375, 37.5380859375, 38.79736328125, 40.056640625, 41.31591796875, 42.5751953125, 43.83447265625, 45.09375]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 11.0, 10.0, 10.0, 12.0, 15.0, 16.0, 15.0, 23.0, 37.0, 38.0, 82.0, 84.0, 73.0, 128.0, 127.0, 236.0, 342.0, 782.0, 5367.0, 2787641.0, 345786.0, 3152.0, 661.0, 282.0, 194.0, 139.0, 101.0, 90.0, 52.0, 52.0, 35.0, 24.0, 18.0, 12.0, 17.0, 8.0, 12.0, 9.0, 4.0, 4.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-76.25, -74.1259765625, -72.001953125, -69.8779296875, -67.75390625, -65.6298828125, -63.505859375, -61.3818359375, -59.2578125, -57.1337890625, -55.009765625, -52.8857421875, -50.76171875, -48.6376953125, -46.513671875, -44.3896484375, -42.265625, -40.1416015625, -38.017578125, -35.8935546875, -33.76953125, -31.6455078125, -29.521484375, -27.3974609375, -25.2734375, -23.1494140625, -21.025390625, -18.9013671875, -16.77734375, -14.6533203125, -12.529296875, -10.4052734375, -8.28125, -6.1572265625, -4.033203125, -1.9091796875, 0.21484375, 2.3388671875, 4.462890625, 6.5869140625, 8.7109375, 10.8349609375, 12.958984375, 15.0830078125, 17.20703125, 19.3310546875, 21.455078125, 23.5791015625, 25.703125, 27.8271484375, 29.951171875, 32.0751953125, 34.19921875, 36.3232421875, 38.447265625, 40.5712890625, 42.6953125, 44.8193359375, 46.943359375, 49.0673828125, 51.19140625, 53.3154296875, 55.439453125, 57.5634765625, 59.6875]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [203.0, 807.0, 7.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.93674373626709, -2.113966941833496, 7.708809852600098, 17.531585693359375, 27.35436248779297, 37.17713928222656, 46.999916076660156, 56.82269287109375, 66.64546966552734, 76.46824645996094, 86.29102325439453, 96.11380004882812, 105.93657684326172, 115.75935363769531, 125.5821304321289, 135.4049072265625, 145.22769165039062, 155.05047607421875, 164.8732452392578, 174.69601440429688, 184.518798828125, 194.34158325195312, 204.1643524169922, 213.98712158203125, 223.80990600585938, 233.6326904296875, 243.45545959472656, 253.27822875976562, 263.10101318359375, 272.9237976074219, 282.74658203125, 292.5693359375, 302.39208984375, 312.2148742675781, 322.03765869140625, 331.86041259765625, 341.6831970214844, 351.5059814453125, 361.3287353515625, 371.1515197753906, 380.97430419921875, 390.7970886230469, 400.619873046875, 410.442626953125, 420.2654113769531, 430.08819580078125, 439.91094970703125, 449.7337341308594, 459.5565185546875, 469.3793029785156, 479.20208740234375, 489.02484130859375, 498.8476257324219, 508.67041015625, 518.4931640625, 528.3159790039062, 538.1387329101562, 547.9614868164062, 557.7843017578125, 567.6070556640625, 577.4298095703125, 587.2526245117188, 597.0753784179688, 606.898193359375, 616.720947265625]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 5.0, 6.0, 2.0, 6.0, 9.0, 16.0, 14.0, 23.0, 20.0, 27.0, 35.0, 32.0, 31.0, 39.0, 42.0, 36.0, 38.0, 53.0, 59.0, 33.0, 44.0, 35.0, 49.0, 37.0, 39.0, 36.0, 27.0, 21.0, 29.0, 22.0, 26.0, 16.0, 25.0, 15.0, 13.0, 8.0, 8.0, 8.0, 7.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-99.80734252929688, -96.58840942382812, -93.3694839477539, -90.15055084228516, -86.9316177368164, -83.71269226074219, -80.49375915527344, -77.27482604980469, -74.05590057373047, -70.83696746826172, -67.6180419921875, -64.39910888671875, -61.180179595947266, -57.96125030517578, -54.74231719970703, -51.52338790893555, -48.3044548034668, -45.08552551269531, -41.86659240722656, -38.64766311645508, -35.428733825683594, -32.209800720214844, -28.99087142944336, -25.771942138671875, -22.553010940551758, -19.33407974243164, -16.115150451660156, -12.896219253540039, -9.677289009094238, -6.4583587646484375, -3.2394275665283203, -0.020498275756835938, 3.1984329223632812, 6.417363166809082, 9.636293411254883, 12.855224609375, 16.074153900146484, 19.2930850982666, 22.51201629638672, 25.730945587158203, 28.94987678527832, 32.16880798339844, 35.38773727416992, 38.606666564941406, 41.825599670410156, 45.04452896118164, 48.263458251953125, 51.482391357421875, 54.70132064819336, 57.920249938964844, 61.139183044433594, 64.35810852050781, 67.57704162597656, 70.79597473144531, 74.01490783691406, 77.23383331298828, 80.45276641845703, 83.67169952392578, 86.890625, 90.10955810546875, 93.3284912109375, 96.54741668701172, 99.76634979248047, 102.98527526855469, 106.20420837402344]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 3.0, 2.0, 4.0, 4.0, 14.0, 7.0, 15.0, 8.0, 13.0, 14.0, 20.0, 21.0, 29.0, 29.0, 33.0, 39.0, 27.0, 33.0, 43.0, 41.0, 33.0, 42.0, 40.0, 29.0, 33.0, 47.0, 52.0, 30.0, 35.0, 29.0, 32.0, 20.0, 27.0, 18.0, 14.0, 17.0, 24.0, 11.0, 15.0, 12.0, 8.0, 7.0, 7.0, 6.0, 2.0, 7.0, 3.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-13.6953125, -13.2537841796875, -12.812255859375, -12.3707275390625, -11.92919921875, -11.4876708984375, -11.046142578125, -10.6046142578125, -10.1630859375, -9.7215576171875, -9.280029296875, -8.8385009765625, -8.39697265625, -7.9554443359375, -7.513916015625, -7.0723876953125, -6.630859375, -6.1893310546875, -5.747802734375, -5.3062744140625, -4.86474609375, -4.4232177734375, -3.981689453125, -3.5401611328125, -3.0986328125, -2.6571044921875, -2.215576171875, -1.7740478515625, -1.33251953125, -0.8909912109375, -0.449462890625, -0.0079345703125, 0.43359375, 0.8751220703125, 1.316650390625, 1.7581787109375, 2.19970703125, 2.6412353515625, 3.082763671875, 3.5242919921875, 3.9658203125, 4.4073486328125, 4.848876953125, 5.2904052734375, 5.73193359375, 6.1734619140625, 6.614990234375, 7.0565185546875, 7.498046875, 7.9395751953125, 8.381103515625, 8.8226318359375, 9.26416015625, 9.7056884765625, 10.147216796875, 10.5887451171875, 11.0302734375, 11.4718017578125, 11.913330078125, 12.3548583984375, 12.79638671875, 13.2379150390625, 13.679443359375, 14.1209716796875, 14.5625]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 6.0, 6.0, 9.0, 17.0, 15.0, 22.0, 47.0, 51.0, 57.0, 109.0, 155.0, 172.0, 240.0, 379.0, 567.0, 868.0, 1394.0, 2152.0, 3603.0, 6416.0, 11777.0, 35894.0, 644258.0, 3312807.0, 134022.0, 17523.0, 8507.0, 4757.0, 2791.0, 1800.0, 1181.0, 768.0, 533.0, 379.0, 259.0, 178.0, 144.0, 112.0, 66.0, 63.0, 41.0, 42.0, 20.0, 22.0, 10.0, 19.0, 14.0, 4.0, 4.0, 3.0, 1.0, 0.0, 5.0, 2.0, 0.0, 2.0], "bins": [-43.09375, -41.7158203125, -40.337890625, -38.9599609375, -37.58203125, -36.2041015625, -34.826171875, -33.4482421875, -32.0703125, -30.6923828125, -29.314453125, -27.9365234375, -26.55859375, -25.1806640625, -23.802734375, -22.4248046875, -21.046875, -19.6689453125, -18.291015625, -16.9130859375, -15.53515625, -14.1572265625, -12.779296875, -11.4013671875, -10.0234375, -8.6455078125, -7.267578125, -5.8896484375, -4.51171875, -3.1337890625, -1.755859375, -0.3779296875, 1.0, 2.3779296875, 3.755859375, 5.1337890625, 6.51171875, 7.8896484375, 9.267578125, 10.6455078125, 12.0234375, 13.4013671875, 14.779296875, 16.1572265625, 17.53515625, 18.9130859375, 20.291015625, 21.6689453125, 23.046875, 24.4248046875, 25.802734375, 27.1806640625, 28.55859375, 29.9365234375, 31.314453125, 32.6923828125, 34.0703125, 35.4482421875, 36.826171875, 38.2041015625, 39.58203125, 40.9599609375, 42.337890625, 43.7158203125, 45.09375]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 0.0, 2.0, 1.0, 11.0, 9.0, 6.0, 7.0, 14.0, 13.0, 18.0, 16.0, 28.0, 46.0, 89.0, 200.0, 402.0, 907.0, 1146.0, 556.0, 278.0, 137.0, 46.0, 42.0, 32.0, 19.0, 13.0, 7.0, 10.0, 8.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.625, -29.40869140625, -28.1923828125, -26.97607421875, -25.759765625, -24.54345703125, -23.3271484375, -22.11083984375, -20.89453125, -19.67822265625, -18.4619140625, -17.24560546875, -16.029296875, -14.81298828125, -13.5966796875, -12.38037109375, -11.1640625, -9.94775390625, -8.7314453125, -7.51513671875, -6.298828125, -5.08251953125, -3.8662109375, -2.64990234375, -1.43359375, -0.21728515625, 0.9990234375, 2.21533203125, 3.431640625, 4.64794921875, 5.8642578125, 7.08056640625, 8.296875, 9.51318359375, 10.7294921875, 11.94580078125, 13.162109375, 14.37841796875, 15.5947265625, 16.81103515625, 18.02734375, 19.24365234375, 20.4599609375, 21.67626953125, 22.892578125, 24.10888671875, 25.3251953125, 26.54150390625, 27.7578125, 28.97412109375, 30.1904296875, 31.40673828125, 32.623046875, 33.83935546875, 35.0556640625, 36.27197265625, 37.48828125, 38.70458984375, 39.9208984375, 41.13720703125, 42.353515625, 43.56982421875, 44.7861328125, 46.00244140625, 47.21875]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 4.0, 4.0, 3.0, 6.0, 11.0, 19.0, 25.0, 45.0, 77.0, 139.0, 255.0, 477.0, 1139.0, 3008.0, 9798.0, 44884.0, 3789779.0, 313598.0, 21512.0, 5883.0, 2066.0, 735.0, 347.0, 185.0, 95.0, 54.0, 41.0, 25.0, 24.0, 11.0, 10.0, 9.0, 6.0, 1.0, 6.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-133.125, -129.693359375, -126.26171875, -122.830078125, -119.3984375, -115.966796875, -112.53515625, -109.103515625, -105.671875, -102.240234375, -98.80859375, -95.376953125, -91.9453125, -88.513671875, -85.08203125, -81.650390625, -78.21875, -74.787109375, -71.35546875, -67.923828125, -64.4921875, -61.060546875, -57.62890625, -54.197265625, -50.765625, -47.333984375, -43.90234375, -40.470703125, -37.0390625, -33.607421875, -30.17578125, -26.744140625, -23.3125, -19.880859375, -16.44921875, -13.017578125, -9.5859375, -6.154296875, -2.72265625, 0.708984375, 4.140625, 7.572265625, 11.00390625, 14.435546875, 17.8671875, 21.298828125, 24.73046875, 28.162109375, 31.59375, 35.025390625, 38.45703125, 41.888671875, 45.3203125, 48.751953125, 52.18359375, 55.615234375, 59.046875, 62.478515625, 65.91015625, 69.341796875, 72.7734375, 76.205078125, 79.63671875, 83.068359375, 86.5]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 1.0, 3.0, 4.0, 7.0, 3.0, 11.0, 12.0, 9.0, 8.0, 13.0, 21.0, 43.0, 58.0, 70.0, 119.0, 122.0, 136.0, 115.0, 65.0, 50.0, 40.0, 27.0, 19.0, 13.0, 5.0, 4.0, 14.0, 6.0, 2.0, 1.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-82.74673461914062, -79.55815887451172, -76.36959075927734, -73.18101501464844, -69.99243927001953, -66.80386352539062, -63.61529541015625, -60.426719665527344, -57.2381477355957, -54.04957580566406, -50.861000061035156, -47.672428131103516, -44.483856201171875, -41.29528045654297, -38.10670852661133, -34.91813659667969, -31.72956085205078, -28.540987014770508, -25.352413177490234, -22.163841247558594, -18.97526741027832, -15.786693572998047, -12.598121643066406, -9.409547805786133, -6.220973968505859, -3.032400608062744, 0.1561727523803711, 3.344745635986328, 6.533319473266602, 9.721893310546875, 12.910465240478516, 16.09903907775879, 19.28760528564453, 22.476179122924805, 25.664752960205078, 28.85332489013672, 32.041900634765625, 35.230472564697266, 38.419044494628906, 41.60762023925781, 44.79619216918945, 47.984764099121094, 51.17333984375, 54.36191177368164, 57.55048370361328, 60.73905944824219, 63.92763137817383, 67.11620330810547, 70.30477905273438, 73.49335479736328, 76.68192291259766, 79.87049865722656, 83.05907440185547, 86.24765014648438, 89.43621826171875, 92.62479400634766, 95.81336975097656, 99.00194549560547, 102.19051361083984, 105.37908935546875, 108.56766510009766, 111.75624084472656, 114.94480895996094, 118.13338470458984, 121.32195281982422]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 4.0, 5.0, 4.0, 8.0, 8.0, 3.0, 20.0, 18.0, 11.0, 14.0, 18.0, 15.0, 23.0, 23.0, 20.0, 24.0, 38.0, 29.0, 21.0, 33.0, 38.0, 45.0, 33.0, 47.0, 44.0, 49.0, 34.0, 36.0, 46.0, 38.0, 28.0, 24.0, 28.0, 29.0, 20.0, 22.0, 18.0, 14.0, 13.0, 9.0, 7.0, 7.0, 7.0, 6.0, 9.0, 3.0, 7.0, 4.0, 1.0, 3.0, 3.0, 0.0, 2.0], "bins": [-87.6893310546875, -85.1355209350586, -82.58171081542969, -80.02790069580078, -77.47409057617188, -74.92028045654297, -72.36647033691406, -69.81266021728516, -67.25885009765625, -64.70503997802734, -62.15122985839844, -59.59741973876953, -57.043609619140625, -54.48979949951172, -51.93598937988281, -49.382179260253906, -46.828369140625, -44.274559020996094, -41.72074890136719, -39.16693878173828, -36.613128662109375, -34.05931854248047, -31.505508422851562, -28.951698303222656, -26.39788818359375, -23.844078063964844, -21.290267944335938, -18.73645782470703, -16.182647705078125, -13.628837585449219, -11.075027465820312, -8.521217346191406, -5.9674072265625, -3.4135971069335938, -0.8597869873046875, 1.6940231323242188, 4.247833251953125, 6.801643371582031, 9.355453491210938, 11.909263610839844, 14.46307373046875, 17.016883850097656, 19.570693969726562, 22.12450408935547, 24.678314208984375, 27.23212432861328, 29.785934448242188, 32.339744567871094, 34.8935546875, 37.447364807128906, 40.00117492675781, 42.55498504638672, 45.108795166015625, 47.66260528564453, 50.21641540527344, 52.770225524902344, 55.32403564453125, 57.877845764160156, 60.43165588378906, 62.98546600341797, 65.53927612304688, 68.09308624267578, 70.64689636230469, 73.2007064819336, 75.7545166015625]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 6.0, 5.0, 2.0, 5.0, 9.0, 7.0, 11.0, 19.0, 18.0, 16.0, 20.0, 15.0, 44.0, 27.0, 41.0, 44.0, 29.0, 41.0, 37.0, 35.0, 47.0, 50.0, 28.0, 41.0, 42.0, 35.0, 26.0, 36.0, 37.0, 34.0, 24.0, 24.0, 20.0, 27.0, 16.0, 12.0, 10.0, 13.0, 9.0, 10.0, 10.0, 6.0, 4.0, 3.0, 2.0, 2.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.671875, -13.199462890625, -12.72705078125, -12.254638671875, -11.7822265625, -11.309814453125, -10.83740234375, -10.364990234375, -9.892578125, -9.420166015625, -8.94775390625, -8.475341796875, -8.0029296875, -7.530517578125, -7.05810546875, -6.585693359375, -6.11328125, -5.640869140625, -5.16845703125, -4.696044921875, -4.2236328125, -3.751220703125, -3.27880859375, -2.806396484375, -2.333984375, -1.861572265625, -1.38916015625, -0.916748046875, -0.4443359375, 0.028076171875, 0.50048828125, 0.972900390625, 1.4453125, 1.917724609375, 2.39013671875, 2.862548828125, 3.3349609375, 3.807373046875, 4.27978515625, 4.752197265625, 5.224609375, 5.697021484375, 6.16943359375, 6.641845703125, 7.1142578125, 7.586669921875, 8.05908203125, 8.531494140625, 9.00390625, 9.476318359375, 9.94873046875, 10.421142578125, 10.8935546875, 11.365966796875, 11.83837890625, 12.310791015625, 12.783203125, 13.255615234375, 13.72802734375, 14.200439453125, 14.6728515625, 15.145263671875, 15.61767578125, 16.090087890625, 16.5625]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 1.0, 3.0, 17.0, 12.0, 20.0, 21.0, 55.0, 66.0, 101.0, 126.0, 208.0, 300.0, 428.0, 614.0, 851.0, 1348.0, 1912.0, 2938.0, 4329.0, 6731.0, 10152.0, 15813.0, 25121.0, 40856.0, 67392.0, 115292.0, 192308.0, 213042.0, 137765.0, 80315.0, 47702.0, 29584.0, 18251.0, 11729.0, 7733.0, 5089.0, 3230.0, 2245.0, 1569.0, 1039.0, 699.0, 511.0, 350.0, 210.0, 159.0, 111.0, 86.0, 47.0, 31.0, 17.0, 17.0, 6.0, 6.0, 4.0, 4.0, 1.0, 0.0, 1.0], "bins": [-1.41796875, -1.375213623046875, -1.33245849609375, -1.289703369140625, -1.2469482421875, -1.204193115234375, -1.16143798828125, -1.118682861328125, -1.075927734375, -1.033172607421875, -0.99041748046875, -0.947662353515625, -0.9049072265625, -0.862152099609375, -0.81939697265625, -0.776641845703125, -0.73388671875, -0.691131591796875, -0.64837646484375, -0.605621337890625, -0.5628662109375, -0.520111083984375, -0.47735595703125, -0.434600830078125, -0.391845703125, -0.349090576171875, -0.30633544921875, -0.263580322265625, -0.2208251953125, -0.178070068359375, -0.13531494140625, -0.092559814453125, -0.0498046875, -0.007049560546875, 0.03570556640625, 0.078460693359375, 0.1212158203125, 0.163970947265625, 0.20672607421875, 0.249481201171875, 0.292236328125, 0.334991455078125, 0.37774658203125, 0.420501708984375, 0.4632568359375, 0.506011962890625, 0.54876708984375, 0.591522216796875, 0.63427734375, 0.677032470703125, 0.71978759765625, 0.762542724609375, 0.8052978515625, 0.848052978515625, 0.89080810546875, 0.933563232421875, 0.976318359375, 1.019073486328125, 1.06182861328125, 1.104583740234375, 1.1473388671875, 1.190093994140625, 1.23284912109375, 1.275604248046875, 1.318359375]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 5.0, 4.0, 7.0, 6.0, 4.0, 7.0, 8.0, 11.0, 15.0, 21.0, 18.0, 25.0, 23.0, 24.0, 27.0, 25.0, 34.0, 53.0, 37.0, 39.0, 37.0, 37.0, 1070.0, 33.0, 31.0, 39.0, 40.0, 41.0, 45.0, 21.0, 33.0, 24.0, 23.0, 17.0, 21.0, 16.0, 13.0, 18.0, 17.0, 15.0, 9.0, 6.0, 11.0, 5.0, 1.0, 6.0, 3.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.6640625, -8.3651123046875, -8.066162109375, -7.7672119140625, -7.46826171875, -7.1693115234375, -6.870361328125, -6.5714111328125, -6.2724609375, -5.9735107421875, -5.674560546875, -5.3756103515625, -5.07666015625, -4.7777099609375, -4.478759765625, -4.1798095703125, -3.880859375, -3.5819091796875, -3.282958984375, -2.9840087890625, -2.68505859375, -2.3861083984375, -2.087158203125, -1.7882080078125, -1.4892578125, -1.1903076171875, -0.891357421875, -0.5924072265625, -0.29345703125, 0.0054931640625, 0.304443359375, 0.6033935546875, 0.90234375, 1.2012939453125, 1.500244140625, 1.7991943359375, 2.09814453125, 2.3970947265625, 2.696044921875, 2.9949951171875, 3.2939453125, 3.5928955078125, 3.891845703125, 4.1907958984375, 4.48974609375, 4.7886962890625, 5.087646484375, 5.3865966796875, 5.685546875, 5.9844970703125, 6.283447265625, 6.5823974609375, 6.88134765625, 7.1802978515625, 7.479248046875, 7.7781982421875, 8.0771484375, 8.3760986328125, 8.675048828125, 8.9739990234375, 9.27294921875, 9.5718994140625, 9.870849609375, 10.1697998046875, 10.46875]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 5.0, 3.0, 10.0, 11.0, 15.0, 24.0, 51.0, 64.0, 113.0, 145.0, 217.0, 374.0, 531.0, 802.0, 1195.0, 1794.0, 2867.0, 4254.0, 6304.0, 9799.0, 14847.0, 23022.0, 35995.0, 59865.0, 102566.0, 172255.0, 1267219.0, 154451.0, 91146.0, 53887.0, 32700.0, 20929.0, 13567.0, 9096.0, 5772.0, 3866.0, 2546.0, 1668.0, 1145.0, 646.0, 481.0, 311.0, 201.0, 149.0, 93.0, 51.0, 40.0, 17.0, 12.0, 7.0, 3.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.92724609375, -0.89862060546875, -0.8699951171875, -0.84136962890625, -0.812744140625, -0.78411865234375, -0.7554931640625, -0.72686767578125, -0.6982421875, -0.66961669921875, -0.6409912109375, -0.61236572265625, -0.583740234375, -0.55511474609375, -0.5264892578125, -0.49786376953125, -0.46923828125, -0.44061279296875, -0.4119873046875, -0.38336181640625, -0.354736328125, -0.32611083984375, -0.2974853515625, -0.26885986328125, -0.240234375, -0.21160888671875, -0.1829833984375, -0.15435791015625, -0.125732421875, -0.09710693359375, -0.0684814453125, -0.03985595703125, -0.01123046875, 0.01739501953125, 0.0460205078125, 0.07464599609375, 0.103271484375, 0.13189697265625, 0.1605224609375, 0.18914794921875, 0.2177734375, 0.24639892578125, 0.2750244140625, 0.30364990234375, 0.332275390625, 0.36090087890625, 0.3895263671875, 0.41815185546875, 0.44677734375, 0.47540283203125, 0.5040283203125, 0.53265380859375, 0.561279296875, 0.58990478515625, 0.6185302734375, 0.64715576171875, 0.67578125, 0.70440673828125, 0.7330322265625, 0.76165771484375, 0.790283203125, 0.81890869140625, 0.8475341796875, 0.87615966796875, 0.90478515625]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 6.0, 4.0, 6.0, 5.0, 6.0, 5.0, 18.0, 14.0, 19.0, 21.0, 29.0, 37.0, 33.0, 43.0, 75.0, 75.0, 106.0, 124.0, 85.0, 58.0, 42.0, 37.0, 25.0, 27.0, 23.0, 16.0, 13.0, 16.0, 5.0, 5.0, 10.0, 10.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.027130126953125, -0.02639603614807129, -0.025661945343017578, -0.024927854537963867, -0.024193763732910156, -0.023459672927856445, -0.022725582122802734, -0.021991491317749023, -0.021257400512695312, -0.0205233097076416, -0.01978921890258789, -0.01905512809753418, -0.01832103729248047, -0.017586946487426758, -0.016852855682373047, -0.016118764877319336, -0.015384674072265625, -0.014650583267211914, -0.013916492462158203, -0.013182401657104492, -0.012448310852050781, -0.01171422004699707, -0.01098012924194336, -0.010246038436889648, -0.009511947631835938, -0.008777856826782227, -0.008043766021728516, -0.007309675216674805, -0.006575584411621094, -0.005841493606567383, -0.005107402801513672, -0.004373311996459961, -0.00363922119140625, -0.002905130386352539, -0.002171039581298828, -0.0014369487762451172, -0.0007028579711914062, 3.123283386230469e-05, 0.0007653236389160156, 0.0014994144439697266, 0.0022335052490234375, 0.0029675960540771484, 0.0037016868591308594, 0.00443577766418457, 0.005169868469238281, 0.005903959274291992, 0.006638050079345703, 0.007372140884399414, 0.008106231689453125, 0.008840322494506836, 0.009574413299560547, 0.010308504104614258, 0.011042594909667969, 0.01177668571472168, 0.01251077651977539, 0.013244867324829102, 0.013978958129882812, 0.014713048934936523, 0.015447139739990234, 0.016181230545043945, 0.016915321350097656, 0.017649412155151367, 0.018383502960205078, 0.01911759376525879, 0.0198516845703125]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 2.0, 3.0, 5.0, 8.0, 8.0, 10.0, 9.0, 10.0, 20.0, 20.0, 25.0, 38.0, 41.0, 58.0, 109.0, 185.0, 459.0, 1652.0, 10564.0, 820204.0, 207076.0, 5964.0, 1213.0, 349.0, 158.0, 93.0, 65.0, 43.0, 40.0, 24.0, 25.0, 14.0, 12.0, 11.0, 9.0, 8.0, 6.0, 1.0, 2.0, 4.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.374755859375, -0.3608131408691406, -0.34687042236328125, -0.3329277038574219, -0.3189849853515625, -0.3050422668457031, -0.29109954833984375, -0.2771568298339844, -0.263214111328125, -0.24927139282226562, -0.23532867431640625, -0.22138595581054688, -0.2074432373046875, -0.19350051879882812, -0.17955780029296875, -0.16561508178710938, -0.15167236328125, -0.13772964477539062, -0.12378692626953125, -0.10984420776367188, -0.0959014892578125, -0.08195877075195312, -0.06801605224609375, -0.054073333740234375, -0.040130615234375, -0.026187896728515625, -0.01224517822265625, 0.001697540283203125, 0.0156402587890625, 0.029582977294921875, 0.04352569580078125, 0.057468414306640625, 0.0714111328125, 0.08535385131835938, 0.09929656982421875, 0.11323928833007812, 0.1271820068359375, 0.14112472534179688, 0.15506744384765625, 0.16901016235351562, 0.182952880859375, 0.19689559936523438, 0.21083831787109375, 0.22478103637695312, 0.2387237548828125, 0.2526664733886719, 0.26660919189453125, 0.2805519104003906, 0.29449462890625, 0.3084373474121094, 0.32238006591796875, 0.3363227844238281, 0.3502655029296875, 0.3642082214355469, 0.37815093994140625, 0.3920936584472656, 0.406036376953125, 0.4199790954589844, 0.43392181396484375, 0.4478645324707031, 0.4618072509765625, 0.4757499694824219, 0.48969268798828125, 0.5036354064941406, 0.517578125]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [4.0, 5.0, 5.0, 7.0, 26.0, 51.0, 146.0, 386.0, 225.0, 85.0, 43.0, 13.0, 12.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.034176044166088104, -0.029731385409832, -0.025286724790930748, -0.020842064172029495, -0.01639740541577339, -0.011952746659517288, -0.0075080860406160355, -0.0030634254217147827, 0.0013812333345413208, 0.005825893022119999, 0.010270552709698677, 0.014715212397277355, 0.019159872084856033, 0.023604530841112137, 0.02804919146001339, 0.03249385207891464, 0.036938510835170746, 0.04138316959142685, 0.04582782834768295, 0.050272490829229355, 0.05471714958548546, 0.05916180834174156, 0.06360647082328796, 0.06805112957954407, 0.07249578833580017, 0.07694044709205627, 0.08138510584831238, 0.08582976460456848, 0.09027442336082458, 0.09471908211708069, 0.09916374832391739, 0.10360840708017349, 0.108053058385849, 0.1124977171421051, 0.1169423758983612, 0.12138703465461731, 0.1258316934108734, 0.13027635216712952, 0.13472101092338562, 0.13916566967964172, 0.14361032843589783, 0.14805498719215393, 0.15249964594841003, 0.15694430470466614, 0.16138896346092224, 0.16583362221717834, 0.17027828097343445, 0.17472293972969055, 0.17916761338710785, 0.18361227214336395, 0.18805693089962006, 0.19250158965587616, 0.19694624841213226, 0.20139090716838837, 0.20583556592464447, 0.21028023958206177, 0.21472489833831787, 0.21916955709457397, 0.22361421585083008, 0.22805887460708618, 0.23250353336334229, 0.2369481921195984, 0.2413928508758545, 0.2458375096321106, 0.2502821683883667]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 6.0, 3.0, 5.0, 7.0, 10.0, 10.0, 10.0, 12.0, 27.0, 16.0, 19.0, 21.0, 26.0, 27.0, 22.0, 43.0, 29.0, 26.0, 38.0, 49.0, 47.0, 43.0, 45.0, 39.0, 42.0, 42.0, 41.0, 40.0, 41.0, 24.0, 18.0, 24.0, 30.0, 25.0, 16.0, 19.0, 15.0, 12.0, 12.0, 9.0, 6.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.024921059608459473, -0.02416166290640831, -0.023402266204357147, -0.022642869502305984, -0.021883472800254822, -0.02112407609820366, -0.020364679396152496, -0.019605282694101334, -0.01884588599205017, -0.018086489289999008, -0.017327092587947845, -0.016567695885896683, -0.01580829918384552, -0.015048902481794357, -0.014289505779743195, -0.013530109077692032, -0.01277071237564087, -0.012011315673589706, -0.011251918971538544, -0.010492522269487381, -0.009733125567436218, -0.008973728865385056, -0.008214332163333893, -0.00745493546128273, -0.006695538759231567, -0.005936142057180405, -0.005176745355129242, -0.004417348653078079, -0.0036579519510269165, -0.002898555248975754, -0.002139158546924591, -0.0013797618448734283, -0.0006203651428222656, 0.0001390315592288971, 0.0008984282612800598, 0.0016578249633312225, 0.0024172216653823853, 0.003176618367433548, 0.003936015069484711, 0.004695411771535873, 0.005454808473587036, 0.006214205175638199, 0.006973601877689362, 0.007732998579740524, 0.008492395281791687, 0.00925179198384285, 0.010011188685894012, 0.010770585387945175, 0.011529982089996338, 0.0122893787920475, 0.013048775494098663, 0.013808172196149826, 0.014567568898200989, 0.015326965600252151, 0.016086362302303314, 0.016845759004354477, 0.01760515570640564, 0.018364552408456802, 0.019123949110507965, 0.019883345812559128, 0.02064274251461029, 0.021402139216661453, 0.022161535918712616, 0.02292093262076378, 0.02368032932281494]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 6.0, 5.0, 2.0, 5.0, 9.0, 7.0, 11.0, 18.0, 19.0, 16.0, 20.0, 15.0, 44.0, 27.0, 41.0, 44.0, 28.0, 42.0, 37.0, 35.0, 47.0, 49.0, 29.0, 40.0, 43.0, 34.0, 26.0, 37.0, 36.0, 35.0, 24.0, 24.0, 20.0, 26.0, 17.0, 11.0, 11.0, 13.0, 9.0, 10.0, 10.0, 6.0, 4.0, 3.0, 2.0, 2.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.6796875, -13.2071533203125, -12.734619140625, -12.2620849609375, -11.78955078125, -11.3170166015625, -10.844482421875, -10.3719482421875, -9.8994140625, -9.4268798828125, -8.954345703125, -8.4818115234375, -8.00927734375, -7.5367431640625, -7.064208984375, -6.5916748046875, -6.119140625, -5.6466064453125, -5.174072265625, -4.7015380859375, -4.22900390625, -3.7564697265625, -3.283935546875, -2.8114013671875, -2.3388671875, -1.8663330078125, -1.393798828125, -0.9212646484375, -0.44873046875, 0.0238037109375, 0.496337890625, 0.9688720703125, 1.44140625, 1.9139404296875, 2.386474609375, 2.8590087890625, 3.33154296875, 3.8040771484375, 4.276611328125, 4.7491455078125, 5.2216796875, 5.6942138671875, 6.166748046875, 6.6392822265625, 7.11181640625, 7.5843505859375, 8.056884765625, 8.5294189453125, 9.001953125, 9.4744873046875, 9.947021484375, 10.4195556640625, 10.89208984375, 11.3646240234375, 11.837158203125, 12.3096923828125, 12.7822265625, 13.2547607421875, 13.727294921875, 14.1998291015625, 14.67236328125, 15.1448974609375, 15.617431640625, 16.0899658203125, 16.5625]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 6.0, 7.0, 4.0, 8.0, 9.0, 13.0, 14.0, 19.0, 31.0, 28.0, 40.0, 41.0, 79.0, 77.0, 123.0, 193.0, 276.0, 589.0, 1366.0, 4357.0, 24323.0, 459637.0, 523852.0, 25985.0, 4483.0, 1400.0, 562.0, 335.0, 198.0, 117.0, 85.0, 67.0, 50.0, 40.0, 27.0, 19.0, 19.0, 18.0, 11.0, 14.0, 8.0, 8.0, 5.0, 3.0, 2.0, 2.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-27.109375, -26.175048828125, -25.24072265625, -24.306396484375, -23.3720703125, -22.437744140625, -21.50341796875, -20.569091796875, -19.634765625, -18.700439453125, -17.76611328125, -16.831787109375, -15.8974609375, -14.963134765625, -14.02880859375, -13.094482421875, -12.16015625, -11.225830078125, -10.29150390625, -9.357177734375, -8.4228515625, -7.488525390625, -6.55419921875, -5.619873046875, -4.685546875, -3.751220703125, -2.81689453125, -1.882568359375, -0.9482421875, -0.013916015625, 0.92041015625, 1.854736328125, 2.7890625, 3.723388671875, 4.65771484375, 5.592041015625, 6.5263671875, 7.460693359375, 8.39501953125, 9.329345703125, 10.263671875, 11.197998046875, 12.13232421875, 13.066650390625, 14.0009765625, 14.935302734375, 15.86962890625, 16.803955078125, 17.73828125, 18.672607421875, 19.60693359375, 20.541259765625, 21.4755859375, 22.409912109375, 23.34423828125, 24.278564453125, 25.212890625, 26.147216796875, 27.08154296875, 28.015869140625, 28.9501953125, 29.884521484375, 30.81884765625, 31.753173828125, 32.6875]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 6.0, 6.0, 3.0, 7.0, 17.0, 17.0, 13.0, 19.0, 23.0, 29.0, 28.0, 35.0, 34.0, 45.0, 46.0, 46.0, 56.0, 80.0, 1538.0, 483.0, 82.0, 63.0, 39.0, 53.0, 35.0, 35.0, 40.0, 35.0, 31.0, 19.0, 18.0, 17.0, 13.0, 8.0, 9.0, 12.0, 3.0, 5.0, 6.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.03125, -44.63525390625, -43.2392578125, -41.84326171875, -40.447265625, -39.05126953125, -37.6552734375, -36.25927734375, -34.86328125, -33.46728515625, -32.0712890625, -30.67529296875, -29.279296875, -27.88330078125, -26.4873046875, -25.09130859375, -23.6953125, -22.29931640625, -20.9033203125, -19.50732421875, -18.111328125, -16.71533203125, -15.3193359375, -13.92333984375, -12.52734375, -11.13134765625, -9.7353515625, -8.33935546875, -6.943359375, -5.54736328125, -4.1513671875, -2.75537109375, -1.359375, 0.03662109375, 1.4326171875, 2.82861328125, 4.224609375, 5.62060546875, 7.0166015625, 8.41259765625, 9.80859375, 11.20458984375, 12.6005859375, 13.99658203125, 15.392578125, 16.78857421875, 18.1845703125, 19.58056640625, 20.9765625, 22.37255859375, 23.7685546875, 25.16455078125, 26.560546875, 27.95654296875, 29.3525390625, 30.74853515625, 32.14453125, 33.54052734375, 34.9365234375, 36.33251953125, 37.728515625, 39.12451171875, 40.5205078125, 41.91650390625, 43.3125]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 7.0, 5.0, 9.0, 9.0, 10.0, 14.0, 20.0, 12.0, 30.0, 34.0, 36.0, 46.0, 74.0, 94.0, 143.0, 250.0, 719.0, 2670.0, 163846.0, 2970994.0, 4839.0, 957.0, 305.0, 165.0, 100.0, 69.0, 49.0, 50.0, 38.0, 22.0, 21.0, 14.0, 21.0, 13.0, 6.0, 3.0, 8.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-99.375, -96.1826171875, -92.990234375, -89.7978515625, -86.60546875, -83.4130859375, -80.220703125, -77.0283203125, -73.8359375, -70.6435546875, -67.451171875, -64.2587890625, -61.06640625, -57.8740234375, -54.681640625, -51.4892578125, -48.296875, -45.1044921875, -41.912109375, -38.7197265625, -35.52734375, -32.3349609375, -29.142578125, -25.9501953125, -22.7578125, -19.5654296875, -16.373046875, -13.1806640625, -9.98828125, -6.7958984375, -3.603515625, -0.4111328125, 2.78125, 5.9736328125, 9.166015625, 12.3583984375, 15.55078125, 18.7431640625, 21.935546875, 25.1279296875, 28.3203125, 31.5126953125, 34.705078125, 37.8974609375, 41.08984375, 44.2822265625, 47.474609375, 50.6669921875, 53.859375, 57.0517578125, 60.244140625, 63.4365234375, 66.62890625, 69.8212890625, 73.013671875, 76.2060546875, 79.3984375, 82.5908203125, 85.783203125, 88.9755859375, 92.16796875, 95.3603515625, 98.552734375, 101.7451171875, 104.9375]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 48.0, 670.0, 282.0, 15.0], "bins": [-483.9574279785156, -476.1205749511719, -468.28375244140625, -460.4468994140625, -452.61004638671875, -444.7732238769531, -436.9363708496094, -429.0995178222656, -421.2626953125, -413.42584228515625, -405.5890197753906, -397.7521667480469, -389.9153137207031, -382.0784912109375, -374.24163818359375, -366.40478515625, -358.56793212890625, -350.7310791015625, -342.8942565917969, -335.0574035644531, -327.2205505371094, -319.38372802734375, -311.546875, -303.71002197265625, -295.8731994628906, -288.0363464355469, -280.19952392578125, -272.3626708984375, -264.52581787109375, -256.6889953613281, -248.85214233398438, -241.0153045654297, -233.178466796875, -225.3416290283203, -217.50477600097656, -209.66793823242188, -201.8311004638672, -193.9942626953125, -186.15740966796875, -178.32057189941406, -170.4837188720703, -162.64688110351562, -154.81002807617188, -146.9731903076172, -139.1363525390625, -131.29949951171875, -123.46266174316406, -115.62582397460938, -107.78898620605469, -99.95214080810547, -92.11530303955078, -84.27845764160156, -76.44161987304688, -68.60477447509766, -60.76792907714844, -52.931087493896484, -45.09424591064453, -37.25740432739258, -29.420560836791992, -21.583717346191406, -13.746875762939453, -5.9100341796875, 1.9268112182617188, 9.763652801513672, 17.600496292114258]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 3.0, 8.0, 5.0, 8.0, 5.0, 6.0, 6.0, 8.0, 13.0, 12.0, 12.0, 18.0, 20.0, 25.0, 18.0, 20.0, 27.0, 37.0, 26.0, 25.0, 36.0, 44.0, 32.0, 37.0, 41.0, 39.0, 50.0, 45.0, 33.0, 40.0, 34.0, 42.0, 25.0, 34.0, 25.0, 19.0, 23.0, 21.0, 14.0, 9.0, 9.0, 11.0, 9.0, 13.0, 6.0, 8.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-89.78470611572266, -86.94556427001953, -84.10641479492188, -81.26727294921875, -78.42813110351562, -75.58898162841797, -72.74983978271484, -69.91069030761719, -67.07154846191406, -64.23240661621094, -61.39325714111328, -58.554115295410156, -55.714969635009766, -52.875823974609375, -50.03668212890625, -47.19753646850586, -44.35839080810547, -41.51924514770508, -38.68009948730469, -35.84095764160156, -33.00181198120117, -30.16266632080078, -27.323522567749023, -24.484378814697266, -21.645233154296875, -18.806087493896484, -15.966943740844727, -13.127799034118652, -10.288654327392578, -7.449509620666504, -4.61036491394043, -1.7712211608886719, 1.0679168701171875, 3.9070615768432617, 6.746206283569336, 9.58535099029541, 12.424495697021484, 15.263640403747559, 18.102785110473633, 20.94192886352539, 23.78107452392578, 26.620220184326172, 29.45936393737793, 32.29850769042969, 35.13765335083008, 37.97679901123047, 40.815940856933594, 43.655086517333984, 46.494232177734375, 49.333377838134766, 52.172523498535156, 55.01166534423828, 57.85081100463867, 60.68995666503906, 63.52909851074219, 66.36824035644531, 69.20738983154297, 72.0465316772461, 74.88568115234375, 77.72482299804688, 80.56396484375, 83.40311431884766, 86.24225616455078, 89.08140563964844, 91.92054748535156]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 3.0, 3.0, 4.0, 4.0, 5.0, 4.0, 14.0, 14.0, 12.0, 25.0, 21.0, 22.0, 18.0, 39.0, 32.0, 43.0, 31.0, 44.0, 36.0, 50.0, 37.0, 42.0, 51.0, 45.0, 29.0, 40.0, 41.0, 38.0, 33.0, 33.0, 26.0, 24.0, 25.0, 22.0, 12.0, 13.0, 12.0, 14.0, 6.0, 9.0, 11.0, 5.0, 3.0, 4.0, 1.0, 3.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.53125, -14.0341796875, -13.537109375, -13.0400390625, -12.54296875, -12.0458984375, -11.548828125, -11.0517578125, -10.5546875, -10.0576171875, -9.560546875, -9.0634765625, -8.56640625, -8.0693359375, -7.572265625, -7.0751953125, -6.578125, -6.0810546875, -5.583984375, -5.0869140625, -4.58984375, -4.0927734375, -3.595703125, -3.0986328125, -2.6015625, -2.1044921875, -1.607421875, -1.1103515625, -0.61328125, -0.1162109375, 0.380859375, 0.8779296875, 1.375, 1.8720703125, 2.369140625, 2.8662109375, 3.36328125, 3.8603515625, 4.357421875, 4.8544921875, 5.3515625, 5.8486328125, 6.345703125, 6.8427734375, 7.33984375, 7.8369140625, 8.333984375, 8.8310546875, 9.328125, 9.8251953125, 10.322265625, 10.8193359375, 11.31640625, 11.8134765625, 12.310546875, 12.8076171875, 13.3046875, 13.8017578125, 14.298828125, 14.7958984375, 15.29296875, 15.7900390625, 16.287109375, 16.7841796875, 17.28125]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 8.0, 11.0, 21.0, 32.0, 40.0, 66.0, 85.0, 106.0, 159.0, 236.0, 329.0, 470.0, 683.0, 988.0, 1484.0, 2304.0, 3622.0, 6171.0, 11434.0, 30881.0, 435719.0, 3427722.0, 223826.0, 22039.0, 10135.0, 5557.0, 3337.0, 2119.0, 1402.0, 945.0, 675.0, 453.0, 351.0, 222.0, 189.0, 121.0, 85.0, 74.0, 52.0, 40.0, 24.0, 22.0, 15.0, 11.0, 9.0, 6.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-44.28125, -42.87109375, -41.4609375, -40.05078125, -38.640625, -37.23046875, -35.8203125, -34.41015625, -33.0, -31.58984375, -30.1796875, -28.76953125, -27.359375, -25.94921875, -24.5390625, -23.12890625, -21.71875, -20.30859375, -18.8984375, -17.48828125, -16.078125, -14.66796875, -13.2578125, -11.84765625, -10.4375, -9.02734375, -7.6171875, -6.20703125, -4.796875, -3.38671875, -1.9765625, -0.56640625, 0.84375, 2.25390625, 3.6640625, 5.07421875, 6.484375, 7.89453125, 9.3046875, 10.71484375, 12.125, 13.53515625, 14.9453125, 16.35546875, 17.765625, 19.17578125, 20.5859375, 21.99609375, 23.40625, 24.81640625, 26.2265625, 27.63671875, 29.046875, 30.45703125, 31.8671875, 33.27734375, 34.6875, 36.09765625, 37.5078125, 38.91796875, 40.328125, 41.73828125, 43.1484375, 44.55859375, 45.96875]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 7.0, 7.0, 4.0, 8.0, 7.0, 5.0, 14.0, 17.0, 30.0, 44.0, 74.0, 117.0, 262.0, 568.0, 1033.0, 907.0, 446.0, 191.0, 106.0, 61.0, 40.0, 28.0, 16.0, 24.0, 14.0, 9.0, 9.0, 7.0, 5.0, 4.0, 5.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-36.0, -34.8701171875, -33.740234375, -32.6103515625, -31.48046875, -30.3505859375, -29.220703125, -28.0908203125, -26.9609375, -25.8310546875, -24.701171875, -23.5712890625, -22.44140625, -21.3115234375, -20.181640625, -19.0517578125, -17.921875, -16.7919921875, -15.662109375, -14.5322265625, -13.40234375, -12.2724609375, -11.142578125, -10.0126953125, -8.8828125, -7.7529296875, -6.623046875, -5.4931640625, -4.36328125, -3.2333984375, -2.103515625, -0.9736328125, 0.15625, 1.2861328125, 2.416015625, 3.5458984375, 4.67578125, 5.8056640625, 6.935546875, 8.0654296875, 9.1953125, 10.3251953125, 11.455078125, 12.5849609375, 13.71484375, 14.8447265625, 15.974609375, 17.1044921875, 18.234375, 19.3642578125, 20.494140625, 21.6240234375, 22.75390625, 23.8837890625, 25.013671875, 26.1435546875, 27.2734375, 28.4033203125, 29.533203125, 30.6630859375, 31.79296875, 32.9228515625, 34.052734375, 35.1826171875, 36.3125]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 4.0, 5.0, 6.0, 6.0, 8.0, 24.0, 27.0, 34.0, 52.0, 81.0, 120.0, 164.0, 268.0, 440.0, 739.0, 1366.0, 2609.0, 5369.0, 12553.0, 33772.0, 216700.0, 3723575.0, 145125.0, 29649.0, 11207.0, 4873.0, 2374.0, 1312.0, 705.0, 390.0, 250.0, 150.0, 103.0, 65.0, 52.0, 32.0, 20.0, 21.0, 9.0, 10.0, 6.0, 5.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.25, -63.23828125, -61.2265625, -59.21484375, -57.203125, -55.19140625, -53.1796875, -51.16796875, -49.15625, -47.14453125, -45.1328125, -43.12109375, -41.109375, -39.09765625, -37.0859375, -35.07421875, -33.0625, -31.05078125, -29.0390625, -27.02734375, -25.015625, -23.00390625, -20.9921875, -18.98046875, -16.96875, -14.95703125, -12.9453125, -10.93359375, -8.921875, -6.91015625, -4.8984375, -2.88671875, -0.875, 1.13671875, 3.1484375, 5.16015625, 7.171875, 9.18359375, 11.1953125, 13.20703125, 15.21875, 17.23046875, 19.2421875, 21.25390625, 23.265625, 25.27734375, 27.2890625, 29.30078125, 31.3125, 33.32421875, 35.3359375, 37.34765625, 39.359375, 41.37109375, 43.3828125, 45.39453125, 47.40625, 49.41796875, 51.4296875, 53.44140625, 55.453125, 57.46484375, 59.4765625, 61.48828125, 63.5]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 4.0, 6.0, 18.0, 18.0, 18.0, 48.0, 91.0, 189.0, 237.0, 173.0, 80.0, 55.0, 28.0, 16.0, 11.0, 4.0, 7.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-263.5518798828125, -258.11639404296875, -252.68087768554688, -247.24539184570312, -241.8098907470703, -236.3743896484375, -230.9388885498047, -225.50338745117188, -220.06788635253906, -214.63238525390625, -209.19688415527344, -203.76138305664062, -198.32589721679688, -192.89039611816406, -187.45489501953125, -182.01939392089844, -176.58389282226562, -171.1483917236328, -165.712890625, -160.27740478515625, -154.84190368652344, -149.40640258789062, -143.9709014892578, -138.535400390625, -133.09991455078125, -127.66441345214844, -122.22891998291016, -116.79341888427734, -111.35791778564453, -105.92242431640625, -100.48692321777344, -95.05142211914062, -89.61591339111328, -84.18041229248047, -78.74491882324219, -73.30941772460938, -67.87391662597656, -62.438419342041016, -57.00292205810547, -51.567420959472656, -46.13192367553711, -40.69642639160156, -35.26092529296875, -29.825428009033203, -24.389928817749023, -18.954429626464844, -13.518932342529297, -8.083431243896484, -2.6479339599609375, 2.787564754486084, 8.223063468933105, 13.658561706542969, 19.09406089782715, 24.529560089111328, 29.965057373046875, 35.40055847167969, 40.836055755615234, 46.27155303955078, 51.707054138183594, 57.14255142211914, 62.57804870605469, 68.0135498046875, 73.44905090332031, 78.88455200195312, 84.3200454711914]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 8.0, 6.0, 5.0, 4.0, 3.0, 8.0, 11.0, 12.0, 12.0, 18.0, 11.0, 21.0, 26.0, 33.0, 31.0, 26.0, 41.0, 34.0, 33.0, 33.0, 44.0, 44.0, 39.0, 41.0, 38.0, 34.0, 39.0, 22.0, 39.0, 46.0, 36.0, 23.0, 28.0, 24.0, 22.0, 18.0, 11.0, 18.0, 11.0, 9.0, 9.0, 4.0, 8.0, 5.0, 9.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-76.08663940429688, -73.7289810180664, -71.37132263183594, -69.01365661621094, -66.65599822998047, -64.29833984375, -61.94068145751953, -59.5830192565918, -57.22535705566406, -54.867698669433594, -52.51003646850586, -50.15237808227539, -47.794715881347656, -45.43705749511719, -43.07939910888672, -40.721736907958984, -38.364078521728516, -36.00642013549805, -33.64875793457031, -31.291099548339844, -28.93343734741211, -26.57577896118164, -24.21811866760254, -21.860458374023438, -19.502798080444336, -17.145137786865234, -14.787477493286133, -12.429818153381348, -10.072157859802246, -7.7144975662231445, -5.356838226318359, -2.999177932739258, -0.6415176391601562, 1.7161424160003662, 4.073802471160889, 6.431462287902832, 8.789122581481934, 11.146782875061035, 13.50444221496582, 15.862102508544922, 18.219762802124023, 20.577423095703125, 22.935083389282227, 25.292743682861328, 27.650402069091797, 30.00806427001953, 32.36572265625, 34.72338104248047, 37.0810432434082, 39.43870162963867, 41.796363830566406, 44.154022216796875, 46.51168441772461, 48.86934280395508, 51.22700500488281, 53.58466339111328, 55.94232177734375, 58.29998016357422, 60.65764236450195, 63.01530075073242, 65.37296295166016, 67.73062133789062, 70.0882797241211, 72.44593811035156, 74.80360412597656]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 5.0, 5.0, 10.0, 9.0, 10.0, 12.0, 14.0, 15.0, 19.0, 19.0, 35.0, 21.0, 27.0, 36.0, 30.0, 54.0, 41.0, 54.0, 38.0, 66.0, 39.0, 36.0, 46.0, 35.0, 33.0, 38.0, 29.0, 31.0, 27.0, 25.0, 28.0, 11.0, 19.0, 18.0, 15.0, 11.0, 8.0, 11.0, 6.0, 5.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.375, -14.84765625, -14.3203125, -13.79296875, -13.265625, -12.73828125, -12.2109375, -11.68359375, -11.15625, -10.62890625, -10.1015625, -9.57421875, -9.046875, -8.51953125, -7.9921875, -7.46484375, -6.9375, -6.41015625, -5.8828125, -5.35546875, -4.828125, -4.30078125, -3.7734375, -3.24609375, -2.71875, -2.19140625, -1.6640625, -1.13671875, -0.609375, -0.08203125, 0.4453125, 0.97265625, 1.5, 2.02734375, 2.5546875, 3.08203125, 3.609375, 4.13671875, 4.6640625, 5.19140625, 5.71875, 6.24609375, 6.7734375, 7.30078125, 7.828125, 8.35546875, 8.8828125, 9.41015625, 9.9375, 10.46484375, 10.9921875, 11.51953125, 12.046875, 12.57421875, 13.1015625, 13.62890625, 14.15625, 14.68359375, 15.2109375, 15.73828125, 16.265625, 16.79296875, 17.3203125, 17.84765625, 18.375]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 8.0, 4.0, 7.0, 15.0, 19.0, 25.0, 44.0, 82.0, 85.0, 130.0, 209.0, 287.0, 451.0, 628.0, 965.0, 1451.0, 2218.0, 3282.0, 4880.0, 7854.0, 12262.0, 19500.0, 31677.0, 53839.0, 94914.0, 167898.0, 238075.0, 170552.0, 96226.0, 54066.0, 32359.0, 19536.0, 12206.0, 7868.0, 5001.0, 3319.0, 2161.0, 1463.0, 957.0, 654.0, 464.0, 281.0, 200.0, 146.0, 87.0, 67.0, 46.0, 32.0, 19.0, 11.0, 19.0, 8.0, 2.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-1.3193359375, -1.276092529296875, -1.23284912109375, -1.189605712890625, -1.1463623046875, -1.103118896484375, -1.05987548828125, -1.016632080078125, -0.973388671875, -0.930145263671875, -0.88690185546875, -0.843658447265625, -0.8004150390625, -0.757171630859375, -0.71392822265625, -0.670684814453125, -0.62744140625, -0.584197998046875, -0.54095458984375, -0.497711181640625, -0.4544677734375, -0.411224365234375, -0.36798095703125, -0.324737548828125, -0.281494140625, -0.238250732421875, -0.19500732421875, -0.151763916015625, -0.1085205078125, -0.065277099609375, -0.02203369140625, 0.021209716796875, 0.064453125, 0.107696533203125, 0.15093994140625, 0.194183349609375, 0.2374267578125, 0.280670166015625, 0.32391357421875, 0.367156982421875, 0.410400390625, 0.453643798828125, 0.49688720703125, 0.540130615234375, 0.5833740234375, 0.626617431640625, 0.66986083984375, 0.713104248046875, 0.75634765625, 0.799591064453125, 0.84283447265625, 0.886077880859375, 0.9293212890625, 0.972564697265625, 1.01580810546875, 1.059051513671875, 1.102294921875, 1.145538330078125, 1.18878173828125, 1.232025146484375, 1.2752685546875, 1.318511962890625, 1.36175537109375, 1.404998779296875, 1.4482421875]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 3.0, 3.0, 5.0, 9.0, 6.0, 10.0, 13.0, 9.0, 17.0, 16.0, 19.0, 19.0, 21.0, 32.0, 21.0, 25.0, 43.0, 38.0, 38.0, 30.0, 29.0, 37.0, 1071.0, 37.0, 55.0, 56.0, 31.0, 35.0, 40.0, 31.0, 25.0, 26.0, 23.0, 20.0, 21.0, 16.0, 23.0, 13.0, 13.0, 8.0, 12.0, 3.0, 4.0, 9.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0], "bins": [-10.875, -10.5626220703125, -10.250244140625, -9.9378662109375, -9.62548828125, -9.3131103515625, -9.000732421875, -8.6883544921875, -8.3759765625, -8.0635986328125, -7.751220703125, -7.4388427734375, -7.12646484375, -6.8140869140625, -6.501708984375, -6.1893310546875, -5.876953125, -5.5645751953125, -5.252197265625, -4.9398193359375, -4.62744140625, -4.3150634765625, -4.002685546875, -3.6903076171875, -3.3779296875, -3.0655517578125, -2.753173828125, -2.4407958984375, -2.12841796875, -1.8160400390625, -1.503662109375, -1.1912841796875, -0.87890625, -0.5665283203125, -0.254150390625, 0.0582275390625, 0.37060546875, 0.6829833984375, 0.995361328125, 1.3077392578125, 1.6201171875, 1.9324951171875, 2.244873046875, 2.5572509765625, 2.86962890625, 3.1820068359375, 3.494384765625, 3.8067626953125, 4.119140625, 4.4315185546875, 4.743896484375, 5.0562744140625, 5.36865234375, 5.6810302734375, 5.993408203125, 6.3057861328125, 6.6181640625, 6.9305419921875, 7.242919921875, 7.5552978515625, 7.86767578125, 8.1800537109375, 8.492431640625, 8.8048095703125, 9.1171875]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 6.0, 4.0, 18.0, 22.0, 25.0, 44.0, 71.0, 89.0, 114.0, 178.0, 307.0, 369.0, 596.0, 842.0, 1234.0, 1854.0, 2676.0, 4073.0, 6158.0, 9350.0, 14124.0, 21754.0, 34670.0, 56338.0, 94814.0, 159783.0, 1261147.0, 166306.0, 99157.0, 58575.0, 36074.0, 22768.0, 14614.0, 9510.0, 6340.0, 4188.0, 2855.0, 1980.0, 1284.0, 900.0, 637.0, 408.0, 302.0, 178.0, 127.0, 95.0, 56.0, 40.0, 36.0, 14.0, 7.0, 14.0, 5.0, 6.0, 2.0, 2.0, 3.0, 1.0, 4.0, 0.0, 2.0], "bins": [-0.83935546875, -0.810943603515625, -0.78253173828125, -0.754119873046875, -0.7257080078125, -0.697296142578125, -0.66888427734375, -0.640472412109375, -0.612060546875, -0.583648681640625, -0.55523681640625, -0.526824951171875, -0.4984130859375, -0.470001220703125, -0.44158935546875, -0.413177490234375, -0.384765625, -0.356353759765625, -0.32794189453125, -0.299530029296875, -0.2711181640625, -0.242706298828125, -0.21429443359375, -0.185882568359375, -0.157470703125, -0.129058837890625, -0.10064697265625, -0.072235107421875, -0.0438232421875, -0.015411376953125, 0.01300048828125, 0.041412353515625, 0.06982421875, 0.098236083984375, 0.12664794921875, 0.155059814453125, 0.1834716796875, 0.211883544921875, 0.24029541015625, 0.268707275390625, 0.297119140625, 0.325531005859375, 0.35394287109375, 0.382354736328125, 0.4107666015625, 0.439178466796875, 0.46759033203125, 0.496002197265625, 0.5244140625, 0.552825927734375, 0.58123779296875, 0.609649658203125, 0.6380615234375, 0.666473388671875, 0.69488525390625, 0.723297119140625, 0.751708984375, 0.780120849609375, 0.80853271484375, 0.836944580078125, 0.8653564453125, 0.893768310546875, 0.92218017578125, 0.950592041015625, 0.97900390625]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 6.0, 4.0, 6.0, 7.0, 9.0, 7.0, 13.0, 16.0, 15.0, 19.0, 23.0, 39.0, 65.0, 62.0, 71.0, 83.0, 85.0, 84.0, 79.0, 52.0, 44.0, 39.0, 33.0, 21.0, 8.0, 11.0, 19.0, 13.0, 15.0, 6.0, 8.0, 3.0, 6.0, 7.0, 2.0, 2.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.01629638671875, -0.015798449516296387, -0.015300512313842773, -0.01480257511138916, -0.014304637908935547, -0.013806700706481934, -0.01330876350402832, -0.012810826301574707, -0.012312889099121094, -0.01181495189666748, -0.011317014694213867, -0.010819077491760254, -0.01032114028930664, -0.009823203086853027, -0.009325265884399414, -0.0088273286819458, -0.008329391479492188, -0.007831454277038574, -0.007333517074584961, -0.006835579872131348, -0.006337642669677734, -0.005839705467224121, -0.005341768264770508, -0.0048438310623168945, -0.004345893859863281, -0.003847956657409668, -0.0033500194549560547, -0.0028520822525024414, -0.002354145050048828, -0.0018562078475952148, -0.0013582706451416016, -0.0008603334426879883, -0.000362396240234375, 0.00013554096221923828, 0.0006334781646728516, 0.0011314153671264648, 0.0016293525695800781, 0.0021272897720336914, 0.0026252269744873047, 0.003123164176940918, 0.0036211013793945312, 0.0041190385818481445, 0.004616975784301758, 0.005114912986755371, 0.005612850189208984, 0.006110787391662598, 0.006608724594116211, 0.007106661796569824, 0.0076045989990234375, 0.00810253620147705, 0.008600473403930664, 0.009098410606384277, 0.00959634780883789, 0.010094285011291504, 0.010592222213745117, 0.01109015941619873, 0.011588096618652344, 0.012086033821105957, 0.01258397102355957, 0.013081908226013184, 0.013579845428466797, 0.01407778263092041, 0.014575719833374023, 0.015073657035827637, 0.01557159423828125]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 2.0, 5.0, 3.0, 4.0, 12.0, 5.0, 11.0, 8.0, 16.0, 12.0, 22.0, 16.0, 28.0, 24.0, 30.0, 68.0, 109.0, 142.0, 265.0, 1319.0, 104703.0, 936137.0, 4583.0, 414.0, 189.0, 114.0, 79.0, 51.0, 47.0, 28.0, 21.0, 18.0, 8.0, 17.0, 8.0, 12.0, 4.0, 4.0, 7.0, 5.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.3623046875, -0.35105133056640625, -0.3397979736328125, -0.32854461669921875, -0.317291259765625, -0.30603790283203125, -0.2947845458984375, -0.28353118896484375, -0.27227783203125, -0.26102447509765625, -0.2497711181640625, -0.23851776123046875, -0.227264404296875, -0.21601104736328125, -0.2047576904296875, -0.19350433349609375, -0.1822509765625, -0.17099761962890625, -0.1597442626953125, -0.14849090576171875, -0.137237548828125, -0.12598419189453125, -0.1147308349609375, -0.10347747802734375, -0.09222412109375, -0.08097076416015625, -0.0697174072265625, -0.05846405029296875, -0.047210693359375, -0.03595733642578125, -0.0247039794921875, -0.01345062255859375, -0.002197265625, 0.00905609130859375, 0.0203094482421875, 0.03156280517578125, 0.042816162109375, 0.05406951904296875, 0.0653228759765625, 0.07657623291015625, 0.08782958984375, 0.09908294677734375, 0.1103363037109375, 0.12158966064453125, 0.132843017578125, 0.14409637451171875, 0.1553497314453125, 0.16660308837890625, 0.1778564453125, 0.18910980224609375, 0.2003631591796875, 0.21161651611328125, 0.222869873046875, 0.23412322998046875, 0.2453765869140625, 0.25662994384765625, 0.26788330078125, 0.27913665771484375, 0.2903900146484375, 0.30164337158203125, 0.312896728515625, 0.32415008544921875, 0.3354034423828125, 0.34665679931640625, 0.35791015625]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 43.0, 446.0, 461.0, 50.0, 10.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0415981188416481, -0.03640041500329971, -0.031202707439661026, -0.026005001738667488, -0.02080729603767395, -0.015609590336680412, -0.010411884635686874, -0.005214177072048187, -1.6473233699798584e-05, 0.005181232467293739, 0.010378938168287277, 0.015576643869280815, 0.020774349570274353, 0.02597205527126789, 0.03116976097226143, 0.036367468535900116, 0.041565172374248505, 0.04676287621259689, 0.05196058377623558, 0.05715829133987427, 0.062355995178222656, 0.06755369901657104, 0.07275140285491943, 0.07794911414384842, 0.08314681798219681, 0.0883445218205452, 0.09354223310947418, 0.09873993694782257, 0.10393764078617096, 0.10913534462451935, 0.11433304846286774, 0.11953075975179672, 0.12472847104072571, 0.1299261748790741, 0.13512387871742249, 0.14032158255577087, 0.14551928639411926, 0.15071700513362885, 0.15591470897197723, 0.16111241281032562, 0.166310116648674, 0.1715078204870224, 0.1767055243253708, 0.18190322816371918, 0.18710094690322876, 0.19229865074157715, 0.19749635457992554, 0.20269405841827393, 0.20789176225662231, 0.2130894660949707, 0.2182871699333191, 0.22348487377166748, 0.22868257761001587, 0.23388029634952545, 0.23907800018787384, 0.24427570402622223, 0.24947340786457062, 0.2546711266040802, 0.2598688304424286, 0.265066534280777, 0.27026423811912537, 0.27546194195747375, 0.28065964579582214, 0.28585734963417053, 0.2910550534725189]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 3.0, 3.0, 5.0, 8.0, 12.0, 13.0, 8.0, 13.0, 13.0, 16.0, 19.0, 18.0, 30.0, 31.0, 37.0, 34.0, 35.0, 40.0, 45.0, 47.0, 46.0, 38.0, 44.0, 51.0, 53.0, 41.0, 46.0, 39.0, 31.0, 21.0, 23.0, 24.0, 29.0, 19.0, 18.0, 16.0, 8.0, 4.0, 9.0, 6.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.021617889404296875, -0.020996319130063057, -0.02037474885582924, -0.01975317858159542, -0.019131608307361603, -0.018510038033127785, -0.017888467758893967, -0.01726689748466015, -0.01664532721042633, -0.016023756936192513, -0.015402186661958694, -0.014780616387724876, -0.014159046113491058, -0.01353747583925724, -0.012915905565023422, -0.012294335290789604, -0.011672765016555786, -0.011051194742321968, -0.01042962446808815, -0.009808054193854332, -0.009186483919620514, -0.008564913645386696, -0.007943343371152878, -0.00732177309691906, -0.006700202822685242, -0.006078632548451424, -0.005457062274217606, -0.0048354919999837875, -0.0042139217257499695, -0.0035923514515161514, -0.0029707811772823334, -0.0023492109030485153, -0.0017276406288146973, -0.0011060703545808792, -0.00048450008034706116, 0.0001370701938867569, 0.000758640468120575, 0.001380210742354393, 0.002001781016588211, 0.002623351290822029, 0.003244921565055847, 0.0038664918392896652, 0.004488062113523483, 0.005109632387757301, 0.005731202661991119, 0.0063527729362249374, 0.0069743432104587555, 0.0075959134846925735, 0.008217483758926392, 0.00883905403316021, 0.009460624307394028, 0.010082194581627846, 0.010703764855861664, 0.011325335130095482, 0.0119469054043293, 0.012568475678563118, 0.013190045952796936, 0.013811616227030754, 0.014433186501264572, 0.01505475677549839, 0.015676327049732208, 0.016297897323966026, 0.016919467598199844, 0.017541037872433662, 0.01816260814666748]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 5.0, 5.0, 10.0, 9.0, 10.0, 12.0, 14.0, 15.0, 19.0, 19.0, 35.0, 21.0, 27.0, 36.0, 30.0, 54.0, 41.0, 54.0, 38.0, 66.0, 39.0, 36.0, 46.0, 35.0, 33.0, 38.0, 29.0, 31.0, 27.0, 25.0, 28.0, 11.0, 19.0, 18.0, 15.0, 11.0, 8.0, 11.0, 6.0, 5.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.375, -14.84765625, -14.3203125, -13.79296875, -13.265625, -12.73828125, -12.2109375, -11.68359375, -11.15625, -10.62890625, -10.1015625, -9.57421875, -9.046875, -8.51953125, -7.9921875, -7.46484375, -6.9375, -6.41015625, -5.8828125, -5.35546875, -4.828125, -4.30078125, -3.7734375, -3.24609375, -2.71875, -2.19140625, -1.6640625, -1.13671875, -0.609375, -0.08203125, 0.4453125, 0.97265625, 1.5, 2.02734375, 2.5546875, 3.08203125, 3.609375, 4.13671875, 4.6640625, 5.19140625, 5.71875, 6.24609375, 6.7734375, 7.30078125, 7.828125, 8.35546875, 8.8828125, 9.41015625, 9.9375, 10.46484375, 10.9921875, 11.51953125, 12.046875, 12.57421875, 13.1015625, 13.62890625, 14.15625, 14.68359375, 15.2109375, 15.73828125, 16.265625, 16.79296875, 17.3203125, 17.84765625, 18.375]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 5.0, 7.0, 6.0, 14.0, 18.0, 17.0, 26.0, 26.0, 33.0, 46.0, 60.0, 91.0, 126.0, 176.0, 263.0, 402.0, 604.0, 1109.0, 2096.0, 4891.0, 16219.0, 202429.0, 781536.0, 25821.0, 6502.0, 2583.0, 1268.0, 717.0, 444.0, 282.0, 207.0, 142.0, 96.0, 64.0, 55.0, 30.0, 37.0, 23.0, 20.0, 17.0, 11.0, 11.0, 6.0, 8.0, 5.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-36.75, -35.48876953125, -34.2275390625, -32.96630859375, -31.705078125, -30.44384765625, -29.1826171875, -27.92138671875, -26.66015625, -25.39892578125, -24.1376953125, -22.87646484375, -21.615234375, -20.35400390625, -19.0927734375, -17.83154296875, -16.5703125, -15.30908203125, -14.0478515625, -12.78662109375, -11.525390625, -10.26416015625, -9.0029296875, -7.74169921875, -6.48046875, -5.21923828125, -3.9580078125, -2.69677734375, -1.435546875, -0.17431640625, 1.0869140625, 2.34814453125, 3.609375, 4.87060546875, 6.1318359375, 7.39306640625, 8.654296875, 9.91552734375, 11.1767578125, 12.43798828125, 13.69921875, 14.96044921875, 16.2216796875, 17.48291015625, 18.744140625, 20.00537109375, 21.2666015625, 22.52783203125, 23.7890625, 25.05029296875, 26.3115234375, 27.57275390625, 28.833984375, 30.09521484375, 31.3564453125, 32.61767578125, 33.87890625, 35.14013671875, 36.4013671875, 37.66259765625, 38.923828125, 40.18505859375, 41.4462890625, 42.70751953125, 43.96875]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 7.0, 2.0, 7.0, 8.0, 3.0, 11.0, 8.0, 11.0, 10.0, 19.0, 16.0, 15.0, 22.0, 29.0, 21.0, 31.0, 42.0, 37.0, 38.0, 44.0, 69.0, 92.0, 1605.0, 382.0, 100.0, 52.0, 44.0, 35.0, 36.0, 30.0, 30.0, 32.0, 26.0, 22.0, 20.0, 26.0, 21.0, 13.0, 12.0, 6.0, 5.0, 2.0, 6.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-36.5625, -35.341796875, -34.12109375, -32.900390625, -31.6796875, -30.458984375, -29.23828125, -28.017578125, -26.796875, -25.576171875, -24.35546875, -23.134765625, -21.9140625, -20.693359375, -19.47265625, -18.251953125, -17.03125, -15.810546875, -14.58984375, -13.369140625, -12.1484375, -10.927734375, -9.70703125, -8.486328125, -7.265625, -6.044921875, -4.82421875, -3.603515625, -2.3828125, -1.162109375, 0.05859375, 1.279296875, 2.5, 3.720703125, 4.94140625, 6.162109375, 7.3828125, 8.603515625, 9.82421875, 11.044921875, 12.265625, 13.486328125, 14.70703125, 15.927734375, 17.1484375, 18.369140625, 19.58984375, 20.810546875, 22.03125, 23.251953125, 24.47265625, 25.693359375, 26.9140625, 28.134765625, 29.35546875, 30.576171875, 31.796875, 33.017578125, 34.23828125, 35.458984375, 36.6796875, 37.900390625, 39.12109375, 40.341796875, 41.5625]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 3.0, 3.0, 2.0, 1.0, 2.0, 6.0, 1.0, 12.0, 5.0, 10.0, 12.0, 16.0, 20.0, 32.0, 24.0, 15.0, 40.0, 37.0, 57.0, 47.0, 82.0, 140.0, 265.0, 747.0, 4257.0, 125838.0, 3002292.0, 9512.0, 1250.0, 332.0, 173.0, 108.0, 66.0, 64.0, 44.0, 22.0, 26.0, 16.0, 17.0, 17.0, 20.0, 14.0, 9.0, 12.0, 9.0, 8.0, 5.0, 4.0, 7.0, 1.0, 6.0, 1.0, 2.0, 4.0], "bins": [-107.4375, -104.4677734375, -101.498046875, -98.5283203125, -95.55859375, -92.5888671875, -89.619140625, -86.6494140625, -83.6796875, -80.7099609375, -77.740234375, -74.7705078125, -71.80078125, -68.8310546875, -65.861328125, -62.8916015625, -59.921875, -56.9521484375, -53.982421875, -51.0126953125, -48.04296875, -45.0732421875, -42.103515625, -39.1337890625, -36.1640625, -33.1943359375, -30.224609375, -27.2548828125, -24.28515625, -21.3154296875, -18.345703125, -15.3759765625, -12.40625, -9.4365234375, -6.466796875, -3.4970703125, -0.52734375, 2.4423828125, 5.412109375, 8.3818359375, 11.3515625, 14.3212890625, 17.291015625, 20.2607421875, 23.23046875, 26.2001953125, 29.169921875, 32.1396484375, 35.109375, 38.0791015625, 41.048828125, 44.0185546875, 46.98828125, 49.9580078125, 52.927734375, 55.8974609375, 58.8671875, 61.8369140625, 64.806640625, 67.7763671875, 70.74609375, 73.7158203125, 76.685546875, 79.6552734375, 82.625]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 6.0, 18.0, 19.0, 52.0, 95.0, 171.0, 178.0, 191.0, 116.0, 73.0, 42.0, 30.0, 8.0, 9.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.6999626159668, -51.271575927734375, -49.84318923950195, -48.41480255126953, -46.986419677734375, -45.55803298950195, -44.12964630126953, -42.70125961303711, -41.27287292480469, -39.844486236572266, -38.416099548339844, -36.98771286010742, -35.559326171875, -34.130943298339844, -32.70255661010742, -31.274169921875, -29.845783233642578, -28.417396545410156, -26.989009857177734, -25.560625076293945, -24.132238388061523, -22.7038516998291, -21.275466918945312, -19.84708023071289, -18.41869354248047, -16.990306854248047, -15.561921119689941, -14.133535385131836, -12.705148696899414, -11.276762008666992, -9.848376274108887, -8.419990539550781, -6.991600036621094, -5.56321382522583, -4.134827613830566, -2.7064414024353027, -1.278055191040039, 0.1503310203552246, 1.5787172317504883, 3.0071029663085938, 4.435489654541016, 5.863875865936279, 7.292262077331543, 8.720647811889648, 10.14903450012207, 11.577421188354492, 13.005806922912598, 14.434192657470703, 15.862579345703125, 17.290966033935547, 18.71935272216797, 20.147737503051758, 21.57612419128418, 23.0045108795166, 24.43289566040039, 25.861282348632812, 27.289669036865234, 28.718055725097656, 30.146442413330078, 31.574827194213867, 33.003211975097656, 34.43159866333008, 35.8599853515625, 37.28837203979492, 38.716758728027344]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 2.0, 13.0, 3.0, 17.0, 17.0, 9.0, 19.0, 20.0, 24.0, 25.0, 27.0, 24.0, 32.0, 51.0, 33.0, 50.0, 42.0, 60.0, 58.0, 49.0, 48.0, 56.0, 37.0, 45.0, 35.0, 33.0, 30.0, 18.0, 24.0, 24.0, 17.0, 18.0, 11.0, 7.0, 4.0, 11.0, 8.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-116.44855499267578, -112.91067504882812, -109.37279510498047, -105.83491516113281, -102.29703521728516, -98.7591552734375, -95.22127532958984, -91.68339538574219, -88.14551544189453, -84.60763549804688, -81.06975555419922, -77.53187561035156, -73.9939956665039, -70.45611572265625, -66.9182357788086, -63.38035583496094, -59.84247589111328, -56.304595947265625, -52.76671600341797, -49.22883605957031, -45.690956115722656, -42.153076171875, -38.615196228027344, -35.07731628417969, -31.53943634033203, -28.001556396484375, -24.46367645263672, -20.925796508789062, -17.387916564941406, -13.85003662109375, -10.312156677246094, -6.7742767333984375, -3.2363967895507812, 0.301483154296875, 3.8393630981445312, 7.3772430419921875, 10.915122985839844, 14.4530029296875, 17.990882873535156, 21.528762817382812, 25.06664276123047, 28.604522705078125, 32.14240264892578, 35.68028259277344, 39.218162536621094, 42.75604248046875, 46.293922424316406, 49.83180236816406, 53.36968231201172, 56.907562255859375, 60.44544219970703, 63.98332214355469, 67.52120208740234, 71.05908203125, 74.59696197509766, 78.13484191894531, 81.67272186279297, 85.21060180664062, 88.74848175048828, 92.28636169433594, 95.8242416381836, 99.36212158203125, 102.9000015258789, 106.43788146972656, 109.97576141357422]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 6.0, 6.0, 8.0, 9.0, 8.0, 8.0, 18.0, 18.0, 15.0, 22.0, 25.0, 26.0, 25.0, 34.0, 30.0, 58.0, 43.0, 52.0, 56.0, 57.0, 41.0, 35.0, 40.0, 39.0, 33.0, 30.0, 39.0, 34.0, 31.0, 21.0, 18.0, 25.0, 22.0, 15.0, 9.0, 8.0, 12.0, 5.0, 8.0, 4.0, 3.0, 2.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.7109375, -15.1717529296875, -14.632568359375, -14.0933837890625, -13.55419921875, -13.0150146484375, -12.475830078125, -11.9366455078125, -11.3974609375, -10.8582763671875, -10.319091796875, -9.7799072265625, -9.24072265625, -8.7015380859375, -8.162353515625, -7.6231689453125, -7.083984375, -6.5447998046875, -6.005615234375, -5.4664306640625, -4.92724609375, -4.3880615234375, -3.848876953125, -3.3096923828125, -2.7705078125, -2.2313232421875, -1.692138671875, -1.1529541015625, -0.61376953125, -0.0745849609375, 0.464599609375, 1.0037841796875, 1.54296875, 2.0821533203125, 2.621337890625, 3.1605224609375, 3.69970703125, 4.2388916015625, 4.778076171875, 5.3172607421875, 5.8564453125, 6.3956298828125, 6.934814453125, 7.4739990234375, 8.01318359375, 8.5523681640625, 9.091552734375, 9.6307373046875, 10.169921875, 10.7091064453125, 11.248291015625, 11.7874755859375, 12.32666015625, 12.8658447265625, 13.405029296875, 13.9442138671875, 14.4833984375, 15.0225830078125, 15.561767578125, 16.1009521484375, 16.64013671875, 17.1793212890625, 17.718505859375, 18.2576904296875, 18.796875]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 6.0, 5.0, 17.0, 19.0, 35.0, 43.0, 60.0, 78.0, 131.0, 211.0, 235.0, 401.0, 577.0, 762.0, 1144.0, 1702.0, 2490.0, 3921.0, 6220.0, 10670.0, 21423.0, 125635.0, 2499357.0, 1402652.0, 72797.0, 17484.0, 9533.0, 5612.0, 3583.0, 2280.0, 1575.0, 1058.0, 763.0, 498.0, 373.0, 291.0, 181.0, 124.0, 92.0, 79.0, 43.0, 29.0, 26.0, 24.0, 19.0, 5.0, 14.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-37.4375, -36.14208984375, -34.8466796875, -33.55126953125, -32.255859375, -30.96044921875, -29.6650390625, -28.36962890625, -27.07421875, -25.77880859375, -24.4833984375, -23.18798828125, -21.892578125, -20.59716796875, -19.3017578125, -18.00634765625, -16.7109375, -15.41552734375, -14.1201171875, -12.82470703125, -11.529296875, -10.23388671875, -8.9384765625, -7.64306640625, -6.34765625, -5.05224609375, -3.7568359375, -2.46142578125, -1.166015625, 0.12939453125, 1.4248046875, 2.72021484375, 4.015625, 5.31103515625, 6.6064453125, 7.90185546875, 9.197265625, 10.49267578125, 11.7880859375, 13.08349609375, 14.37890625, 15.67431640625, 16.9697265625, 18.26513671875, 19.560546875, 20.85595703125, 22.1513671875, 23.44677734375, 24.7421875, 26.03759765625, 27.3330078125, 28.62841796875, 29.923828125, 31.21923828125, 32.5146484375, 33.81005859375, 35.10546875, 36.40087890625, 37.6962890625, 38.99169921875, 40.287109375, 41.58251953125, 42.8779296875, 44.17333984375, 45.46875]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 2.0, 3.0, 4.0, 2.0, 5.0, 6.0, 10.0, 13.0, 21.0, 25.0, 29.0, 30.0, 43.0, 109.0, 228.0, 451.0, 899.0, 1006.0, 576.0, 267.0, 124.0, 46.0, 41.0, 22.0, 17.0, 17.0, 10.0, 19.0, 10.0, 6.0, 5.0, 5.0, 1.0, 7.0, 2.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-38.9375, -37.7978515625, -36.658203125, -35.5185546875, -34.37890625, -33.2392578125, -32.099609375, -30.9599609375, -29.8203125, -28.6806640625, -27.541015625, -26.4013671875, -25.26171875, -24.1220703125, -22.982421875, -21.8427734375, -20.703125, -19.5634765625, -18.423828125, -17.2841796875, -16.14453125, -15.0048828125, -13.865234375, -12.7255859375, -11.5859375, -10.4462890625, -9.306640625, -8.1669921875, -7.02734375, -5.8876953125, -4.748046875, -3.6083984375, -2.46875, -1.3291015625, -0.189453125, 0.9501953125, 2.08984375, 3.2294921875, 4.369140625, 5.5087890625, 6.6484375, 7.7880859375, 8.927734375, 10.0673828125, 11.20703125, 12.3466796875, 13.486328125, 14.6259765625, 15.765625, 16.9052734375, 18.044921875, 19.1845703125, 20.32421875, 21.4638671875, 22.603515625, 23.7431640625, 24.8828125, 26.0224609375, 27.162109375, 28.3017578125, 29.44140625, 30.5810546875, 31.720703125, 32.8603515625, 34.0]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 1.0, 3.0, 3.0, 7.0, 8.0, 7.0, 8.0, 27.0, 30.0, 65.0, 83.0, 152.0, 287.0, 456.0, 891.0, 1724.0, 3470.0, 8036.0, 22015.0, 96617.0, 3747038.0, 260475.0, 32777.0, 10853.0, 4566.0, 2206.0, 1084.0, 621.0, 333.0, 163.0, 104.0, 62.0, 46.0, 21.0, 14.0, 7.0, 6.0, 4.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-76.5, -74.083984375, -71.66796875, -69.251953125, -66.8359375, -64.419921875, -62.00390625, -59.587890625, -57.171875, -54.755859375, -52.33984375, -49.923828125, -47.5078125, -45.091796875, -42.67578125, -40.259765625, -37.84375, -35.427734375, -33.01171875, -30.595703125, -28.1796875, -25.763671875, -23.34765625, -20.931640625, -18.515625, -16.099609375, -13.68359375, -11.267578125, -8.8515625, -6.435546875, -4.01953125, -1.603515625, 0.8125, 3.228515625, 5.64453125, 8.060546875, 10.4765625, 12.892578125, 15.30859375, 17.724609375, 20.140625, 22.556640625, 24.97265625, 27.388671875, 29.8046875, 32.220703125, 34.63671875, 37.052734375, 39.46875, 41.884765625, 44.30078125, 46.716796875, 49.1328125, 51.548828125, 53.96484375, 56.380859375, 58.796875, 61.212890625, 63.62890625, 66.044921875, 68.4609375, 70.876953125, 73.29296875, 75.708984375, 78.125]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 50.0, 829.0, 127.0, 11.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1635.44873046875, -1597.9898681640625, -1560.531005859375, -1523.072265625, -1485.6134033203125, -1448.154541015625, -1410.69580078125, -1373.2369384765625, -1335.778076171875, -1298.3192138671875, -1260.8603515625, -1223.401611328125, -1185.9427490234375, -1148.48388671875, -1111.025146484375, -1073.5662841796875, -1036.107421875, -998.6485595703125, -961.1897583007812, -923.73095703125, -886.2720947265625, -848.813232421875, -811.3544311523438, -773.8956298828125, -736.436767578125, -698.9779052734375, -661.5191040039062, -624.060302734375, -586.6014404296875, -549.142578125, -511.68377685546875, -474.2249450683594, -436.7659912109375, -399.3071594238281, -361.84832763671875, -324.3894958496094, -286.9306640625, -249.47183227539062, -212.01300048828125, -174.55416870117188, -137.0953369140625, -99.63650512695312, -62.17767333984375, -24.718841552734375, 12.739990234375, 50.198822021484375, 87.65765380859375, 125.11648559570312, 162.5753173828125, 200.03414916992188, 237.49298095703125, 274.9518127441406, 312.41064453125, 349.8694763183594, 387.32830810546875, 424.7871398925781, 462.2459716796875, 499.7048034667969, 537.1636352539062, 574.6224365234375, 612.081298828125, 649.5401611328125, 686.9989624023438, 724.457763671875, 761.9166259765625]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 3.0, 1.0, 6.0, 3.0, 1.0, 13.0, 15.0, 24.0, 11.0, 22.0, 20.0, 20.0, 23.0, 25.0, 28.0, 40.0, 34.0, 36.0, 45.0, 39.0, 50.0, 38.0, 44.0, 36.0, 42.0, 48.0, 31.0, 42.0, 24.0, 28.0, 37.0, 35.0, 20.0, 30.0, 20.0, 17.0, 14.0, 19.0, 10.0, 7.0, 6.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.83078002929688, -72.99639129638672, -70.16200256347656, -67.32760620117188, -64.49321746826172, -61.65882873535156, -58.824440002441406, -55.99005126953125, -53.15565872192383, -50.32126998901367, -47.48687744140625, -44.652488708496094, -41.81809997558594, -38.983707427978516, -36.14931869506836, -33.31492614746094, -30.48053741455078, -27.646146774291992, -24.811756134033203, -21.977367401123047, -19.142976760864258, -16.30858612060547, -13.474197387695312, -10.639806747436523, -7.805416107177734, -4.9710259437561035, -2.1366357803344727, 0.69775390625, 3.532144546508789, 6.366535186767578, 9.200923919677734, 12.035314559936523, 14.869705200195312, 17.7040958404541, 20.53848648071289, 23.372875213623047, 26.207265853881836, 29.041656494140625, 31.87604522705078, 34.71043395996094, 37.54482650756836, 40.379215240478516, 43.21360778808594, 46.047996520996094, 48.88238525390625, 51.71677780151367, 54.55116653442383, 57.38555908203125, 60.219947814941406, 63.05433654785156, 65.88872528076172, 68.72311401367188, 71.55751037597656, 74.39189910888672, 77.22628784179688, 80.06067657470703, 82.89506530761719, 85.72945404052734, 88.5638427734375, 91.39823913574219, 94.23262786865234, 97.0670166015625, 99.90140533447266, 102.73579406738281, 105.5701904296875]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 6.0, 7.0, 10.0, 4.0, 11.0, 6.0, 15.0, 21.0, 15.0, 26.0, 28.0, 38.0, 34.0, 36.0, 38.0, 41.0, 56.0, 47.0, 48.0, 41.0, 55.0, 37.0, 34.0, 37.0, 29.0, 29.0, 34.0, 31.0, 33.0, 20.0, 24.0, 25.0, 18.0, 17.0, 14.0, 9.0, 8.0, 4.0, 7.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-17.0, -16.428955078125, -15.85791015625, -15.286865234375, -14.7158203125, -14.144775390625, -13.57373046875, -13.002685546875, -12.431640625, -11.860595703125, -11.28955078125, -10.718505859375, -10.1474609375, -9.576416015625, -9.00537109375, -8.434326171875, -7.86328125, -7.292236328125, -6.72119140625, -6.150146484375, -5.5791015625, -5.008056640625, -4.43701171875, -3.865966796875, -3.294921875, -2.723876953125, -2.15283203125, -1.581787109375, -1.0107421875, -0.439697265625, 0.13134765625, 0.702392578125, 1.2734375, 1.844482421875, 2.41552734375, 2.986572265625, 3.5576171875, 4.128662109375, 4.69970703125, 5.270751953125, 5.841796875, 6.412841796875, 6.98388671875, 7.554931640625, 8.1259765625, 8.697021484375, 9.26806640625, 9.839111328125, 10.41015625, 10.981201171875, 11.55224609375, 12.123291015625, 12.6943359375, 13.265380859375, 13.83642578125, 14.407470703125, 14.978515625, 15.549560546875, 16.12060546875, 16.691650390625, 17.2626953125, 17.833740234375, 18.40478515625, 18.975830078125, 19.546875]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 5.0, 7.0, 15.0, 18.0, 46.0, 48.0, 71.0, 124.0, 168.0, 230.0, 381.0, 638.0, 940.0, 1517.0, 2458.0, 4013.0, 6551.0, 10620.0, 18128.0, 30339.0, 52715.0, 94724.0, 175377.0, 249634.0, 175765.0, 95123.0, 52520.0, 30402.0, 18007.0, 10777.0, 6476.0, 3963.0, 2450.0, 1579.0, 988.0, 605.0, 415.0, 219.0, 171.0, 93.0, 70.0, 43.0, 45.0, 32.0, 17.0, 13.0, 8.0, 5.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0], "bins": [-1.732421875, -1.6807098388671875, -1.628997802734375, -1.5772857666015625, -1.52557373046875, -1.4738616943359375, -1.422149658203125, -1.3704376220703125, -1.3187255859375, -1.2670135498046875, -1.215301513671875, -1.1635894775390625, -1.11187744140625, -1.0601654052734375, -1.008453369140625, -0.9567413330078125, -0.905029296875, -0.8533172607421875, -0.801605224609375, -0.7498931884765625, -0.69818115234375, -0.6464691162109375, -0.594757080078125, -0.5430450439453125, -0.4913330078125, -0.4396209716796875, -0.387908935546875, -0.3361968994140625, -0.28448486328125, -0.2327728271484375, -0.181060791015625, -0.1293487548828125, -0.07763671875, -0.0259246826171875, 0.025787353515625, 0.0774993896484375, 0.12921142578125, 0.1809234619140625, 0.232635498046875, 0.2843475341796875, 0.3360595703125, 0.3877716064453125, 0.439483642578125, 0.4911956787109375, 0.54290771484375, 0.5946197509765625, 0.646331787109375, 0.6980438232421875, 0.749755859375, 0.8014678955078125, 0.853179931640625, 0.9048919677734375, 0.95660400390625, 1.0083160400390625, 1.060028076171875, 1.1117401123046875, 1.1634521484375, 1.2151641845703125, 1.266876220703125, 1.3185882568359375, 1.37030029296875, 1.4220123291015625, 1.473724365234375, 1.5254364013671875, 1.5771484375]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 4.0, 7.0, 2.0, 11.0, 11.0, 8.0, 10.0, 8.0, 16.0, 14.0, 19.0, 13.0, 23.0, 18.0, 21.0, 20.0, 29.0, 32.0, 26.0, 38.0, 35.0, 38.0, 44.0, 39.0, 1053.0, 42.0, 48.0, 35.0, 28.0, 31.0, 34.0, 31.0, 27.0, 24.0, 24.0, 23.0, 15.0, 18.0, 12.0, 6.0, 18.0, 22.0, 18.0, 9.0, 7.0, 6.0, 8.0, 1.0, 2.0, 1.0, 4.0], "bins": [-11.2734375, -10.9713134765625, -10.669189453125, -10.3670654296875, -10.06494140625, -9.7628173828125, -9.460693359375, -9.1585693359375, -8.8564453125, -8.5543212890625, -8.252197265625, -7.9500732421875, -7.64794921875, -7.3458251953125, -7.043701171875, -6.7415771484375, -6.439453125, -6.1373291015625, -5.835205078125, -5.5330810546875, -5.23095703125, -4.9288330078125, -4.626708984375, -4.3245849609375, -4.0224609375, -3.7203369140625, -3.418212890625, -3.1160888671875, -2.81396484375, -2.5118408203125, -2.209716796875, -1.9075927734375, -1.60546875, -1.3033447265625, -1.001220703125, -0.6990966796875, -0.39697265625, -0.0948486328125, 0.207275390625, 0.5093994140625, 0.8115234375, 1.1136474609375, 1.415771484375, 1.7178955078125, 2.02001953125, 2.3221435546875, 2.624267578125, 2.9263916015625, 3.228515625, 3.5306396484375, 3.832763671875, 4.1348876953125, 4.43701171875, 4.7391357421875, 5.041259765625, 5.3433837890625, 5.6455078125, 5.9476318359375, 6.249755859375, 6.5518798828125, 6.85400390625, 7.1561279296875, 7.458251953125, 7.7603759765625, 8.0625]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 8.0, 13.0, 27.0, 27.0, 34.0, 54.0, 81.0, 141.0, 220.0, 343.0, 522.0, 837.0, 1266.0, 1989.0, 3107.0, 4716.0, 7361.0, 11002.0, 16892.0, 26878.0, 43223.0, 72961.0, 125473.0, 556828.0, 901353.0, 127222.0, 74001.0, 44220.0, 27248.0, 17078.0, 11029.0, 7285.0, 4732.0, 3177.0, 2074.0, 1339.0, 846.0, 586.0, 334.0, 215.0, 145.0, 72.0, 57.0, 37.0, 35.0, 14.0, 13.0, 9.0, 7.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0], "bins": [-1.0029296875, -0.9716033935546875, -0.940277099609375, -0.9089508056640625, -0.87762451171875, -0.8462982177734375, -0.814971923828125, -0.7836456298828125, -0.7523193359375, -0.7209930419921875, -0.689666748046875, -0.6583404541015625, -0.62701416015625, -0.5956878662109375, -0.564361572265625, -0.5330352783203125, -0.501708984375, -0.4703826904296875, -0.439056396484375, -0.4077301025390625, -0.37640380859375, -0.3450775146484375, -0.313751220703125, -0.2824249267578125, -0.2510986328125, -0.2197723388671875, -0.188446044921875, -0.1571197509765625, -0.12579345703125, -0.0944671630859375, -0.063140869140625, -0.0318145751953125, -0.00048828125, 0.0308380126953125, 0.062164306640625, 0.0934906005859375, 0.12481689453125, 0.1561431884765625, 0.187469482421875, 0.2187957763671875, 0.2501220703125, 0.2814483642578125, 0.312774658203125, 0.3441009521484375, 0.37542724609375, 0.4067535400390625, 0.438079833984375, 0.4694061279296875, 0.500732421875, 0.5320587158203125, 0.563385009765625, 0.5947113037109375, 0.62603759765625, 0.6573638916015625, 0.688690185546875, 0.7200164794921875, 0.7513427734375, 0.7826690673828125, 0.813995361328125, 0.8453216552734375, 0.87664794921875, 0.9079742431640625, 0.939300537109375, 0.9706268310546875, 1.001953125]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 1.0, 1.0, 7.0, 5.0, 7.0, 8.0, 18.0, 20.0, 19.0, 26.0, 32.0, 30.0, 40.0, 55.0, 66.0, 95.0, 104.0, 121.0, 81.0, 52.0, 35.0, 35.0, 33.0, 26.0, 20.0, 15.0, 8.0, 9.0, 8.0, 5.0, 6.0, 5.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.04522705078125, -0.043990135192871094, -0.04275321960449219, -0.04151630401611328, -0.040279388427734375, -0.03904247283935547, -0.03780555725097656, -0.036568641662597656, -0.03533172607421875, -0.034094810485839844, -0.03285789489746094, -0.03162097930908203, -0.030384063720703125, -0.02914714813232422, -0.027910232543945312, -0.026673316955566406, -0.0254364013671875, -0.024199485778808594, -0.022962570190429688, -0.02172565460205078, -0.020488739013671875, -0.01925182342529297, -0.018014907836914062, -0.016777992248535156, -0.01554107666015625, -0.014304161071777344, -0.013067245483398438, -0.011830329895019531, -0.010593414306640625, -0.009356498718261719, -0.008119583129882812, -0.006882667541503906, -0.005645751953125, -0.004408836364746094, -0.0031719207763671875, -0.0019350051879882812, -0.000698089599609375, 0.0005388259887695312, 0.0017757415771484375, 0.0030126571655273438, 0.00424957275390625, 0.005486488342285156, 0.0067234039306640625, 0.007960319519042969, 0.009197235107421875, 0.010434150695800781, 0.011671066284179688, 0.012907981872558594, 0.0141448974609375, 0.015381813049316406, 0.016618728637695312, 0.01785564422607422, 0.019092559814453125, 0.02032947540283203, 0.021566390991210938, 0.022803306579589844, 0.02404022216796875, 0.025277137756347656, 0.026514053344726562, 0.02775096893310547, 0.028987884521484375, 0.03022480010986328, 0.03146171569824219, 0.032698631286621094, 0.033935546875]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 2.0, 11.0, 11.0, 9.0, 13.0, 15.0, 12.0, 25.0, 30.0, 39.0, 72.0, 97.0, 132.0, 274.0, 647.0, 9911.0, 1032676.0, 3327.0, 549.0, 221.0, 127.0, 90.0, 68.0, 47.0, 41.0, 28.0, 22.0, 14.0, 9.0, 6.0, 5.0, 7.0, 6.0, 3.0, 2.0, 1.0, 5.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.697265625, -0.67181396484375, -0.6463623046875, -0.62091064453125, -0.595458984375, -0.57000732421875, -0.5445556640625, -0.51910400390625, -0.49365234375, -0.46820068359375, -0.4427490234375, -0.41729736328125, -0.391845703125, -0.36639404296875, -0.3409423828125, -0.31549072265625, -0.2900390625, -0.26458740234375, -0.2391357421875, -0.21368408203125, -0.188232421875, -0.16278076171875, -0.1373291015625, -0.11187744140625, -0.08642578125, -0.06097412109375, -0.0355224609375, -0.01007080078125, 0.015380859375, 0.04083251953125, 0.0662841796875, 0.09173583984375, 0.1171875, 0.14263916015625, 0.1680908203125, 0.19354248046875, 0.218994140625, 0.24444580078125, 0.2698974609375, 0.29534912109375, 0.32080078125, 0.34625244140625, 0.3717041015625, 0.39715576171875, 0.422607421875, 0.44805908203125, 0.4735107421875, 0.49896240234375, 0.5244140625, 0.54986572265625, 0.5753173828125, 0.60076904296875, 0.626220703125, 0.65167236328125, 0.6771240234375, 0.70257568359375, 0.72802734375, 0.75347900390625, 0.7789306640625, 0.80438232421875, 0.829833984375, 0.85528564453125, 0.8807373046875, 0.90618896484375, 0.931640625]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 27.0, 919.0, 65.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15368282794952393, -0.1356232464313507, -0.11756366491317749, -0.09950407594442368, -0.08144449442625046, -0.06338491290807724, -0.045325323939323425, -0.027265742421150208, -0.00920616090297699, 0.008853422477841377, 0.026913005858659744, 0.04497259110212326, 0.06303217262029648, 0.0810917541384697, 0.09915134310722351, 0.11721092462539673, 0.13527050614356995, 0.15333008766174316, 0.17138966917991638, 0.1894492506980896, 0.20750883221626282, 0.22556841373443604, 0.24362801015377045, 0.26168757677078247, 0.2797471880912781, 0.2978067696094513, 0.3158663511276245, 0.33392593264579773, 0.35198551416397095, 0.37004509568214417, 0.3881046772003174, 0.406164288520813, 0.4242238402366638, 0.44228342175483704, 0.46034300327301025, 0.47840258479118347, 0.4964621663093567, 0.5145217776298523, 0.5325813293457031, 0.5506409406661987, 0.5687004923820496, 0.5867601037025452, 0.604819655418396, 0.6228792667388916, 0.6409388184547424, 0.658998429775238, 0.6770579814910889, 0.6951175928115845, 0.7131772041320801, 0.7312368154525757, 0.7492963671684265, 0.7673559784889221, 0.785415530204773, 0.8034751415252686, 0.8215346932411194, 0.839594304561615, 0.8576538562774658, 0.8757134675979614, 0.8937730193138123, 0.9118326306343079, 0.9298921823501587, 0.9479517936706543, 0.9660113453865051, 0.9840709567070007, 1.0021305084228516]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 2.0, 4.0, 11.0, 10.0, 16.0, 13.0, 15.0, 15.0, 23.0, 23.0, 22.0, 45.0, 37.0, 34.0, 40.0, 37.0, 46.0, 49.0, 45.0, 45.0, 46.0, 51.0, 30.0, 40.0, 31.0, 52.0, 31.0, 31.0, 29.0, 25.0, 22.0, 18.0, 15.0, 16.0, 9.0, 10.0, 5.0, 3.0, 3.0, 1.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05918377637863159, -0.05743154510855675, -0.0556793138384819, -0.05392708256840706, -0.052174851298332214, -0.05042262002825737, -0.048670388758182526, -0.04691815748810768, -0.04516592621803284, -0.04341369494795799, -0.04166146367788315, -0.039909232407808304, -0.03815700113773346, -0.036404769867658615, -0.03465253859758377, -0.032900307327508926, -0.031148076057434082, -0.029395844787359238, -0.027643613517284393, -0.02589138224720955, -0.024139150977134705, -0.02238691970705986, -0.020634688436985016, -0.01888245716691017, -0.017130225896835327, -0.015377994626760483, -0.013625763356685638, -0.011873532086610794, -0.01012130081653595, -0.008369069546461105, -0.006616838276386261, -0.004864607006311417, -0.0031123757362365723, -0.001360144466161728, 0.00039208680391311646, 0.002144318073987961, 0.003896549344062805, 0.0056487806141376495, 0.007401011884212494, 0.009153243154287338, 0.010905474424362183, 0.012657705694437027, 0.014409936964511871, 0.016162168234586716, 0.01791439950466156, 0.019666630774736404, 0.02141886204481125, 0.023171093314886093, 0.024923324584960938, 0.026675555855035782, 0.028427787125110626, 0.03018001839518547, 0.031932249665260315, 0.03368448093533516, 0.035436712205410004, 0.03718894347548485, 0.03894117474555969, 0.04069340601563454, 0.04244563728570938, 0.044197868555784225, 0.04595009982585907, 0.047702331095933914, 0.04945456236600876, 0.0512067936360836, 0.05295902490615845]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 6.0, 7.0, 10.0, 4.0, 11.0, 6.0, 15.0, 21.0, 16.0, 25.0, 28.0, 38.0, 34.0, 36.0, 39.0, 41.0, 56.0, 46.0, 48.0, 40.0, 56.0, 37.0, 35.0, 36.0, 29.0, 30.0, 33.0, 31.0, 33.0, 20.0, 24.0, 25.0, 18.0, 17.0, 14.0, 9.0, 8.0, 4.0, 7.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-17.0, -16.428955078125, -15.85791015625, -15.286865234375, -14.7158203125, -14.144775390625, -13.57373046875, -13.002685546875, -12.431640625, -11.860595703125, -11.28955078125, -10.718505859375, -10.1474609375, -9.576416015625, -9.00537109375, -8.434326171875, -7.86328125, -7.292236328125, -6.72119140625, -6.150146484375, -5.5791015625, -5.008056640625, -4.43701171875, -3.865966796875, -3.294921875, -2.723876953125, -2.15283203125, -1.581787109375, -1.0107421875, -0.439697265625, 0.13134765625, 0.702392578125, 1.2734375, 1.844482421875, 2.41552734375, 2.986572265625, 3.5576171875, 4.128662109375, 4.69970703125, 5.270751953125, 5.841796875, 6.412841796875, 6.98388671875, 7.554931640625, 8.1259765625, 8.697021484375, 9.26806640625, 9.839111328125, 10.41015625, 10.981201171875, 11.55224609375, 12.123291015625, 12.6943359375, 13.265380859375, 13.83642578125, 14.407470703125, 14.978515625, 15.549560546875, 16.12060546875, 16.691650390625, 17.2626953125, 17.833740234375, 18.40478515625, 18.975830078125, 19.546875]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 6.0, 11.0, 11.0, 15.0, 32.0, 35.0, 44.0, 70.0, 62.0, 95.0, 148.0, 251.0, 395.0, 589.0, 953.0, 1624.0, 2853.0, 5709.0, 14598.0, 69026.0, 634492.0, 264938.0, 33080.0, 9590.0, 4166.0, 2164.0, 1310.0, 762.0, 508.0, 284.0, 204.0, 140.0, 113.0, 72.0, 69.0, 35.0, 23.0, 20.0, 17.0, 9.0, 10.0, 10.0, 7.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-23.375, -22.563232421875, -21.75146484375, -20.939697265625, -20.1279296875, -19.316162109375, -18.50439453125, -17.692626953125, -16.880859375, -16.069091796875, -15.25732421875, -14.445556640625, -13.6337890625, -12.822021484375, -12.01025390625, -11.198486328125, -10.38671875, -9.574951171875, -8.76318359375, -7.951416015625, -7.1396484375, -6.327880859375, -5.51611328125, -4.704345703125, -3.892578125, -3.080810546875, -2.26904296875, -1.457275390625, -0.6455078125, 0.166259765625, 0.97802734375, 1.789794921875, 2.6015625, 3.413330078125, 4.22509765625, 5.036865234375, 5.8486328125, 6.660400390625, 7.47216796875, 8.283935546875, 9.095703125, 9.907470703125, 10.71923828125, 11.531005859375, 12.3427734375, 13.154541015625, 13.96630859375, 14.778076171875, 15.58984375, 16.401611328125, 17.21337890625, 18.025146484375, 18.8369140625, 19.648681640625, 20.46044921875, 21.272216796875, 22.083984375, 22.895751953125, 23.70751953125, 24.519287109375, 25.3310546875, 26.142822265625, 26.95458984375, 27.766357421875, 28.578125]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 4.0, 2.0, 4.0, 3.0, 6.0, 9.0, 10.0, 14.0, 13.0, 8.0, 16.0, 20.0, 25.0, 26.0, 18.0, 26.0, 44.0, 38.0, 41.0, 66.0, 70.0, 174.0, 1665.0, 231.0, 94.0, 62.0, 54.0, 36.0, 52.0, 37.0, 37.0, 28.0, 24.0, 24.0, 15.0, 17.0, 9.0, 11.0, 6.0, 3.0, 4.0, 2.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-43.625, -42.24560546875, -40.8662109375, -39.48681640625, -38.107421875, -36.72802734375, -35.3486328125, -33.96923828125, -32.58984375, -31.21044921875, -29.8310546875, -28.45166015625, -27.072265625, -25.69287109375, -24.3134765625, -22.93408203125, -21.5546875, -20.17529296875, -18.7958984375, -17.41650390625, -16.037109375, -14.65771484375, -13.2783203125, -11.89892578125, -10.51953125, -9.14013671875, -7.7607421875, -6.38134765625, -5.001953125, -3.62255859375, -2.2431640625, -0.86376953125, 0.515625, 1.89501953125, 3.2744140625, 4.65380859375, 6.033203125, 7.41259765625, 8.7919921875, 10.17138671875, 11.55078125, 12.93017578125, 14.3095703125, 15.68896484375, 17.068359375, 18.44775390625, 19.8271484375, 21.20654296875, 22.5859375, 23.96533203125, 25.3447265625, 26.72412109375, 28.103515625, 29.48291015625, 30.8623046875, 32.24169921875, 33.62109375, 35.00048828125, 36.3798828125, 37.75927734375, 39.138671875, 40.51806640625, 41.8974609375, 43.27685546875, 44.65625]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 1.0, 4.0, 6.0, 9.0, 17.0, 13.0, 20.0, 32.0, 51.0, 85.0, 114.0, 191.0, 334.0, 873.0, 4387.0, 146614.0, 2975866.0, 14228.0, 1722.0, 467.0, 222.0, 141.0, 95.0, 61.0, 53.0, 34.0, 22.0, 17.0, 11.0, 6.0, 2.0, 7.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.625, -66.1943359375, -63.763671875, -61.3330078125, -58.90234375, -56.4716796875, -54.041015625, -51.6103515625, -49.1796875, -46.7490234375, -44.318359375, -41.8876953125, -39.45703125, -37.0263671875, -34.595703125, -32.1650390625, -29.734375, -27.3037109375, -24.873046875, -22.4423828125, -20.01171875, -17.5810546875, -15.150390625, -12.7197265625, -10.2890625, -7.8583984375, -5.427734375, -2.9970703125, -0.56640625, 1.8642578125, 4.294921875, 6.7255859375, 9.15625, 11.5869140625, 14.017578125, 16.4482421875, 18.87890625, 21.3095703125, 23.740234375, 26.1708984375, 28.6015625, 31.0322265625, 33.462890625, 35.8935546875, 38.32421875, 40.7548828125, 43.185546875, 45.6162109375, 48.046875, 50.4775390625, 52.908203125, 55.3388671875, 57.76953125, 60.2001953125, 62.630859375, 65.0615234375, 67.4921875, 69.9228515625, 72.353515625, 74.7841796875, 77.21484375, 79.6455078125, 82.076171875, 84.5068359375, 86.9375]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 338.0, 677.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.522544860839844, -45.73832702636719, -30.95410919189453, -16.169891357421875, -1.3856735229492188, 13.398544311523438, 28.182762145996094, 42.96697998046875, 57.751197814941406, 72.53541564941406, 87.31963348388672, 102.10385131835938, 116.88806915283203, 131.6722869873047, 146.45651245117188, 161.24072265625, 176.02493286132812, 190.80914306640625, 205.59336853027344, 220.37759399414062, 235.16180419921875, 249.94601440429688, 264.730224609375, 279.51446533203125, 294.2986755371094, 309.0828857421875, 323.86712646484375, 338.6513366699219, 353.435546875, 368.2197570800781, 383.00396728515625, 397.7882080078125, 412.57244873046875, 427.3566589355469, 442.140869140625, 456.92510986328125, 471.7093200683594, 486.4935302734375, 501.27777099609375, 516.0619506835938, 530.84619140625, 545.6304321289062, 560.4146118164062, 575.1988525390625, 589.9830322265625, 604.7672729492188, 619.551513671875, 634.335693359375, 649.1199340820312, 663.9041748046875, 678.6883544921875, 693.4725952148438, 708.2568359375, 723.041015625, 737.8252563476562, 752.6094360351562, 767.3936767578125, 782.1779174804688, 796.9620971679688, 811.746337890625, 826.530517578125, 841.3147583007812, 856.0989990234375, 870.8831787109375, 885.6674194335938]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 6.0, 4.0, 6.0, 12.0, 5.0, 11.0, 15.0, 12.0, 26.0, 21.0, 17.0, 31.0, 31.0, 35.0, 31.0, 41.0, 37.0, 44.0, 41.0, 32.0, 43.0, 53.0, 43.0, 43.0, 35.0, 29.0, 34.0, 33.0, 38.0, 24.0, 32.0, 23.0, 20.0, 22.0, 14.0, 12.0, 11.0, 7.0, 6.0, 8.0, 5.0, 2.0, 2.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-98.87551879882812, -96.03118133544922, -93.18684387207031, -90.34249877929688, -87.49816131591797, -84.65382385253906, -81.80948638916016, -78.96514892578125, -76.12080383300781, -73.2764663696289, -70.43212890625, -67.58778381347656, -64.74344635009766, -61.89910888671875, -59.054771423339844, -56.21043395996094, -53.36609649658203, -50.521759033203125, -47.67741775512695, -44.83308029174805, -41.988739013671875, -39.14440155029297, -36.30006408691406, -33.455726623535156, -30.611385345458984, -27.767045974731445, -24.922706604003906, -22.078369140625, -19.23402976989746, -16.389690399169922, -13.545352935791016, -10.701013565063477, -7.8566741943359375, -5.012335300445557, -2.167996406555176, 0.6763420104980469, 3.520681381225586, 6.365020751953125, 9.209358215332031, 12.05369758605957, 14.89803695678711, 17.74237632751465, 20.586715698242188, 23.431053161621094, 26.275392532348633, 29.119731903076172, 31.964069366455078, 34.80841064453125, 37.652748107910156, 40.49708557128906, 43.341426849365234, 46.18576431274414, 49.03010559082031, 51.87444305419922, 54.718780517578125, 57.56311798095703, 60.4074592590332, 63.25179672241211, 66.09613800048828, 68.94047546386719, 71.7848129272461, 74.629150390625, 77.47349548339844, 80.31783294677734, 83.16217041015625]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 5.0, 4.0, 11.0, 2.0, 12.0, 8.0, 14.0, 16.0, 14.0, 17.0, 22.0, 40.0, 28.0, 37.0, 30.0, 41.0, 48.0, 39.0, 42.0, 49.0, 34.0, 47.0, 36.0, 49.0, 41.0, 38.0, 21.0, 41.0, 32.0, 15.0, 33.0, 22.0, 19.0, 15.0, 19.0, 15.0, 12.0, 8.0, 10.0, 7.0, 2.0, 2.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-16.5, -15.9482421875, -15.396484375, -14.8447265625, -14.29296875, -13.7412109375, -13.189453125, -12.6376953125, -12.0859375, -11.5341796875, -10.982421875, -10.4306640625, -9.87890625, -9.3271484375, -8.775390625, -8.2236328125, -7.671875, -7.1201171875, -6.568359375, -6.0166015625, -5.46484375, -4.9130859375, -4.361328125, -3.8095703125, -3.2578125, -2.7060546875, -2.154296875, -1.6025390625, -1.05078125, -0.4990234375, 0.052734375, 0.6044921875, 1.15625, 1.7080078125, 2.259765625, 2.8115234375, 3.36328125, 3.9150390625, 4.466796875, 5.0185546875, 5.5703125, 6.1220703125, 6.673828125, 7.2255859375, 7.77734375, 8.3291015625, 8.880859375, 9.4326171875, 9.984375, 10.5361328125, 11.087890625, 11.6396484375, 12.19140625, 12.7431640625, 13.294921875, 13.8466796875, 14.3984375, 14.9501953125, 15.501953125, 16.0537109375, 16.60546875, 17.1572265625, 17.708984375, 18.2607421875, 18.8125]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 9.0, 8.0, 7.0, 18.0, 21.0, 45.0, 44.0, 73.0, 105.0, 160.0, 209.0, 356.0, 469.0, 679.0, 1018.0, 1522.0, 2263.0, 3494.0, 6048.0, 12584.0, 60364.0, 1718130.0, 2284184.0, 72465.0, 12715.0, 6125.0, 3715.0, 2447.0, 1598.0, 1102.0, 729.0, 497.0, 337.0, 221.0, 157.0, 103.0, 73.0, 59.0, 39.0, 21.0, 23.0, 14.0, 10.0, 11.0, 3.0, 0.0, 4.0, 5.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-43.75, -42.29345703125, -40.8369140625, -39.38037109375, -37.923828125, -36.46728515625, -35.0107421875, -33.55419921875, -32.09765625, -30.64111328125, -29.1845703125, -27.72802734375, -26.271484375, -24.81494140625, -23.3583984375, -21.90185546875, -20.4453125, -18.98876953125, -17.5322265625, -16.07568359375, -14.619140625, -13.16259765625, -11.7060546875, -10.24951171875, -8.79296875, -7.33642578125, -5.8798828125, -4.42333984375, -2.966796875, -1.51025390625, -0.0537109375, 1.40283203125, 2.859375, 4.31591796875, 5.7724609375, 7.22900390625, 8.685546875, 10.14208984375, 11.5986328125, 13.05517578125, 14.51171875, 15.96826171875, 17.4248046875, 18.88134765625, 20.337890625, 21.79443359375, 23.2509765625, 24.70751953125, 26.1640625, 27.62060546875, 29.0771484375, 30.53369140625, 31.990234375, 33.44677734375, 34.9033203125, 36.35986328125, 37.81640625, 39.27294921875, 40.7294921875, 42.18603515625, 43.642578125, 45.09912109375, 46.5556640625, 48.01220703125, 49.46875]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 6.0, 13.0, 9.0, 13.0, 24.0, 24.0, 48.0, 77.0, 140.0, 330.0, 861.0, 1323.0, 645.0, 272.0, 98.0, 49.0, 38.0, 26.0, 13.0, 16.0, 9.0, 10.0, 4.0, 4.0, 6.0, 4.0, 2.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-37.15625, -35.8896484375, -34.623046875, -33.3564453125, -32.08984375, -30.8232421875, -29.556640625, -28.2900390625, -27.0234375, -25.7568359375, -24.490234375, -23.2236328125, -21.95703125, -20.6904296875, -19.423828125, -18.1572265625, -16.890625, -15.6240234375, -14.357421875, -13.0908203125, -11.82421875, -10.5576171875, -9.291015625, -8.0244140625, -6.7578125, -5.4912109375, -4.224609375, -2.9580078125, -1.69140625, -0.4248046875, 0.841796875, 2.1083984375, 3.375, 4.6416015625, 5.908203125, 7.1748046875, 8.44140625, 9.7080078125, 10.974609375, 12.2412109375, 13.5078125, 14.7744140625, 16.041015625, 17.3076171875, 18.57421875, 19.8408203125, 21.107421875, 22.3740234375, 23.640625, 24.9072265625, 26.173828125, 27.4404296875, 28.70703125, 29.9736328125, 31.240234375, 32.5068359375, 33.7734375, 35.0400390625, 36.306640625, 37.5732421875, 38.83984375, 40.1064453125, 41.373046875, 42.6396484375, 43.90625]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 9.0, 7.0, 14.0, 24.0, 27.0, 33.0, 53.0, 58.0, 95.0, 143.0, 209.0, 319.0, 506.0, 823.0, 1411.0, 2520.0, 4824.0, 9421.0, 21489.0, 66133.0, 1215697.0, 2733632.0, 88540.0, 25078.0, 10891.0, 5312.0, 2731.0, 1638.0, 935.0, 594.0, 388.0, 223.0, 150.0, 106.0, 62.0, 46.0, 40.0, 32.0, 18.0, 12.0, 13.0, 9.0, 8.0, 5.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0], "bins": [-54.34375, -52.794921875, -51.24609375, -49.697265625, -48.1484375, -46.599609375, -45.05078125, -43.501953125, -41.953125, -40.404296875, -38.85546875, -37.306640625, -35.7578125, -34.208984375, -32.66015625, -31.111328125, -29.5625, -28.013671875, -26.46484375, -24.916015625, -23.3671875, -21.818359375, -20.26953125, -18.720703125, -17.171875, -15.623046875, -14.07421875, -12.525390625, -10.9765625, -9.427734375, -7.87890625, -6.330078125, -4.78125, -3.232421875, -1.68359375, -0.134765625, 1.4140625, 2.962890625, 4.51171875, 6.060546875, 7.609375, 9.158203125, 10.70703125, 12.255859375, 13.8046875, 15.353515625, 16.90234375, 18.451171875, 20.0, 21.548828125, 23.09765625, 24.646484375, 26.1953125, 27.744140625, 29.29296875, 30.841796875, 32.390625, 33.939453125, 35.48828125, 37.037109375, 38.5859375, 40.134765625, 41.68359375, 43.232421875, 44.78125]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 5.0, 6.0, 16.0, 32.0, 65.0, 162.0, 302.0, 212.0, 106.0, 45.0, 21.0, 17.0, 8.0, 5.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-308.9152526855469, -302.4376525878906, -295.9600830078125, -289.48248291015625, -283.0048828125, -276.52728271484375, -270.0497131347656, -263.5721130371094, -257.0945129394531, -250.61692810058594, -244.1393280029297, -237.6617431640625, -231.18414306640625, -224.70655822753906, -218.2289581298828, -211.75137329101562, -205.27377319335938, -198.7961883544922, -192.31858825683594, -185.84100341796875, -179.3634033203125, -172.8858184814453, -166.40821838378906, -159.93063354492188, -153.4530487060547, -146.9754638671875, -140.49786376953125, -134.02027893066406, -127.54267883300781, -121.06509399414062, -114.58749389648438, -108.10990905761719, -101.63230895996094, -95.15471649169922, -88.6771240234375, -82.19953155517578, -75.72193908691406, -69.24435424804688, -62.76675796508789, -56.28916549682617, -49.81157302856445, -43.333980560302734, -36.856388092041016, -30.37879753112793, -23.90120506286621, -17.423614501953125, -10.946022033691406, -4.4684295654296875, 2.0091629028320312, 8.48675537109375, 14.964346885681152, 21.441938400268555, 27.919530868530273, 34.39712142944336, 40.87471389770508, 47.3523063659668, 53.829898834228516, 60.307491302490234, 66.78507995605469, 73.2626724243164, 79.74026489257812, 86.21785736083984, 92.69544982910156, 99.17304229736328, 105.650634765625]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 6.0, 4.0, 7.0, 9.0, 10.0, 12.0, 6.0, 19.0, 22.0, 18.0, 26.0, 37.0, 17.0, 38.0, 36.0, 28.0, 39.0, 46.0, 41.0, 47.0, 44.0, 46.0, 40.0, 53.0, 36.0, 42.0, 44.0, 35.0, 24.0, 17.0, 33.0, 26.0, 14.0, 11.0, 15.0, 10.0, 11.0, 11.0, 5.0, 2.0, 4.0, 5.0, 5.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-86.68189239501953, -84.02593994140625, -81.36998748779297, -78.71403503417969, -76.05807495117188, -73.4021224975586, -70.74617004394531, -68.09021759033203, -65.43426513671875, -62.77831268310547, -60.12236022949219, -57.46640396118164, -54.81045150756836, -52.15449905395508, -49.49854278564453, -46.84259033203125, -44.18663787841797, -41.53068542480469, -38.874732971191406, -36.21877670288086, -33.56282424926758, -30.906871795654297, -28.250917434692383, -25.59496307373047, -22.939010620117188, -20.283058166503906, -17.627103805541992, -14.971150398254395, -12.315196990966797, -9.6592435836792, -7.003290176391602, -4.3473358154296875, -1.6913909912109375, 0.9645624160766602, 3.620515823364258, 6.2764692306518555, 8.932422637939453, 11.58837604522705, 14.244329452514648, 16.900283813476562, 19.556236267089844, 22.212188720703125, 24.86814308166504, 27.524097442626953, 30.180049896240234, 32.836002349853516, 35.49195861816406, 38.147911071777344, 40.803863525390625, 43.459815979003906, 46.11576843261719, 48.771724700927734, 51.427677154541016, 54.0836296081543, 56.739585876464844, 59.395538330078125, 62.051490783691406, 64.70744323730469, 67.36339569091797, 70.01934814453125, 72.67530822753906, 75.33126068115234, 77.98721313476562, 80.6431655883789, 83.29911804199219]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 5.0, 1.0, 3.0, 4.0, 7.0, 6.0, 13.0, 17.0, 27.0, 16.0, 17.0, 27.0, 20.0, 30.0, 41.0, 51.0, 39.0, 36.0, 48.0, 48.0, 50.0, 42.0, 52.0, 46.0, 41.0, 45.0, 37.0, 41.0, 22.0, 29.0, 20.0, 31.0, 15.0, 20.0, 12.0, 15.0, 8.0, 11.0, 4.0, 6.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-19.390625, -18.769287109375, -18.14794921875, -17.526611328125, -16.9052734375, -16.283935546875, -15.66259765625, -15.041259765625, -14.419921875, -13.798583984375, -13.17724609375, -12.555908203125, -11.9345703125, -11.313232421875, -10.69189453125, -10.070556640625, -9.44921875, -8.827880859375, -8.20654296875, -7.585205078125, -6.9638671875, -6.342529296875, -5.72119140625, -5.099853515625, -4.478515625, -3.857177734375, -3.23583984375, -2.614501953125, -1.9931640625, -1.371826171875, -0.75048828125, -0.129150390625, 0.4921875, 1.113525390625, 1.73486328125, 2.356201171875, 2.9775390625, 3.598876953125, 4.22021484375, 4.841552734375, 5.462890625, 6.084228515625, 6.70556640625, 7.326904296875, 7.9482421875, 8.569580078125, 9.19091796875, 9.812255859375, 10.43359375, 11.054931640625, 11.67626953125, 12.297607421875, 12.9189453125, 13.540283203125, 14.16162109375, 14.782958984375, 15.404296875, 16.025634765625, 16.64697265625, 17.268310546875, 17.8896484375, 18.510986328125, 19.13232421875, 19.753662109375, 20.375]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 6.0, 19.0, 24.0, 25.0, 32.0, 38.0, 60.0, 92.0, 128.0, 196.0, 286.0, 425.0, 646.0, 943.0, 1330.0, 1939.0, 2709.0, 4142.0, 6207.0, 9335.0, 14084.0, 22013.0, 34039.0, 55144.0, 93451.0, 157620.0, 215941.0, 166140.0, 98965.0, 58707.0, 36181.0, 23097.0, 14780.0, 9719.0, 6398.0, 4306.0, 2956.0, 2022.0, 1400.0, 965.0, 631.0, 408.0, 320.0, 227.0, 153.0, 109.0, 61.0, 41.0, 35.0, 16.0, 11.0, 12.0, 11.0, 5.0, 7.0, 6.0], "bins": [-1.5771484375, -1.5315093994140625, -1.485870361328125, -1.4402313232421875, -1.39459228515625, -1.3489532470703125, -1.303314208984375, -1.2576751708984375, -1.2120361328125, -1.1663970947265625, -1.120758056640625, -1.0751190185546875, -1.02947998046875, -0.9838409423828125, -0.938201904296875, -0.8925628662109375, -0.846923828125, -0.8012847900390625, -0.755645751953125, -0.7100067138671875, -0.66436767578125, -0.6187286376953125, -0.573089599609375, -0.5274505615234375, -0.4818115234375, -0.4361724853515625, -0.390533447265625, -0.3448944091796875, -0.29925537109375, -0.2536163330078125, -0.207977294921875, -0.1623382568359375, -0.11669921875, -0.0710601806640625, -0.025421142578125, 0.0202178955078125, 0.06585693359375, 0.1114959716796875, 0.157135009765625, 0.2027740478515625, 0.2484130859375, 0.2940521240234375, 0.339691162109375, 0.3853302001953125, 0.43096923828125, 0.4766082763671875, 0.522247314453125, 0.5678863525390625, 0.613525390625, 0.6591644287109375, 0.704803466796875, 0.7504425048828125, 0.79608154296875, 0.8417205810546875, 0.887359619140625, 0.9329986572265625, 0.9786376953125, 1.0242767333984375, 1.069915771484375, 1.1155548095703125, 1.16119384765625, 1.2068328857421875, 1.252471923828125, 1.2981109619140625, 1.34375]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 1.0, 2.0, 7.0, 6.0, 4.0, 6.0, 2.0, 10.0, 15.0, 11.0, 18.0, 19.0, 21.0, 24.0, 33.0, 36.0, 30.0, 26.0, 42.0, 48.0, 27.0, 55.0, 36.0, 1065.0, 35.0, 41.0, 38.0, 43.0, 37.0, 38.0, 29.0, 37.0, 23.0, 28.0, 25.0, 21.0, 19.0, 12.0, 7.0, 15.0, 6.0, 5.0, 6.0, 5.0, 8.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-11.78125, -11.4287109375, -11.076171875, -10.7236328125, -10.37109375, -10.0185546875, -9.666015625, -9.3134765625, -8.9609375, -8.6083984375, -8.255859375, -7.9033203125, -7.55078125, -7.1982421875, -6.845703125, -6.4931640625, -6.140625, -5.7880859375, -5.435546875, -5.0830078125, -4.73046875, -4.3779296875, -4.025390625, -3.6728515625, -3.3203125, -2.9677734375, -2.615234375, -2.2626953125, -1.91015625, -1.5576171875, -1.205078125, -0.8525390625, -0.5, -0.1474609375, 0.205078125, 0.5576171875, 0.91015625, 1.2626953125, 1.615234375, 1.9677734375, 2.3203125, 2.6728515625, 3.025390625, 3.3779296875, 3.73046875, 4.0830078125, 4.435546875, 4.7880859375, 5.140625, 5.4931640625, 5.845703125, 6.1982421875, 6.55078125, 6.9033203125, 7.255859375, 7.6083984375, 7.9609375, 8.3134765625, 8.666015625, 9.0185546875, 9.37109375, 9.7236328125, 10.076171875, 10.4287109375, 10.78125]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 7.0, 7.0, 18.0, 27.0, 32.0, 52.0, 77.0, 114.0, 178.0, 231.0, 369.0, 581.0, 794.0, 1126.0, 1688.0, 2558.0, 3772.0, 5627.0, 8519.0, 13480.0, 21531.0, 35566.0, 59306.0, 101973.0, 173945.0, 1269289.0, 159732.0, 93371.0, 54483.0, 32078.0, 19914.0, 12514.0, 7935.0, 5312.0, 3533.0, 2400.0, 1531.0, 1113.0, 770.0, 484.0, 359.0, 252.0, 161.0, 110.0, 87.0, 46.0, 35.0, 18.0, 3.0, 7.0, 9.0, 4.0, 3.0, 2.0, 4.0, 2.0, 0.0, 3.0], "bins": [-1.05078125, -1.017333984375, -0.98388671875, -0.950439453125, -0.9169921875, -0.883544921875, -0.85009765625, -0.816650390625, -0.783203125, -0.749755859375, -0.71630859375, -0.682861328125, -0.6494140625, -0.615966796875, -0.58251953125, -0.549072265625, -0.515625, -0.482177734375, -0.44873046875, -0.415283203125, -0.3818359375, -0.348388671875, -0.31494140625, -0.281494140625, -0.248046875, -0.214599609375, -0.18115234375, -0.147705078125, -0.1142578125, -0.080810546875, -0.04736328125, -0.013916015625, 0.01953125, 0.052978515625, 0.08642578125, 0.119873046875, 0.1533203125, 0.186767578125, 0.22021484375, 0.253662109375, 0.287109375, 0.320556640625, 0.35400390625, 0.387451171875, 0.4208984375, 0.454345703125, 0.48779296875, 0.521240234375, 0.5546875, 0.588134765625, 0.62158203125, 0.655029296875, 0.6884765625, 0.721923828125, 0.75537109375, 0.788818359375, 0.822265625, 0.855712890625, 0.88916015625, 0.922607421875, 0.9560546875, 0.989501953125, 1.02294921875, 1.056396484375, 1.08984375]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 1.0, 0.0, 4.0, 4.0, 2.0, 4.0, 6.0, 5.0, 4.0, 5.0, 3.0, 11.0, 7.0, 10.0, 14.0, 32.0, 29.0, 38.0, 71.0, 73.0, 97.0, 122.0, 112.0, 86.0, 76.0, 49.0, 26.0, 17.0, 18.0, 10.0, 9.0, 11.0, 13.0, 7.0, 6.0, 5.0, 2.0, 5.0, 1.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0310516357421875, -0.030129194259643555, -0.02920675277709961, -0.028284311294555664, -0.02736186981201172, -0.026439428329467773, -0.025516986846923828, -0.024594545364379883, -0.023672103881835938, -0.022749662399291992, -0.021827220916748047, -0.0209047794342041, -0.019982337951660156, -0.01905989646911621, -0.018137454986572266, -0.01721501350402832, -0.016292572021484375, -0.01537013053894043, -0.014447689056396484, -0.013525247573852539, -0.012602806091308594, -0.011680364608764648, -0.010757923126220703, -0.009835481643676758, -0.008913040161132812, -0.007990598678588867, -0.007068157196044922, -0.0061457157135009766, -0.005223274230957031, -0.004300832748413086, -0.0033783912658691406, -0.0024559497833251953, -0.00153350830078125, -0.0006110668182373047, 0.0003113746643066406, 0.001233816146850586, 0.0021562576293945312, 0.0030786991119384766, 0.004001140594482422, 0.004923582077026367, 0.0058460235595703125, 0.006768465042114258, 0.007690906524658203, 0.008613348007202148, 0.009535789489746094, 0.010458230972290039, 0.011380672454833984, 0.01230311393737793, 0.013225555419921875, 0.01414799690246582, 0.015070438385009766, 0.01599287986755371, 0.016915321350097656, 0.0178377628326416, 0.018760204315185547, 0.019682645797729492, 0.020605087280273438, 0.021527528762817383, 0.022449970245361328, 0.023372411727905273, 0.02429485321044922, 0.025217294692993164, 0.02613973617553711, 0.027062177658081055, 0.027984619140625]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 3.0, 1.0, 4.0, 4.0, 5.0, 11.0, 6.0, 12.0, 15.0, 27.0, 16.0, 31.0, 48.0, 49.0, 67.0, 92.0, 189.0, 368.0, 1567.0, 42559.0, 988117.0, 13636.0, 893.0, 265.0, 152.0, 109.0, 78.0, 51.0, 38.0, 28.0, 20.0, 22.0, 9.0, 5.0, 10.0, 6.0, 10.0, 2.0, 8.0, 3.0, 6.0, 3.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.5244140625, -0.5059280395507812, -0.4874420166015625, -0.46895599365234375, -0.450469970703125, -0.43198394775390625, -0.4134979248046875, -0.39501190185546875, -0.37652587890625, -0.35803985595703125, -0.3395538330078125, -0.32106781005859375, -0.302581787109375, -0.28409576416015625, -0.2656097412109375, -0.24712371826171875, -0.2286376953125, -0.21015167236328125, -0.1916656494140625, -0.17317962646484375, -0.154693603515625, -0.13620758056640625, -0.1177215576171875, -0.09923553466796875, -0.08074951171875, -0.06226348876953125, -0.0437774658203125, -0.02529144287109375, -0.006805419921875, 0.01168060302734375, 0.0301666259765625, 0.04865264892578125, 0.067138671875, 0.08562469482421875, 0.1041107177734375, 0.12259674072265625, 0.141082763671875, 0.15956878662109375, 0.1780548095703125, 0.19654083251953125, 0.21502685546875, 0.23351287841796875, 0.2519989013671875, 0.27048492431640625, 0.288970947265625, 0.30745697021484375, 0.3259429931640625, 0.34442901611328125, 0.3629150390625, 0.38140106201171875, 0.3998870849609375, 0.41837310791015625, 0.436859130859375, 0.45534515380859375, 0.4738311767578125, 0.49231719970703125, 0.51080322265625, 0.5292892456054688, 0.5477752685546875, 0.5662612915039062, 0.584747314453125, 0.6032333374023438, 0.6217193603515625, 0.6402053833007812, 0.65869140625]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 19.0, 82.0, 429.0, 376.0, 76.0, 18.0, 8.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09516280889511108, -0.08785489201545715, -0.08054696768522263, -0.0732390433549881, -0.06593112647533417, -0.05862320587038994, -0.05131528526544571, -0.04400736466050148, -0.03669944405555725, -0.029391523450613022, -0.022083602845668793, -0.014775682240724564, -0.0074677616357803345, -0.00015984103083610535, 0.007148079574108124, 0.014456000179052353, 0.021763920783996582, 0.02907184138894081, 0.03637976199388504, 0.04368768259882927, 0.0509956032037735, 0.05830352380871773, 0.06561144441366196, 0.07291936874389648, 0.08022728562355042, 0.08753520250320435, 0.09484312683343887, 0.1021510511636734, 0.10945896804332733, 0.11676688492298126, 0.12407480925321579, 0.13138273358345032, 0.13869065046310425, 0.14599856734275818, 0.1533064842224121, 0.16061441600322723, 0.16792233288288116, 0.1752302497625351, 0.18253818154335022, 0.18984609842300415, 0.19715401530265808, 0.204461932182312, 0.21176984906196594, 0.21907778084278107, 0.226385697722435, 0.23369361460208893, 0.24100154638290405, 0.24830946326255798, 0.2556173801422119, 0.26292529702186584, 0.2702332139015198, 0.2775411307811737, 0.28484904766082764, 0.29215699434280396, 0.2994649112224579, 0.3067728281021118, 0.31408074498176575, 0.3213886618614197, 0.3286965787410736, 0.33600449562072754, 0.34331244230270386, 0.3506203591823578, 0.3579282760620117, 0.36523619294166565, 0.3725441098213196]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 6.0, 7.0, 13.0, 17.0, 16.0, 14.0, 18.0, 18.0, 24.0, 22.0, 30.0, 28.0, 28.0, 35.0, 38.0, 39.0, 42.0, 41.0, 36.0, 54.0, 38.0, 44.0, 35.0, 38.0, 30.0, 25.0, 35.0, 32.0, 32.0, 24.0, 28.0, 23.0, 18.0, 14.0, 12.0, 13.0, 9.0, 5.0, 4.0, 8.0, 1.0, 3.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.023150980472564697, -0.02247793599963188, -0.021804893389344215, -0.02113185077905655, -0.020458806306123734, -0.019785761833190918, -0.01911271922290325, -0.018439676612615585, -0.01776663213968277, -0.017093587666749954, -0.016420545056462288, -0.01574750244617462, -0.015074457973241806, -0.014401414431631565, -0.013728370890021324, -0.013055327348411083, -0.012382283806800842, -0.011709240265190601, -0.01103619672358036, -0.01036315318197012, -0.009690109640359879, -0.009017066098749638, -0.008344022557139397, -0.007670979015529156, -0.006997935473918915, -0.006324891932308674, -0.005651848390698433, -0.004978804849088192, -0.004305761307477951, -0.00363271776586771, -0.002959674224257469, -0.0022866306826472282, -0.0016135871410369873, -0.0009405435994267464, -0.00026750005781650543, 0.0004055434837937355, 0.0010785870254039764, 0.0017516305670142174, 0.0024246741086244583, 0.0030977176502346992, 0.00377076119184494, 0.004443804733455181, 0.005116848275065422, 0.005789891816675663, 0.006462935358285904, 0.007135978899896145, 0.007809022441506386, 0.008482065983116627, 0.009155109524726868, 0.009828153066337109, 0.01050119660794735, 0.01117424014955759, 0.011847283691167831, 0.012520327232778072, 0.013193370774388313, 0.013866414315998554, 0.014539457857608795, 0.015212501399219036, 0.015885544940829277, 0.016558587551116943, 0.01723163202404976, 0.017904676496982574, 0.01857771910727024, 0.019250761717557907, 0.019923806190490723]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 2.0, 3.0, 2.0, 9.0, 6.0, 13.0, 16.0, 27.0, 17.0, 17.0, 27.0, 20.0, 30.0, 40.0, 51.0, 39.0, 37.0, 47.0, 49.0, 50.0, 40.0, 54.0, 46.0, 41.0, 45.0, 36.0, 41.0, 22.0, 29.0, 21.0, 31.0, 15.0, 19.0, 13.0, 15.0, 8.0, 10.0, 5.0, 6.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-19.40625, -18.78466796875, -18.1630859375, -17.54150390625, -16.919921875, -16.29833984375, -15.6767578125, -15.05517578125, -14.43359375, -13.81201171875, -13.1904296875, -12.56884765625, -11.947265625, -11.32568359375, -10.7041015625, -10.08251953125, -9.4609375, -8.83935546875, -8.2177734375, -7.59619140625, -6.974609375, -6.35302734375, -5.7314453125, -5.10986328125, -4.48828125, -3.86669921875, -3.2451171875, -2.62353515625, -2.001953125, -1.38037109375, -0.7587890625, -0.13720703125, 0.484375, 1.10595703125, 1.7275390625, 2.34912109375, 2.970703125, 3.59228515625, 4.2138671875, 4.83544921875, 5.45703125, 6.07861328125, 6.7001953125, 7.32177734375, 7.943359375, 8.56494140625, 9.1865234375, 9.80810546875, 10.4296875, 11.05126953125, 11.6728515625, 12.29443359375, 12.916015625, 13.53759765625, 14.1591796875, 14.78076171875, 15.40234375, 16.02392578125, 16.6455078125, 17.26708984375, 17.888671875, 18.51025390625, 19.1318359375, 19.75341796875, 20.375]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 5.0, 6.0, 9.0, 14.0, 13.0, 22.0, 44.0, 45.0, 75.0, 115.0, 153.0, 211.0, 318.0, 399.0, 644.0, 992.0, 1492.0, 2295.0, 3649.0, 6111.0, 10691.0, 22904.0, 81049.0, 553788.0, 278153.0, 46526.0, 16545.0, 8434.0, 4942.0, 3054.0, 1929.0, 1272.0, 869.0, 542.0, 379.0, 245.0, 172.0, 141.0, 92.0, 59.0, 49.0, 25.0, 29.0, 12.0, 15.0, 10.0, 4.0, 4.0, 3.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0], "bins": [-24.71875, -23.91650390625, -23.1142578125, -22.31201171875, -21.509765625, -20.70751953125, -19.9052734375, -19.10302734375, -18.30078125, -17.49853515625, -16.6962890625, -15.89404296875, -15.091796875, -14.28955078125, -13.4873046875, -12.68505859375, -11.8828125, -11.08056640625, -10.2783203125, -9.47607421875, -8.673828125, -7.87158203125, -7.0693359375, -6.26708984375, -5.46484375, -4.66259765625, -3.8603515625, -3.05810546875, -2.255859375, -1.45361328125, -0.6513671875, 0.15087890625, 0.953125, 1.75537109375, 2.5576171875, 3.35986328125, 4.162109375, 4.96435546875, 5.7666015625, 6.56884765625, 7.37109375, 8.17333984375, 8.9755859375, 9.77783203125, 10.580078125, 11.38232421875, 12.1845703125, 12.98681640625, 13.7890625, 14.59130859375, 15.3935546875, 16.19580078125, 16.998046875, 17.80029296875, 18.6025390625, 19.40478515625, 20.20703125, 21.00927734375, 21.8115234375, 22.61376953125, 23.416015625, 24.21826171875, 25.0205078125, 25.82275390625, 26.625]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 1.0, 10.0, 10.0, 9.0, 14.0, 12.0, 11.0, 13.0, 15.0, 12.0, 25.0, 26.0, 26.0, 25.0, 31.0, 38.0, 32.0, 48.0, 69.0, 89.0, 220.0, 1584.0, 208.0, 99.0, 58.0, 44.0, 51.0, 25.0, 33.0, 34.0, 19.0, 16.0, 23.0, 15.0, 17.0, 15.0, 18.0, 11.0, 8.0, 10.0, 10.0, 4.0, 4.0, 2.0, 7.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-37.65625, -36.53076171875, -35.4052734375, -34.27978515625, -33.154296875, -32.02880859375, -30.9033203125, -29.77783203125, -28.65234375, -27.52685546875, -26.4013671875, -25.27587890625, -24.150390625, -23.02490234375, -21.8994140625, -20.77392578125, -19.6484375, -18.52294921875, -17.3974609375, -16.27197265625, -15.146484375, -14.02099609375, -12.8955078125, -11.77001953125, -10.64453125, -9.51904296875, -8.3935546875, -7.26806640625, -6.142578125, -5.01708984375, -3.8916015625, -2.76611328125, -1.640625, -0.51513671875, 0.6103515625, 1.73583984375, 2.861328125, 3.98681640625, 5.1123046875, 6.23779296875, 7.36328125, 8.48876953125, 9.6142578125, 10.73974609375, 11.865234375, 12.99072265625, 14.1162109375, 15.24169921875, 16.3671875, 17.49267578125, 18.6181640625, 19.74365234375, 20.869140625, 21.99462890625, 23.1201171875, 24.24560546875, 25.37109375, 26.49658203125, 27.6220703125, 28.74755859375, 29.873046875, 30.99853515625, 32.1240234375, 33.24951171875, 34.375]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 3.0, 2.0, 3.0, 4.0, 4.0, 3.0, 6.0, 5.0, 11.0, 17.0, 26.0, 39.0, 55.0, 78.0, 146.0, 256.0, 631.0, 3047.0, 45225.0, 3072325.0, 20743.0, 1993.0, 480.0, 247.0, 126.0, 74.0, 47.0, 36.0, 20.0, 17.0, 10.0, 9.0, 6.0, 3.0, 0.0, 1.0, 5.0, 3.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-91.75, -88.400390625, -85.05078125, -81.701171875, -78.3515625, -75.001953125, -71.65234375, -68.302734375, -64.953125, -61.603515625, -58.25390625, -54.904296875, -51.5546875, -48.205078125, -44.85546875, -41.505859375, -38.15625, -34.806640625, -31.45703125, -28.107421875, -24.7578125, -21.408203125, -18.05859375, -14.708984375, -11.359375, -8.009765625, -4.66015625, -1.310546875, 2.0390625, 5.388671875, 8.73828125, 12.087890625, 15.4375, 18.787109375, 22.13671875, 25.486328125, 28.8359375, 32.185546875, 35.53515625, 38.884765625, 42.234375, 45.583984375, 48.93359375, 52.283203125, 55.6328125, 58.982421875, 62.33203125, 65.681640625, 69.03125, 72.380859375, 75.73046875, 79.080078125, 82.4296875, 85.779296875, 89.12890625, 92.478515625, 95.828125, 99.177734375, 102.52734375, 105.876953125, 109.2265625, 112.576171875, 115.92578125, 119.275390625, 122.625]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 18.0, 142.0, 495.0, 294.0, 61.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.3460578918457, -46.34069061279297, -40.33531951904297, -34.32994842529297, -28.324581146240234, -22.319211959838867, -16.3138427734375, -10.308475494384766, -4.303104400634766, 1.7022647857666016, 7.707633972167969, 13.713003158569336, 19.718372344970703, 25.72374153137207, 31.729110717773438, 37.73447799682617, 43.73984909057617, 49.745216369628906, 55.750587463378906, 61.755958557128906, 67.76132202148438, 73.76669311523438, 79.77206420898438, 85.77743530273438, 91.78280639648438, 97.78817749023438, 103.79354858398438, 109.79891204833984, 115.80428314208984, 121.80965423583984, 127.81501770019531, 133.8203887939453, 139.82574462890625, 145.83111572265625, 151.83648681640625, 157.84185791015625, 163.84722900390625, 169.8525848388672, 175.8579559326172, 181.8633270263672, 187.8686981201172, 193.8740692138672, 199.8794403076172, 205.8848114013672, 211.89016723632812, 217.89553833007812, 223.90090942382812, 229.90628051757812, 235.91165161132812, 241.91702270507812, 247.92239379882812, 253.92776489257812, 259.9331359863281, 265.9385070800781, 271.9438781738281, 277.94921875, 283.95458984375, 289.9599609375, 295.96533203125, 301.970703125, 307.97607421875, 313.9814453125, 319.98681640625, 325.9921875, 331.99755859375]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 5.0, 3.0, 8.0, 8.0, 12.0, 8.0, 10.0, 8.0, 15.0, 19.0, 22.0, 23.0, 29.0, 25.0, 27.0, 32.0, 42.0, 27.0, 39.0, 36.0, 40.0, 51.0, 44.0, 35.0, 41.0, 39.0, 33.0, 34.0, 26.0, 33.0, 38.0, 31.0, 29.0, 15.0, 22.0, 12.0, 10.0, 17.0, 11.0, 9.0, 11.0, 8.0, 7.0, 5.0, 4.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-71.37543487548828, -68.8658447265625, -66.35624694824219, -63.84665298461914, -61.337059020996094, -58.82746887207031, -56.317874908447266, -53.80828094482422, -51.29868698120117, -48.789093017578125, -46.27949905395508, -43.76990509033203, -41.26031494140625, -38.75071716308594, -36.241127014160156, -33.73153305053711, -31.221939086914062, -28.712345123291016, -26.20275115966797, -23.693159103393555, -21.183565139770508, -18.67397117614746, -16.164379119873047, -13.65478515625, -11.145191192626953, -8.635597229003906, -6.126004219055176, -3.616410732269287, -1.1068172454833984, 1.4027767181396484, 3.912369728088379, 6.421962738037109, 8.931556701660156, 11.441150665283203, 13.950743675231934, 16.460336685180664, 18.96993064880371, 21.479524612426758, 23.989116668701172, 26.49871063232422, 29.008304595947266, 31.517898559570312, 34.02749252319336, 36.537086486816406, 39.04667663574219, 41.5562744140625, 44.06586456298828, 46.57545852661133, 49.085052490234375, 51.59464645385742, 54.10424041748047, 56.613834381103516, 59.12342834472656, 61.633018493652344, 64.14261627197266, 66.65220642089844, 69.16180419921875, 71.67139434814453, 74.18099212646484, 76.69058227539062, 79.20018005371094, 81.70977020263672, 84.21936798095703, 86.72895812988281, 89.2385482788086]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 2.0, 1.0, 8.0, 13.0, 6.0, 12.0, 15.0, 21.0, 19.0, 21.0, 34.0, 20.0, 31.0, 37.0, 38.0, 37.0, 42.0, 46.0, 42.0, 47.0, 50.0, 55.0, 44.0, 43.0, 39.0, 44.0, 27.0, 27.0, 30.0, 19.0, 17.0, 23.0, 27.0, 14.0, 13.0, 8.0, 11.0, 4.0, 4.0, 4.0, 5.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-18.359375, -17.750244140625, -17.14111328125, -16.531982421875, -15.9228515625, -15.313720703125, -14.70458984375, -14.095458984375, -13.486328125, -12.877197265625, -12.26806640625, -11.658935546875, -11.0498046875, -10.440673828125, -9.83154296875, -9.222412109375, -8.61328125, -8.004150390625, -7.39501953125, -6.785888671875, -6.1767578125, -5.567626953125, -4.95849609375, -4.349365234375, -3.740234375, -3.131103515625, -2.52197265625, -1.912841796875, -1.3037109375, -0.694580078125, -0.08544921875, 0.523681640625, 1.1328125, 1.741943359375, 2.35107421875, 2.960205078125, 3.5693359375, 4.178466796875, 4.78759765625, 5.396728515625, 6.005859375, 6.614990234375, 7.22412109375, 7.833251953125, 8.4423828125, 9.051513671875, 9.66064453125, 10.269775390625, 10.87890625, 11.488037109375, 12.09716796875, 12.706298828125, 13.3154296875, 13.924560546875, 14.53369140625, 15.142822265625, 15.751953125, 16.361083984375, 16.97021484375, 17.579345703125, 18.1884765625, 18.797607421875, 19.40673828125, 20.015869140625, 20.625]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 10.0, 7.0, 11.0, 9.0, 9.0, 24.0, 15.0, 21.0, 30.0, 26.0, 38.0, 47.0, 55.0, 97.0, 107.0, 158.0, 244.0, 363.0, 784.0, 2674.0, 29914.0, 4142420.0, 13330.0, 1981.0, 686.0, 365.0, 223.0, 149.0, 102.0, 87.0, 54.0, 40.0, 49.0, 28.0, 29.0, 16.0, 16.0, 14.0, 10.0, 13.0, 6.0, 7.0, 3.0, 4.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-186.5, -180.365234375, -174.23046875, -168.095703125, -161.9609375, -155.826171875, -149.69140625, -143.556640625, -137.421875, -131.287109375, -125.15234375, -119.017578125, -112.8828125, -106.748046875, -100.61328125, -94.478515625, -88.34375, -82.208984375, -76.07421875, -69.939453125, -63.8046875, -57.669921875, -51.53515625, -45.400390625, -39.265625, -33.130859375, -26.99609375, -20.861328125, -14.7265625, -8.591796875, -2.45703125, 3.677734375, 9.8125, 15.947265625, 22.08203125, 28.216796875, 34.3515625, 40.486328125, 46.62109375, 52.755859375, 58.890625, 65.025390625, 71.16015625, 77.294921875, 83.4296875, 89.564453125, 95.69921875, 101.833984375, 107.96875, 114.103515625, 120.23828125, 126.373046875, 132.5078125, 138.642578125, 144.77734375, 150.912109375, 157.046875, 163.181640625, 169.31640625, 175.451171875, 181.5859375, 187.720703125, 193.85546875, 199.990234375, 206.125]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 2.0, 4.0, 9.0, 9.0, 10.0, 9.0, 11.0, 25.0, 23.0, 29.0, 47.0, 59.0, 92.0, 166.0, 342.0, 676.0, 1184.0, 643.0, 312.0, 165.0, 74.0, 45.0, 37.0, 21.0, 15.0, 15.0, 6.0, 6.0, 7.0, 6.0, 8.0, 3.0, 1.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-38.75, -37.65576171875, -36.5615234375, -35.46728515625, -34.373046875, -33.27880859375, -32.1845703125, -31.09033203125, -29.99609375, -28.90185546875, -27.8076171875, -26.71337890625, -25.619140625, -24.52490234375, -23.4306640625, -22.33642578125, -21.2421875, -20.14794921875, -19.0537109375, -17.95947265625, -16.865234375, -15.77099609375, -14.6767578125, -13.58251953125, -12.48828125, -11.39404296875, -10.2998046875, -9.20556640625, -8.111328125, -7.01708984375, -5.9228515625, -4.82861328125, -3.734375, -2.64013671875, -1.5458984375, -0.45166015625, 0.642578125, 1.73681640625, 2.8310546875, 3.92529296875, 5.01953125, 6.11376953125, 7.2080078125, 8.30224609375, 9.396484375, 10.49072265625, 11.5849609375, 12.67919921875, 13.7734375, 14.86767578125, 15.9619140625, 17.05615234375, 18.150390625, 19.24462890625, 20.3388671875, 21.43310546875, 22.52734375, 23.62158203125, 24.7158203125, 25.81005859375, 26.904296875, 27.99853515625, 29.0927734375, 30.18701171875, 31.28125]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 5.0, 0.0, 4.0, 8.0, 14.0, 13.0, 7.0, 10.0, 25.0, 34.0, 40.0, 67.0, 125.0, 290.0, 626.0, 1800.0, 5757.0, 28107.0, 1850415.0, 2269737.0, 28446.0, 5746.0, 1787.0, 617.0, 261.0, 126.0, 65.0, 38.0, 23.0, 34.0, 12.0, 8.0, 10.0, 9.0, 6.0, 6.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-91.8125, -88.4130859375, -85.013671875, -81.6142578125, -78.21484375, -74.8154296875, -71.416015625, -68.0166015625, -64.6171875, -61.2177734375, -57.818359375, -54.4189453125, -51.01953125, -47.6201171875, -44.220703125, -40.8212890625, -37.421875, -34.0224609375, -30.623046875, -27.2236328125, -23.82421875, -20.4248046875, -17.025390625, -13.6259765625, -10.2265625, -6.8271484375, -3.427734375, -0.0283203125, 3.37109375, 6.7705078125, 10.169921875, 13.5693359375, 16.96875, 20.3681640625, 23.767578125, 27.1669921875, 30.56640625, 33.9658203125, 37.365234375, 40.7646484375, 44.1640625, 47.5634765625, 50.962890625, 54.3623046875, 57.76171875, 61.1611328125, 64.560546875, 67.9599609375, 71.359375, 74.7587890625, 78.158203125, 81.5576171875, 84.95703125, 88.3564453125, 91.755859375, 95.1552734375, 98.5546875, 101.9541015625, 105.353515625, 108.7529296875, 112.15234375, 115.5517578125, 118.951171875, 122.3505859375, 125.75]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 13.0, 27.0, 65.0, 212.0, 398.0, 191.0, 69.0, 22.0, 8.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-278.3038330078125, -269.4793395996094, -260.6548156738281, -251.830322265625, -243.0058135986328, -234.18130493164062, -225.3568115234375, -216.5323028564453, -207.70779418945312, -198.88328552246094, -190.0587921142578, -181.23428344726562, -172.40977478027344, -163.58526611328125, -154.76077270507812, -145.93626403808594, -137.1117706298828, -128.28726196289062, -119.46276092529297, -110.63825988769531, -101.81375122070312, -92.98925018310547, -84.16474914550781, -75.34024047851562, -66.51573944091797, -57.69123458862305, -48.866729736328125, -40.04222869873047, -31.217723846435547, -22.393218994140625, -13.568717956542969, -4.744213104248047, 4.080291748046875, 12.90479564666748, 21.729299545288086, 30.553802490234375, 39.3783073425293, 48.20281219482422, 57.027313232421875, 65.85182189941406, 74.67632293701172, 83.50082397460938, 92.32533264160156, 101.14983367919922, 109.97433471679688, 118.79884338378906, 127.62334442138672, 136.44784545898438, 145.27235412597656, 154.09686279296875, 162.92135620117188, 171.74586486816406, 180.57037353515625, 189.39486694335938, 198.21937561035156, 207.04388427734375, 215.86837768554688, 224.69288635253906, 233.5173797607422, 242.34188842773438, 251.16639709472656, 259.99090576171875, 268.8153991699219, 277.639892578125, 286.46441650390625]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 9.0, 5.0, 10.0, 10.0, 13.0, 10.0, 15.0, 25.0, 22.0, 36.0, 19.0, 41.0, 35.0, 37.0, 43.0, 43.0, 50.0, 40.0, 38.0, 52.0, 39.0, 37.0, 39.0, 34.0, 42.0, 32.0, 36.0, 30.0, 30.0, 20.0, 14.0, 21.0, 16.0, 13.0, 5.0, 9.0, 5.0, 9.0, 3.0, 7.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-82.40347290039062, -79.65919494628906, -76.9149169921875, -74.17063903808594, -71.4263687133789, -68.68209075927734, -65.93781280517578, -63.19353485107422, -60.44926071166992, -57.70498275756836, -54.96070861816406, -52.2164306640625, -49.47215270996094, -46.72787857055664, -43.98360061645508, -41.23932647705078, -38.49504852294922, -35.750770568847656, -33.00649642944336, -30.262218475341797, -27.517942428588867, -24.773666381835938, -22.029388427734375, -19.285112380981445, -16.540836334228516, -13.796560287475586, -11.05228328704834, -8.308006286621094, -5.563730239868164, -2.8194541931152344, -0.07517623901367188, 2.669099807739258, 5.4133758544921875, 8.157651901245117, 10.901928901672363, 13.64620590209961, 16.39048194885254, 19.13475799560547, 21.87903594970703, 24.62331199645996, 27.36758804321289, 30.11186408996582, 32.85614013671875, 35.60041809082031, 38.344696044921875, 41.08897018432617, 43.833248138427734, 46.57752227783203, 49.321800231933594, 52.066078186035156, 54.81035232543945, 57.554630279541016, 60.29890441894531, 63.043182373046875, 65.78746032714844, 68.53173828125, 71.27601623535156, 74.02029418945312, 76.76457214355469, 79.50885009765625, 82.25312042236328, 84.99739837646484, 87.7416763305664, 90.48595428466797, 93.230224609375]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 2.0, 1.0, 6.0, 4.0, 8.0, 5.0, 13.0, 10.0, 18.0, 16.0, 23.0, 14.0, 32.0, 34.0, 18.0, 31.0, 32.0, 31.0, 42.0, 51.0, 44.0, 52.0, 49.0, 40.0, 44.0, 54.0, 33.0, 49.0, 30.0, 30.0, 32.0, 25.0, 21.0, 21.0, 18.0, 17.0, 11.0, 7.0, 12.0, 9.0, 10.0, 1.0, 5.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.4375, -18.8525390625, -18.267578125, -17.6826171875, -17.09765625, -16.5126953125, -15.927734375, -15.3427734375, -14.7578125, -14.1728515625, -13.587890625, -13.0029296875, -12.41796875, -11.8330078125, -11.248046875, -10.6630859375, -10.078125, -9.4931640625, -8.908203125, -8.3232421875, -7.73828125, -7.1533203125, -6.568359375, -5.9833984375, -5.3984375, -4.8134765625, -4.228515625, -3.6435546875, -3.05859375, -2.4736328125, -1.888671875, -1.3037109375, -0.71875, -0.1337890625, 0.451171875, 1.0361328125, 1.62109375, 2.2060546875, 2.791015625, 3.3759765625, 3.9609375, 4.5458984375, 5.130859375, 5.7158203125, 6.30078125, 6.8857421875, 7.470703125, 8.0556640625, 8.640625, 9.2255859375, 9.810546875, 10.3955078125, 10.98046875, 11.5654296875, 12.150390625, 12.7353515625, 13.3203125, 13.9052734375, 14.490234375, 15.0751953125, 15.66015625, 16.2451171875, 16.830078125, 17.4150390625, 18.0]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 8.0, 4.0, 11.0, 12.0, 23.0, 47.0, 46.0, 73.0, 105.0, 154.0, 240.0, 300.0, 464.0, 716.0, 1100.0, 1648.0, 2436.0, 3658.0, 5589.0, 8692.0, 13253.0, 20918.0, 32707.0, 53066.0, 89208.0, 154854.0, 225520.0, 173058.0, 99829.0, 59173.0, 36252.0, 22969.0, 14702.0, 9523.0, 6118.0, 4036.0, 2607.0, 1808.0, 1191.0, 789.0, 513.0, 366.0, 253.0, 170.0, 100.0, 70.0, 56.0, 40.0, 34.0, 13.0, 15.0, 4.0, 4.0, 3.0, 4.0, 4.0, 3.0, 4.0], "bins": [-1.576171875, -1.52783203125, -1.4794921875, -1.43115234375, -1.3828125, -1.33447265625, -1.2861328125, -1.23779296875, -1.189453125, -1.14111328125, -1.0927734375, -1.04443359375, -0.99609375, -0.94775390625, -0.8994140625, -0.85107421875, -0.802734375, -0.75439453125, -0.7060546875, -0.65771484375, -0.609375, -0.56103515625, -0.5126953125, -0.46435546875, -0.416015625, -0.36767578125, -0.3193359375, -0.27099609375, -0.22265625, -0.17431640625, -0.1259765625, -0.07763671875, -0.029296875, 0.01904296875, 0.0673828125, 0.11572265625, 0.1640625, 0.21240234375, 0.2607421875, 0.30908203125, 0.357421875, 0.40576171875, 0.4541015625, 0.50244140625, 0.55078125, 0.59912109375, 0.6474609375, 0.69580078125, 0.744140625, 0.79248046875, 0.8408203125, 0.88916015625, 0.9375, 0.98583984375, 1.0341796875, 1.08251953125, 1.130859375, 1.17919921875, 1.2275390625, 1.27587890625, 1.32421875, 1.37255859375, 1.4208984375, 1.46923828125, 1.517578125]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 6.0, 2.0, 8.0, 7.0, 5.0, 7.0, 5.0, 19.0, 6.0, 16.0, 24.0, 14.0, 23.0, 22.0, 19.0, 32.0, 34.0, 25.0, 31.0, 40.0, 31.0, 39.0, 49.0, 1059.0, 38.0, 37.0, 39.0, 41.0, 32.0, 43.0, 33.0, 24.0, 26.0, 30.0, 20.0, 24.0, 21.0, 20.0, 18.0, 17.0, 11.0, 2.0, 7.0, 2.0, 8.0, 5.0, 3.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-10.9453125, -10.601318359375, -10.25732421875, -9.913330078125, -9.5693359375, -9.225341796875, -8.88134765625, -8.537353515625, -8.193359375, -7.849365234375, -7.50537109375, -7.161376953125, -6.8173828125, -6.473388671875, -6.12939453125, -5.785400390625, -5.44140625, -5.097412109375, -4.75341796875, -4.409423828125, -4.0654296875, -3.721435546875, -3.37744140625, -3.033447265625, -2.689453125, -2.345458984375, -2.00146484375, -1.657470703125, -1.3134765625, -0.969482421875, -0.62548828125, -0.281494140625, 0.0625, 0.406494140625, 0.75048828125, 1.094482421875, 1.4384765625, 1.782470703125, 2.12646484375, 2.470458984375, 2.814453125, 3.158447265625, 3.50244140625, 3.846435546875, 4.1904296875, 4.534423828125, 4.87841796875, 5.222412109375, 5.56640625, 5.910400390625, 6.25439453125, 6.598388671875, 6.9423828125, 7.286376953125, 7.63037109375, 7.974365234375, 8.318359375, 8.662353515625, 9.00634765625, 9.350341796875, 9.6943359375, 10.038330078125, 10.38232421875, 10.726318359375, 11.0703125]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 2.0, 6.0, 9.0, 25.0, 24.0, 48.0, 81.0, 123.0, 179.0, 252.0, 403.0, 644.0, 997.0, 1518.0, 2223.0, 3570.0, 5444.0, 8385.0, 12857.0, 19980.0, 32106.0, 52542.0, 90823.0, 157514.0, 1276082.0, 174760.0, 101002.0, 58478.0, 35340.0, 21875.0, 13921.0, 8896.0, 5931.0, 3876.0, 2470.0, 1655.0, 1127.0, 685.0, 446.0, 295.0, 186.0, 133.0, 82.0, 45.0, 31.0, 22.0, 13.0, 9.0, 8.0, 7.0, 5.0, 4.0, 1.0], "bins": [-1.2529296875, -1.2177352905273438, -1.1825408935546875, -1.1473464965820312, -1.112152099609375, -1.0769577026367188, -1.0417633056640625, -1.0065689086914062, -0.97137451171875, -0.9361801147460938, -0.9009857177734375, -0.8657913208007812, -0.830596923828125, -0.7954025268554688, -0.7602081298828125, -0.7250137329101562, -0.6898193359375, -0.6546249389648438, -0.6194305419921875, -0.5842361450195312, -0.549041748046875, -0.5138473510742188, -0.4786529541015625, -0.44345855712890625, -0.40826416015625, -0.37306976318359375, -0.3378753662109375, -0.30268096923828125, -0.267486572265625, -0.23229217529296875, -0.1970977783203125, -0.16190338134765625, -0.126708984375, -0.09151458740234375, -0.0563201904296875, -0.02112579345703125, 0.014068603515625, 0.04926300048828125, 0.0844573974609375, 0.11965179443359375, 0.15484619140625, 0.19004058837890625, 0.2252349853515625, 0.26042938232421875, 0.295623779296875, 0.33081817626953125, 0.3660125732421875, 0.40120697021484375, 0.4364013671875, 0.47159576416015625, 0.5067901611328125, 0.5419845581054688, 0.577178955078125, 0.6123733520507812, 0.6475677490234375, 0.6827621459960938, 0.71795654296875, 0.7531509399414062, 0.7883453369140625, 0.8235397338867188, 0.858734130859375, 0.8939285278320312, 0.9291229248046875, 0.9643173217773438, 0.99951171875]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 3.0, 2.0, 0.0, 4.0, 5.0, 2.0, 4.0, 7.0, 8.0, 3.0, 18.0, 14.0, 13.0, 14.0, 20.0, 22.0, 22.0, 34.0, 63.0, 71.0, 88.0, 96.0, 107.0, 80.0, 55.0, 47.0, 37.0, 23.0, 17.0, 27.0, 17.0, 9.0, 19.0, 12.0, 10.0, 4.0, 7.0, 2.0, 3.0, 4.0, 5.0, 0.0, 5.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0250701904296875, -0.02422618865966797, -0.023382186889648438, -0.022538185119628906, -0.021694183349609375, -0.020850181579589844, -0.020006179809570312, -0.01916217803955078, -0.01831817626953125, -0.01747417449951172, -0.016630172729492188, -0.015786170959472656, -0.014942169189453125, -0.014098167419433594, -0.013254165649414062, -0.012410163879394531, -0.011566162109375, -0.010722160339355469, -0.009878158569335938, -0.009034156799316406, -0.008190155029296875, -0.007346153259277344, -0.0065021514892578125, -0.005658149719238281, -0.00481414794921875, -0.003970146179199219, -0.0031261444091796875, -0.0022821426391601562, -0.001438140869140625, -0.0005941390991210938, 0.0002498626708984375, 0.0010938644409179688, 0.0019378662109375, 0.0027818679809570312, 0.0036258697509765625, 0.004469871520996094, 0.005313873291015625, 0.006157875061035156, 0.0070018768310546875, 0.007845878601074219, 0.00868988037109375, 0.009533882141113281, 0.010377883911132812, 0.011221885681152344, 0.012065887451171875, 0.012909889221191406, 0.013753890991210938, 0.014597892761230469, 0.01544189453125, 0.01628589630126953, 0.017129898071289062, 0.017973899841308594, 0.018817901611328125, 0.019661903381347656, 0.020505905151367188, 0.02134990692138672, 0.02219390869140625, 0.02303791046142578, 0.023881912231445312, 0.024725914001464844, 0.025569915771484375, 0.026413917541503906, 0.027257919311523438, 0.02810192108154297, 0.0289459228515625]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 1.0, 4.0, 3.0, 7.0, 1.0, 5.0, 4.0, 6.0, 7.0, 8.0, 7.0, 15.0, 15.0, 16.0, 29.0, 27.0, 37.0, 50.0, 95.0, 91.0, 136.0, 277.0, 796.0, 5227.0, 147355.0, 876603.0, 15167.0, 1585.0, 405.0, 166.0, 92.0, 66.0, 55.0, 49.0, 31.0, 23.0, 19.0, 13.0, 9.0, 13.0, 2.0, 7.0, 7.0, 3.0, 8.0, 5.0, 3.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.54150390625, -0.5251922607421875, -0.508880615234375, -0.4925689697265625, -0.47625732421875, -0.4599456787109375, -0.443634033203125, -0.4273223876953125, -0.4110107421875, -0.3946990966796875, -0.378387451171875, -0.3620758056640625, -0.34576416015625, -0.3294525146484375, -0.313140869140625, -0.2968292236328125, -0.280517578125, -0.2642059326171875, -0.247894287109375, -0.2315826416015625, -0.21527099609375, -0.1989593505859375, -0.182647705078125, -0.1663360595703125, -0.1500244140625, -0.1337127685546875, -0.117401123046875, -0.1010894775390625, -0.08477783203125, -0.0684661865234375, -0.052154541015625, -0.0358428955078125, -0.01953125, -0.0032196044921875, 0.013092041015625, 0.0294036865234375, 0.04571533203125, 0.0620269775390625, 0.078338623046875, 0.0946502685546875, 0.1109619140625, 0.1272735595703125, 0.143585205078125, 0.1598968505859375, 0.17620849609375, 0.1925201416015625, 0.208831787109375, 0.2251434326171875, 0.241455078125, 0.2577667236328125, 0.274078369140625, 0.2903900146484375, 0.30670166015625, 0.3230133056640625, 0.339324951171875, 0.3556365966796875, 0.3719482421875, 0.3882598876953125, 0.404571533203125, 0.4208831787109375, 0.43719482421875, 0.4535064697265625, 0.469818115234375, 0.4861297607421875, 0.50244140625]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 14.0, 40.0, 127.0, 391.0, 297.0, 90.0, 32.0, 11.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07173629850149155, -0.06513958424329758, -0.058542877435684204, -0.051946163177490234, -0.04534945636987686, -0.03875274211168289, -0.03215603157877922, -0.02555932104587555, -0.018962610512971878, -0.012365899980068207, -0.005769188515841961, 0.000827522948384285, 0.007424233481287956, 0.014020945876836777, 0.020617656409740448, 0.02721436694264412, 0.03381107747554779, 0.04040778800845146, 0.04700449854135513, 0.0536012127995491, 0.060197919607162476, 0.06679463386535645, 0.07339134812355042, 0.07998805493116379, 0.08658476173877716, 0.09318147599697113, 0.0997781828045845, 0.10637489706277847, 0.11297160387039185, 0.11956831812858582, 0.12616503238677979, 0.13276174664497375, 0.13935844600200653, 0.1459551602602005, 0.15255187451839447, 0.15914857387542725, 0.16574528813362122, 0.17234200239181519, 0.17893871665000916, 0.18553543090820312, 0.1921321302652359, 0.19872884452342987, 0.20532555878162384, 0.21192225813865662, 0.21851897239685059, 0.22511568665504456, 0.23171240091323853, 0.2383091151714325, 0.24490582942962646, 0.25150254368782043, 0.2580992579460144, 0.2646959722042084, 0.27129268646240234, 0.2778893709182739, 0.2844860851764679, 0.29108279943466187, 0.29767951369285583, 0.3042762279510498, 0.3108729422092438, 0.31746965646743774, 0.3240663707256317, 0.3306630849838257, 0.33725976943969727, 0.34385648369789124, 0.3504531979560852]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 7.0, 9.0, 7.0, 8.0, 19.0, 16.0, 24.0, 18.0, 33.0, 27.0, 37.0, 22.0, 41.0, 34.0, 42.0, 45.0, 56.0, 43.0, 49.0, 61.0, 34.0, 60.0, 41.0, 32.0, 47.0, 30.0, 20.0, 29.0, 33.0, 18.0, 12.0, 9.0, 12.0, 4.0, 6.0, 3.0, 7.0, 2.0, 3.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.020522117614746094, -0.019879672676324844, -0.019237225875258446, -0.018594779074192047, -0.017952334135770798, -0.01730988919734955, -0.01666744239628315, -0.01602499559521675, -0.015382550656795502, -0.014740104787051678, -0.014097658917307854, -0.01345521304756403, -0.012812767177820206, -0.012170321308076382, -0.011527875438332558, -0.010885429568588734, -0.01024298369884491, -0.009600537829101086, -0.008958091959357262, -0.008315646089613438, -0.007673200219869614, -0.00703075435012579, -0.006388308480381966, -0.005745862610638142, -0.005103416740894318, -0.004460970871150494, -0.0038185250014066696, -0.0031760791316628456, -0.0025336332619190216, -0.0018911873921751976, -0.0012487415224313736, -0.0006062956526875496, 3.6150217056274414e-05, 0.0006785960868000984, 0.0013210419565439224, 0.0019634878262877464, 0.0026059336960315704, 0.0032483795657753944, 0.0038908254355192184, 0.0045332713052630424, 0.0051757171750068665, 0.0058181630447506905, 0.0064606089144945145, 0.0071030547842383385, 0.0077455006539821625, 0.008387946523725986, 0.00903039239346981, 0.009672838263213634, 0.010315284132957458, 0.010957730002701283, 0.011600175872445107, 0.01224262174218893, 0.012885067611932755, 0.013527513481676579, 0.014169959351420403, 0.014812405221164227, 0.01545485109090805, 0.0160972960293293, 0.0167397428303957, 0.017382189631462097, 0.018024634569883347, 0.018667079508304596, 0.019309526309370995, 0.019951973110437393, 0.020594418048858643]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 2.0, 1.0, 6.0, 4.0, 8.0, 5.0, 13.0, 10.0, 18.0, 16.0, 23.0, 14.0, 32.0, 34.0, 18.0, 31.0, 32.0, 31.0, 42.0, 51.0, 44.0, 52.0, 49.0, 40.0, 44.0, 54.0, 33.0, 49.0, 30.0, 30.0, 32.0, 25.0, 21.0, 21.0, 18.0, 17.0, 11.0, 7.0, 12.0, 9.0, 10.0, 1.0, 5.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.4375, -18.8525390625, -18.267578125, -17.6826171875, -17.09765625, -16.5126953125, -15.927734375, -15.3427734375, -14.7578125, -14.1728515625, -13.587890625, -13.0029296875, -12.41796875, -11.8330078125, -11.248046875, -10.6630859375, -10.078125, -9.4931640625, -8.908203125, -8.3232421875, -7.73828125, -7.1533203125, -6.568359375, -5.9833984375, -5.3984375, -4.8134765625, -4.228515625, -3.6435546875, -3.05859375, -2.4736328125, -1.888671875, -1.3037109375, -0.71875, -0.1337890625, 0.451171875, 1.0361328125, 1.62109375, 2.2060546875, 2.791015625, 3.3759765625, 3.9609375, 4.5458984375, 5.130859375, 5.7158203125, 6.30078125, 6.8857421875, 7.470703125, 8.0556640625, 8.640625, 9.2255859375, 9.810546875, 10.3955078125, 10.98046875, 11.5654296875, 12.150390625, 12.7353515625, 13.3203125, 13.9052734375, 14.490234375, 15.0751953125, 15.66015625, 16.2451171875, 16.830078125, 17.4150390625, 18.0]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 2.0, 4.0, 11.0, 9.0, 12.0, 20.0, 19.0, 37.0, 48.0, 57.0, 83.0, 127.0, 157.0, 220.0, 370.0, 473.0, 724.0, 1042.0, 1647.0, 2476.0, 4712.0, 10504.0, 37189.0, 272088.0, 608668.0, 75917.0, 16479.0, 6354.0, 3186.0, 1974.0, 1226.0, 821.0, 544.0, 392.0, 277.0, 199.0, 146.0, 80.0, 75.0, 48.0, 41.0, 30.0, 27.0, 14.0, 3.0, 4.0, 13.0, 3.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-33.8125, -32.794189453125, -31.77587890625, -30.757568359375, -29.7392578125, -28.720947265625, -27.70263671875, -26.684326171875, -25.666015625, -24.647705078125, -23.62939453125, -22.611083984375, -21.5927734375, -20.574462890625, -19.55615234375, -18.537841796875, -17.51953125, -16.501220703125, -15.48291015625, -14.464599609375, -13.4462890625, -12.427978515625, -11.40966796875, -10.391357421875, -9.373046875, -8.354736328125, -7.33642578125, -6.318115234375, -5.2998046875, -4.281494140625, -3.26318359375, -2.244873046875, -1.2265625, -0.208251953125, 0.81005859375, 1.828369140625, 2.8466796875, 3.864990234375, 4.88330078125, 5.901611328125, 6.919921875, 7.938232421875, 8.95654296875, 9.974853515625, 10.9931640625, 12.011474609375, 13.02978515625, 14.048095703125, 15.06640625, 16.084716796875, 17.10302734375, 18.121337890625, 19.1396484375, 20.157958984375, 21.17626953125, 22.194580078125, 23.212890625, 24.231201171875, 25.24951171875, 26.267822265625, 27.2861328125, 28.304443359375, 29.32275390625, 30.341064453125, 31.359375]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 5.0, 4.0, 7.0, 4.0, 4.0, 6.0, 11.0, 15.0, 12.0, 10.0, 21.0, 29.0, 23.0, 43.0, 23.0, 33.0, 30.0, 48.0, 55.0, 77.0, 165.0, 1599.0, 252.0, 99.0, 68.0, 74.0, 48.0, 35.0, 41.0, 35.0, 34.0, 24.0, 21.0, 14.0, 19.0, 8.0, 11.0, 6.0, 15.0, 9.0, 2.0, 4.0, 5.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-36.84375, -35.71484375, -34.5859375, -33.45703125, -32.328125, -31.19921875, -30.0703125, -28.94140625, -27.8125, -26.68359375, -25.5546875, -24.42578125, -23.296875, -22.16796875, -21.0390625, -19.91015625, -18.78125, -17.65234375, -16.5234375, -15.39453125, -14.265625, -13.13671875, -12.0078125, -10.87890625, -9.75, -8.62109375, -7.4921875, -6.36328125, -5.234375, -4.10546875, -2.9765625, -1.84765625, -0.71875, 0.41015625, 1.5390625, 2.66796875, 3.796875, 4.92578125, 6.0546875, 7.18359375, 8.3125, 9.44140625, 10.5703125, 11.69921875, 12.828125, 13.95703125, 15.0859375, 16.21484375, 17.34375, 18.47265625, 19.6015625, 20.73046875, 21.859375, 22.98828125, 24.1171875, 25.24609375, 26.375, 27.50390625, 28.6328125, 29.76171875, 30.890625, 32.01953125, 33.1484375, 34.27734375, 35.40625]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 1.0, 5.0, 10.0, 11.0, 5.0, 17.0, 11.0, 16.0, 21.0, 33.0, 47.0, 61.0, 98.0, 157.0, 270.0, 564.0, 1626.0, 263323.0, 2875949.0, 2103.0, 603.0, 268.0, 166.0, 97.0, 62.0, 32.0, 29.0, 19.0, 15.0, 20.0, 9.0, 15.0, 14.0, 8.0, 2.0, 4.0, 3.0, 2.0, 0.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-144.125, -139.16796875, -134.2109375, -129.25390625, -124.296875, -119.33984375, -114.3828125, -109.42578125, -104.46875, -99.51171875, -94.5546875, -89.59765625, -84.640625, -79.68359375, -74.7265625, -69.76953125, -64.8125, -59.85546875, -54.8984375, -49.94140625, -44.984375, -40.02734375, -35.0703125, -30.11328125, -25.15625, -20.19921875, -15.2421875, -10.28515625, -5.328125, -0.37109375, 4.5859375, 9.54296875, 14.5, 19.45703125, 24.4140625, 29.37109375, 34.328125, 39.28515625, 44.2421875, 49.19921875, 54.15625, 59.11328125, 64.0703125, 69.02734375, 73.984375, 78.94140625, 83.8984375, 88.85546875, 93.8125, 98.76953125, 103.7265625, 108.68359375, 113.640625, 118.59765625, 123.5546875, 128.51171875, 133.46875, 138.42578125, 143.3828125, 148.33984375, 153.296875, 158.25390625, 163.2109375, 168.16796875, 173.125]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 9.0, 41.0, 250.0, 466.0, 196.0, 35.0, 14.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-224.83074951171875, -218.1095428466797, -211.38832092285156, -204.6671142578125, -197.94589233398438, -191.2246856689453, -184.50347900390625, -177.78225708007812, -171.06105041503906, -164.33984375, -157.61862182617188, -150.8974151611328, -144.17620849609375, -137.45498657226562, -130.73377990722656, -124.01256561279297, -117.29135131835938, -110.57013702392578, -103.84892272949219, -97.12771606445312, -90.40650177001953, -83.68528747558594, -76.96408081054688, -70.24286651611328, -63.52165222167969, -56.800437927246094, -50.079227447509766, -43.35801696777344, -36.636802673339844, -29.91558837890625, -23.194377899169922, -16.473167419433594, -9.751968383789062, -3.0307559967041016, 3.6904563903808594, 10.41166877746582, 17.13288116455078, 23.854095458984375, 30.575305938720703, 37.29651641845703, 44.017730712890625, 50.73894500732422, 57.46015548706055, 64.18136596679688, 70.90258026123047, 77.62379455566406, 84.34500122070312, 91.06621551513672, 97.78742980957031, 104.5086441040039, 111.2298583984375, 117.95106506347656, 124.67227935791016, 131.39349365234375, 138.1147003173828, 144.83590698242188, 151.55712890625, 158.27833557128906, 164.9995574951172, 171.72076416015625, 178.44198608398438, 185.16319274902344, 191.8843994140625, 198.60562133789062, 205.3268280029297]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 7.0, 7.0, 7.0, 6.0, 8.0, 8.0, 14.0, 8.0, 19.0, 17.0, 19.0, 16.0, 22.0, 28.0, 31.0, 37.0, 44.0, 38.0, 47.0, 43.0, 47.0, 46.0, 53.0, 40.0, 46.0, 36.0, 41.0, 27.0, 31.0, 31.0, 20.0, 27.0, 24.0, 18.0, 16.0, 20.0, 9.0, 12.0, 9.0, 6.0, 8.0, 4.0, 2.0, 0.0, 1.0, 6.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-92.90000915527344, -89.84323120117188, -86.78644561767578, -83.72966766357422, -80.67288208007812, -77.61610412597656, -74.55931854248047, -71.5025405883789, -68.44575500488281, -65.38897705078125, -62.332191467285156, -59.27540969848633, -56.2186279296875, -53.16184616088867, -50.105064392089844, -47.04828643798828, -43.99150466918945, -40.934722900390625, -37.8779411315918, -34.82115936279297, -31.76437759399414, -28.707595825195312, -25.650815963745117, -22.59403419494629, -19.53725242614746, -16.480470657348633, -13.423688888549805, -10.366908073425293, -7.310126304626465, -4.253344535827637, -1.196563720703125, 1.8602180480957031, 4.916999816894531, 7.973781585693359, 11.030563354492188, 14.0873441696167, 17.144126892089844, 20.200908660888672, 23.257688522338867, 26.314470291137695, 29.371252059936523, 32.42803192138672, 35.48481369018555, 38.541595458984375, 41.5983772277832, 44.65515899658203, 47.71194076538086, 50.76872253417969, 53.825504302978516, 56.882286071777344, 59.93906784057617, 62.995849609375, 66.05262756347656, 69.10941314697266, 72.16619110107422, 75.22297668457031, 78.27975463867188, 81.33653259277344, 84.39331817626953, 87.4500961303711, 90.50688171386719, 93.56365966796875, 96.62044525146484, 99.6772232055664, 102.7340087890625]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 4.0, 4.0, 3.0, 4.0, 8.0, 9.0, 11.0, 13.0, 23.0, 25.0, 16.0, 23.0, 33.0, 30.0, 28.0, 25.0, 42.0, 38.0, 41.0, 52.0, 48.0, 41.0, 63.0, 36.0, 54.0, 41.0, 34.0, 38.0, 30.0, 23.0, 25.0, 24.0, 23.0, 10.0, 19.0, 13.0, 14.0, 11.0, 7.0, 5.0, 4.0, 1.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-19.234375, -18.65576171875, -18.0771484375, -17.49853515625, -16.919921875, -16.34130859375, -15.7626953125, -15.18408203125, -14.60546875, -14.02685546875, -13.4482421875, -12.86962890625, -12.291015625, -11.71240234375, -11.1337890625, -10.55517578125, -9.9765625, -9.39794921875, -8.8193359375, -8.24072265625, -7.662109375, -7.08349609375, -6.5048828125, -5.92626953125, -5.34765625, -4.76904296875, -4.1904296875, -3.61181640625, -3.033203125, -2.45458984375, -1.8759765625, -1.29736328125, -0.71875, -0.14013671875, 0.4384765625, 1.01708984375, 1.595703125, 2.17431640625, 2.7529296875, 3.33154296875, 3.91015625, 4.48876953125, 5.0673828125, 5.64599609375, 6.224609375, 6.80322265625, 7.3818359375, 7.96044921875, 8.5390625, 9.11767578125, 9.6962890625, 10.27490234375, 10.853515625, 11.43212890625, 12.0107421875, 12.58935546875, 13.16796875, 13.74658203125, 14.3251953125, 14.90380859375, 15.482421875, 16.06103515625, 16.6396484375, 17.21826171875, 17.796875]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 4.0, 4.0, 9.0, 13.0, 5.0, 15.0, 21.0, 21.0, 36.0, 53.0, 74.0, 106.0, 144.0, 162.0, 296.0, 418.0, 633.0, 1145.0, 2125.0, 5014.0, 15315.0, 165816.0, 3441290.0, 524654.0, 24264.0, 6603.0, 2576.0, 1335.0, 703.0, 410.0, 305.0, 238.0, 128.0, 104.0, 57.0, 55.0, 27.0, 23.0, 32.0, 17.0, 8.0, 13.0, 6.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-59.40625, -57.529296875, -55.65234375, -53.775390625, -51.8984375, -50.021484375, -48.14453125, -46.267578125, -44.390625, -42.513671875, -40.63671875, -38.759765625, -36.8828125, -35.005859375, -33.12890625, -31.251953125, -29.375, -27.498046875, -25.62109375, -23.744140625, -21.8671875, -19.990234375, -18.11328125, -16.236328125, -14.359375, -12.482421875, -10.60546875, -8.728515625, -6.8515625, -4.974609375, -3.09765625, -1.220703125, 0.65625, 2.533203125, 4.41015625, 6.287109375, 8.1640625, 10.041015625, 11.91796875, 13.794921875, 15.671875, 17.548828125, 19.42578125, 21.302734375, 23.1796875, 25.056640625, 26.93359375, 28.810546875, 30.6875, 32.564453125, 34.44140625, 36.318359375, 38.1953125, 40.072265625, 41.94921875, 43.826171875, 45.703125, 47.580078125, 49.45703125, 51.333984375, 53.2109375, 55.087890625, 56.96484375, 58.841796875, 60.71875]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 2.0, 4.0, 6.0, 4.0, 10.0, 12.0, 7.0, 11.0, 27.0, 14.0, 16.0, 34.0, 38.0, 49.0, 65.0, 103.0, 121.0, 197.0, 294.0, 530.0, 742.0, 619.0, 375.0, 256.0, 151.0, 90.0, 79.0, 53.0, 44.0, 29.0, 22.0, 17.0, 14.0, 8.0, 7.0, 7.0, 4.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-29.53125, -28.5673828125, -27.603515625, -26.6396484375, -25.67578125, -24.7119140625, -23.748046875, -22.7841796875, -21.8203125, -20.8564453125, -19.892578125, -18.9287109375, -17.96484375, -17.0009765625, -16.037109375, -15.0732421875, -14.109375, -13.1455078125, -12.181640625, -11.2177734375, -10.25390625, -9.2900390625, -8.326171875, -7.3623046875, -6.3984375, -5.4345703125, -4.470703125, -3.5068359375, -2.54296875, -1.5791015625, -0.615234375, 0.3486328125, 1.3125, 2.2763671875, 3.240234375, 4.2041015625, 5.16796875, 6.1318359375, 7.095703125, 8.0595703125, 9.0234375, 9.9873046875, 10.951171875, 11.9150390625, 12.87890625, 13.8427734375, 14.806640625, 15.7705078125, 16.734375, 17.6982421875, 18.662109375, 19.6259765625, 20.58984375, 21.5537109375, 22.517578125, 23.4814453125, 24.4453125, 25.4091796875, 26.373046875, 27.3369140625, 28.30078125, 29.2646484375, 30.228515625, 31.1923828125, 32.15625]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 2.0, 6.0, 7.0, 11.0, 16.0, 20.0, 34.0, 48.0, 73.0, 129.0, 204.0, 373.0, 763.0, 1420.0, 2985.0, 6859.0, 17269.0, 53578.0, 331777.0, 3439139.0, 264005.0, 47595.0, 15713.0, 6299.0, 2913.0, 1381.0, 715.0, 371.0, 208.0, 126.0, 70.0, 53.0, 34.0, 21.0, 21.0, 13.0, 8.0, 5.0, 1.0, 4.0, 5.0, 3.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-50.96875, -49.3984375, -47.828125, -46.2578125, -44.6875, -43.1171875, -41.546875, -39.9765625, -38.40625, -36.8359375, -35.265625, -33.6953125, -32.125, -30.5546875, -28.984375, -27.4140625, -25.84375, -24.2734375, -22.703125, -21.1328125, -19.5625, -17.9921875, -16.421875, -14.8515625, -13.28125, -11.7109375, -10.140625, -8.5703125, -7.0, -5.4296875, -3.859375, -2.2890625, -0.71875, 0.8515625, 2.421875, 3.9921875, 5.5625, 7.1328125, 8.703125, 10.2734375, 11.84375, 13.4140625, 14.984375, 16.5546875, 18.125, 19.6953125, 21.265625, 22.8359375, 24.40625, 25.9765625, 27.546875, 29.1171875, 30.6875, 32.2578125, 33.828125, 35.3984375, 36.96875, 38.5390625, 40.109375, 41.6796875, 43.25, 44.8203125, 46.390625, 47.9609375, 49.53125]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [7.0, 11.0, 30.0, 154.0, 541.0, 228.0, 36.0, 10.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.45288848876953, -64.00987243652344, -46.56685256958008, -29.12383270263672, -11.680816650390625, 5.762199401855469, 23.205223083496094, 40.64823913574219, 58.09125518798828, 75.53427124023438, 92.977294921875, 110.4203109741211, 127.86332702636719, 145.30633544921875, 162.74935913085938, 180.1923828125, 197.63540649414062, 215.07843017578125, 232.5214385986328, 249.96446228027344, 267.407470703125, 284.8504943847656, 302.29351806640625, 319.7365417480469, 337.1795349121094, 354.62255859375, 372.0655822753906, 389.50860595703125, 406.95159912109375, 424.3946228027344, 441.837646484375, 459.2806701660156, 476.72369384765625, 494.1667175292969, 511.6097412109375, 529.052734375, 546.4957885742188, 563.9387817382812, 581.3818359375, 598.8248291015625, 616.267822265625, 633.7108154296875, 651.1538696289062, 668.5968627929688, 686.0399169921875, 703.48291015625, 720.9259033203125, 738.3689575195312, 755.81201171875, 773.2550048828125, 790.6980590820312, 808.1410522460938, 825.5841064453125, 843.027099609375, 860.4700927734375, 877.9131469726562, 895.3561401367188, 912.7991333007812, 930.2421875, 947.6851806640625, 965.1282348632812, 982.5712280273438, 1000.0142822265625, 1017.457275390625, 1034.9002685546875]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 5.0, 1.0, 4.0, 6.0, 8.0, 14.0, 9.0, 13.0, 17.0, 18.0, 12.0, 21.0, 19.0, 35.0, 24.0, 30.0, 47.0, 36.0, 39.0, 41.0, 38.0, 44.0, 42.0, 40.0, 37.0, 39.0, 28.0, 30.0, 31.0, 32.0, 30.0, 33.0, 28.0, 21.0, 23.0, 13.0, 18.0, 15.0, 12.0, 7.0, 11.0, 11.0, 6.0, 5.0, 2.0, 7.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-104.64703369140625, -101.5959701538086, -98.54490661621094, -95.49384307861328, -92.44277954101562, -89.39170837402344, -86.34064483642578, -83.28958129882812, -80.23851776123047, -77.18745422363281, -74.13639068603516, -71.0853271484375, -68.03425598144531, -64.98319244384766, -61.93212890625, -58.881065368652344, -55.83000183105469, -52.77893829345703, -49.727874755859375, -46.67680740356445, -43.6257438659668, -40.57468032836914, -37.52361297607422, -34.47254943847656, -31.421485900878906, -28.37042236328125, -25.31935691833496, -22.268291473388672, -19.217227935791016, -16.16616439819336, -13.11509895324707, -10.064033508300781, -7.012977600097656, -3.9619131088256836, -0.9108486175537109, 2.1402158737182617, 5.191280364990234, 8.242344856262207, 11.29340934753418, 14.344474792480469, 17.395538330078125, 20.44660186767578, 23.49766731262207, 26.54873275756836, 29.599796295166016, 32.65085983276367, 35.701927185058594, 38.75299072265625, 41.804054260253906, 44.85511779785156, 47.90618133544922, 50.95724868774414, 54.0083122253418, 57.05937576293945, 60.110443115234375, 63.16150665283203, 66.21257019042969, 69.26363372802734, 72.314697265625, 75.36576080322266, 78.41682434082031, 81.4678955078125, 84.51895904541016, 87.57002258300781, 90.62108612060547]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 6.0, 2.0, 6.0, 7.0, 13.0, 7.0, 11.0, 16.0, 12.0, 21.0, 25.0, 27.0, 34.0, 27.0, 27.0, 29.0, 46.0, 47.0, 54.0, 34.0, 40.0, 43.0, 34.0, 42.0, 41.0, 45.0, 31.0, 27.0, 29.0, 35.0, 28.0, 14.0, 20.0, 18.0, 16.0, 22.0, 12.0, 13.0, 7.0, 11.0, 6.0, 5.0, 7.0, 1.0, 1.0, 6.0, 2.0, 2.0, 1.0], "bins": [-16.484375, -16.031982421875, -15.57958984375, -15.127197265625, -14.6748046875, -14.222412109375, -13.77001953125, -13.317626953125, -12.865234375, -12.412841796875, -11.96044921875, -11.508056640625, -11.0556640625, -10.603271484375, -10.15087890625, -9.698486328125, -9.24609375, -8.793701171875, -8.34130859375, -7.888916015625, -7.4365234375, -6.984130859375, -6.53173828125, -6.079345703125, -5.626953125, -5.174560546875, -4.72216796875, -4.269775390625, -3.8173828125, -3.364990234375, -2.91259765625, -2.460205078125, -2.0078125, -1.555419921875, -1.10302734375, -0.650634765625, -0.1982421875, 0.254150390625, 0.70654296875, 1.158935546875, 1.611328125, 2.063720703125, 2.51611328125, 2.968505859375, 3.4208984375, 3.873291015625, 4.32568359375, 4.778076171875, 5.23046875, 5.682861328125, 6.13525390625, 6.587646484375, 7.0400390625, 7.492431640625, 7.94482421875, 8.397216796875, 8.849609375, 9.302001953125, 9.75439453125, 10.206787109375, 10.6591796875, 11.111572265625, 11.56396484375, 12.016357421875, 12.46875]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [5.0, 3.0, 6.0, 9.0, 9.0, 16.0, 23.0, 32.0, 43.0, 64.0, 69.0, 106.0, 158.0, 220.0, 336.0, 401.0, 636.0, 868.0, 1219.0, 1773.0, 2450.0, 3421.0, 4995.0, 7503.0, 10808.0, 16294.0, 25545.0, 40969.0, 68014.0, 115877.0, 190097.0, 208026.0, 135451.0, 79268.0, 47248.0, 28878.0, 18615.0, 12172.0, 8079.0, 5680.0, 3843.0, 2708.0, 1916.0, 1384.0, 975.0, 712.0, 462.0, 340.0, 242.0, 152.0, 115.0, 92.0, 74.0, 67.0, 31.0, 35.0, 18.0, 4.0, 4.0, 3.0, 3.0, 4.0, 3.0, 3.0], "bins": [-1.1904296875, -1.1522064208984375, -1.113983154296875, -1.0757598876953125, -1.03753662109375, -0.9993133544921875, -0.961090087890625, -0.9228668212890625, -0.8846435546875, -0.8464202880859375, -0.808197021484375, -0.7699737548828125, -0.73175048828125, -0.6935272216796875, -0.655303955078125, -0.6170806884765625, -0.578857421875, -0.5406341552734375, -0.502410888671875, -0.4641876220703125, -0.42596435546875, -0.3877410888671875, -0.349517822265625, -0.3112945556640625, -0.2730712890625, -0.2348480224609375, -0.196624755859375, -0.1584014892578125, -0.12017822265625, -0.0819549560546875, -0.043731689453125, -0.0055084228515625, 0.03271484375, 0.0709381103515625, 0.109161376953125, 0.1473846435546875, 0.18560791015625, 0.2238311767578125, 0.262054443359375, 0.3002777099609375, 0.3385009765625, 0.3767242431640625, 0.414947509765625, 0.4531707763671875, 0.49139404296875, 0.5296173095703125, 0.567840576171875, 0.6060638427734375, 0.644287109375, 0.6825103759765625, 0.720733642578125, 0.7589569091796875, 0.79718017578125, 0.8354034423828125, 0.873626708984375, 0.9118499755859375, 0.9500732421875, 0.9882965087890625, 1.026519775390625, 1.0647430419921875, 1.10296630859375, 1.1411895751953125, 1.179412841796875, 1.2176361083984375, 1.255859375]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 4.0, 0.0, 4.0, 3.0, 4.0, 2.0, 4.0, 5.0, 8.0, 7.0, 9.0, 15.0, 16.0, 16.0, 18.0, 25.0, 30.0, 19.0, 30.0, 20.0, 40.0, 29.0, 41.0, 44.0, 38.0, 35.0, 36.0, 1067.0, 32.0, 40.0, 38.0, 32.0, 35.0, 27.0, 28.0, 27.0, 31.0, 29.0, 26.0, 24.0, 18.0, 14.0, 20.0, 13.0, 6.0, 5.0, 8.0, 7.0, 4.0, 0.0, 4.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.89453125, -7.61505126953125, -7.3355712890625, -7.05609130859375, -6.776611328125, -6.49713134765625, -6.2176513671875, -5.93817138671875, -5.65869140625, -5.37921142578125, -5.0997314453125, -4.82025146484375, -4.540771484375, -4.26129150390625, -3.9818115234375, -3.70233154296875, -3.4228515625, -3.14337158203125, -2.8638916015625, -2.58441162109375, -2.304931640625, -2.02545166015625, -1.7459716796875, -1.46649169921875, -1.18701171875, -0.90753173828125, -0.6280517578125, -0.34857177734375, -0.069091796875, 0.21038818359375, 0.4898681640625, 0.76934814453125, 1.048828125, 1.32830810546875, 1.6077880859375, 1.88726806640625, 2.166748046875, 2.44622802734375, 2.7257080078125, 3.00518798828125, 3.28466796875, 3.56414794921875, 3.8436279296875, 4.12310791015625, 4.402587890625, 4.68206787109375, 4.9615478515625, 5.24102783203125, 5.5205078125, 5.79998779296875, 6.0794677734375, 6.35894775390625, 6.638427734375, 6.91790771484375, 7.1973876953125, 7.47686767578125, 7.75634765625, 8.03582763671875, 8.3153076171875, 8.59478759765625, 8.874267578125, 9.15374755859375, 9.4332275390625, 9.71270751953125, 9.9921875]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 10.0, 9.0, 12.0, 29.0, 43.0, 85.0, 86.0, 176.0, 237.0, 347.0, 554.0, 869.0, 1271.0, 1965.0, 2933.0, 4677.0, 7070.0, 11015.0, 17273.0, 27320.0, 44258.0, 75096.0, 128919.0, 991983.0, 463480.0, 125859.0, 73787.0, 43609.0, 26605.0, 16813.0, 10748.0, 6813.0, 4598.0, 3052.0, 1876.0, 1256.0, 806.0, 603.0, 323.0, 219.0, 158.0, 101.0, 59.0, 44.0, 31.0, 26.0, 7.0, 12.0, 4.0, 4.0, 3.0, 1.0, 3.0], "bins": [-1.029296875, -0.9998703002929688, -0.9704437255859375, -0.9410171508789062, -0.911590576171875, -0.8821640014648438, -0.8527374267578125, -0.8233108520507812, -0.79388427734375, -0.7644577026367188, -0.7350311279296875, -0.7056045532226562, -0.676177978515625, -0.6467514038085938, -0.6173248291015625, -0.5878982543945312, -0.5584716796875, -0.5290451049804688, -0.4996185302734375, -0.47019195556640625, -0.440765380859375, -0.41133880615234375, -0.3819122314453125, -0.35248565673828125, -0.32305908203125, -0.29363250732421875, -0.2642059326171875, -0.23477935791015625, -0.205352783203125, -0.17592620849609375, -0.1464996337890625, -0.11707305908203125, -0.087646484375, -0.05821990966796875, -0.0287933349609375, 0.00063323974609375, 0.030059814453125, 0.05948638916015625, 0.0889129638671875, 0.11833953857421875, 0.14776611328125, 0.17719268798828125, 0.2066192626953125, 0.23604583740234375, 0.265472412109375, 0.29489898681640625, 0.3243255615234375, 0.35375213623046875, 0.3831787109375, 0.41260528564453125, 0.4420318603515625, 0.47145843505859375, 0.500885009765625, 0.5303115844726562, 0.5597381591796875, 0.5891647338867188, 0.61859130859375, 0.6480178833007812, 0.6774444580078125, 0.7068710327148438, 0.736297607421875, 0.7657241821289062, 0.7951507568359375, 0.8245773315429688, 0.85400390625]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 5.0, 6.0, 7.0, 4.0, 10.0, 8.0, 9.0, 17.0, 16.0, 19.0, 29.0, 53.0, 67.0, 94.0, 121.0, 128.0, 99.0, 82.0, 65.0, 38.0, 33.0, 19.0, 13.0, 11.0, 3.0, 6.0, 3.0, 3.0, 3.0, 7.0, 3.0, 1.0, 3.0, 1.0, 6.0, 2.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.031494140625, -0.03055095672607422, -0.029607772827148438, -0.028664588928222656, -0.027721405029296875, -0.026778221130371094, -0.025835037231445312, -0.02489185333251953, -0.02394866943359375, -0.02300548553466797, -0.022062301635742188, -0.021119117736816406, -0.020175933837890625, -0.019232749938964844, -0.018289566040039062, -0.01734638214111328, -0.0164031982421875, -0.015460014343261719, -0.014516830444335938, -0.013573646545410156, -0.012630462646484375, -0.011687278747558594, -0.010744094848632812, -0.009800910949707031, -0.00885772705078125, -0.007914543151855469, -0.0069713592529296875, -0.006028175354003906, -0.005084991455078125, -0.004141807556152344, -0.0031986236572265625, -0.0022554397583007812, -0.001312255859375, -0.00036907196044921875, 0.0005741119384765625, 0.0015172958374023438, 0.002460479736328125, 0.0034036636352539062, 0.0043468475341796875, 0.005290031433105469, 0.00623321533203125, 0.007176399230957031, 0.008119583129882812, 0.009062767028808594, 0.010005950927734375, 0.010949134826660156, 0.011892318725585938, 0.012835502624511719, 0.0137786865234375, 0.014721870422363281, 0.015665054321289062, 0.016608238220214844, 0.017551422119140625, 0.018494606018066406, 0.019437789916992188, 0.02038097381591797, 0.02132415771484375, 0.02226734161376953, 0.023210525512695312, 0.024153709411621094, 0.025096893310546875, 0.026040077209472656, 0.026983261108398438, 0.02792644500732422, 0.02886962890625]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 3.0, 8.0, 6.0, 5.0, 5.0, 7.0, 8.0, 5.0, 11.0, 8.0, 11.0, 13.0, 21.0, 27.0, 40.0, 65.0, 120.0, 178.0, 361.0, 1271.0, 187414.0, 855840.0, 2070.0, 431.0, 218.0, 104.0, 63.0, 51.0, 48.0, 33.0, 21.0, 14.0, 17.0, 13.0, 8.0, 7.0, 7.0, 5.0, 2.0, 6.0, 3.0, 3.0, 1.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.591796875, -0.5727615356445312, -0.5537261962890625, -0.5346908569335938, -0.515655517578125, -0.49662017822265625, -0.4775848388671875, -0.45854949951171875, -0.43951416015625, -0.42047882080078125, -0.4014434814453125, -0.38240814208984375, -0.363372802734375, -0.34433746337890625, -0.3253021240234375, -0.30626678466796875, -0.2872314453125, -0.26819610595703125, -0.2491607666015625, -0.23012542724609375, -0.211090087890625, -0.19205474853515625, -0.1730194091796875, -0.15398406982421875, -0.13494873046875, -0.11591339111328125, -0.0968780517578125, -0.07784271240234375, -0.058807373046875, -0.03977203369140625, -0.0207366943359375, -0.00170135498046875, 0.017333984375, 0.03636932373046875, 0.0554046630859375, 0.07444000244140625, 0.093475341796875, 0.11251068115234375, 0.1315460205078125, 0.15058135986328125, 0.16961669921875, 0.18865203857421875, 0.2076873779296875, 0.22672271728515625, 0.245758056640625, 0.26479339599609375, 0.2838287353515625, 0.30286407470703125, 0.3218994140625, 0.34093475341796875, 0.3599700927734375, 0.37900543212890625, 0.398040771484375, 0.41707611083984375, 0.4361114501953125, 0.45514678955078125, 0.47418212890625, 0.49321746826171875, 0.5122528076171875, 0.5312881469726562, 0.550323486328125, 0.5693588256835938, 0.5883941650390625, 0.6074295043945312, 0.62646484375]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 18.0, 88.0, 633.0, 237.0, 29.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15334580838680267, -0.14595602452754974, -0.138566255569458, -0.13117647171020508, -0.12378668785095215, -0.11639690399169922, -0.10900712758302689, -0.10161735117435455, -0.09422756731510162, -0.0868377834558487, -0.07944800704717636, -0.07205823063850403, -0.0646684467792511, -0.05727866664528847, -0.049888886511325836, -0.042499106377363205, -0.035109326243400574, -0.027719546109437943, -0.02032976597547531, -0.01293998584151268, -0.005550205707550049, 0.0018395744264125824, 0.009229354560375214, 0.016619134694337845, 0.024008914828300476, 0.03139869496226311, 0.03878847509622574, 0.04617825523018837, 0.053568035364151, 0.06095781549811363, 0.06834759563207626, 0.0757373720407486, 0.08312717080116272, 0.09051695466041565, 0.09790673106908798, 0.10529650747776031, 0.11268629133701324, 0.12007607519626617, 0.1274658441543579, 0.13485562801361084, 0.14224541187286377, 0.1496351957321167, 0.15702497959136963, 0.16441474854946136, 0.1718045324087143, 0.17919431626796722, 0.18658408522605896, 0.1939738690853119, 0.20136365294456482, 0.20875343680381775, 0.21614322066307068, 0.22353298962116241, 0.23092277348041534, 0.23831255733966827, 0.24570232629776, 0.25309211015701294, 0.26048189401626587, 0.2678716778755188, 0.27526146173477173, 0.28265124559402466, 0.2900410294532776, 0.29743078351020813, 0.30482056736946106, 0.312210351228714, 0.3196001350879669]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 5.0, 7.0, 5.0, 11.0, 5.0, 9.0, 11.0, 15.0, 20.0, 14.0, 17.0, 23.0, 25.0, 32.0, 30.0, 37.0, 40.0, 47.0, 53.0, 50.0, 32.0, 50.0, 36.0, 35.0, 45.0, 44.0, 38.0, 31.0, 28.0, 32.0, 34.0, 30.0, 19.0, 15.0, 15.0, 19.0, 13.0, 9.0, 4.0, 11.0, 2.0, 3.0, 2.0, 2.0, 5.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.03445249795913696, -0.033480700105428696, -0.03250890225172043, -0.03153710812330246, -0.030565310269594193, -0.029593512415885925, -0.028621716424822807, -0.02764992043375969, -0.026678122580051422, -0.025706324726343155, -0.024734528735280037, -0.02376273274421692, -0.02279093489050865, -0.021819137036800385, -0.020847341045737267, -0.01987554505467415, -0.01890374720096588, -0.017931949347257614, -0.016960153356194496, -0.015988357365131378, -0.015016559511423111, -0.014044762589037418, -0.013072965666651726, -0.012101168744266033, -0.01112937182188034, -0.010157574899494648, -0.009185777977108955, -0.008213981054723263, -0.00724218413233757, -0.006270387209951878, -0.005298590287566185, -0.004326793365180492, -0.0033549964427948, -0.002383199520409107, -0.0014114025980234146, -0.000439605675637722, 0.0005321912467479706, 0.0015039881691336632, 0.0024757850915193558, 0.0034475820139050484, 0.004419378936290741, 0.0053911758586764336, 0.006362972781062126, 0.007334769703447819, 0.008306566625833511, 0.009278363548219204, 0.010250160470604897, 0.01122195739299059, 0.012193754315376282, 0.013165551237761974, 0.014137348160147667, 0.01510914508253336, 0.016080942004919052, 0.01705273985862732, 0.018024535849690437, 0.018996331840753555, 0.019968129694461823, 0.02093992754817009, 0.021911723539233208, 0.022883519530296326, 0.023855317384004593, 0.02482711523771286, 0.025798911228775978, 0.026770707219839096, 0.027742505073547363]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 6.0, 2.0, 6.0, 7.0, 13.0, 7.0, 11.0, 16.0, 12.0, 21.0, 25.0, 28.0, 35.0, 25.0, 29.0, 28.0, 46.0, 47.0, 54.0, 33.0, 40.0, 43.0, 34.0, 42.0, 41.0, 46.0, 30.0, 27.0, 29.0, 36.0, 27.0, 14.0, 20.0, 18.0, 16.0, 22.0, 12.0, 13.0, 7.0, 11.0, 6.0, 5.0, 7.0, 1.0, 1.0, 6.0, 2.0, 2.0, 1.0], "bins": [-16.46875, -16.0166015625, -15.564453125, -15.1123046875, -14.66015625, -14.2080078125, -13.755859375, -13.3037109375, -12.8515625, -12.3994140625, -11.947265625, -11.4951171875, -11.04296875, -10.5908203125, -10.138671875, -9.6865234375, -9.234375, -8.7822265625, -8.330078125, -7.8779296875, -7.42578125, -6.9736328125, -6.521484375, -6.0693359375, -5.6171875, -5.1650390625, -4.712890625, -4.2607421875, -3.80859375, -3.3564453125, -2.904296875, -2.4521484375, -2.0, -1.5478515625, -1.095703125, -0.6435546875, -0.19140625, 0.2607421875, 0.712890625, 1.1650390625, 1.6171875, 2.0693359375, 2.521484375, 2.9736328125, 3.42578125, 3.8779296875, 4.330078125, 4.7822265625, 5.234375, 5.6865234375, 6.138671875, 6.5908203125, 7.04296875, 7.4951171875, 7.947265625, 8.3994140625, 8.8515625, 9.3037109375, 9.755859375, 10.2080078125, 10.66015625, 11.1123046875, 11.564453125, 12.0166015625, 12.46875]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 4.0, 4.0, 4.0, 6.0, 4.0, 13.0, 17.0, 23.0, 19.0, 39.0, 44.0, 70.0, 106.0, 162.0, 163.0, 290.0, 403.0, 596.0, 922.0, 1416.0, 2101.0, 3629.0, 6746.0, 16619.0, 97672.0, 787589.0, 96610.0, 16574.0, 6632.0, 3565.0, 2215.0, 1434.0, 919.0, 602.0, 418.0, 264.0, 198.0, 136.0, 101.0, 66.0, 38.0, 33.0, 22.0, 29.0, 15.0, 9.0, 8.0, 7.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.78125, -34.47998046875, -33.1787109375, -31.87744140625, -30.576171875, -29.27490234375, -27.9736328125, -26.67236328125, -25.37109375, -24.06982421875, -22.7685546875, -21.46728515625, -20.166015625, -18.86474609375, -17.5634765625, -16.26220703125, -14.9609375, -13.65966796875, -12.3583984375, -11.05712890625, -9.755859375, -8.45458984375, -7.1533203125, -5.85205078125, -4.55078125, -3.24951171875, -1.9482421875, -0.64697265625, 0.654296875, 1.95556640625, 3.2568359375, 4.55810546875, 5.859375, 7.16064453125, 8.4619140625, 9.76318359375, 11.064453125, 12.36572265625, 13.6669921875, 14.96826171875, 16.26953125, 17.57080078125, 18.8720703125, 20.17333984375, 21.474609375, 22.77587890625, 24.0771484375, 25.37841796875, 26.6796875, 27.98095703125, 29.2822265625, 30.58349609375, 31.884765625, 33.18603515625, 34.4873046875, 35.78857421875, 37.08984375, 38.39111328125, 39.6923828125, 40.99365234375, 42.294921875, 43.59619140625, 44.8974609375, 46.19873046875, 47.5]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 2.0, 3.0, 4.0, 3.0, 6.0, 7.0, 6.0, 10.0, 5.0, 19.0, 14.0, 19.0, 19.0, 29.0, 29.0, 34.0, 42.0, 54.0, 61.0, 63.0, 98.0, 142.0, 367.0, 1395.0, 132.0, 81.0, 59.0, 72.0, 46.0, 43.0, 40.0, 30.0, 17.0, 22.0, 22.0, 11.0, 11.0, 5.0, 8.0, 1.0, 5.0, 4.0, 5.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.28125, -30.303955078125, -29.32666015625, -28.349365234375, -27.3720703125, -26.394775390625, -25.41748046875, -24.440185546875, -23.462890625, -22.485595703125, -21.50830078125, -20.531005859375, -19.5537109375, -18.576416015625, -17.59912109375, -16.621826171875, -15.64453125, -14.667236328125, -13.68994140625, -12.712646484375, -11.7353515625, -10.758056640625, -9.78076171875, -8.803466796875, -7.826171875, -6.848876953125, -5.87158203125, -4.894287109375, -3.9169921875, -2.939697265625, -1.96240234375, -0.985107421875, -0.0078125, 0.969482421875, 1.94677734375, 2.924072265625, 3.9013671875, 4.878662109375, 5.85595703125, 6.833251953125, 7.810546875, 8.787841796875, 9.76513671875, 10.742431640625, 11.7197265625, 12.697021484375, 13.67431640625, 14.651611328125, 15.62890625, 16.606201171875, 17.58349609375, 18.560791015625, 19.5380859375, 20.515380859375, 21.49267578125, 22.469970703125, 23.447265625, 24.424560546875, 25.40185546875, 26.379150390625, 27.3564453125, 28.333740234375, 29.31103515625, 30.288330078125, 31.265625]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 1.0, 7.0, 1.0, 2.0, 14.0, 5.0, 13.0, 20.0, 35.0, 58.0, 55.0, 90.0, 137.0, 300.0, 739.0, 3143.0, 3055820.0, 82441.0, 1569.0, 564.0, 261.0, 138.0, 85.0, 53.0, 44.0, 25.0, 21.0, 16.0, 9.0, 8.0, 4.0, 4.0, 2.0, 4.0, 4.0, 2.0, 3.0, 1.0, 2.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-133.75, -128.943359375, -124.13671875, -119.330078125, -114.5234375, -109.716796875, -104.91015625, -100.103515625, -95.296875, -90.490234375, -85.68359375, -80.876953125, -76.0703125, -71.263671875, -66.45703125, -61.650390625, -56.84375, -52.037109375, -47.23046875, -42.423828125, -37.6171875, -32.810546875, -28.00390625, -23.197265625, -18.390625, -13.583984375, -8.77734375, -3.970703125, 0.8359375, 5.642578125, 10.44921875, 15.255859375, 20.0625, 24.869140625, 29.67578125, 34.482421875, 39.2890625, 44.095703125, 48.90234375, 53.708984375, 58.515625, 63.322265625, 68.12890625, 72.935546875, 77.7421875, 82.548828125, 87.35546875, 92.162109375, 96.96875, 101.775390625, 106.58203125, 111.388671875, 116.1953125, 121.001953125, 125.80859375, 130.615234375, 135.421875, 140.228515625, 145.03515625, 149.841796875, 154.6484375, 159.455078125, 164.26171875, 169.068359375, 173.875]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 8.0, 21.0, 32.0, 70.0, 208.0, 307.0, 224.0, 83.0, 37.0, 15.0, 4.0, 7.0], "bins": [-392.7497253417969, -385.93365478515625, -379.11761474609375, -372.3015441894531, -365.4854736328125, -358.66943359375, -351.8533630371094, -345.03729248046875, -338.22125244140625, -331.4051818847656, -324.5891418457031, -317.7730712890625, -310.9570007324219, -304.1409606933594, -297.32489013671875, -290.50885009765625, -283.6927795410156, -276.876708984375, -270.0606689453125, -263.2445983886719, -256.42852783203125, -249.61248779296875, -242.79641723632812, -235.98036193847656, -229.16429138183594, -222.34823608398438, -215.53216552734375, -208.7161102294922, -201.90005493164062, -195.083984375, -188.26792907714844, -181.45187377929688, -174.63580322265625, -167.8197479248047, -161.00367736816406, -154.1876220703125, -147.37156677246094, -140.55551147460938, -133.73944091796875, -126.92338562011719, -120.10733032226562, -113.29126739501953, -106.47521209716797, -99.65914916992188, -92.84309387207031, -86.02703094482422, -79.21096801757812, -72.39491271972656, -65.578857421875, -58.76279830932617, -51.946739196777344, -45.13067626953125, -38.31462097167969, -31.498558044433594, -24.682498931884766, -17.866439819335938, -11.050376892089844, -4.234317302703857, 2.581742286682129, 9.397802352905273, 16.2138614654541, 23.029922485351562, 29.84598159790039, 36.66204071044922, 43.47809982299805]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 4.0, 4.0, 5.0, 8.0, 8.0, 11.0, 20.0, 17.0, 16.0, 13.0, 19.0, 24.0, 30.0, 29.0, 39.0, 32.0, 39.0, 43.0, 32.0, 46.0, 41.0, 42.0, 38.0, 49.0, 38.0, 43.0, 45.0, 37.0, 26.0, 31.0, 25.0, 17.0, 17.0, 25.0, 17.0, 11.0, 9.0, 10.0, 11.0, 9.0, 7.0, 3.0, 5.0, 1.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-86.37979888916016, -83.68284606933594, -80.98590087890625, -78.28894805908203, -75.59200286865234, -72.89505004882812, -70.19810485839844, -67.50115203857422, -64.80419921875, -62.10725021362305, -59.410301208496094, -56.713348388671875, -54.01640319824219, -51.31945037841797, -48.622501373291016, -45.92555236816406, -43.228607177734375, -40.53165817260742, -37.83470916748047, -35.13775634765625, -32.44081115722656, -29.743860244750977, -27.04690933227539, -24.349960327148438, -21.653011322021484, -18.95606231689453, -16.259113311767578, -13.562162399291992, -10.865213394165039, -8.168264389038086, -5.4713134765625, -2.774364471435547, -0.077423095703125, 2.6195263862609863, 5.316475868225098, 8.013425827026367, 10.71037483215332, 13.407323837280273, 16.10427474975586, 18.801223754882812, 21.498172760009766, 24.19512176513672, 26.892070770263672, 29.589021682739258, 32.285972595214844, 34.98291778564453, 37.67987060546875, 40.3768196105957, 43.073768615722656, 45.77071762084961, 48.46766662597656, 51.16461944580078, 53.86156463623047, 56.55851745605469, 59.25546646118164, 61.952415466308594, 64.64936828613281, 67.34632110595703, 70.04326629638672, 72.74021911621094, 75.43716430664062, 78.13411712646484, 80.83106994628906, 83.52801513671875, 86.22496032714844]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 3.0, 2.0, 7.0, 11.0, 15.0, 26.0, 19.0, 13.0, 22.0, 25.0, 29.0, 35.0, 43.0, 33.0, 31.0, 39.0, 42.0, 44.0, 35.0, 55.0, 37.0, 47.0, 51.0, 32.0, 33.0, 31.0, 30.0, 24.0, 28.0, 26.0, 27.0, 24.0, 19.0, 17.0, 5.0, 6.0, 8.0, 4.0, 8.0, 6.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.046875, -15.5501708984375, -15.053466796875, -14.5567626953125, -14.06005859375, -13.5633544921875, -13.066650390625, -12.5699462890625, -12.0732421875, -11.5765380859375, -11.079833984375, -10.5831298828125, -10.08642578125, -9.5897216796875, -9.093017578125, -8.5963134765625, -8.099609375, -7.6029052734375, -7.106201171875, -6.6094970703125, -6.11279296875, -5.6160888671875, -5.119384765625, -4.6226806640625, -4.1259765625, -3.6292724609375, -3.132568359375, -2.6358642578125, -2.13916015625, -1.6424560546875, -1.145751953125, -0.6490478515625, -0.15234375, 0.3443603515625, 0.841064453125, 1.3377685546875, 1.83447265625, 2.3311767578125, 2.827880859375, 3.3245849609375, 3.8212890625, 4.3179931640625, 4.814697265625, 5.3114013671875, 5.80810546875, 6.3048095703125, 6.801513671875, 7.2982177734375, 7.794921875, 8.2916259765625, 8.788330078125, 9.2850341796875, 9.78173828125, 10.2784423828125, 10.775146484375, 11.2718505859375, 11.7685546875, 12.2652587890625, 12.761962890625, 13.2586669921875, 13.75537109375, 14.2520751953125, 14.748779296875, 15.2454833984375, 15.7421875]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 4.0, 5.0, 2.0, 3.0, 4.0, 10.0, 8.0, 18.0, 20.0, 15.0, 33.0, 38.0, 31.0, 60.0, 64.0, 97.0, 113.0, 153.0, 192.0, 290.0, 424.0, 725.0, 1456.0, 4214.0, 35970.0, 3367529.0, 765848.0, 11419.0, 2571.0, 1054.0, 583.0, 354.0, 240.0, 178.0, 133.0, 92.0, 88.0, 43.0, 46.0, 36.0, 30.0, 30.0, 5.0, 13.0, 14.0, 6.0, 10.0, 6.0, 2.0, 4.0, 0.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-73.625, -71.380859375, -69.13671875, -66.892578125, -64.6484375, -62.404296875, -60.16015625, -57.916015625, -55.671875, -53.427734375, -51.18359375, -48.939453125, -46.6953125, -44.451171875, -42.20703125, -39.962890625, -37.71875, -35.474609375, -33.23046875, -30.986328125, -28.7421875, -26.498046875, -24.25390625, -22.009765625, -19.765625, -17.521484375, -15.27734375, -13.033203125, -10.7890625, -8.544921875, -6.30078125, -4.056640625, -1.8125, 0.431640625, 2.67578125, 4.919921875, 7.1640625, 9.408203125, 11.65234375, 13.896484375, 16.140625, 18.384765625, 20.62890625, 22.873046875, 25.1171875, 27.361328125, 29.60546875, 31.849609375, 34.09375, 36.337890625, 38.58203125, 40.826171875, 43.0703125, 45.314453125, 47.55859375, 49.802734375, 52.046875, 54.291015625, 56.53515625, 58.779296875, 61.0234375, 63.267578125, 65.51171875, 67.755859375, 70.0]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 8.0, 6.0, 13.0, 24.0, 34.0, 66.0, 101.0, 182.0, 302.0, 579.0, 1024.0, 740.0, 417.0, 222.0, 122.0, 78.0, 51.0, 32.0, 23.0, 13.0, 9.0, 3.0, 9.0, 4.0, 2.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.75, -40.54638671875, -39.3427734375, -38.13916015625, -36.935546875, -35.73193359375, -34.5283203125, -33.32470703125, -32.12109375, -30.91748046875, -29.7138671875, -28.51025390625, -27.306640625, -26.10302734375, -24.8994140625, -23.69580078125, -22.4921875, -21.28857421875, -20.0849609375, -18.88134765625, -17.677734375, -16.47412109375, -15.2705078125, -14.06689453125, -12.86328125, -11.65966796875, -10.4560546875, -9.25244140625, -8.048828125, -6.84521484375, -5.6416015625, -4.43798828125, -3.234375, -2.03076171875, -0.8271484375, 0.37646484375, 1.580078125, 2.78369140625, 3.9873046875, 5.19091796875, 6.39453125, 7.59814453125, 8.8017578125, 10.00537109375, 11.208984375, 12.41259765625, 13.6162109375, 14.81982421875, 16.0234375, 17.22705078125, 18.4306640625, 19.63427734375, 20.837890625, 22.04150390625, 23.2451171875, 24.44873046875, 25.65234375, 26.85595703125, 28.0595703125, 29.26318359375, 30.466796875, 31.67041015625, 32.8740234375, 34.07763671875, 35.28125]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 4.0, 2.0, 5.0, 10.0, 8.0, 14.0, 21.0, 45.0, 69.0, 100.0, 224.0, 544.0, 1699.0, 8714.0, 174263.0, 3954268.0, 47831.0, 4588.0, 1149.0, 368.0, 164.0, 77.0, 51.0, 26.0, 13.0, 6.0, 9.0, 5.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-83.5, -80.6533203125, -77.806640625, -74.9599609375, -72.11328125, -69.2666015625, -66.419921875, -63.5732421875, -60.7265625, -57.8798828125, -55.033203125, -52.1865234375, -49.33984375, -46.4931640625, -43.646484375, -40.7998046875, -37.953125, -35.1064453125, -32.259765625, -29.4130859375, -26.56640625, -23.7197265625, -20.873046875, -18.0263671875, -15.1796875, -12.3330078125, -9.486328125, -6.6396484375, -3.79296875, -0.9462890625, 1.900390625, 4.7470703125, 7.59375, 10.4404296875, 13.287109375, 16.1337890625, 18.98046875, 21.8271484375, 24.673828125, 27.5205078125, 30.3671875, 33.2138671875, 36.060546875, 38.9072265625, 41.75390625, 44.6005859375, 47.447265625, 50.2939453125, 53.140625, 55.9873046875, 58.833984375, 61.6806640625, 64.52734375, 67.3740234375, 70.220703125, 73.0673828125, 75.9140625, 78.7607421875, 81.607421875, 84.4541015625, 87.30078125, 90.1474609375, 92.994140625, 95.8408203125, 98.6875]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 11.0, 266.0, 696.0, 35.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1320.40576171875, -1294.0941162109375, -1267.7823486328125, -1241.470703125, -1215.158935546875, -1188.8472900390625, -1162.5355224609375, -1136.223876953125, -1109.912109375, -1083.6004638671875, -1057.2886962890625, -1030.97705078125, -1004.665283203125, -978.3535766601562, -952.0418701171875, -925.7301635742188, -899.41845703125, -873.1067504882812, -846.7950439453125, -820.4833374023438, -794.171630859375, -767.8599243164062, -741.5482177734375, -715.2365112304688, -688.9248657226562, -662.6131591796875, -636.3014526367188, -609.98974609375, -583.6780395507812, -557.3663330078125, -531.0546264648438, -504.742919921875, -478.4312438964844, -452.1195373535156, -425.8078308105469, -399.4961242675781, -373.1844177246094, -346.87274169921875, -320.56103515625, -294.24932861328125, -267.9376220703125, -241.62591552734375, -215.314208984375, -189.00250244140625, -162.6907958984375, -136.3791046142578, -110.06739807128906, -83.75569152832031, -57.4439697265625, -31.132265090942383, -4.820560455322266, 21.49114227294922, 47.80284881591797, 74.11454772949219, 100.42625427246094, 126.73796081542969, 153.04966735839844, 179.3613739013672, 205.67308044433594, 231.98477172851562, 258.2964782714844, 284.6081848144531, 310.9198913574219, 337.2315979003906, 363.5433044433594]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 7.0, 3.0, 6.0, 8.0, 8.0, 15.0, 16.0, 12.0, 29.0, 23.0, 24.0, 27.0, 25.0, 32.0, 40.0, 33.0, 43.0, 37.0, 44.0, 36.0, 41.0, 39.0, 48.0, 37.0, 49.0, 32.0, 43.0, 28.0, 21.0, 29.0, 26.0, 26.0, 13.0, 18.0, 16.0, 18.0, 11.0, 10.0, 6.0, 2.0, 6.0, 4.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-85.37924194335938, -82.60194396972656, -79.82464599609375, -77.04734802246094, -74.27005004882812, -71.49275207519531, -68.7154541015625, -65.93815612792969, -63.160858154296875, -60.38356018066406, -57.60626220703125, -54.82896423339844, -52.051666259765625, -49.27436828613281, -46.4970703125, -43.71977233886719, -40.942474365234375, -38.16517639160156, -35.38787841796875, -32.61058044433594, -29.833282470703125, -27.055984497070312, -24.2786865234375, -21.501388549804688, -18.724090576171875, -15.946792602539062, -13.16949462890625, -10.392196655273438, -7.614898681640625, -4.8376007080078125, -2.060302734375, 0.7169952392578125, 3.4942855834960938, 6.271583557128906, 9.048881530761719, 11.826179504394531, 14.603477478027344, 17.380775451660156, 20.15807342529297, 22.93537139892578, 25.712669372558594, 28.489967346191406, 31.26726531982422, 34.04456329345703, 36.821861267089844, 39.599159240722656, 42.37645721435547, 45.15375518798828, 47.931053161621094, 50.708351135253906, 53.48564910888672, 56.26294708251953, 59.040245056152344, 61.817543029785156, 64.59484100341797, 67.37213897705078, 70.1494369506836, 72.9267349243164, 75.70403289794922, 78.48133087158203, 81.25862884521484, 84.03592681884766, 86.81322479248047, 89.59052276611328, 92.3678207397461]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 3.0, 3.0, 9.0, 7.0, 10.0, 6.0, 11.0, 12.0, 14.0, 12.0, 20.0, 18.0, 21.0, 22.0, 14.0, 21.0, 39.0, 38.0, 37.0, 29.0, 36.0, 39.0, 36.0, 46.0, 39.0, 33.0, 22.0, 36.0, 35.0, 30.0, 22.0, 30.0, 35.0, 31.0, 16.0, 24.0, 24.0, 15.0, 17.0, 19.0, 8.0, 10.0, 11.0, 9.0, 9.0, 5.0, 7.0, 3.0, 5.0, 4.0, 3.0, 0.0, 2.0, 0.0, 2.0], "bins": [-11.5, -11.15380859375, -10.8076171875, -10.46142578125, -10.115234375, -9.76904296875, -9.4228515625, -9.07666015625, -8.73046875, -8.38427734375, -8.0380859375, -7.69189453125, -7.345703125, -6.99951171875, -6.6533203125, -6.30712890625, -5.9609375, -5.61474609375, -5.2685546875, -4.92236328125, -4.576171875, -4.22998046875, -3.8837890625, -3.53759765625, -3.19140625, -2.84521484375, -2.4990234375, -2.15283203125, -1.806640625, -1.46044921875, -1.1142578125, -0.76806640625, -0.421875, -0.07568359375, 0.2705078125, 0.61669921875, 0.962890625, 1.30908203125, 1.6552734375, 2.00146484375, 2.34765625, 2.69384765625, 3.0400390625, 3.38623046875, 3.732421875, 4.07861328125, 4.4248046875, 4.77099609375, 5.1171875, 5.46337890625, 5.8095703125, 6.15576171875, 6.501953125, 6.84814453125, 7.1943359375, 7.54052734375, 7.88671875, 8.23291015625, 8.5791015625, 8.92529296875, 9.271484375, 9.61767578125, 9.9638671875, 10.31005859375, 10.65625]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 4.0, 6.0, 2.0, 5.0, 17.0, 19.0, 33.0, 37.0, 64.0, 59.0, 118.0, 162.0, 236.0, 345.0, 575.0, 768.0, 1061.0, 1571.0, 2426.0, 3478.0, 5184.0, 7708.0, 11616.0, 17659.0, 27557.0, 43728.0, 72365.0, 123112.0, 199415.0, 201466.0, 126433.0, 74051.0, 44815.0, 27941.0, 18318.0, 11786.0, 7727.0, 5460.0, 3555.0, 2446.0, 1709.0, 1075.0, 745.0, 520.0, 388.0, 227.0, 192.0, 139.0, 85.0, 54.0, 35.0, 21.0, 15.0, 13.0, 9.0, 6.0, 7.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.9560546875, -0.9262008666992188, -0.8963470458984375, -0.8664932250976562, -0.836639404296875, -0.8067855834960938, -0.7769317626953125, -0.7470779418945312, -0.71722412109375, -0.6873703002929688, -0.6575164794921875, -0.6276626586914062, -0.597808837890625, -0.5679550170898438, -0.5381011962890625, -0.5082473754882812, -0.4783935546875, -0.44853973388671875, -0.4186859130859375, -0.38883209228515625, -0.358978271484375, -0.32912445068359375, -0.2992706298828125, -0.26941680908203125, -0.23956298828125, -0.20970916748046875, -0.1798553466796875, -0.15000152587890625, -0.120147705078125, -0.09029388427734375, -0.0604400634765625, -0.03058624267578125, -0.000732421875, 0.02912139892578125, 0.0589752197265625, 0.08882904052734375, 0.118682861328125, 0.14853668212890625, 0.1783905029296875, 0.20824432373046875, 0.23809814453125, 0.26795196533203125, 0.2978057861328125, 0.32765960693359375, 0.357513427734375, 0.38736724853515625, 0.4172210693359375, 0.44707489013671875, 0.4769287109375, 0.5067825317382812, 0.5366363525390625, 0.5664901733398438, 0.596343994140625, 0.6261978149414062, 0.6560516357421875, 0.6859054565429688, 0.71575927734375, 0.7456130981445312, 0.7754669189453125, 0.8053207397460938, 0.835174560546875, 0.8650283813476562, 0.8948822021484375, 0.9247360229492188, 0.95458984375]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 6.0, 7.0, 11.0, 5.0, 6.0, 17.0, 12.0, 12.0, 17.0, 15.0, 30.0, 30.0, 37.0, 34.0, 35.0, 24.0, 26.0, 49.0, 37.0, 50.0, 40.0, 1063.0, 42.0, 50.0, 40.0, 20.0, 35.0, 36.0, 30.0, 23.0, 22.0, 29.0, 20.0, 18.0, 20.0, 17.0, 13.0, 10.0, 8.0, 9.0, 6.0, 3.0, 2.0, 5.0, 1.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.328125, -8.07720947265625, -7.8262939453125, -7.57537841796875, -7.324462890625, -7.07354736328125, -6.8226318359375, -6.57171630859375, -6.32080078125, -6.06988525390625, -5.8189697265625, -5.56805419921875, -5.317138671875, -5.06622314453125, -4.8153076171875, -4.56439208984375, -4.3134765625, -4.06256103515625, -3.8116455078125, -3.56072998046875, -3.309814453125, -3.05889892578125, -2.8079833984375, -2.55706787109375, -2.30615234375, -2.05523681640625, -1.8043212890625, -1.55340576171875, -1.302490234375, -1.05157470703125, -0.8006591796875, -0.54974365234375, -0.298828125, -0.04791259765625, 0.2030029296875, 0.45391845703125, 0.704833984375, 0.95574951171875, 1.2066650390625, 1.45758056640625, 1.70849609375, 1.95941162109375, 2.2103271484375, 2.46124267578125, 2.712158203125, 2.96307373046875, 3.2139892578125, 3.46490478515625, 3.7158203125, 3.96673583984375, 4.2176513671875, 4.46856689453125, 4.719482421875, 4.97039794921875, 5.2213134765625, 5.47222900390625, 5.72314453125, 5.97406005859375, 6.2249755859375, 6.47589111328125, 6.726806640625, 6.97772216796875, 7.2286376953125, 7.47955322265625, 7.73046875]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 4.0, 10.0, 17.0, 24.0, 38.0, 53.0, 86.0, 160.0, 204.0, 325.0, 407.0, 739.0, 1075.0, 1566.0, 2420.0, 3554.0, 5319.0, 8284.0, 12411.0, 18667.0, 29423.0, 47370.0, 80212.0, 137386.0, 1251425.0, 200020.0, 114381.0, 66735.0, 41130.0, 25567.0, 16204.0, 10771.0, 7063.0, 4578.0, 3190.0, 2105.0, 1461.0, 925.0, 615.0, 447.0, 276.0, 158.0, 119.0, 76.0, 44.0, 37.0, 18.0, 11.0, 8.0, 9.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.73876953125, -0.714813232421875, -0.69085693359375, -0.666900634765625, -0.6429443359375, -0.618988037109375, -0.59503173828125, -0.571075439453125, -0.547119140625, -0.523162841796875, -0.49920654296875, -0.475250244140625, -0.4512939453125, -0.427337646484375, -0.40338134765625, -0.379425048828125, -0.35546875, -0.331512451171875, -0.30755615234375, -0.283599853515625, -0.2596435546875, -0.235687255859375, -0.21173095703125, -0.187774658203125, -0.163818359375, -0.139862060546875, -0.11590576171875, -0.091949462890625, -0.0679931640625, -0.044036865234375, -0.02008056640625, 0.003875732421875, 0.02783203125, 0.051788330078125, 0.07574462890625, 0.099700927734375, 0.1236572265625, 0.147613525390625, 0.17156982421875, 0.195526123046875, 0.219482421875, 0.243438720703125, 0.26739501953125, 0.291351318359375, 0.3153076171875, 0.339263916015625, 0.36322021484375, 0.387176513671875, 0.4111328125, 0.435089111328125, 0.45904541015625, 0.483001708984375, 0.5069580078125, 0.530914306640625, 0.55487060546875, 0.578826904296875, 0.602783203125, 0.626739501953125, 0.65069580078125, 0.674652099609375, 0.6986083984375, 0.722564697265625, 0.74652099609375, 0.770477294921875, 0.79443359375]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 3.0, 3.0, 3.0, 6.0, 6.0, 14.0, 10.0, 23.0, 18.0, 55.0, 108.0, 206.0, 273.0, 111.0, 66.0, 32.0, 15.0, 13.0, 9.0, 8.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.033782958984375, -0.032663822174072266, -0.03154468536376953, -0.030425548553466797, -0.029306411743164062, -0.028187274932861328, -0.027068138122558594, -0.02594900131225586, -0.024829864501953125, -0.02371072769165039, -0.022591590881347656, -0.021472454071044922, -0.020353317260742188, -0.019234180450439453, -0.01811504364013672, -0.016995906829833984, -0.01587677001953125, -0.014757633209228516, -0.013638496398925781, -0.012519359588623047, -0.011400222778320312, -0.010281085968017578, -0.009161949157714844, -0.00804281234741211, -0.006923675537109375, -0.005804538726806641, -0.004685401916503906, -0.003566265106201172, -0.0024471282958984375, -0.0013279914855957031, -0.00020885467529296875, 0.0009102821350097656, 0.0020294189453125, 0.0031485557556152344, 0.004267692565917969, 0.005386829376220703, 0.0065059661865234375, 0.007625102996826172, 0.008744239807128906, 0.00986337661743164, 0.010982513427734375, 0.01210165023803711, 0.013220787048339844, 0.014339923858642578, 0.015459060668945312, 0.016578197479248047, 0.01769733428955078, 0.018816471099853516, 0.01993560791015625, 0.021054744720458984, 0.02217388153076172, 0.023293018341064453, 0.024412155151367188, 0.025531291961669922, 0.026650428771972656, 0.02776956558227539, 0.028888702392578125, 0.03000783920288086, 0.031126976013183594, 0.03224611282348633, 0.03336524963378906, 0.0344843864440918, 0.03560352325439453, 0.036722660064697266, 0.037841796875]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 4.0, 3.0, 2.0, 3.0, 8.0, 3.0, 6.0, 14.0, 20.0, 21.0, 33.0, 55.0, 114.0, 267.0, 1041.0, 1030052.0, 15914.0, 497.0, 197.0, 90.0, 62.0, 41.0, 24.0, 20.0, 11.0, 6.0, 12.0, 7.0, 3.0, 7.0, 3.0, 1.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.744140625, -0.7221145629882812, -0.7000885009765625, -0.6780624389648438, -0.656036376953125, -0.6340103149414062, -0.6119842529296875, -0.5899581909179688, -0.56793212890625, -0.5459060668945312, -0.5238800048828125, -0.5018539428710938, -0.479827880859375, -0.45780181884765625, -0.4357757568359375, -0.41374969482421875, -0.3917236328125, -0.36969757080078125, -0.3476715087890625, -0.32564544677734375, -0.303619384765625, -0.28159332275390625, -0.2595672607421875, -0.23754119873046875, -0.21551513671875, -0.19348907470703125, -0.1714630126953125, -0.14943695068359375, -0.127410888671875, -0.10538482666015625, -0.0833587646484375, -0.06133270263671875, -0.039306640625, -0.01728057861328125, 0.0047454833984375, 0.02677154541015625, 0.048797607421875, 0.07082366943359375, 0.0928497314453125, 0.11487579345703125, 0.13690185546875, 0.15892791748046875, 0.1809539794921875, 0.20298004150390625, 0.225006103515625, 0.24703216552734375, 0.2690582275390625, 0.29108428955078125, 0.3131103515625, 0.33513641357421875, 0.3571624755859375, 0.37918853759765625, 0.401214599609375, 0.42324066162109375, 0.4452667236328125, 0.46729278564453125, 0.48931884765625, 0.5113449096679688, 0.5333709716796875, 0.5553970336914062, 0.577423095703125, 0.5994491577148438, 0.6214752197265625, 0.6435012817382812, 0.66552734375]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 7.0, 1000.0, 10.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.177730530500412, -0.16547609865665436, -0.15322166681289673, -0.1409672349691391, -0.12871280312538147, -0.11645837128162384, -0.10420393943786621, -0.09194950759410858, -0.07969507575035095, -0.06744064390659332, -0.05518621206283569, -0.042931780219078064, -0.030677348375320435, -0.018422916531562805, -0.006168484687805176, 0.006085947155952454, 0.018340378999710083, 0.030594810843467712, 0.04284924268722534, 0.05510367453098297, 0.0673581063747406, 0.07961253821849823, 0.09186697006225586, 0.10412140190601349, 0.11637583374977112, 0.12863026559352875, 0.14088469743728638, 0.153139129281044, 0.16539356112480164, 0.17764799296855927, 0.1899024248123169, 0.20215685665607452, 0.21441125869750977, 0.2266656905412674, 0.23892012238502502, 0.25117456912994385, 0.2634289860725403, 0.2756834030151367, 0.28793784976005554, 0.30019229650497437, 0.3124467134475708, 0.32470113039016724, 0.33695557713508606, 0.3492100238800049, 0.3614644408226013, 0.37371885776519775, 0.3859733045101166, 0.3982277512550354, 0.41048216819763184, 0.42273658514022827, 0.4349910318851471, 0.4472454786300659, 0.45949989557266235, 0.4717543125152588, 0.4840087592601776, 0.49626320600509644, 0.5085176229476929, 0.5207720398902893, 0.5330264568328857, 0.545280933380127, 0.5575353503227234, 0.5697897672653198, 0.582044243812561, 0.5942986607551575, 0.6065530776977539]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 6.0, 5.0, 10.0, 11.0, 19.0, 31.0, 33.0, 59.0, 68.0, 67.0, 68.0, 71.0, 91.0, 64.0, 71.0, 75.0, 60.0, 41.0, 47.0, 32.0, 25.0, 21.0, 12.0, 10.0, 4.0, 1.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.027426540851593018, -0.026311088353395462, -0.025195635855197906, -0.02408018335700035, -0.022964730858802795, -0.02184927836060524, -0.020733825862407684, -0.01961837336421013, -0.018502920866012573, -0.017387468367815018, -0.016272015869617462, -0.015156563371419907, -0.014041110873222351, -0.012925658375024796, -0.01181020587682724, -0.010694753378629684, -0.009579300880432129, -0.008463848382234573, -0.007348395884037018, -0.006232943385839462, -0.005117490887641907, -0.004002038389444351, -0.0028865858912467957, -0.0017711333930492401, -0.0006556808948516846, 0.00045977160334587097, 0.0015752241015434265, 0.002690676599740982, 0.0038061290979385376, 0.004921581596136093, 0.006037034094333649, 0.007152486592531204, 0.00826793909072876, 0.009383391588926315, 0.01049884408712387, 0.011614296585321426, 0.012729749083518982, 0.013845201581716537, 0.014960654079914093, 0.01607610657811165, 0.017191559076309204, 0.01830701157450676, 0.019422464072704315, 0.02053791657090187, 0.021653369069099426, 0.022768821567296982, 0.023884274065494537, 0.024999726563692093, 0.02611517906188965, 0.027230631560087204, 0.02834608405828476, 0.029461536556482315, 0.03057698905467987, 0.031692441552877426, 0.03280789405107498, 0.03392334654927254, 0.03503879904747009, 0.03615425154566765, 0.037269704043865204, 0.03838515654206276, 0.039500609040260315, 0.04061606153845787, 0.041731514036655426, 0.04284696653485298, 0.04396241903305054]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 3.0, 3.0, 9.0, 7.0, 10.0, 6.0, 11.0, 12.0, 14.0, 12.0, 20.0, 17.0, 22.0, 22.0, 14.0, 19.0, 41.0, 38.0, 36.0, 30.0, 35.0, 39.0, 36.0, 47.0, 38.0, 34.0, 22.0, 35.0, 36.0, 30.0, 22.0, 29.0, 36.0, 31.0, 15.0, 25.0, 24.0, 15.0, 17.0, 19.0, 8.0, 10.0, 11.0, 9.0, 9.0, 5.0, 7.0, 3.0, 5.0, 4.0, 3.0, 0.0, 2.0, 0.0, 2.0], "bins": [-11.5078125, -11.1614990234375, -10.815185546875, -10.4688720703125, -10.12255859375, -9.7762451171875, -9.429931640625, -9.0836181640625, -8.7373046875, -8.3909912109375, -8.044677734375, -7.6983642578125, -7.35205078125, -7.0057373046875, -6.659423828125, -6.3131103515625, -5.966796875, -5.6204833984375, -5.274169921875, -4.9278564453125, -4.58154296875, -4.2352294921875, -3.888916015625, -3.5426025390625, -3.1962890625, -2.8499755859375, -2.503662109375, -2.1573486328125, -1.81103515625, -1.4647216796875, -1.118408203125, -0.7720947265625, -0.42578125, -0.0794677734375, 0.266845703125, 0.6131591796875, 0.95947265625, 1.3057861328125, 1.652099609375, 1.9984130859375, 2.3447265625, 2.6910400390625, 3.037353515625, 3.3836669921875, 3.72998046875, 4.0762939453125, 4.422607421875, 4.7689208984375, 5.115234375, 5.4615478515625, 5.807861328125, 6.1541748046875, 6.50048828125, 6.8468017578125, 7.193115234375, 7.5394287109375, 7.8857421875, 8.2320556640625, 8.578369140625, 8.9246826171875, 9.27099609375, 9.6173095703125, 9.963623046875, 10.3099365234375, 10.65625]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 2.0, 5.0, 5.0, 8.0, 13.0, 13.0, 23.0, 30.0, 30.0, 42.0, 50.0, 75.0, 105.0, 123.0, 164.0, 205.0, 326.0, 389.0, 670.0, 944.0, 1500.0, 2559.0, 5138.0, 12417.0, 43865.0, 252024.0, 592589.0, 95843.0, 22281.0, 7774.0, 3511.0, 1981.0, 1140.0, 752.0, 534.0, 376.0, 262.0, 179.0, 140.0, 117.0, 101.0, 57.0, 45.0, 34.0, 37.0, 24.0, 19.0, 10.0, 9.0, 8.0, 7.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0], "bins": [-20.171875, -19.565185546875, -18.95849609375, -18.351806640625, -17.7451171875, -17.138427734375, -16.53173828125, -15.925048828125, -15.318359375, -14.711669921875, -14.10498046875, -13.498291015625, -12.8916015625, -12.284912109375, -11.67822265625, -11.071533203125, -10.46484375, -9.858154296875, -9.25146484375, -8.644775390625, -8.0380859375, -7.431396484375, -6.82470703125, -6.218017578125, -5.611328125, -5.004638671875, -4.39794921875, -3.791259765625, -3.1845703125, -2.577880859375, -1.97119140625, -1.364501953125, -0.7578125, -0.151123046875, 0.45556640625, 1.062255859375, 1.6689453125, 2.275634765625, 2.88232421875, 3.489013671875, 4.095703125, 4.702392578125, 5.30908203125, 5.915771484375, 6.5224609375, 7.129150390625, 7.73583984375, 8.342529296875, 8.94921875, 9.555908203125, 10.16259765625, 10.769287109375, 11.3759765625, 11.982666015625, 12.58935546875, 13.196044921875, 13.802734375, 14.409423828125, 15.01611328125, 15.622802734375, 16.2294921875, 16.836181640625, 17.44287109375, 18.049560546875, 18.65625]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 3.0, 3.0, 6.0, 5.0, 9.0, 6.0, 8.0, 16.0, 7.0, 17.0, 20.0, 17.0, 14.0, 36.0, 24.0, 30.0, 60.0, 47.0, 72.0, 87.0, 138.0, 1438.0, 387.0, 135.0, 87.0, 68.0, 49.0, 47.0, 26.0, 39.0, 23.0, 22.0, 16.0, 18.0, 11.0, 16.0, 9.0, 8.0, 9.0, 2.0, 6.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-25.34375, -24.468505859375, -23.59326171875, -22.718017578125, -21.8427734375, -20.967529296875, -20.09228515625, -19.217041015625, -18.341796875, -17.466552734375, -16.59130859375, -15.716064453125, -14.8408203125, -13.965576171875, -13.09033203125, -12.215087890625, -11.33984375, -10.464599609375, -9.58935546875, -8.714111328125, -7.8388671875, -6.963623046875, -6.08837890625, -5.213134765625, -4.337890625, -3.462646484375, -2.58740234375, -1.712158203125, -0.8369140625, 0.038330078125, 0.91357421875, 1.788818359375, 2.6640625, 3.539306640625, 4.41455078125, 5.289794921875, 6.1650390625, 7.040283203125, 7.91552734375, 8.790771484375, 9.666015625, 10.541259765625, 11.41650390625, 12.291748046875, 13.1669921875, 14.042236328125, 14.91748046875, 15.792724609375, 16.66796875, 17.543212890625, 18.41845703125, 19.293701171875, 20.1689453125, 21.044189453125, 21.91943359375, 22.794677734375, 23.669921875, 24.545166015625, 25.42041015625, 26.295654296875, 27.1708984375, 28.046142578125, 28.92138671875, 29.796630859375, 30.671875]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 8.0, 6.0, 9.0, 9.0, 16.0, 19.0, 18.0, 26.0, 35.0, 34.0, 55.0, 80.0, 94.0, 157.0, 213.0, 419.0, 817.0, 2068.0, 32692.0, 3084225.0, 20926.0, 1850.0, 699.0, 418.0, 225.0, 142.0, 115.0, 65.0, 55.0, 48.0, 41.0, 20.0, 23.0, 12.0, 14.0, 15.0, 9.0, 3.0, 7.0, 6.0, 3.0, 6.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-61.6875, -59.89697265625, -58.1064453125, -56.31591796875, -54.525390625, -52.73486328125, -50.9443359375, -49.15380859375, -47.36328125, -45.57275390625, -43.7822265625, -41.99169921875, -40.201171875, -38.41064453125, -36.6201171875, -34.82958984375, -33.0390625, -31.24853515625, -29.4580078125, -27.66748046875, -25.876953125, -24.08642578125, -22.2958984375, -20.50537109375, -18.71484375, -16.92431640625, -15.1337890625, -13.34326171875, -11.552734375, -9.76220703125, -7.9716796875, -6.18115234375, -4.390625, -2.60009765625, -0.8095703125, 0.98095703125, 2.771484375, 4.56201171875, 6.3525390625, 8.14306640625, 9.93359375, 11.72412109375, 13.5146484375, 15.30517578125, 17.095703125, 18.88623046875, 20.6767578125, 22.46728515625, 24.2578125, 26.04833984375, 27.8388671875, 29.62939453125, 31.419921875, 33.21044921875, 35.0009765625, 36.79150390625, 38.58203125, 40.37255859375, 42.1630859375, 43.95361328125, 45.744140625, 47.53466796875, 49.3251953125, 51.11572265625, 52.90625]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 47.0, 697.0, 254.0, 11.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-653.3788452148438, -640.7673950195312, -628.1559448242188, -615.5444946289062, -602.9330444335938, -590.3215942382812, -577.7101440429688, -565.0986938476562, -552.4872436523438, -539.8757934570312, -527.2643432617188, -514.6528930664062, -502.04144287109375, -489.42999267578125, -476.81854248046875, -464.20709228515625, -451.59564208984375, -438.98419189453125, -426.37274169921875, -413.76129150390625, -401.14984130859375, -388.53839111328125, -375.92694091796875, -363.31549072265625, -350.70404052734375, -338.09259033203125, -325.48114013671875, -312.86968994140625, -300.25823974609375, -287.64678955078125, -275.03533935546875, -262.42388916015625, -249.81240844726562, -237.20095825195312, -224.58950805664062, -211.97805786132812, -199.36660766601562, -186.75515747070312, -174.14370727539062, -161.53225708007812, -148.92080688476562, -136.30935668945312, -123.69790649414062, -111.08645629882812, -98.47500610351562, -85.86355590820312, -73.25210571289062, -60.640655517578125, -48.029205322265625, -35.417755126953125, -22.806304931640625, -10.194854736328125, 2.416595458984375, 15.028045654296875, 27.639495849609375, 40.250946044921875, 52.862396240234375, 65.47384643554688, 78.08529663085938, 90.69674682617188, 103.30819702148438, 115.91964721679688, 128.53109741210938, 141.14254760742188, 153.75399780273438]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 8.0, 4.0, 5.0, 13.0, 8.0, 16.0, 10.0, 13.0, 21.0, 22.0, 20.0, 27.0, 22.0, 20.0, 23.0, 30.0, 35.0, 37.0, 32.0, 38.0, 35.0, 52.0, 38.0, 41.0, 32.0, 37.0, 32.0, 38.0, 27.0, 28.0, 21.0, 28.0, 30.0, 20.0, 22.0, 10.0, 18.0, 22.0, 13.0, 8.0, 9.0, 16.0, 9.0, 3.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-68.07286071777344, -66.01931762695312, -63.96577835083008, -61.91223907470703, -59.85869598388672, -57.805152893066406, -55.75161361694336, -53.69807434082031, -51.64453125, -49.59098815917969, -47.53744888305664, -45.483909606933594, -43.43036651611328, -41.37682342529297, -39.32328414916992, -37.269744873046875, -35.21620178222656, -33.16265869140625, -31.109119415283203, -29.055578231811523, -27.002037048339844, -24.948495864868164, -22.894954681396484, -20.841413497924805, -18.787872314453125, -16.734331130981445, -14.680789947509766, -12.627248764038086, -10.573707580566406, -8.520166397094727, -6.466625213623047, -4.413084030151367, -2.3595352172851562, -0.30599403381347656, 1.7475471496582031, 3.801088333129883, 5.8546295166015625, 7.908170700073242, 9.961711883544922, 12.015253067016602, 14.068794250488281, 16.12233543395996, 18.17587661743164, 20.22941780090332, 22.282958984375, 24.33650016784668, 26.39004135131836, 28.44358253479004, 30.49712371826172, 32.55066680908203, 34.60420608520508, 36.657745361328125, 38.71128845214844, 40.76483154296875, 42.8183708190918, 44.871910095214844, 46.925453186035156, 48.97899627685547, 51.032535552978516, 53.08607482910156, 55.139617919921875, 57.19316101074219, 59.246700286865234, 61.30023956298828, 63.353782653808594]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 5.0, 4.0, 8.0, 8.0, 15.0, 11.0, 6.0, 13.0, 15.0, 18.0, 24.0, 20.0, 16.0, 27.0, 22.0, 38.0, 30.0, 33.0, 32.0, 41.0, 39.0, 32.0, 38.0, 46.0, 38.0, 30.0, 40.0, 39.0, 29.0, 33.0, 20.0, 36.0, 28.0, 25.0, 23.0, 17.0, 14.0, 11.0, 12.0, 6.0, 11.0, 7.0, 6.0, 11.0, 5.0, 5.0, 7.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-12.0703125, -11.6793212890625, -11.288330078125, -10.8973388671875, -10.50634765625, -10.1153564453125, -9.724365234375, -9.3333740234375, -8.9423828125, -8.5513916015625, -8.160400390625, -7.7694091796875, -7.37841796875, -6.9874267578125, -6.596435546875, -6.2054443359375, -5.814453125, -5.4234619140625, -5.032470703125, -4.6414794921875, -4.25048828125, -3.8594970703125, -3.468505859375, -3.0775146484375, -2.6865234375, -2.2955322265625, -1.904541015625, -1.5135498046875, -1.12255859375, -0.7315673828125, -0.340576171875, 0.0504150390625, 0.44140625, 0.8323974609375, 1.223388671875, 1.6143798828125, 2.00537109375, 2.3963623046875, 2.787353515625, 3.1783447265625, 3.5693359375, 3.9603271484375, 4.351318359375, 4.7423095703125, 5.13330078125, 5.5242919921875, 5.915283203125, 6.3062744140625, 6.697265625, 7.0882568359375, 7.479248046875, 7.8702392578125, 8.26123046875, 8.6522216796875, 9.043212890625, 9.4342041015625, 9.8251953125, 10.2161865234375, 10.607177734375, 10.9981689453125, 11.38916015625, 11.7801513671875, 12.171142578125, 12.5621337890625, 12.953125]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 1.0, 7.0, 4.0, 3.0, 11.0, 15.0, 16.0, 13.0, 17.0, 25.0, 47.0, 63.0, 68.0, 119.0, 144.0, 225.0, 328.0, 508.0, 794.0, 1334.0, 2559.0, 5559.0, 14167.0, 106854.0, 3422785.0, 600437.0, 22613.0, 7833.0, 3291.0, 1732.0, 890.0, 571.0, 370.0, 241.0, 177.0, 130.0, 88.0, 62.0, 45.0, 32.0, 27.0, 19.0, 10.0, 15.0, 4.0, 6.0, 6.0, 10.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-63.0625, -61.072265625, -59.08203125, -57.091796875, -55.1015625, -53.111328125, -51.12109375, -49.130859375, -47.140625, -45.150390625, -43.16015625, -41.169921875, -39.1796875, -37.189453125, -35.19921875, -33.208984375, -31.21875, -29.228515625, -27.23828125, -25.248046875, -23.2578125, -21.267578125, -19.27734375, -17.287109375, -15.296875, -13.306640625, -11.31640625, -9.326171875, -7.3359375, -5.345703125, -3.35546875, -1.365234375, 0.625, 2.615234375, 4.60546875, 6.595703125, 8.5859375, 10.576171875, 12.56640625, 14.556640625, 16.546875, 18.537109375, 20.52734375, 22.517578125, 24.5078125, 26.498046875, 28.48828125, 30.478515625, 32.46875, 34.458984375, 36.44921875, 38.439453125, 40.4296875, 42.419921875, 44.41015625, 46.400390625, 48.390625, 50.380859375, 52.37109375, 54.361328125, 56.3515625, 58.341796875, 60.33203125, 62.322265625, 64.3125]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 6.0, 7.0, 4.0, 12.0, 9.0, 14.0, 22.0, 42.0, 42.0, 67.0, 107.0, 203.0, 428.0, 888.0, 967.0, 579.0, 264.0, 136.0, 82.0, 52.0, 32.0, 33.0, 24.0, 19.0, 8.0, 11.0, 9.0, 6.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.71875, -36.37939453125, -35.0400390625, -33.70068359375, -32.361328125, -31.02197265625, -29.6826171875, -28.34326171875, -27.00390625, -25.66455078125, -24.3251953125, -22.98583984375, -21.646484375, -20.30712890625, -18.9677734375, -17.62841796875, -16.2890625, -14.94970703125, -13.6103515625, -12.27099609375, -10.931640625, -9.59228515625, -8.2529296875, -6.91357421875, -5.57421875, -4.23486328125, -2.8955078125, -1.55615234375, -0.216796875, 1.12255859375, 2.4619140625, 3.80126953125, 5.140625, 6.47998046875, 7.8193359375, 9.15869140625, 10.498046875, 11.83740234375, 13.1767578125, 14.51611328125, 15.85546875, 17.19482421875, 18.5341796875, 19.87353515625, 21.212890625, 22.55224609375, 23.8916015625, 25.23095703125, 26.5703125, 27.90966796875, 29.2490234375, 30.58837890625, 31.927734375, 33.26708984375, 34.6064453125, 35.94580078125, 37.28515625, 38.62451171875, 39.9638671875, 41.30322265625, 42.642578125, 43.98193359375, 45.3212890625, 46.66064453125, 48.0]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 5.0, 9.0, 9.0, 10.0, 5.0, 17.0, 18.0, 42.0, 51.0, 92.0, 118.0, 189.0, 252.0, 447.0, 806.0, 1493.0, 2918.0, 6039.0, 13054.0, 32025.0, 104986.0, 1057356.0, 2712195.0, 182830.0, 45878.0, 17612.0, 7819.0, 3687.0, 1875.0, 1014.0, 523.0, 309.0, 204.0, 108.0, 66.0, 69.0, 37.0, 37.0, 30.0, 18.0, 9.0, 9.0, 9.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-32.84375, -31.853515625, -30.86328125, -29.873046875, -28.8828125, -27.892578125, -26.90234375, -25.912109375, -24.921875, -23.931640625, -22.94140625, -21.951171875, -20.9609375, -19.970703125, -18.98046875, -17.990234375, -17.0, -16.009765625, -15.01953125, -14.029296875, -13.0390625, -12.048828125, -11.05859375, -10.068359375, -9.078125, -8.087890625, -7.09765625, -6.107421875, -5.1171875, -4.126953125, -3.13671875, -2.146484375, -1.15625, -0.166015625, 0.82421875, 1.814453125, 2.8046875, 3.794921875, 4.78515625, 5.775390625, 6.765625, 7.755859375, 8.74609375, 9.736328125, 10.7265625, 11.716796875, 12.70703125, 13.697265625, 14.6875, 15.677734375, 16.66796875, 17.658203125, 18.6484375, 19.638671875, 20.62890625, 21.619140625, 22.609375, 23.599609375, 24.58984375, 25.580078125, 26.5703125, 27.560546875, 28.55078125, 29.541015625, 30.53125]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 6.0, 4.0, 5.0, 9.0, 13.0, 16.0, 15.0, 36.0, 35.0, 66.0, 74.0, 80.0, 112.0, 127.0, 103.0, 74.0, 70.0, 34.0, 29.0, 21.0, 20.0, 15.0, 12.0, 12.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-159.45872497558594, -152.8987579345703, -146.33877563476562, -139.77880859375, -133.21884155273438, -126.65885925292969, -120.09889221191406, -113.5389175415039, -106.97894287109375, -100.4189682006836, -93.85899353027344, -87.29902648925781, -80.73905181884766, -74.1790771484375, -67.61911010742188, -61.05913543701172, -54.49916076660156, -47.939186096191406, -41.379215240478516, -34.819244384765625, -28.25926971435547, -21.699295043945312, -15.139324188232422, -8.579353332519531, -2.019378662109375, 4.540594100952148, 11.100566864013672, 17.660539627075195, 24.22051239013672, 30.780487060546875, 37.340457916259766, 43.900428771972656, 50.460418701171875, 57.02039337158203, 63.58036422729492, 70.14033508300781, 76.70030975341797, 83.26028442382812, 89.82025146484375, 96.3802261352539, 102.94020080566406, 109.50017547607422, 116.06015014648438, 122.6201171875, 129.18008422851562, 135.7400665283203, 142.30003356933594, 148.86001586914062, 155.41998291015625, 161.97994995117188, 168.53993225097656, 175.0998992919922, 181.65988159179688, 188.2198486328125, 194.77981567382812, 201.33978271484375, 207.89976501464844, 214.45973205566406, 221.01971435546875, 227.57968139648438, 234.1396484375, 240.6996307373047, 247.2595977783203, 253.819580078125, 260.3795471191406]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 7.0, 1.0, 3.0, 10.0, 7.0, 7.0, 16.0, 11.0, 15.0, 11.0, 14.0, 16.0, 24.0, 38.0, 24.0, 34.0, 39.0, 48.0, 34.0, 30.0, 42.0, 47.0, 39.0, 34.0, 34.0, 37.0, 34.0, 34.0, 32.0, 33.0, 32.0, 29.0, 30.0, 19.0, 22.0, 17.0, 22.0, 11.0, 15.0, 12.0, 7.0, 9.0, 8.0, 7.0, 7.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-123.80955505371094, -120.26142120361328, -116.71328735351562, -113.16515350341797, -109.61701965332031, -106.06888580322266, -102.520751953125, -98.97261810302734, -95.42448425292969, -91.87635040283203, -88.32821655273438, -84.78008270263672, -81.23194885253906, -77.6838150024414, -74.13568115234375, -70.5875473022461, -67.03941345214844, -63.49127960205078, -59.943145751953125, -56.39501190185547, -52.84687805175781, -49.298744201660156, -45.7506103515625, -42.202476501464844, -38.65434265136719, -35.10620880126953, -31.558074951171875, -28.00994110107422, -24.461807250976562, -20.913673400878906, -17.36553955078125, -13.817405700683594, -10.269271850585938, -6.721138000488281, -3.173004150390625, 0.37512969970703125, 3.9232635498046875, 7.471397399902344, 11.01953125, 14.567665100097656, 18.115798950195312, 21.66393280029297, 25.212066650390625, 28.76020050048828, 32.30833435058594, 35.856468200683594, 39.40460205078125, 42.952735900878906, 46.50086975097656, 50.04900360107422, 53.597137451171875, 57.14527130126953, 60.69340515136719, 64.24153900146484, 67.7896728515625, 71.33780670166016, 74.88594055175781, 78.43407440185547, 81.98220825195312, 85.53034210205078, 89.07847595214844, 92.6266098022461, 96.17474365234375, 99.7228775024414, 103.27101135253906]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 5.0, 2.0, 10.0, 6.0, 6.0, 8.0, 6.0, 16.0, 15.0, 16.0, 26.0, 13.0, 28.0, 29.0, 24.0, 38.0, 37.0, 44.0, 48.0, 43.0, 48.0, 41.0, 43.0, 41.0, 40.0, 45.0, 37.0, 33.0, 34.0, 29.0, 33.0, 20.0, 20.0, 27.0, 15.0, 16.0, 8.0, 14.0, 10.0, 9.0, 9.0, 10.0, 9.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-223.75, -217.376953125, -211.00390625, -204.630859375, -198.2578125, -191.884765625, -185.51171875, -179.138671875, -172.765625, -166.392578125, -160.01953125, -153.646484375, -147.2734375, -140.900390625, -134.52734375, -128.154296875, -121.78125, -115.408203125, -109.03515625, -102.662109375, -96.2890625, -89.916015625, -83.54296875, -77.169921875, -70.796875, -64.423828125, -58.05078125, -51.677734375, -45.3046875, -38.931640625, -32.55859375, -26.185546875, -19.8125, -13.439453125, -7.06640625, -0.693359375, 5.6796875, 12.052734375, 18.42578125, 24.798828125, 31.171875, 37.544921875, 43.91796875, 50.291015625, 56.6640625, 63.037109375, 69.41015625, 75.783203125, 82.15625, 88.529296875, 94.90234375, 101.275390625, 107.6484375, 114.021484375, 120.39453125, 126.767578125, 133.140625, 139.513671875, 145.88671875, 152.259765625, 158.6328125, 165.005859375, 171.37890625, 177.751953125, 184.125]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 10.0, 13.0, 16.0, 25.0, 36.0, 40.0, 51.0, 106.0, 160.0, 207.0, 302.0, 477.0, 686.0, 986.0, 1346.0, 2002.0, 3098.0, 4438.0, 6575.0, 9885.0, 14992.0, 23254.0, 37012.0, 61449.0, 109662.0, 196985.0, 230691.0, 139597.0, 77254.0, 45613.0, 28054.0, 17712.0, 11649.0, 7761.0, 5209.0, 3585.0, 2421.0, 1615.0, 1195.0, 786.0, 486.0, 350.0, 255.0, 180.0, 119.0, 68.0, 51.0, 35.0, 23.0, 19.0, 6.0, 7.0, 4.0, 2.0, 3.0, 0.0, 4.0, 2.0, 0.0, 2.0], "bins": [-12.015625, -11.6177978515625, -11.219970703125, -10.8221435546875, -10.42431640625, -10.0264892578125, -9.628662109375, -9.2308349609375, -8.8330078125, -8.4351806640625, -8.037353515625, -7.6395263671875, -7.24169921875, -6.8438720703125, -6.446044921875, -6.0482177734375, -5.650390625, -5.2525634765625, -4.854736328125, -4.4569091796875, -4.05908203125, -3.6612548828125, -3.263427734375, -2.8656005859375, -2.4677734375, -2.0699462890625, -1.672119140625, -1.2742919921875, -0.87646484375, -0.4786376953125, -0.080810546875, 0.3170166015625, 0.71484375, 1.1126708984375, 1.510498046875, 1.9083251953125, 2.30615234375, 2.7039794921875, 3.101806640625, 3.4996337890625, 3.8974609375, 4.2952880859375, 4.693115234375, 5.0909423828125, 5.48876953125, 5.8865966796875, 6.284423828125, 6.6822509765625, 7.080078125, 7.4779052734375, 7.875732421875, 8.2735595703125, 8.67138671875, 9.0692138671875, 9.467041015625, 9.8648681640625, 10.2626953125, 10.6605224609375, 11.058349609375, 11.4561767578125, 11.85400390625, 12.2518310546875, 12.649658203125, 13.0474853515625, 13.4453125]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 4.0, 1.0, 5.0, 3.0, 5.0, 10.0, 12.0, 11.0, 14.0, 18.0, 18.0, 13.0, 23.0, 24.0, 22.0, 33.0, 28.0, 35.0, 30.0, 32.0, 47.0, 30.0, 34.0, 36.0, 1056.0, 30.0, 33.0, 28.0, 41.0, 36.0, 36.0, 30.0, 21.0, 33.0, 17.0, 22.0, 22.0, 20.0, 19.0, 8.0, 13.0, 13.0, 12.0, 12.0, 8.0, 6.0, 3.0, 4.0, 5.0, 5.0, 1.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-109.1875, -105.744140625, -102.30078125, -98.857421875, -95.4140625, -91.970703125, -88.52734375, -85.083984375, -81.640625, -78.197265625, -74.75390625, -71.310546875, -67.8671875, -64.423828125, -60.98046875, -57.537109375, -54.09375, -50.650390625, -47.20703125, -43.763671875, -40.3203125, -36.876953125, -33.43359375, -29.990234375, -26.546875, -23.103515625, -19.66015625, -16.216796875, -12.7734375, -9.330078125, -5.88671875, -2.443359375, 1.0, 4.443359375, 7.88671875, 11.330078125, 14.7734375, 18.216796875, 21.66015625, 25.103515625, 28.546875, 31.990234375, 35.43359375, 38.876953125, 42.3203125, 45.763671875, 49.20703125, 52.650390625, 56.09375, 59.537109375, 62.98046875, 66.423828125, 69.8671875, 73.310546875, 76.75390625, 80.197265625, 83.640625, 87.083984375, 90.52734375, 93.970703125, 97.4140625, 100.857421875, 104.30078125, 107.744140625, 111.1875]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 10.0, 13.0, 15.0, 17.0, 36.0, 70.0, 111.0, 127.0, 197.0, 297.0, 459.0, 732.0, 1142.0, 1793.0, 2666.0, 3924.0, 6093.0, 9155.0, 14557.0, 23135.0, 37010.0, 62570.0, 110490.0, 206754.0, 1266801.0, 143441.0, 80766.0, 46151.0, 28147.0, 17691.0, 11460.0, 7217.0, 4746.0, 3294.0, 2039.0, 1388.0, 868.0, 621.0, 400.0, 258.0, 161.0, 116.0, 74.0, 40.0, 32.0, 18.0, 12.0, 8.0, 4.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.484375, -11.1043701171875, -10.724365234375, -10.3443603515625, -9.96435546875, -9.5843505859375, -9.204345703125, -8.8243408203125, -8.4443359375, -8.0643310546875, -7.684326171875, -7.3043212890625, -6.92431640625, -6.5443115234375, -6.164306640625, -5.7843017578125, -5.404296875, -5.0242919921875, -4.644287109375, -4.2642822265625, -3.88427734375, -3.5042724609375, -3.124267578125, -2.7442626953125, -2.3642578125, -1.9842529296875, -1.604248046875, -1.2242431640625, -0.84423828125, -0.4642333984375, -0.084228515625, 0.2957763671875, 0.67578125, 1.0557861328125, 1.435791015625, 1.8157958984375, 2.19580078125, 2.5758056640625, 2.955810546875, 3.3358154296875, 3.7158203125, 4.0958251953125, 4.475830078125, 4.8558349609375, 5.23583984375, 5.6158447265625, 5.995849609375, 6.3758544921875, 6.755859375, 7.1358642578125, 7.515869140625, 7.8958740234375, 8.27587890625, 8.6558837890625, 9.035888671875, 9.4158935546875, 9.7958984375, 10.1759033203125, 10.555908203125, 10.9359130859375, 11.31591796875, 11.6959228515625, 12.075927734375, 12.4559326171875, 12.8359375]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 3.0, 1.0, 3.0, 4.0, 11.0, 3.0, 8.0, 7.0, 7.0, 14.0, 21.0, 15.0, 32.0, 20.0, 30.0, 39.0, 52.0, 73.0, 103.0, 77.0, 86.0, 59.0, 59.0, 43.0, 41.0, 30.0, 30.0, 21.0, 20.0, 18.0, 8.0, 18.0, 8.0, 6.0, 6.0, 2.0, 6.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.10626220703125, -0.10278892517089844, -0.09931564331054688, -0.09584236145019531, -0.09236907958984375, -0.08889579772949219, -0.08542251586914062, -0.08194923400878906, -0.0784759521484375, -0.07500267028808594, -0.07152938842773438, -0.06805610656738281, -0.06458282470703125, -0.06110954284667969, -0.057636260986328125, -0.05416297912597656, -0.050689697265625, -0.04721641540527344, -0.043743133544921875, -0.04026985168457031, -0.03679656982421875, -0.03332328796386719, -0.029850006103515625, -0.026376724243164062, -0.0229034423828125, -0.019430160522460938, -0.015956878662109375, -0.012483596801757812, -0.00901031494140625, -0.0055370330810546875, -0.002063751220703125, 0.0014095306396484375, 0.0048828125, 0.008356094360351562, 0.011829376220703125, 0.015302658081054688, 0.01877593994140625, 0.022249221801757812, 0.025722503662109375, 0.029195785522460938, 0.0326690673828125, 0.03614234924316406, 0.039615631103515625, 0.04308891296386719, 0.04656219482421875, 0.05003547668457031, 0.053508758544921875, 0.05698204040527344, 0.060455322265625, 0.06392860412597656, 0.06740188598632812, 0.07087516784667969, 0.07434844970703125, 0.07782173156738281, 0.08129501342773438, 0.08476829528808594, 0.0882415771484375, 0.09171485900878906, 0.09518814086914062, 0.09866142272949219, 0.10213470458984375, 0.10560798645019531, 0.10908126831054688, 0.11255455017089844, 0.11602783203125]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 7.0, 6.0, 5.0, 9.0, 9.0, 12.0, 16.0, 21.0, 33.0, 37.0, 26.0, 62.0, 64.0, 81.0, 105.0, 188.0, 274.0, 449.0, 752.0, 1277.0, 2652.0, 5324.0, 12013.0, 30273.0, 90976.0, 393859.0, 371929.0, 86638.0, 28870.0, 11612.0, 5134.0, 2510.0, 1264.0, 761.0, 444.0, 263.0, 165.0, 108.0, 77.0, 64.0, 31.0, 38.0, 27.0, 26.0, 17.0, 14.0, 7.0, 8.0, 7.0, 3.0, 4.0, 4.0, 2.0, 4.0, 1.0, 2.0, 2.0], "bins": [-0.60986328125, -0.59136962890625, -0.5728759765625, -0.55438232421875, -0.535888671875, -0.51739501953125, -0.4989013671875, -0.48040771484375, -0.4619140625, -0.44342041015625, -0.4249267578125, -0.40643310546875, -0.387939453125, -0.36944580078125, -0.3509521484375, -0.33245849609375, -0.31396484375, -0.29547119140625, -0.2769775390625, -0.25848388671875, -0.239990234375, -0.22149658203125, -0.2030029296875, -0.18450927734375, -0.166015625, -0.14752197265625, -0.1290283203125, -0.11053466796875, -0.092041015625, -0.07354736328125, -0.0550537109375, -0.03656005859375, -0.01806640625, 0.00042724609375, 0.0189208984375, 0.03741455078125, 0.055908203125, 0.07440185546875, 0.0928955078125, 0.11138916015625, 0.1298828125, 0.14837646484375, 0.1668701171875, 0.18536376953125, 0.203857421875, 0.22235107421875, 0.2408447265625, 0.25933837890625, 0.27783203125, 0.29632568359375, 0.3148193359375, 0.33331298828125, 0.351806640625, 0.37030029296875, 0.3887939453125, 0.40728759765625, 0.42578125, 0.44427490234375, 0.4627685546875, 0.48126220703125, 0.499755859375, 0.51824951171875, 0.5367431640625, 0.55523681640625, 0.57373046875]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 9.0, 14.0, 41.0, 94.0, 205.0, 225.0, 155.0, 88.0, 52.0, 41.0, 22.0, 22.0, 7.0, 12.0, 6.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.11078447103500366, -0.09978906810283661, -0.08879366517066956, -0.0777982547879219, -0.06680285185575485, -0.0558074489235878, -0.04481203854084015, -0.033816635608673096, -0.022821232676506042, -0.01182582788169384, -0.0008304230868816376, 0.010164983570575714, 0.021160386502742767, 0.03215578943490982, 0.04315119981765747, 0.054146602749824524, 0.06514200568199158, 0.07613740861415863, 0.08713281154632568, 0.09812822192907333, 0.10912362486124039, 0.12011902779340744, 0.1311144381761551, 0.14210984110832214, 0.1531052440404892, 0.16410064697265625, 0.1750960499048233, 0.18609145283699036, 0.1970868706703186, 0.20808225870132446, 0.2190776765346527, 0.23007307946681976, 0.24106848239898682, 0.25206390023231506, 0.2630592882633209, 0.27405470609664917, 0.28505009412765503, 0.2960455119609833, 0.3070409297943115, 0.3180363178253174, 0.32903170585632324, 0.3400271236896515, 0.35102251172065735, 0.3620179295539856, 0.37301331758499146, 0.3840087354183197, 0.39500415325164795, 0.4059995412826538, 0.41699495911598206, 0.4279903769493103, 0.43898576498031616, 0.4499811828136444, 0.46097657084465027, 0.4719719886779785, 0.4829673767089844, 0.4939627945423126, 0.5049582123756409, 0.5159536004066467, 0.5269490480422974, 0.5379444360733032, 0.5489398241043091, 0.5599352121353149, 0.5709306597709656, 0.5819260478019714, 0.5929214358329773]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 6.0, 4.0, 6.0, 7.0, 7.0, 8.0, 12.0, 13.0, 14.0, 14.0, 14.0, 18.0, 39.0, 28.0, 19.0, 18.0, 34.0, 34.0, 39.0, 33.0, 34.0, 39.0, 36.0, 29.0, 36.0, 45.0, 39.0, 38.0, 33.0, 21.0, 28.0, 24.0, 32.0, 24.0, 28.0, 20.0, 18.0, 15.0, 13.0, 12.0, 8.0, 19.0, 16.0, 11.0, 6.0, 6.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 3.0], "bins": [-0.11677920818328857, -0.11341586709022522, -0.11005252599716187, -0.10668918490409851, -0.10332584381103516, -0.0999625027179718, -0.09659916907548904, -0.09323582798242569, -0.08987248688936234, -0.08650914579629898, -0.08314580470323563, -0.07978246361017227, -0.07641912996768951, -0.07305578887462616, -0.0696924477815628, -0.06632910668849945, -0.0629657655954361, -0.05960242450237274, -0.05623908340930939, -0.05287574604153633, -0.04951240494847298, -0.04614906385540962, -0.042785726487636566, -0.03942238539457321, -0.03605904430150986, -0.0326957032084465, -0.029332363978028297, -0.025969024747610092, -0.022605683654546738, -0.019242342561483383, -0.015879003331065178, -0.012515664100646973, -0.009152323007583618, -0.005788982845842838, -0.0024256426841020584, 0.0009376974776387215, 0.004301037639379501, 0.007664378732442856, 0.011027717962861061, 0.014391057193279266, 0.01775439828634262, 0.021117739379405975, 0.02448107860982418, 0.027844417840242386, 0.03120775893330574, 0.034571100026369095, 0.03793443739414215, 0.041297778487205505, 0.04466111958026886, 0.048024460673332214, 0.05138780176639557, 0.054751139134168625, 0.05811448022723198, 0.061477821320295334, 0.06484115868806839, 0.06820449978113174, 0.0715678408741951, 0.07493118196725845, 0.07829452306032181, 0.08165786415338516, 0.08502119779586792, 0.08838453888893127, 0.09174787998199463, 0.09511122107505798, 0.09847456216812134]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 10.0, 5.0, 7.0, 8.0, 6.0, 16.0, 15.0, 16.0, 25.0, 14.0, 30.0, 27.0, 24.0, 38.0, 36.0, 44.0, 50.0, 42.0, 49.0, 40.0, 43.0, 43.0, 37.0, 46.0, 37.0, 32.0, 36.0, 27.0, 33.0, 21.0, 21.0, 27.0, 14.0, 17.0, 7.0, 14.0, 10.0, 9.0, 9.0, 11.0, 8.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-223.75, -217.376953125, -211.00390625, -204.630859375, -198.2578125, -191.884765625, -185.51171875, -179.138671875, -172.765625, -166.392578125, -160.01953125, -153.646484375, -147.2734375, -140.900390625, -134.52734375, -128.154296875, -121.78125, -115.408203125, -109.03515625, -102.662109375, -96.2890625, -89.916015625, -83.54296875, -77.169921875, -70.796875, -64.423828125, -58.05078125, -51.677734375, -45.3046875, -38.931640625, -32.55859375, -26.185546875, -19.8125, -13.439453125, -7.06640625, -0.693359375, 5.6796875, 12.052734375, 18.42578125, 24.798828125, 31.171875, 37.544921875, 43.91796875, 50.291015625, 56.6640625, 63.037109375, 69.41015625, 75.783203125, 82.15625, 88.529296875, 94.90234375, 101.275390625, 107.6484375, 114.021484375, 120.39453125, 126.767578125, 133.140625, 139.513671875, 145.88671875, 152.259765625, 158.6328125, 165.005859375, 171.37890625, 177.751953125, 184.125]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 3.0, 11.0, 11.0, 10.0, 17.0, 25.0, 16.0, 37.0, 28.0, 34.0, 44.0, 52.0, 80.0, 111.0, 176.0, 304.0, 570.0, 1349.0, 3523.0, 11027.0, 44139.0, 279682.0, 586974.0, 91421.0, 19160.0, 5717.0, 2010.0, 819.0, 431.0, 232.0, 136.0, 74.0, 67.0, 51.0, 41.0, 26.0, 29.0, 25.0, 19.0, 19.0, 11.0, 14.0, 13.0, 5.0, 7.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0], "bins": [-41.71875, -40.49951171875, -39.2802734375, -38.06103515625, -36.841796875, -35.62255859375, -34.4033203125, -33.18408203125, -31.96484375, -30.74560546875, -29.5263671875, -28.30712890625, -27.087890625, -25.86865234375, -24.6494140625, -23.43017578125, -22.2109375, -20.99169921875, -19.7724609375, -18.55322265625, -17.333984375, -16.11474609375, -14.8955078125, -13.67626953125, -12.45703125, -11.23779296875, -10.0185546875, -8.79931640625, -7.580078125, -6.36083984375, -5.1416015625, -3.92236328125, -2.703125, -1.48388671875, -0.2646484375, 0.95458984375, 2.173828125, 3.39306640625, 4.6123046875, 5.83154296875, 7.05078125, 8.27001953125, 9.4892578125, 10.70849609375, 11.927734375, 13.14697265625, 14.3662109375, 15.58544921875, 16.8046875, 18.02392578125, 19.2431640625, 20.46240234375, 21.681640625, 22.90087890625, 24.1201171875, 25.33935546875, 26.55859375, 27.77783203125, 28.9970703125, 30.21630859375, 31.435546875, 32.65478515625, 33.8740234375, 35.09326171875, 36.3125]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 7.0, 8.0, 9.0, 14.0, 14.0, 20.0, 35.0, 49.0, 38.0, 43.0, 67.0, 75.0, 60.0, 2101.0, 96.0, 67.0, 75.0, 57.0, 50.0, 34.0, 37.0, 25.0, 21.0, 9.0, 14.0, 8.0, 6.0, 5.0, 3.0, 1.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-328.0, -316.15625, -304.3125, -292.46875, -280.625, -268.78125, -256.9375, -245.09375, -233.25, -221.40625, -209.5625, -197.71875, -185.875, -174.03125, -162.1875, -150.34375, -138.5, -126.65625, -114.8125, -102.96875, -91.125, -79.28125, -67.4375, -55.59375, -43.75, -31.90625, -20.0625, -8.21875, 3.625, 15.46875, 27.3125, 39.15625, 51.0, 62.84375, 74.6875, 86.53125, 98.375, 110.21875, 122.0625, 133.90625, 145.75, 157.59375, 169.4375, 181.28125, 193.125, 204.96875, 216.8125, 228.65625, 240.5, 252.34375, 264.1875, 276.03125, 287.875, 299.71875, 311.5625, 323.40625, 335.25, 347.09375, 358.9375, 370.78125, 382.625, 394.46875, 406.3125, 418.15625, 430.0]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 12.0, 9.0, 15.0, 25.0, 29.0, 46.0, 79.0, 140.0, 236.0, 409.0, 1015.0, 2612.0, 17733.0, 2813542.0, 296379.0, 9680.0, 2055.0, 788.0, 389.0, 210.0, 90.0, 81.0, 40.0, 27.0, 22.0, 12.0, 12.0, 0.0, 3.0, 6.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-86.5, -84.154296875, -81.80859375, -79.462890625, -77.1171875, -74.771484375, -72.42578125, -70.080078125, -67.734375, -65.388671875, -63.04296875, -60.697265625, -58.3515625, -56.005859375, -53.66015625, -51.314453125, -48.96875, -46.623046875, -44.27734375, -41.931640625, -39.5859375, -37.240234375, -34.89453125, -32.548828125, -30.203125, -27.857421875, -25.51171875, -23.166015625, -20.8203125, -18.474609375, -16.12890625, -13.783203125, -11.4375, -9.091796875, -6.74609375, -4.400390625, -2.0546875, 0.291015625, 2.63671875, 4.982421875, 7.328125, 9.673828125, 12.01953125, 14.365234375, 16.7109375, 19.056640625, 21.40234375, 23.748046875, 26.09375, 28.439453125, 30.78515625, 33.130859375, 35.4765625, 37.822265625, 40.16796875, 42.513671875, 44.859375, 47.205078125, 49.55078125, 51.896484375, 54.2421875, 56.587890625, 58.93359375, 61.279296875, 63.625]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 2.0, 4.0, 6.0, 18.0, 16.0, 17.0, 67.0, 93.0, 184.0, 192.0, 174.0, 92.0, 49.0, 29.0, 15.0, 11.0, 7.0, 4.0, 4.0, 5.0, 2.0, 4.0, 0.0, 2.0, 3.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-541.301513671875, -526.8113403320312, -512.3211669921875, -497.83099365234375, -483.3407897949219, -468.8506164550781, -454.3604431152344, -439.8702697753906, -425.38006591796875, -410.889892578125, -396.39971923828125, -381.9095458984375, -367.4193420410156, -352.9291687011719, -338.4389953613281, -323.9488220214844, -309.4586486816406, -294.9684753417969, -280.4783020019531, -265.98809814453125, -251.4979248046875, -237.00775146484375, -222.517578125, -208.02740478515625, -193.53721618652344, -179.0470428466797, -164.55685424804688, -150.06668090820312, -135.57650756835938, -121.08631896972656, -106.59614562988281, -92.10596466064453, -77.61578369140625, -63.12560272216797, -48.63542556762695, -34.14524841308594, -19.655067443847656, -5.164886474609375, 9.325286865234375, 23.815467834472656, 38.30564880371094, 52.79582977294922, 67.2860107421875, 81.77618408203125, 96.26636505126953, 110.75654602050781, 125.24671936035156, 139.73690795898438, 154.22708129882812, 168.71725463867188, 183.2074432373047, 197.69761657714844, 212.18780517578125, 226.677978515625, 241.16815185546875, 255.6583251953125, 270.14849853515625, 284.638671875, 299.12884521484375, 313.6190185546875, 328.1092224121094, 342.5993957519531, 357.0895690917969, 371.5797424316406, 386.0699462890625]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 7.0, 8.0, 6.0, 13.0, 8.0, 19.0, 24.0, 29.0, 32.0, 31.0, 30.0, 43.0, 44.0, 46.0, 39.0, 57.0, 57.0, 50.0, 43.0, 45.0, 57.0, 32.0, 41.0, 47.0, 26.0, 35.0, 23.0, 24.0, 19.0, 9.0, 13.0, 2.0, 8.0, 6.0, 5.0, 6.0, 3.0, 7.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-411.3312072753906, -399.6236267089844, -387.9160461425781, -376.2084655761719, -364.5008850097656, -352.7933349609375, -341.08575439453125, -329.378173828125, -317.67059326171875, -305.9630126953125, -294.25543212890625, -282.5478515625, -270.84027099609375, -259.1326904296875, -247.4251251220703, -235.71755981445312, -224.0099639892578, -212.30238342285156, -200.5948028564453, -188.88723754882812, -177.17965698242188, -165.47207641601562, -153.76449584960938, -142.05691528320312, -130.34933471679688, -118.64175415039062, -106.9341812133789, -95.22660064697266, -83.51902770996094, -71.81144714355469, -60.10386657714844, -48.39629364013672, -36.688720703125, -24.981143951416016, -13.273565292358398, -1.5659866333007812, 10.141590118408203, 21.849166870117188, 33.55674743652344, 45.264320373535156, 56.971900939941406, 68.67948150634766, 80.38705444335938, 92.09463500976562, 103.80221557617188, 115.5097885131836, 127.21736907958984, 138.92494201660156, 150.6325225830078, 162.34010314941406, 174.0476837158203, 185.7552490234375, 197.46282958984375, 209.17041015625, 220.87799072265625, 232.5855712890625, 244.29315185546875, 256.000732421875, 267.70831298828125, 279.4158935546875, 291.12347412109375, 302.8310546875, 314.53863525390625, 326.2461853027344, 337.9537658691406]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 6.0, 7.0, 3.0, 1.0, 8.0, 10.0, 12.0, 15.0, 9.0, 20.0, 24.0, 12.0, 28.0, 23.0, 34.0, 44.0, 55.0, 86.0, 153.0, 302.0, 612.0, 1125.0, 1041124.0, 2352.0, 1047.0, 616.0, 288.0, 151.0, 82.0, 49.0, 48.0, 35.0, 19.0, 26.0, 23.0, 20.0, 15.0, 17.0, 11.0, 8.0, 9.0, 10.0, 4.0, 8.0, 3.0, 2.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-183.59390258789062, -178.02786254882812, -172.46182250976562, -166.89578247070312, -161.32974243164062, -155.7637176513672, -150.1976776123047, -144.6316375732422, -139.0655975341797, -133.4995574951172, -127.93351745605469, -122.36748504638672, -116.80144500732422, -111.23540496826172, -105.66937255859375, -100.10333251953125, -94.53729248046875, -88.97125244140625, -83.40521240234375, -77.83917999267578, -72.27313995361328, -66.70709991455078, -61.14106369018555, -55.57502746582031, -50.00898742675781, -44.44294738769531, -38.87691116333008, -33.310874938964844, -27.744834899902344, -22.178796768188477, -16.61275863647461, -11.046722412109375, -5.4806976318359375, 0.08534049987792969, 5.651378631591797, 11.217416763305664, 16.78345489501953, 22.3494930267334, 27.915531158447266, 33.4815673828125, 39.047607421875, 44.6136474609375, 50.179683685302734, 55.74571990966797, 61.31175994873047, 66.87779998779297, 72.44383239746094, 78.00987243652344, 83.57591247558594, 89.14195251464844, 94.70799255371094, 100.2740249633789, 105.8400650024414, 111.4061050415039, 116.97213745117188, 122.53817749023438, 128.10421752929688, 133.67025756835938, 139.23629760742188, 144.80233764648438, 150.36837768554688, 155.9344024658203, 161.5004425048828, 167.0664825439453, 172.6325225830078]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 3.0, 3.0, 4.0, 2.0, 4.0, 8.0, 6.0, 8.0, 14.0, 13.0, 15.0, 28.0, 35.0, 78.0, 349.0, 51441860.0, 20352.0, 273.0, 50.0, 29.0, 17.0, 7.0, 7.0, 6.0, 9.0, 1.0, 7.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-2284.1474609375, -2216.785888671875, -2149.424072265625, -2082.0625, -2014.70068359375, -1947.339111328125, -1879.9774169921875, -1812.61572265625, -1745.2540283203125, -1677.892333984375, -1610.5306396484375, -1543.1689453125, -1475.807373046875, -1408.445556640625, -1341.083984375, -1273.7222900390625, -1206.360595703125, -1138.9989013671875, -1071.63720703125, -1004.2755737304688, -936.9138793945312, -869.5521850585938, -802.1905517578125, -734.828857421875, -667.4671630859375, -600.10546875, -532.7437744140625, -465.38214111328125, -398.02044677734375, -330.65875244140625, -263.2970886230469, -195.9354248046875, -128.57373046875, -61.21205139160156, 6.149627685546875, 73.51130676269531, 140.87298583984375, 208.23468017578125, 275.5963439941406, 342.9580078125, 410.3197021484375, 477.681396484375, 545.0430908203125, 612.4047241210938, 679.7664184570312, 747.1281127929688, 814.48974609375, 881.8514404296875, 949.213134765625, 1016.5748291015625, 1083.9365234375, 1151.2982177734375, 1218.659912109375, 1286.021484375, 1353.3831787109375, 1420.744873046875, 1488.1065673828125, 1555.46826171875, 1622.8299560546875, 1690.191650390625, 1757.55322265625, 1824.9150390625, 1892.276611328125, 1959.6383056640625, 2027.0]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 1.0, 2.0, 3.0, 5.0, 13.0, 29.0, 37.0, 47.0, 80.0, 153.0, 202.0, 307.0, 556.0, 870.0, 1315.0, 1966.0, 3094.0, 4846.0, 7423.0, 11045.0, 17809.0, 28319.0, 45431.0, 73579.0, 125278.0, 219306.0, 390510.0, 1635331.0, 2751805.0, 408674.0, 227935.0, 130027.0, 77588.0, 47348.0, 29040.0, 18273.0, 11620.0, 7698.0, 4893.0, 3057.0, 2082.0, 1341.0, 875.0, 560.0, 358.0, 258.0, 163.0, 105.0, 73.0, 39.0, 29.0, 19.0, 9.0, 9.0, 7.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-3.525390625, -3.41180419921875, -3.2982177734375, -3.18463134765625, -3.071044921875, -2.95745849609375, -2.8438720703125, -2.73028564453125, -2.61669921875, -2.50311279296875, -2.3895263671875, -2.27593994140625, -2.162353515625, -2.04876708984375, -1.9351806640625, -1.82159423828125, -1.7080078125, -1.59442138671875, -1.4808349609375, -1.36724853515625, -1.253662109375, -1.14007568359375, -1.0264892578125, -0.91290283203125, -0.79931640625, -0.68572998046875, -0.5721435546875, -0.45855712890625, -0.344970703125, -0.23138427734375, -0.1177978515625, -0.00421142578125, 0.109375, 0.22296142578125, 0.3365478515625, 0.45013427734375, 0.563720703125, 0.67730712890625, 0.7908935546875, 0.90447998046875, 1.01806640625, 1.13165283203125, 1.2452392578125, 1.35882568359375, 1.472412109375, 1.58599853515625, 1.6995849609375, 1.81317138671875, 1.9267578125, 2.04034423828125, 2.1539306640625, 2.26751708984375, 2.381103515625, 2.49468994140625, 2.6082763671875, 2.72186279296875, 2.83544921875, 2.94903564453125, 3.0626220703125, 3.17620849609375, 3.289794921875, 3.40338134765625, 3.5169677734375, 3.63055419921875, 3.744140625]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 6.0, 3.0, 6.0, 12.0, 10.0, 11.0, 10.0, 7.0, 11.0, 16.0, 17.0, 14.0, 22.0, 26.0, 30.0, 30.0, 36.0, 24.0, 35.0, 29.0, 41.0, 44.0, 120.0, 955.0, 83.0, 39.0, 28.0, 28.0, 33.0, 41.0, 31.0, 40.0, 29.0, 20.0, 17.0, 13.0, 23.0, 17.0, 13.0, 14.0, 15.0, 4.0, 5.0, 8.0, 4.0, 4.0, 3.0, 2.0, 4.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.0, -32.71533203125, -31.4306640625, -30.14599609375, -28.861328125, -27.57666015625, -26.2919921875, -25.00732421875, -23.72265625, -22.43798828125, -21.1533203125, -19.86865234375, -18.583984375, -17.29931640625, -16.0146484375, -14.72998046875, -13.4453125, -12.16064453125, -10.8759765625, -9.59130859375, -8.306640625, -7.02197265625, -5.7373046875, -4.45263671875, -3.16796875, -1.88330078125, -0.5986328125, 0.68603515625, 1.970703125, 3.25537109375, 4.5400390625, 5.82470703125, 7.109375, 8.39404296875, 9.6787109375, 10.96337890625, 12.248046875, 13.53271484375, 14.8173828125, 16.10205078125, 17.38671875, 18.67138671875, 19.9560546875, 21.24072265625, 22.525390625, 23.81005859375, 25.0947265625, 26.37939453125, 27.6640625, 28.94873046875, 30.2333984375, 31.51806640625, 32.802734375, 34.08740234375, 35.3720703125, 36.65673828125, 37.94140625, 39.22607421875, 40.5107421875, 41.79541015625, 43.080078125, 44.36474609375, 45.6494140625, 46.93408203125, 48.21875]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 6.0, 10.0, 20.0, 15.0, 30.0, 32.0, 64.0, 95.0, 170.0, 277.0, 479.0, 690.0, 1100.0, 1759.0, 2853.0, 4622.0, 7351.0, 11619.0, 18706.0, 30237.0, 48658.0, 79088.0, 131886.0, 218741.0, 340194.0, 506527.0, 3615205.0, 452069.0, 312398.0, 197273.0, 119950.0, 72053.0, 44687.0, 27303.0, 17087.0, 10303.0, 6690.0, 4244.0, 2609.0, 1678.0, 926.0, 654.0, 408.0, 220.0, 156.0, 109.0, 75.0, 39.0, 32.0, 12.0, 9.0, 8.0, 4.0, 3.0, 2.0, 3.0, 3.0, 3.0], "bins": [-2.775390625, -2.689727783203125, -2.60406494140625, -2.518402099609375, -2.4327392578125, -2.347076416015625, -2.26141357421875, -2.175750732421875, -2.090087890625, -2.004425048828125, -1.91876220703125, -1.833099365234375, -1.7474365234375, -1.661773681640625, -1.57611083984375, -1.490447998046875, -1.40478515625, -1.319122314453125, -1.23345947265625, -1.147796630859375, -1.0621337890625, -0.976470947265625, -0.89080810546875, -0.805145263671875, -0.719482421875, -0.633819580078125, -0.54815673828125, -0.462493896484375, -0.3768310546875, -0.291168212890625, -0.20550537109375, -0.119842529296875, -0.0341796875, 0.051483154296875, 0.13714599609375, 0.222808837890625, 0.3084716796875, 0.394134521484375, 0.47979736328125, 0.565460205078125, 0.651123046875, 0.736785888671875, 0.82244873046875, 0.908111572265625, 0.9937744140625, 1.079437255859375, 1.16510009765625, 1.250762939453125, 1.33642578125, 1.422088623046875, 1.50775146484375, 1.593414306640625, 1.6790771484375, 1.764739990234375, 1.85040283203125, 1.936065673828125, 2.021728515625, 2.107391357421875, 2.19305419921875, 2.278717041015625, 2.3643798828125, 2.450042724609375, 2.53570556640625, 2.621368408203125, 2.70703125]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 5.0, 5.0, 9.0, 4.0, 5.0, 5.0, 12.0, 9.0, 13.0, 18.0, 22.0, 23.0, 21.0, 28.0, 29.0, 25.0, 34.0, 44.0, 28.0, 33.0, 40.0, 34.0, 125.0, 966.0, 49.0, 36.0, 37.0, 39.0, 41.0, 27.0, 36.0, 25.0, 25.0, 29.0, 23.0, 15.0, 17.0, 12.0, 15.0, 11.0, 13.0, 15.0, 7.0, 9.0, 3.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-31.125, -30.165283203125, -29.20556640625, -28.245849609375, -27.2861328125, -26.326416015625, -25.36669921875, -24.406982421875, -23.447265625, -22.487548828125, -21.52783203125, -20.568115234375, -19.6083984375, -18.648681640625, -17.68896484375, -16.729248046875, -15.76953125, -14.809814453125, -13.85009765625, -12.890380859375, -11.9306640625, -10.970947265625, -10.01123046875, -9.051513671875, -8.091796875, -7.132080078125, -6.17236328125, -5.212646484375, -4.2529296875, -3.293212890625, -2.33349609375, -1.373779296875, -0.4140625, 0.545654296875, 1.50537109375, 2.465087890625, 3.4248046875, 4.384521484375, 5.34423828125, 6.303955078125, 7.263671875, 8.223388671875, 9.18310546875, 10.142822265625, 11.1025390625, 12.062255859375, 13.02197265625, 13.981689453125, 14.94140625, 15.901123046875, 16.86083984375, 17.820556640625, 18.7802734375, 19.739990234375, 20.69970703125, 21.659423828125, 22.619140625, 23.578857421875, 24.53857421875, 25.498291015625, 26.4580078125, 27.417724609375, 28.37744140625, 29.337158203125, 30.296875]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 12.0, 9.0, 7.0, 12.0, 17.0, 25.0, 28.0, 28.0, 51.0, 93.0, 123.0, 188.0, 208.0, 270.0, 397.0, 577.0, 1012.0, 1630.0, 3041.0, 5997.0, 12029.0, 24706.0, 52903.0, 114482.0, 5659354.0, 243140.0, 88709.0, 41753.0, 19955.0, 9637.0, 4693.0, 2520.0, 1286.0, 774.0, 486.0, 364.0, 261.0, 164.0, 143.0, 98.0, 74.0, 52.0, 29.0, 25.0, 21.0, 13.0, 14.0, 14.0, 5.0, 4.0, 3.0, 4.0, 0.0, 3.0], "bins": [-10.3984375, -10.0999755859375, -9.801513671875, -9.5030517578125, -9.20458984375, -8.9061279296875, -8.607666015625, -8.3092041015625, -8.0107421875, -7.7122802734375, -7.413818359375, -7.1153564453125, -6.81689453125, -6.5184326171875, -6.219970703125, -5.9215087890625, -5.623046875, -5.3245849609375, -5.026123046875, -4.7276611328125, -4.42919921875, -4.1307373046875, -3.832275390625, -3.5338134765625, -3.2353515625, -2.9368896484375, -2.638427734375, -2.3399658203125, -2.04150390625, -1.7430419921875, -1.444580078125, -1.1461181640625, -0.84765625, -0.5491943359375, -0.250732421875, 0.0477294921875, 0.34619140625, 0.6446533203125, 0.943115234375, 1.2415771484375, 1.5400390625, 1.8385009765625, 2.136962890625, 2.4354248046875, 2.73388671875, 3.0323486328125, 3.330810546875, 3.6292724609375, 3.927734375, 4.2261962890625, 4.524658203125, 4.8231201171875, 5.12158203125, 5.4200439453125, 5.718505859375, 6.0169677734375, 6.3154296875, 6.6138916015625, 6.912353515625, 7.2108154296875, 7.50927734375, 7.8077392578125, 8.106201171875, 8.4046630859375, 8.703125]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 4.0, 3.0, 8.0, 4.0, 8.0, 10.0, 13.0, 12.0, 11.0, 15.0, 13.0, 20.0, 26.0, 28.0, 35.0, 33.0, 28.0, 20.0, 29.0, 36.0, 44.0, 35.0, 566.0, 556.0, 38.0, 32.0, 42.0, 38.0, 29.0, 43.0, 31.0, 35.0, 32.0, 21.0, 20.0, 23.0, 14.0, 14.0, 20.0, 9.0, 7.0, 8.0, 5.0, 5.0, 3.0, 1.0, 5.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.671875, -21.801513671875, -20.93115234375, -20.060791015625, -19.1904296875, -18.320068359375, -17.44970703125, -16.579345703125, -15.708984375, -14.838623046875, -13.96826171875, -13.097900390625, -12.2275390625, -11.357177734375, -10.48681640625, -9.616455078125, -8.74609375, -7.875732421875, -7.00537109375, -6.135009765625, -5.2646484375, -4.394287109375, -3.52392578125, -2.653564453125, -1.783203125, -0.912841796875, -0.04248046875, 0.827880859375, 1.6982421875, 2.568603515625, 3.43896484375, 4.309326171875, 5.1796875, 6.050048828125, 6.92041015625, 7.790771484375, 8.6611328125, 9.531494140625, 10.40185546875, 11.272216796875, 12.142578125, 13.012939453125, 13.88330078125, 14.753662109375, 15.6240234375, 16.494384765625, 17.36474609375, 18.235107421875, 19.10546875, 19.975830078125, 20.84619140625, 21.716552734375, 22.5869140625, 23.457275390625, 24.32763671875, 25.197998046875, 26.068359375, 26.938720703125, 27.80908203125, 28.679443359375, 29.5498046875, 30.420166015625, 31.29052734375, 32.160888671875, 33.03125]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 5.0, 5.0, 18.0, 34.0, 78.0, 238.0, 380.0, 157.0, 55.0, 26.0, 9.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-169.63021850585938, -165.21250915527344, -160.79481506347656, -156.37710571289062, -151.9593963623047, -147.54168701171875, -143.12399291992188, -138.70628356933594, -134.28857421875, -129.87086486816406, -125.45316314697266, -121.03546142578125, -116.61775207519531, -112.2000503540039, -107.7823486328125, -103.36463928222656, -98.94693756103516, -94.52923583984375, -90.11152648925781, -85.6938247680664, -81.27611541748047, -76.85841369628906, -72.44070434570312, -68.02300262451172, -63.60529708862305, -59.187591552734375, -54.7698860168457, -50.35218048095703, -45.934478759765625, -41.51676940917969, -37.09906768798828, -32.68136215209961, -28.263656616210938, -23.845951080322266, -19.428245544433594, -15.010541915893555, -10.592836380004883, -6.175130844116211, -1.7574272155761719, 2.6602783203125, 7.077983856201172, 11.495689392089844, 15.9133939743042, 20.331098556518555, 24.748804092407227, 29.1665096282959, 33.58421325683594, 38.00191879272461, 42.41962432861328, 46.83732986450195, 51.255035400390625, 55.67273712158203, 60.09044647216797, 64.50814819335938, 68.92585754394531, 73.34355926513672, 77.76126098632812, 82.17896270751953, 86.59667205810547, 91.01437377929688, 95.43208312988281, 99.84978485107422, 104.26748657226562, 108.68519592285156, 113.1029052734375]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 6.0, 6.0, 7.0, 7.0, 11.0, 14.0, 14.0, 19.0, 27.0, 17.0, 29.0, 34.0, 39.0, 45.0, 52.0, 40.0, 57.0, 49.0, 55.0, 48.0, 47.0, 40.0, 45.0, 49.0, 29.0, 35.0, 40.0, 28.0, 21.0, 16.0, 11.0, 18.0, 9.0, 13.0, 6.0, 8.0, 7.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-73.93032836914062, -71.72845458984375, -69.5265884399414, -67.32471466064453, -65.12284851074219, -62.92097473144531, -60.71910095214844, -58.51723098754883, -56.31536102294922, -54.11349105834961, -51.91162109375, -49.709747314453125, -47.507877349853516, -45.306007385253906, -43.10413360595703, -40.90226364135742, -38.70039367675781, -36.4985237121582, -34.296653747558594, -32.09477996826172, -29.89291000366211, -27.6910400390625, -25.489168167114258, -23.287296295166016, -21.085426330566406, -18.883556365966797, -16.681684494018555, -14.479813575744629, -12.277942657470703, -10.076071739196777, -7.874200820922852, -5.672329902648926, -3.470458984375, -1.2685880661010742, 0.9332828521728516, 3.1351537704467773, 5.337024688720703, 7.538895606994629, 9.740766525268555, 11.94263744354248, 14.144508361816406, 16.346378326416016, 18.548250198364258, 20.7501220703125, 22.95199203491211, 25.15386199951172, 27.35573387145996, 29.557605743408203, 31.759475708007812, 33.96134567260742, 36.16321563720703, 38.365089416503906, 40.566959381103516, 42.768829345703125, 44.970703125, 47.17257308959961, 49.37444305419922, 51.57631301879883, 53.77818298339844, 55.98005676269531, 58.18192672729492, 60.38379669189453, 62.585670471191406, 64.78753662109375, 66.98941040039062]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 2.0, 2.0, 4.0, 7.0, 6.0, 13.0, 11.0, 9.0, 24.0, 17.0, 17.0, 31.0, 54.0, 56.0, 94.0, 120.0, 153.0, 215.0, 302.0, 401.0, 614.0, 1117.0, 1989.0, 4024.0, 10613.0, 46441.0, 3963256.0, 131930.0, 18634.0, 6440.0, 2994.0, 1554.0, 956.0, 573.0, 434.0, 281.0, 196.0, 149.0, 101.0, 101.0, 78.0, 51.0, 56.0, 33.0, 27.0, 17.0, 25.0, 15.0, 10.0, 8.0, 8.0, 11.0, 9.0, 1.0, 7.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.56640625, -0.5473403930664062, -0.5282745361328125, -0.5092086791992188, -0.490142822265625, -0.47107696533203125, -0.4520111083984375, -0.43294525146484375, -0.41387939453125, -0.39481353759765625, -0.3757476806640625, -0.35668182373046875, -0.337615966796875, -0.31855010986328125, -0.2994842529296875, -0.28041839599609375, -0.2613525390625, -0.24228668212890625, -0.2232208251953125, -0.20415496826171875, -0.185089111328125, -0.16602325439453125, -0.1469573974609375, -0.12789154052734375, -0.10882568359375, -0.08975982666015625, -0.0706939697265625, -0.05162811279296875, -0.032562255859375, -0.01349639892578125, 0.0055694580078125, 0.02463531494140625, 0.043701171875, 0.06276702880859375, 0.0818328857421875, 0.10089874267578125, 0.119964599609375, 0.13903045654296875, 0.1580963134765625, 0.17716217041015625, 0.19622802734375, 0.21529388427734375, 0.2343597412109375, 0.25342559814453125, 0.272491455078125, 0.29155731201171875, 0.3106231689453125, 0.32968902587890625, 0.3487548828125, 0.36782073974609375, 0.3868865966796875, 0.40595245361328125, 0.425018310546875, 0.44408416748046875, 0.4631500244140625, 0.48221588134765625, 0.50128173828125, 0.5203475952148438, 0.5394134521484375, 0.5584793090820312, 0.577545166015625, 0.5966110229492188, 0.6156768798828125, 0.6347427368164062, 0.65380859375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 0.0, 2.0, 1.0, 5.0, 3.0, 1.0, 4.0, 6.0, 2.0, 10.0, 5.0, 7.0, 13.0, 17.0, 14.0, 23.0, 759.0, 24.0, 15.0, 11.0, 12.0, 6.0, 7.0, 8.0, 5.0, 5.0, 7.0, 5.0, 4.0, 4.0, 5.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.261474609375, -0.25269317626953125, -0.2439117431640625, -0.23513031005859375, -0.226348876953125, -0.21756744384765625, -0.2087860107421875, -0.20000457763671875, -0.19122314453125, -0.18244171142578125, -0.1736602783203125, -0.16487884521484375, -0.156097412109375, -0.14731597900390625, -0.1385345458984375, -0.12975311279296875, -0.1209716796875, -0.11219024658203125, -0.1034088134765625, -0.09462738037109375, -0.085845947265625, -0.07706451416015625, -0.0682830810546875, -0.05950164794921875, -0.05072021484375, -0.04193878173828125, -0.0331573486328125, -0.02437591552734375, -0.015594482421875, -0.00681304931640625, 0.0019683837890625, 0.01074981689453125, 0.01953125, 0.02831268310546875, 0.0370941162109375, 0.04587554931640625, 0.054656982421875, 0.06343841552734375, 0.0722198486328125, 0.08100128173828125, 0.08978271484375, 0.09856414794921875, 0.1073455810546875, 0.11612701416015625, 0.124908447265625, 0.13368988037109375, 0.1424713134765625, 0.15125274658203125, 0.1600341796875, 0.16881561279296875, 0.1775970458984375, 0.18637847900390625, 0.195159912109375, 0.20394134521484375, 0.2127227783203125, 0.22150421142578125, 0.23028564453125, 0.23906707763671875, 0.2478485107421875, 0.25662994384765625, 0.265411376953125, 0.27419281005859375, 0.2829742431640625, 0.29175567626953125, 0.300537109375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 3.0, 7.0, 2.0, 1.0, 5.0, 9.0, 17.0, 11.0, 16.0, 34.0, 36.0, 71.0, 100.0, 145.0, 228.0, 303.0, 549.0, 892.0, 1734.0, 3424.0, 8993.0, 32504.0, 379314.0, 3632159.0, 103446.0, 18123.0, 5969.0, 2522.0, 1382.0, 795.0, 498.0, 333.0, 221.0, 154.0, 81.0, 55.0, 43.0, 34.0, 19.0, 13.0, 10.0, 7.0, 10.0, 3.0, 3.0, 5.0, 4.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.662109375, -0.6402511596679688, -0.6183929443359375, -0.5965347290039062, -0.574676513671875, -0.5528182983398438, -0.5309600830078125, -0.5091018676757812, -0.48724365234375, -0.46538543701171875, -0.4435272216796875, -0.42166900634765625, -0.399810791015625, -0.37795257568359375, -0.3560943603515625, -0.33423614501953125, -0.3123779296875, -0.29051971435546875, -0.2686614990234375, -0.24680328369140625, -0.224945068359375, -0.20308685302734375, -0.1812286376953125, -0.15937042236328125, -0.13751220703125, -0.11565399169921875, -0.0937957763671875, -0.07193756103515625, -0.050079345703125, -0.02822113037109375, -0.0063629150390625, 0.01549530029296875, 0.037353515625, 0.05921173095703125, 0.0810699462890625, 0.10292816162109375, 0.124786376953125, 0.14664459228515625, 0.1685028076171875, 0.19036102294921875, 0.21221923828125, 0.23407745361328125, 0.2559356689453125, 0.27779388427734375, 0.299652099609375, 0.32151031494140625, 0.3433685302734375, 0.36522674560546875, 0.3870849609375, 0.40894317626953125, 0.4308013916015625, 0.45265960693359375, 0.474517822265625, 0.49637603759765625, 0.5182342529296875, 0.5400924682617188, 0.56195068359375, 0.5838088989257812, 0.6056671142578125, 0.6275253295898438, 0.649383544921875, 0.6712417602539062, 0.6930999755859375, 0.7149581909179688, 0.73681640625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 5.0, 9.0, 5.0, 13.0, 9.0, 22.0, 45.0, 62.0, 162.0, 797.0, 2140.0, 514.0, 130.0, 58.0, 37.0, 19.0, 12.0, 6.0, 8.0, 5.0, 6.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.4912109375, -0.4760284423828125, -0.460845947265625, -0.4456634521484375, -0.43048095703125, -0.4152984619140625, -0.400115966796875, -0.3849334716796875, -0.3697509765625, -0.3545684814453125, -0.339385986328125, -0.3242034912109375, -0.30902099609375, -0.2938385009765625, -0.278656005859375, -0.2634735107421875, -0.248291015625, -0.2331085205078125, -0.217926025390625, -0.2027435302734375, -0.18756103515625, -0.1723785400390625, -0.157196044921875, -0.1420135498046875, -0.1268310546875, -0.1116485595703125, -0.096466064453125, -0.0812835693359375, -0.06610107421875, -0.0509185791015625, -0.035736083984375, -0.0205535888671875, -0.00537109375, 0.0098114013671875, 0.024993896484375, 0.0401763916015625, 0.05535888671875, 0.0705413818359375, 0.085723876953125, 0.1009063720703125, 0.1160888671875, 0.1312713623046875, 0.146453857421875, 0.1616363525390625, 0.17681884765625, 0.1920013427734375, 0.207183837890625, 0.2223663330078125, 0.237548828125, 0.2527313232421875, 0.267913818359375, 0.2830963134765625, 0.29827880859375, 0.3134613037109375, 0.328643798828125, 0.3438262939453125, 0.3590087890625, 0.3741912841796875, 0.389373779296875, 0.4045562744140625, 0.41973876953125, 0.4349212646484375, 0.450103759765625, 0.4652862548828125, 0.48046875]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 8.0, 14.0, 39.0, 115.0, 316.0, 324.0, 117.0, 39.0, 14.0, 6.0, 4.0, 4.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6542479991912842, -1.5881787538528442, -1.5221095085144043, -1.4560402631759644, -1.3899710178375244, -1.3239017724990845, -1.2578325271606445, -1.1917634010314941, -1.1256940364837646, -1.0596247911453247, -0.9935555458068848, -0.9274863004684448, -0.8614170551300049, -0.7953478097915649, -0.7292786240577698, -0.6632093787193298, -0.5971401929855347, -0.5310709476470947, -0.4650017023086548, -0.39893248677253723, -0.3328632414340973, -0.26679399609565735, -0.2007247805595398, -0.13465553522109985, -0.06858628988265991, -0.0025170519948005676, 0.06355218589305878, 0.12962141633033752, 0.19569066166877747, 0.2617599070072174, 0.32782912254333496, 0.3938983678817749, 0.45996761322021484, 0.5260368585586548, 0.5921061038970947, 0.6581753492355347, 0.7242445945739746, 0.7903138399124146, 0.8563830256462097, 0.9224522709846497, 0.9885215163230896, 1.0545907020568848, 1.1206599473953247, 1.1867291927337646, 1.2527984380722046, 1.3188676834106445, 1.3849369287490845, 1.4510061740875244, 1.5170754194259644, 1.5831446647644043, 1.6492139101028442, 1.7152831554412842, 1.7813524007797241, 1.847421646118164, 1.9134907722473145, 1.979560136795044, 2.0456292629241943, 2.1116983890533447, 2.177767753601074, 2.2438368797302246, 2.309906244277954, 2.3759753704071045, 2.442044734954834, 2.5081138610839844, 2.574183225631714]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 3.0, 1.0, 5.0, 4.0, 4.0, 6.0, 5.0, 6.0, 17.0, 7.0, 21.0, 22.0, 24.0, 38.0, 36.0, 48.0, 55.0, 79.0, 64.0, 59.0, 66.0, 77.0, 61.0, 49.0, 43.0, 40.0, 29.0, 18.0, 18.0, 20.0, 14.0, 10.0, 14.0, 13.0, 7.0, 3.0, 11.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.0924677848815918, -1.0598351955413818, -1.0272026062011719, -0.9945700764656067, -0.9619375467300415, -0.9293049573898315, -0.8966723680496216, -0.8640397787094116, -0.8314072489738464, -0.7987746596336365, -0.7661421298980713, -0.7335095405578613, -0.7008769512176514, -0.6682444214820862, -0.6356118321418762, -0.602979302406311, -0.5703467130661011, -0.5377141237258911, -0.5050815939903259, -0.47244900465011597, -0.4398164451122284, -0.4071838855743408, -0.37455129623413086, -0.3419187366962433, -0.3092861771583557, -0.27665361762046814, -0.24402104318141937, -0.2113884687423706, -0.17875590920448303, -0.14612334966659546, -0.11349077522754669, -0.08085820078849792, -0.0482257604598999, -0.015593193471431732, 0.017039373517036438, 0.04967194050550461, 0.08230450749397278, 0.11493706703186035, 0.14756964147090912, 0.18020221590995789, 0.21283477544784546, 0.24546733498573303, 0.2780998945236206, 0.31073248386383057, 0.34336504340171814, 0.3759976029396057, 0.4086301922798157, 0.44126275181770325, 0.4738953113555908, 0.5065279006958008, 0.539160430431366, 0.5717930197715759, 0.6044255495071411, 0.6370581388473511, 0.669690728187561, 0.702323317527771, 0.7349558472633362, 0.7675884366035461, 0.8002209663391113, 0.8328535556793213, 0.8654861450195312, 0.8981186747550964, 0.9307512640953064, 0.9633837938308716, 0.9960163831710815]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 9.0, 1.0, 8.0, 11.0, 12.0, 19.0, 20.0, 45.0, 55.0, 94.0, 132.0, 225.0, 301.0, 412.0, 610.0, 884.0, 1380.0, 2053.0, 3015.0, 4951.0, 8374.0, 16038.0, 35675.0, 857250.0, 64900.0, 22650.0, 11574.0, 6562.0, 3926.0, 2469.0, 1567.0, 1032.0, 740.0, 499.0, 352.0, 236.0, 166.0, 87.0, 70.0, 53.0, 41.0, 25.0, 11.0, 14.0, 5.0, 4.0, 6.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3798828125, -1.337738037109375, -1.29559326171875, -1.253448486328125, -1.2113037109375, -1.169158935546875, -1.12701416015625, -1.084869384765625, -1.042724609375, -1.000579833984375, -0.95843505859375, -0.916290283203125, -0.8741455078125, -0.832000732421875, -0.78985595703125, -0.747711181640625, -0.70556640625, -0.663421630859375, -0.62127685546875, -0.579132080078125, -0.5369873046875, -0.494842529296875, -0.45269775390625, -0.410552978515625, -0.368408203125, -0.326263427734375, -0.28411865234375, -0.241973876953125, -0.1998291015625, -0.157684326171875, -0.11553955078125, -0.073394775390625, -0.03125, 0.010894775390625, 0.05303955078125, 0.095184326171875, 0.1373291015625, 0.179473876953125, 0.22161865234375, 0.263763427734375, 0.305908203125, 0.348052978515625, 0.39019775390625, 0.432342529296875, 0.4744873046875, 0.516632080078125, 0.55877685546875, 0.600921630859375, 0.64306640625, 0.685211181640625, 0.72735595703125, 0.769500732421875, 0.8116455078125, 0.853790283203125, 0.89593505859375, 0.938079833984375, 0.980224609375, 1.022369384765625, 1.06451416015625, 1.106658935546875, 1.1488037109375, 1.190948486328125, 1.23309326171875, 1.275238037109375, 1.3173828125]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 0.0, 4.0, 2.0, 5.0, 9.0, 4.0, 5.0, 10.0, 13.0, 14.0, 20.0, 162.0, 616.0, 25.0, 16.0, 8.0, 14.0, 7.0, 3.0, 10.0, 4.0, 3.0, 6.0, 10.0, 1.0, 3.0, 6.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2418212890625, -0.2333087921142578, -0.22479629516601562, -0.21628379821777344, -0.20777130126953125, -0.19925880432128906, -0.19074630737304688, -0.1822338104248047, -0.1737213134765625, -0.1652088165283203, -0.15669631958007812, -0.14818382263183594, -0.13967132568359375, -0.13115882873535156, -0.12264633178710938, -0.11413383483886719, -0.105621337890625, -0.09710884094238281, -0.08859634399414062, -0.08008384704589844, -0.07157135009765625, -0.06305885314941406, -0.054546356201171875, -0.04603385925292969, -0.0375213623046875, -0.029008865356445312, -0.020496368408203125, -0.011983871459960938, -0.00347137451171875, 0.0050411224365234375, 0.013553619384765625, 0.022066116333007812, 0.03057861328125, 0.03909111022949219, 0.047603607177734375, 0.05611610412597656, 0.06462860107421875, 0.07314109802246094, 0.08165359497070312, 0.09016609191894531, 0.0986785888671875, 0.10719108581542969, 0.11570358276367188, 0.12421607971191406, 0.13272857666015625, 0.14124107360839844, 0.14975357055664062, 0.1582660675048828, 0.166778564453125, 0.1752910614013672, 0.18380355834960938, 0.19231605529785156, 0.20082855224609375, 0.20934104919433594, 0.21785354614257812, 0.2263660430908203, 0.2348785400390625, 0.2433910369873047, 0.2519035339355469, 0.26041603088378906, 0.26892852783203125, 0.27744102478027344, 0.2859535217285156, 0.2944660186767578, 0.302978515625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 6.0, 10.0, 14.0, 17.0, 25.0, 30.0, 33.0, 48.0, 63.0, 92.0, 127.0, 196.0, 260.0, 436.0, 636.0, 1249.0, 2555.0, 5588.0, 13293.0, 35240.0, 106623.0, 366738.0, 353034.0, 103668.0, 34334.0, 13083.0, 5448.0, 2427.0, 1256.0, 707.0, 434.0, 247.0, 156.0, 118.0, 95.0, 68.0, 67.0, 41.0, 26.0, 21.0, 14.0, 16.0, 8.0, 2.0, 8.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.73779296875, -0.71234130859375, -0.6868896484375, -0.66143798828125, -0.635986328125, -0.61053466796875, -0.5850830078125, -0.55963134765625, -0.5341796875, -0.50872802734375, -0.4832763671875, -0.45782470703125, -0.432373046875, -0.40692138671875, -0.3814697265625, -0.35601806640625, -0.33056640625, -0.30511474609375, -0.2796630859375, -0.25421142578125, -0.228759765625, -0.20330810546875, -0.1778564453125, -0.15240478515625, -0.126953125, -0.10150146484375, -0.0760498046875, -0.05059814453125, -0.025146484375, 0.00030517578125, 0.0257568359375, 0.05120849609375, 0.07666015625, 0.10211181640625, 0.1275634765625, 0.15301513671875, 0.178466796875, 0.20391845703125, 0.2293701171875, 0.25482177734375, 0.2802734375, 0.30572509765625, 0.3311767578125, 0.35662841796875, 0.382080078125, 0.40753173828125, 0.4329833984375, 0.45843505859375, 0.48388671875, 0.50933837890625, 0.5347900390625, 0.56024169921875, 0.585693359375, 0.61114501953125, 0.6365966796875, 0.66204833984375, 0.6875, 0.71295166015625, 0.7384033203125, 0.76385498046875, 0.789306640625, 0.81475830078125, 0.8402099609375, 0.86566162109375, 0.89111328125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 3.0, 8.0, 4.0, 4.0, 9.0, 9.0, 22.0, 15.0, 8.0, 16.0, 14.0, 20.0, 31.0, 26.0, 26.0, 31.0, 25.0, 33.0, 32.0, 31.0, 39.0, 29.0, 34.0, 37.0, 33.0, 38.0, 34.0, 35.0, 26.0, 34.0, 21.0, 33.0, 36.0, 30.0, 24.0, 20.0, 28.0, 18.0, 9.0, 14.0, 9.0, 11.0, 8.0, 6.0, 8.0, 6.0, 8.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.8662109375, -0.8380355834960938, -0.8098602294921875, -0.7816848754882812, -0.753509521484375, -0.7253341674804688, -0.6971588134765625, -0.6689834594726562, -0.64080810546875, -0.6126327514648438, -0.5844573974609375, -0.5562820434570312, -0.528106689453125, -0.49993133544921875, -0.4717559814453125, -0.44358062744140625, -0.4154052734375, -0.38722991943359375, -0.3590545654296875, -0.33087921142578125, -0.302703857421875, -0.27452850341796875, -0.2463531494140625, -0.21817779541015625, -0.19000244140625, -0.16182708740234375, -0.1336517333984375, -0.10547637939453125, -0.077301025390625, -0.04912567138671875, -0.0209503173828125, 0.00722503662109375, 0.035400390625, 0.06357574462890625, 0.0917510986328125, 0.11992645263671875, 0.148101806640625, 0.17627716064453125, 0.2044525146484375, 0.23262786865234375, 0.26080322265625, 0.28897857666015625, 0.3171539306640625, 0.34532928466796875, 0.373504638671875, 0.40167999267578125, 0.4298553466796875, 0.45803070068359375, 0.4862060546875, 0.5143814086914062, 0.5425567626953125, 0.5707321166992188, 0.598907470703125, 0.6270828247070312, 0.6552581787109375, 0.6834335327148438, 0.71160888671875, 0.7397842407226562, 0.7679595947265625, 0.7961349487304688, 0.824310302734375, 0.8524856567382812, 0.8806610107421875, 0.9088363647460938, 0.93701171875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 7.0, 2.0, 5.0, 4.0, 6.0, 13.0, 15.0, 18.0, 24.0, 39.0, 56.0, 52.0, 103.0, 138.0, 212.0, 374.0, 641.0, 1137.0, 2883.0, 8051.0, 41367.0, 814926.0, 154539.0, 15740.0, 4335.0, 1757.0, 826.0, 467.0, 286.0, 188.0, 95.0, 76.0, 42.0, 36.0, 22.0, 22.0, 13.0, 12.0, 6.0, 8.0, 4.0, 4.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.99560546875, -0.9597091674804688, -0.9238128662109375, -0.8879165649414062, -0.852020263671875, -0.8161239624023438, -0.7802276611328125, -0.7443313598632812, -0.70843505859375, -0.6725387573242188, -0.6366424560546875, -0.6007461547851562, -0.564849853515625, -0.5289535522460938, -0.4930572509765625, -0.45716094970703125, -0.4212646484375, -0.38536834716796875, -0.3494720458984375, -0.31357574462890625, -0.277679443359375, -0.24178314208984375, -0.2058868408203125, -0.16999053955078125, -0.13409423828125, -0.09819793701171875, -0.0623016357421875, -0.02640533447265625, 0.009490966796875, 0.04538726806640625, 0.0812835693359375, 0.11717987060546875, 0.153076171875, 0.18897247314453125, 0.2248687744140625, 0.26076507568359375, 0.296661376953125, 0.33255767822265625, 0.3684539794921875, 0.40435028076171875, 0.44024658203125, 0.47614288330078125, 0.5120391845703125, 0.5479354858398438, 0.583831787109375, 0.6197280883789062, 0.6556243896484375, 0.6915206909179688, 0.7274169921875, 0.7633132934570312, 0.7992095947265625, 0.8351058959960938, 0.871002197265625, 0.9068984985351562, 0.9427947998046875, 0.9786911010742188, 1.01458740234375, 1.0504837036132812, 1.0863800048828125, 1.1222763061523438, 1.158172607421875, 1.1940689086914062, 1.2299652099609375, 1.2658615112304688, 1.3017578125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 5.0, 1.0, 5.0, 6.0, 10.0, 18.0, 15.0, 27.0, 33.0, 56.0, 66.0, 83.0, 93.0, 96.0, 120.0, 98.0, 85.0, 55.0, 33.0, 27.0, 23.0, 15.0, 6.0, 6.0, 8.0, 4.0, 5.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-6.765127182006836e-05, -6.594602018594742e-05, -6.424076855182648e-05, -6.253551691770554e-05, -6.0830265283584595e-05, -5.9125013649463654e-05, -5.741976201534271e-05, -5.571451038122177e-05, -5.400925874710083e-05, -5.230400711297989e-05, -5.059875547885895e-05, -4.8893503844738007e-05, -4.7188252210617065e-05, -4.5483000576496124e-05, -4.377774894237518e-05, -4.207249730825424e-05, -4.03672456741333e-05, -3.866199404001236e-05, -3.695674240589142e-05, -3.525149077177048e-05, -3.3546239137649536e-05, -3.1840987503528595e-05, -3.0135735869407654e-05, -2.8430484235286713e-05, -2.672523260116577e-05, -2.501998096704483e-05, -2.331472933292389e-05, -2.1609477698802948e-05, -1.9904226064682007e-05, -1.8198974430561066e-05, -1.6493722796440125e-05, -1.4788471162319183e-05, -1.3083219528198242e-05, -1.1377967894077301e-05, -9.67271625995636e-06, -7.967464625835419e-06, -6.2622129917144775e-06, -4.556961357593536e-06, -2.8517097234725952e-06, -1.146458089351654e-06, 5.587935447692871e-07, 2.2640451788902283e-06, 3.9692968130111694e-06, 5.674548447132111e-06, 7.379800081253052e-06, 9.085051715373993e-06, 1.0790303349494934e-05, 1.2495554983615875e-05, 1.4200806617736816e-05, 1.5906058251857758e-05, 1.76113098859787e-05, 1.931656152009964e-05, 2.102181315422058e-05, 2.2727064788341522e-05, 2.4432316422462463e-05, 2.6137568056583405e-05, 2.7842819690704346e-05, 2.9548071324825287e-05, 3.125332295894623e-05, 3.295857459306717e-05, 3.466382622718811e-05, 3.636907786130905e-05, 3.807432949542999e-05, 3.9779581129550934e-05, 4.1484832763671875e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 6.0, 10.0, 6.0, 5.0, 18.0, 34.0, 19.0, 66.0, 83.0, 131.0, 216.0, 338.0, 667.0, 1204.0, 2546.0, 5680.0, 16447.0, 93561.0, 799687.0, 99189.0, 17108.0, 5954.0, 2554.0, 1338.0, 679.0, 359.0, 219.0, 149.0, 93.0, 61.0, 29.0, 20.0, 14.0, 19.0, 11.0, 13.0, 7.0, 8.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.158203125, -1.1161041259765625, -1.074005126953125, -1.0319061279296875, -0.98980712890625, -0.9477081298828125, -0.905609130859375, -0.8635101318359375, -0.8214111328125, -0.7793121337890625, -0.737213134765625, -0.6951141357421875, -0.65301513671875, -0.6109161376953125, -0.568817138671875, -0.5267181396484375, -0.484619140625, -0.4425201416015625, -0.400421142578125, -0.3583221435546875, -0.31622314453125, -0.2741241455078125, -0.232025146484375, -0.1899261474609375, -0.1478271484375, -0.1057281494140625, -0.063629150390625, -0.0215301513671875, 0.02056884765625, 0.0626678466796875, 0.104766845703125, 0.1468658447265625, 0.18896484375, 0.2310638427734375, 0.273162841796875, 0.3152618408203125, 0.35736083984375, 0.3994598388671875, 0.441558837890625, 0.4836578369140625, 0.5257568359375, 0.5678558349609375, 0.609954833984375, 0.6520538330078125, 0.69415283203125, 0.7362518310546875, 0.778350830078125, 0.8204498291015625, 0.862548828125, 0.9046478271484375, 0.946746826171875, 0.9888458251953125, 1.03094482421875, 1.0730438232421875, 1.115142822265625, 1.1572418212890625, 1.1993408203125, 1.2414398193359375, 1.283538818359375, 1.3256378173828125, 1.36773681640625, 1.4098358154296875, 1.451934814453125, 1.4940338134765625, 1.5361328125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 4.0, 3.0, 1.0, 7.0, 6.0, 8.0, 8.0, 7.0, 12.0, 26.0, 21.0, 44.0, 66.0, 63.0, 102.0, 115.0, 104.0, 114.0, 60.0, 49.0, 39.0, 39.0, 16.0, 17.0, 19.0, 5.0, 11.0, 8.0, 4.0, 4.0, 5.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.4140625, -1.3710784912109375, -1.328094482421875, -1.2851104736328125, -1.24212646484375, -1.1991424560546875, -1.156158447265625, -1.1131744384765625, -1.0701904296875, -1.0272064208984375, -0.984222412109375, -0.9412384033203125, -0.89825439453125, -0.8552703857421875, -0.812286376953125, -0.7693023681640625, -0.726318359375, -0.6833343505859375, -0.640350341796875, -0.5973663330078125, -0.55438232421875, -0.5113983154296875, -0.468414306640625, -0.4254302978515625, -0.3824462890625, -0.3394622802734375, -0.296478271484375, -0.2534942626953125, -0.21051025390625, -0.1675262451171875, -0.124542236328125, -0.0815582275390625, -0.03857421875, 0.0044097900390625, 0.047393798828125, 0.0903778076171875, 0.13336181640625, 0.1763458251953125, 0.219329833984375, 0.2623138427734375, 0.3052978515625, 0.3482818603515625, 0.391265869140625, 0.4342498779296875, 0.47723388671875, 0.5202178955078125, 0.563201904296875, 0.6061859130859375, 0.649169921875, 0.6921539306640625, 0.735137939453125, 0.7781219482421875, 0.82110595703125, 0.8640899658203125, 0.907073974609375, 0.9500579833984375, 0.9930419921875, 1.0360260009765625, 1.079010009765625, 1.1219940185546875, 1.16497802734375, 1.2079620361328125, 1.250946044921875, 1.2939300537109375, 1.3369140625]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 3.0, 16.0, 28.0, 144.0, 483.0, 228.0, 59.0, 20.0, 9.0, 7.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.70941925048828, -16.927597045898438, -16.145774841308594, -15.363953590393066, -14.582131385803223, -13.800310134887695, -13.018487930297852, -12.236665725708008, -11.454843521118164, -10.67302131652832, -9.891200065612793, -9.10937786102295, -8.327555656433105, -7.54573392868042, -6.763912200927734, -5.982089996337891, -5.200268745422363, -4.418447017669678, -3.636624813079834, -2.8548030853271484, -2.072981119155884, -1.2911591529846191, -0.5093374252319336, 0.27248477935791016, 1.0543065071105957, 1.8361284732818604, 2.617950439453125, 3.3997721672058105, 4.181593894958496, 4.96341609954834, 5.745237827301025, 6.527060031890869, 7.308881759643555, 8.090703964233398, 8.872525215148926, 9.65434741973877, 10.436169624328613, 11.21799087524414, 11.999813079833984, 12.781635284423828, 13.563457489013672, 14.345279693603516, 15.127100944519043, 15.908923149108887, 16.690744400024414, 17.472566604614258, 18.2543888092041, 19.036211013793945, 19.818031311035156, 20.599853515625, 21.381675720214844, 22.163497924804688, 22.9453182220459, 23.727140426635742, 24.508962631225586, 25.29078483581543, 26.072607040405273, 26.854429244995117, 27.63625144958496, 28.418071746826172, 29.199893951416016, 29.98171615600586, 30.763538360595703, 31.545360565185547, 32.32718276977539]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 3.0, 4.0, 2.0, 3.0, 6.0, 9.0, 10.0, 6.0, 6.0, 12.0, 17.0, 24.0, 43.0, 71.0, 73.0, 121.0, 111.0, 95.0, 97.0, 73.0, 61.0, 39.0, 15.0, 25.0, 11.0, 10.0, 6.0, 4.0, 6.0, 7.0, 2.0, 4.0, 3.0, 2.0, 0.0, 5.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0], "bins": [-15.543840408325195, -15.022405624389648, -14.500970840454102, -13.979536056518555, -13.458101272583008, -12.936666488647461, -12.415230751037598, -11.89379596710205, -11.372361183166504, -10.850926399230957, -10.32949161529541, -9.808056831359863, -9.28662109375, -8.765186309814453, -8.243751525878906, -7.722316741943359, -7.2008819580078125, -6.679447174072266, -6.158012390136719, -5.636577129364014, -5.115142345428467, -4.59370756149292, -4.072272300720215, -3.550837516784668, -3.029402732849121, -2.507967948913574, -1.9865329265594482, -1.4650980234146118, -0.9436631202697754, -0.4222283363342285, 0.09920668601989746, 0.6206417083740234, 1.1420783996582031, 1.6635133028030396, 2.184948205947876, 2.706383228302002, 3.227818012237549, 3.7492527961730957, 4.270688056945801, 4.792122840881348, 5.3135576248168945, 5.834992408752441, 6.356427192687988, 6.877862453460693, 7.39929723739624, 7.920732021331787, 8.442167282104492, 8.963602066040039, 9.485036849975586, 10.006471633911133, 10.52790641784668, 11.049341201782227, 11.570775985717773, 12.09221076965332, 12.613646507263184, 13.13508129119873, 13.656516075134277, 14.177950859069824, 14.699385643005371, 15.220820426940918, 15.742256164550781, 16.263690948486328, 16.785125732421875, 17.306560516357422, 17.82799530029297]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 5.0, 10.0, 14.0, 21.0, 20.0, 40.0, 54.0, 86.0, 98.0, 172.0, 278.0, 393.0, 718.0, 1172.0, 2013.0, 3684.0, 7468.0, 18054.0, 66999.0, 3765508.0, 261350.0, 36599.0, 13686.0, 6860.0, 3580.0, 2055.0, 1211.0, 821.0, 450.0, 281.0, 198.0, 120.0, 93.0, 47.0, 42.0, 25.0, 23.0, 12.0, 6.0, 4.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-1.9609375, -1.9028778076171875, -1.844818115234375, -1.7867584228515625, -1.72869873046875, -1.6706390380859375, -1.612579345703125, -1.5545196533203125, -1.4964599609375, -1.4384002685546875, -1.380340576171875, -1.3222808837890625, -1.26422119140625, -1.2061614990234375, -1.148101806640625, -1.0900421142578125, -1.031982421875, -0.9739227294921875, -0.915863037109375, -0.8578033447265625, -0.79974365234375, -0.7416839599609375, -0.683624267578125, -0.6255645751953125, -0.5675048828125, -0.5094451904296875, -0.451385498046875, -0.3933258056640625, -0.33526611328125, -0.2772064208984375, -0.219146728515625, -0.1610870361328125, -0.10302734375, -0.0449676513671875, 0.013092041015625, 0.0711517333984375, 0.12921142578125, 0.1872711181640625, 0.245330810546875, 0.3033905029296875, 0.3614501953125, 0.4195098876953125, 0.477569580078125, 0.5356292724609375, 0.59368896484375, 0.6517486572265625, 0.709808349609375, 0.7678680419921875, 0.825927734375, 0.8839874267578125, 0.942047119140625, 1.0001068115234375, 1.05816650390625, 1.1162261962890625, 1.174285888671875, 1.2323455810546875, 1.2904052734375, 1.3484649658203125, 1.406524658203125, 1.4645843505859375, 1.52264404296875, 1.5807037353515625, 1.638763427734375, 1.6968231201171875, 1.7548828125]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 1.0, 7.0, 4.0, 0.0, 4.0, 9.0, 10.0, 9.0, 9.0, 12.0, 28.0, 51.0, 145.0, 270.0, 214.0, 77.0, 37.0, 20.0, 10.0, 7.0, 11.0, 7.0, 7.0, 5.0, 5.0, 4.0, 5.0, 5.0, 4.0, 2.0, 4.0, 4.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.2041015625, -0.1980915069580078, -0.19208145141601562, -0.18607139587402344, -0.18006134033203125, -0.17405128479003906, -0.16804122924804688, -0.1620311737060547, -0.1560211181640625, -0.1500110626220703, -0.14400100708007812, -0.13799095153808594, -0.13198089599609375, -0.12597084045410156, -0.11996078491210938, -0.11395072937011719, -0.107940673828125, -0.10193061828613281, -0.09592056274414062, -0.08991050720214844, -0.08390045166015625, -0.07789039611816406, -0.07188034057617188, -0.06587028503417969, -0.0598602294921875, -0.05385017395019531, -0.047840118408203125, -0.04183006286621094, -0.03582000732421875, -0.029809951782226562, -0.023799896240234375, -0.017789840698242188, -0.01177978515625, -0.0057697296142578125, 0.000240325927734375, 0.0062503814697265625, 0.01226043701171875, 0.018270492553710938, 0.024280548095703125, 0.030290603637695312, 0.0363006591796875, 0.04231071472167969, 0.048320770263671875, 0.05433082580566406, 0.06034088134765625, 0.06635093688964844, 0.07236099243164062, 0.07837104797363281, 0.084381103515625, 0.09039115905761719, 0.09640121459960938, 0.10241127014160156, 0.10842132568359375, 0.11443138122558594, 0.12044143676757812, 0.1264514923095703, 0.1324615478515625, 0.1384716033935547, 0.14448165893554688, 0.15049171447753906, 0.15650177001953125, 0.16251182556152344, 0.16852188110351562, 0.1745319366455078, 0.1805419921875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 4.0, 5.0, 4.0, 7.0, 8.0, 13.0, 12.0, 24.0, 33.0, 45.0, 55.0, 96.0, 132.0, 185.0, 340.0, 601.0, 1042.0, 2229.0, 5329.0, 15178.0, 57765.0, 580572.0, 3356868.0, 131879.0, 26991.0, 8156.0, 3301.0, 1484.0, 788.0, 404.0, 235.0, 161.0, 108.0, 60.0, 45.0, 33.0, 30.0, 17.0, 11.0, 10.0, 11.0, 5.0, 4.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.091796875, -1.0531158447265625, -1.014434814453125, -0.9757537841796875, -0.93707275390625, -0.8983917236328125, -0.859710693359375, -0.8210296630859375, -0.7823486328125, -0.7436676025390625, -0.704986572265625, -0.6663055419921875, -0.62762451171875, -0.5889434814453125, -0.550262451171875, -0.5115814208984375, -0.472900390625, -0.4342193603515625, -0.395538330078125, -0.3568572998046875, -0.31817626953125, -0.2794952392578125, -0.240814208984375, -0.2021331787109375, -0.1634521484375, -0.1247711181640625, -0.086090087890625, -0.0474090576171875, -0.00872802734375, 0.0299530029296875, 0.068634033203125, 0.1073150634765625, 0.14599609375, 0.1846771240234375, 0.223358154296875, 0.2620391845703125, 0.30072021484375, 0.3394012451171875, 0.378082275390625, 0.4167633056640625, 0.4554443359375, 0.4941253662109375, 0.532806396484375, 0.5714874267578125, 0.61016845703125, 0.6488494873046875, 0.687530517578125, 0.7262115478515625, 0.764892578125, 0.8035736083984375, 0.842254638671875, 0.8809356689453125, 0.91961669921875, 0.9582977294921875, 0.996978759765625, 1.0356597900390625, 1.0743408203125, 1.1130218505859375, 1.151702880859375, 1.1903839111328125, 1.22906494140625, 1.2677459716796875, 1.306427001953125, 1.3451080322265625, 1.3837890625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 5.0, 6.0, 11.0, 7.0, 11.0, 14.0, 15.0, 31.0, 28.0, 41.0, 56.0, 92.0, 150.0, 462.0, 1523.0, 806.0, 331.0, 161.0, 85.0, 56.0, 36.0, 41.0, 23.0, 21.0, 10.0, 15.0, 10.0, 4.0, 3.0, 7.0, 2.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.275146484375, -0.2669963836669922, -0.2588462829589844, -0.25069618225097656, -0.24254608154296875, -0.23439598083496094, -0.22624588012695312, -0.2180957794189453, -0.2099456787109375, -0.2017955780029297, -0.19364547729492188, -0.18549537658691406, -0.17734527587890625, -0.16919517517089844, -0.16104507446289062, -0.1528949737548828, -0.144744873046875, -0.1365947723388672, -0.12844467163085938, -0.12029457092285156, -0.11214447021484375, -0.10399436950683594, -0.09584426879882812, -0.08769416809082031, -0.0795440673828125, -0.07139396667480469, -0.06324386596679688, -0.05509376525878906, -0.04694366455078125, -0.03879356384277344, -0.030643463134765625, -0.022493362426757812, -0.01434326171875, -0.0061931610107421875, 0.001956939697265625, 0.010107040405273438, 0.01825714111328125, 0.026407241821289062, 0.034557342529296875, 0.04270744323730469, 0.0508575439453125, 0.05900764465332031, 0.06715774536132812, 0.07530784606933594, 0.08345794677734375, 0.09160804748535156, 0.09975814819335938, 0.10790824890136719, 0.116058349609375, 0.12420845031738281, 0.13235855102539062, 0.14050865173339844, 0.14865875244140625, 0.15680885314941406, 0.16495895385742188, 0.1731090545654297, 0.1812591552734375, 0.1894092559814453, 0.19755935668945312, 0.20570945739746094, 0.21385955810546875, 0.22200965881347656, 0.23015975952148438, 0.2383098602294922, 0.2464599609375]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 5.0, 32.0, 344.0, 486.0, 92.0, 14.0, 9.0, 8.0, 4.0, 2.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.371602535247803, -5.226481914520264, -5.081361293792725, -4.936240196228027, -4.791119575500488, -4.645998954772949, -4.50087833404541, -4.355757713317871, -4.210637092590332, -4.065516471862793, -3.920395612716675, -3.7752749919891357, -3.6301541328430176, -3.4850335121154785, -3.3399128913879395, -3.1947922706604004, -3.049671173095703, -2.904550552368164, -2.759429693222046, -2.614309072494507, -2.4691882133483887, -2.3240675926208496, -2.1789469718933105, -2.0338263511657715, -1.8887054920196533, -1.7435847520828247, -1.598464012145996, -1.453343391418457, -1.3082226514816284, -1.1631019115447998, -1.0179812908172607, -0.8728605508804321, -0.7277393341064453, -0.5826185941696167, -0.43749791383743286, -0.29237720370292664, -0.1472564935684204, -0.002135753631591797, 0.14298492670059204, 0.2881056070327759, 0.4332263469696045, 0.5783470869064331, 0.7234677672386169, 0.8685884475708008, 1.0137091875076294, 1.158829927444458, 1.303950548171997, 1.4490712881088257, 1.5941920280456543, 1.739312767982483, 1.8844335079193115, 2.0295541286468506, 2.1746749877929688, 2.319795608520508, 2.464916229248047, 2.610036849975586, 2.755157709121704, 2.900278329849243, 3.0453991889953613, 3.1905198097229004, 3.3356404304504395, 3.4807612895965576, 3.6258819103240967, 3.771002769470215, 3.916123390197754]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 4.0, 3.0, 4.0, 13.0, 9.0, 8.0, 25.0, 17.0, 28.0, 30.0, 43.0, 60.0, 63.0, 69.0, 66.0, 79.0, 75.0, 64.0, 56.0, 60.0, 39.0, 49.0, 31.0, 28.0, 22.0, 13.0, 14.0, 9.0, 5.0, 3.0, 6.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.4345269203186035, -1.3878427743911743, -1.3411585092544556, -1.2944743633270264, -1.2477902173995972, -1.201106071472168, -1.1544218063354492, -1.10773766040802, -1.0610535144805908, -1.0143693685531616, -0.9676851630210876, -0.9210009574890137, -0.8743168115615845, -0.8276326060295105, -0.7809484004974365, -0.7342642545700073, -0.6875800490379333, -0.6408958435058594, -0.5942116975784302, -0.5475274920463562, -0.500843346118927, -0.454159140586853, -0.40747496485710144, -0.36079078912734985, -0.31410661339759827, -0.2674224376678467, -0.2207382619380951, -0.1740540713071823, -0.12736989557743073, -0.08068571984767914, -0.03400152921676636, 0.01268264651298523, 0.059366822242736816, 0.1060509979724884, 0.15273517370224, 0.19941936433315277, 0.24610354006290436, 0.29278773069381714, 0.3394719064235687, 0.3861560821533203, 0.4328402578830719, 0.4795244336128235, 0.5262086391448975, 0.5728927850723267, 0.6195769906044006, 0.6662611365318298, 0.7129453420639038, 0.759629487991333, 0.806313693523407, 0.852997899055481, 0.8996820449829102, 0.9463662505149841, 0.9930503964424133, 1.0397346019744873, 1.0864187479019165, 1.1331028938293457, 1.1797871589660645, 1.2264713048934937, 1.2731555700302124, 1.3198397159576416, 1.3665238618850708, 1.4132080078125, 1.4598922729492188, 1.506576418876648, 1.5532605648040771]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 6.0, 4.0, 6.0, 7.0, 11.0, 22.0, 36.0, 47.0, 65.0, 91.0, 149.0, 205.0, 339.0, 487.0, 662.0, 1020.0, 1659.0, 2344.0, 3585.0, 5686.0, 9206.0, 17101.0, 41404.0, 332349.0, 528745.0, 55804.0, 19354.0, 10292.0, 6136.0, 3869.0, 2615.0, 1760.0, 1158.0, 736.0, 497.0, 373.0, 220.0, 176.0, 112.0, 70.0, 47.0, 39.0, 18.0, 12.0, 6.0, 9.0, 6.0, 5.0, 7.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-1.0556640625, -1.0227813720703125, -0.989898681640625, -0.9570159912109375, -0.92413330078125, -0.8912506103515625, -0.858367919921875, -0.8254852294921875, -0.7926025390625, -0.7597198486328125, -0.726837158203125, -0.6939544677734375, -0.66107177734375, -0.6281890869140625, -0.595306396484375, -0.5624237060546875, -0.529541015625, -0.4966583251953125, -0.463775634765625, -0.4308929443359375, -0.39801025390625, -0.3651275634765625, -0.332244873046875, -0.2993621826171875, -0.2664794921875, -0.2335968017578125, -0.200714111328125, -0.1678314208984375, -0.13494873046875, -0.1020660400390625, -0.069183349609375, -0.0363006591796875, -0.00341796875, 0.0294647216796875, 0.062347412109375, 0.0952301025390625, 0.12811279296875, 0.1609954833984375, 0.193878173828125, 0.2267608642578125, 0.2596435546875, 0.2925262451171875, 0.325408935546875, 0.3582916259765625, 0.39117431640625, 0.4240570068359375, 0.456939697265625, 0.4898223876953125, 0.522705078125, 0.5555877685546875, 0.588470458984375, 0.6213531494140625, 0.65423583984375, 0.6871185302734375, 0.720001220703125, 0.7528839111328125, 0.7857666015625, 0.8186492919921875, 0.851531982421875, 0.8844146728515625, 0.91729736328125, 0.9501800537109375, 0.983062744140625, 1.0159454345703125, 1.048828125]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 7.0, 2.0, 3.0, 7.0, 13.0, 3.0, 12.0, 17.0, 19.0, 49.0, 132.0, 192.0, 188.0, 140.0, 77.0, 36.0, 16.0, 17.0, 6.0, 8.0, 3.0, 9.0, 3.0, 4.0, 3.0, 4.0, 2.0, 5.0, 2.0, 4.0, 2.0, 3.0, 5.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.1898193359375, -0.18430709838867188, -0.17879486083984375, -0.17328262329101562, -0.1677703857421875, -0.16225814819335938, -0.15674591064453125, -0.15123367309570312, -0.145721435546875, -0.14020919799804688, -0.13469696044921875, -0.12918472290039062, -0.1236724853515625, -0.11816024780273438, -0.11264801025390625, -0.10713577270507812, -0.10162353515625, -0.09611129760742188, -0.09059906005859375, -0.08508682250976562, -0.0795745849609375, -0.07406234741210938, -0.06855010986328125, -0.06303787231445312, -0.057525634765625, -0.052013397216796875, -0.04650115966796875, -0.040988922119140625, -0.0354766845703125, -0.029964447021484375, -0.02445220947265625, -0.018939971923828125, -0.013427734375, -0.007915496826171875, -0.00240325927734375, 0.003108978271484375, 0.0086212158203125, 0.014133453369140625, 0.01964569091796875, 0.025157928466796875, 0.030670166015625, 0.036182403564453125, 0.04169464111328125, 0.047206878662109375, 0.0527191162109375, 0.058231353759765625, 0.06374359130859375, 0.06925582885742188, 0.07476806640625, 0.08028030395507812, 0.08579254150390625, 0.09130477905273438, 0.0968170166015625, 0.10232925415039062, 0.10784149169921875, 0.11335372924804688, 0.118865966796875, 0.12437820434570312, 0.12989044189453125, 0.13540267944335938, 0.1409149169921875, 0.14642715454101562, 0.15193939208984375, 0.15745162963867188, 0.1629638671875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 2.0, 2.0, 6.0, 19.0, 41.0, 92.0, 402.0, 1458.0, 15261.0, 596680.0, 422476.0, 10426.0, 1197.0, 319.0, 106.0, 30.0, 19.0, 4.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.876953125, -2.789642333984375, -2.70233154296875, -2.615020751953125, -2.5277099609375, -2.440399169921875, -2.35308837890625, -2.265777587890625, -2.178466796875, -2.091156005859375, -2.00384521484375, -1.916534423828125, -1.8292236328125, -1.741912841796875, -1.65460205078125, -1.567291259765625, -1.47998046875, -1.392669677734375, -1.30535888671875, -1.218048095703125, -1.1307373046875, -1.043426513671875, -0.95611572265625, -0.868804931640625, -0.781494140625, -0.694183349609375, -0.60687255859375, -0.519561767578125, -0.4322509765625, -0.344940185546875, -0.25762939453125, -0.170318603515625, -0.0830078125, 0.004302978515625, 0.09161376953125, 0.178924560546875, 0.2662353515625, 0.353546142578125, 0.44085693359375, 0.528167724609375, 0.615478515625, 0.702789306640625, 0.79010009765625, 0.877410888671875, 0.9647216796875, 1.052032470703125, 1.13934326171875, 1.226654052734375, 1.31396484375, 1.401275634765625, 1.48858642578125, 1.575897216796875, 1.6632080078125, 1.750518798828125, 1.83782958984375, 1.925140380859375, 2.012451171875, 2.099761962890625, 2.18707275390625, 2.274383544921875, 2.3616943359375, 2.449005126953125, 2.53631591796875, 2.623626708984375, 2.7109375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 2.0, 3.0, 5.0, 5.0, 8.0, 8.0, 9.0, 14.0, 12.0, 15.0, 13.0, 26.0, 20.0, 24.0, 31.0, 25.0, 22.0, 32.0, 37.0, 35.0, 31.0, 48.0, 36.0, 48.0, 38.0, 53.0, 35.0, 51.0, 31.0, 40.0, 27.0, 45.0, 25.0, 22.0, 19.0, 15.0, 17.0, 17.0, 9.0, 10.0, 14.0, 11.0, 7.0, 4.0, 3.0, 4.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.60693359375, -0.5877609252929688, -0.5685882568359375, -0.5494155883789062, -0.530242919921875, -0.5110702514648438, -0.4918975830078125, -0.47272491455078125, -0.45355224609375, -0.43437957763671875, -0.4152069091796875, -0.39603424072265625, -0.376861572265625, -0.35768890380859375, -0.3385162353515625, -0.31934356689453125, -0.3001708984375, -0.28099822998046875, -0.2618255615234375, -0.24265289306640625, -0.223480224609375, -0.20430755615234375, -0.1851348876953125, -0.16596221923828125, -0.14678955078125, -0.12761688232421875, -0.1084442138671875, -0.08927154541015625, -0.070098876953125, -0.05092620849609375, -0.0317535400390625, -0.01258087158203125, 0.006591796875, 0.02576446533203125, 0.0449371337890625, 0.06410980224609375, 0.083282470703125, 0.10245513916015625, 0.1216278076171875, 0.14080047607421875, 0.15997314453125, 0.17914581298828125, 0.1983184814453125, 0.21749114990234375, 0.236663818359375, 0.25583648681640625, 0.2750091552734375, 0.29418182373046875, 0.3133544921875, 0.33252716064453125, 0.3516998291015625, 0.37087249755859375, 0.390045166015625, 0.40921783447265625, 0.4283905029296875, 0.44756317138671875, 0.46673583984375, 0.48590850830078125, 0.5050811767578125, 0.5242538452148438, 0.543426513671875, 0.5625991821289062, 0.5817718505859375, 0.6009445190429688, 0.6201171875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 7.0, 2.0, 3.0, 3.0, 5.0, 3.0, 7.0, 16.0, 18.0, 23.0, 38.0, 50.0, 53.0, 109.0, 215.0, 418.0, 949.0, 2604.0, 12306.0, 383541.0, 627735.0, 15453.0, 2916.0, 996.0, 449.0, 237.0, 136.0, 84.0, 59.0, 28.0, 27.0, 16.0, 12.0, 12.0, 7.0, 3.0, 8.0, 1.0, 4.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-2.146484375, -2.0834503173828125, -2.020416259765625, -1.9573822021484375, -1.89434814453125, -1.8313140869140625, -1.768280029296875, -1.7052459716796875, -1.6422119140625, -1.5791778564453125, -1.516143798828125, -1.4531097412109375, -1.39007568359375, -1.3270416259765625, -1.264007568359375, -1.2009735107421875, -1.137939453125, -1.0749053955078125, -1.011871337890625, -0.9488372802734375, -0.88580322265625, -0.8227691650390625, -0.759735107421875, -0.6967010498046875, -0.6336669921875, -0.5706329345703125, -0.507598876953125, -0.4445648193359375, -0.38153076171875, -0.3184967041015625, -0.255462646484375, -0.1924285888671875, -0.12939453125, -0.0663604736328125, -0.003326416015625, 0.0597076416015625, 0.12274169921875, 0.1857757568359375, 0.248809814453125, 0.3118438720703125, 0.3748779296875, 0.4379119873046875, 0.500946044921875, 0.5639801025390625, 0.62701416015625, 0.6900482177734375, 0.753082275390625, 0.8161163330078125, 0.879150390625, 0.9421844482421875, 1.005218505859375, 1.0682525634765625, 1.13128662109375, 1.1943206787109375, 1.257354736328125, 1.3203887939453125, 1.3834228515625, 1.4464569091796875, 1.509490966796875, 1.5725250244140625, 1.63555908203125, 1.6985931396484375, 1.761627197265625, 1.8246612548828125, 1.8876953125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 6.0, 14.0, 11.0, 16.0, 23.0, 36.0, 49.0, 81.0, 134.0, 159.0, 147.0, 112.0, 67.0, 46.0, 37.0, 16.0, 20.0, 7.0, 5.0, 4.0, 5.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.791685104370117e-05, -8.463207632303238e-05, -8.134730160236359e-05, -7.80625268816948e-05, -7.4777752161026e-05, -7.149297744035721e-05, -6.820820271968842e-05, -6.492342799901962e-05, -6.163865327835083e-05, -5.835387855768204e-05, -5.5069103837013245e-05, -5.178432911634445e-05, -4.849955439567566e-05, -4.5214779675006866e-05, -4.1930004954338074e-05, -3.864523023366928e-05, -3.536045551300049e-05, -3.2075680792331696e-05, -2.8790906071662903e-05, -2.550613135099411e-05, -2.2221356630325317e-05, -1.8936581909656525e-05, -1.5651807188987732e-05, -1.236703246831894e-05, -9.082257747650146e-06, -5.797483026981354e-06, -2.512708306312561e-06, 7.720664143562317e-07, 4.056841135025024e-06, 7.341615855693817e-06, 1.062639057636261e-05, 1.3911165297031403e-05, 1.7195940017700195e-05, 2.0480714738368988e-05, 2.376548945903778e-05, 2.7050264179706573e-05, 3.0335038900375366e-05, 3.361981362104416e-05, 3.690458834171295e-05, 4.0189363062381744e-05, 4.347413778305054e-05, 4.675891250371933e-05, 5.004368722438812e-05, 5.3328461945056915e-05, 5.661323666572571e-05, 5.98980113863945e-05, 6.31827861070633e-05, 6.646756082773209e-05, 6.975233554840088e-05, 7.303711026906967e-05, 7.632188498973846e-05, 7.960665971040726e-05, 8.289143443107605e-05, 8.617620915174484e-05, 8.946098387241364e-05, 9.274575859308243e-05, 9.603053331375122e-05, 9.931530803442001e-05, 0.0001026000827550888, 0.0001058848574757576, 0.00010916963219642639, 0.00011245440691709518, 0.00011573918163776398, 0.00011902395635843277, 0.00012230873107910156]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 5.0, 10.0, 15.0, 26.0, 18.0, 50.0, 74.0, 108.0, 178.0, 281.0, 569.0, 1318.0, 3701.0, 13090.0, 87029.0, 793038.0, 125490.0, 16202.0, 4440.0, 1517.0, 640.0, 321.0, 153.0, 105.0, 58.0, 46.0, 17.0, 20.0, 11.0, 8.0, 3.0, 5.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.44140625, -1.40087890625, -1.3603515625, -1.31982421875, -1.279296875, -1.23876953125, -1.1982421875, -1.15771484375, -1.1171875, -1.07666015625, -1.0361328125, -0.99560546875, -0.955078125, -0.91455078125, -0.8740234375, -0.83349609375, -0.79296875, -0.75244140625, -0.7119140625, -0.67138671875, -0.630859375, -0.59033203125, -0.5498046875, -0.50927734375, -0.46875, -0.42822265625, -0.3876953125, -0.34716796875, -0.306640625, -0.26611328125, -0.2255859375, -0.18505859375, -0.14453125, -0.10400390625, -0.0634765625, -0.02294921875, 0.017578125, 0.05810546875, 0.0986328125, 0.13916015625, 0.1796875, 0.22021484375, 0.2607421875, 0.30126953125, 0.341796875, 0.38232421875, 0.4228515625, 0.46337890625, 0.50390625, 0.54443359375, 0.5849609375, 0.62548828125, 0.666015625, 0.70654296875, 0.7470703125, 0.78759765625, 0.828125, 0.86865234375, 0.9091796875, 0.94970703125, 0.990234375, 1.03076171875, 1.0712890625, 1.11181640625, 1.15234375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 2.0, 3.0, 4.0, 9.0, 9.0, 6.0, 17.0, 18.0, 24.0, 50.0, 70.0, 118.0, 120.0, 135.0, 114.0, 90.0, 69.0, 47.0, 30.0, 17.0, 18.0, 6.0, 8.0, 10.0, 2.0, 3.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2626953125, -1.2306365966796875, -1.198577880859375, -1.1665191650390625, -1.13446044921875, -1.1024017333984375, -1.070343017578125, -1.0382843017578125, -1.0062255859375, -0.9741668701171875, -0.942108154296875, -0.9100494384765625, -0.87799072265625, -0.8459320068359375, -0.813873291015625, -0.7818145751953125, -0.749755859375, -0.7176971435546875, -0.685638427734375, -0.6535797119140625, -0.62152099609375, -0.5894622802734375, -0.557403564453125, -0.5253448486328125, -0.4932861328125, -0.4612274169921875, -0.429168701171875, -0.3971099853515625, -0.36505126953125, -0.3329925537109375, -0.300933837890625, -0.2688751220703125, -0.23681640625, -0.2047576904296875, -0.172698974609375, -0.1406402587890625, -0.10858154296875, -0.0765228271484375, -0.044464111328125, -0.0124053955078125, 0.0196533203125, 0.0517120361328125, 0.083770751953125, 0.1158294677734375, 0.14788818359375, 0.1799468994140625, 0.212005615234375, 0.2440643310546875, 0.276123046875, 0.3081817626953125, 0.340240478515625, 0.3722991943359375, 0.40435791015625, 0.4364166259765625, 0.468475341796875, 0.5005340576171875, 0.5325927734375, 0.5646514892578125, 0.596710205078125, 0.6287689208984375, 0.66082763671875, 0.6928863525390625, 0.724945068359375, 0.7570037841796875, 0.7890625]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 7.0, 12.0, 59.0, 433.0, 399.0, 59.0, 15.0, 5.0, 8.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-21.027870178222656, -20.369081497192383, -19.71029281616211, -19.051504135131836, -18.392715454101562, -17.73392677307129, -17.075138092041016, -16.416349411010742, -15.757560729980469, -15.098772048950195, -14.439983367919922, -13.781194686889648, -13.122406005859375, -12.463617324829102, -11.804828643798828, -11.146039962768555, -10.487252235412598, -9.828463554382324, -9.16967487335205, -8.510886192321777, -7.852097511291504, -7.1933088302612305, -6.534520626068115, -5.875731945037842, -5.216943264007568, -4.558154582977295, -3.8993659019470215, -3.240577459335327, -2.5817887783050537, -1.9230000972747803, -1.264211654663086, -0.6054229736328125, 0.05336570739746094, 0.7121543288230896, 1.3709429502487183, 2.029731512069702, 2.6885201930999756, 3.347308874130249, 4.006097316741943, 4.664885997772217, 5.32367467880249, 5.982463359832764, 6.641252040863037, 7.300040245056152, 7.958828926086426, 8.6176176071167, 9.276406288146973, 9.935194969177246, 10.59398365020752, 11.252772331237793, 11.911561012268066, 12.57034969329834, 13.229138374328613, 13.887927055358887, 14.546714782714844, 15.205503463745117, 15.86429214477539, 16.523080825805664, 17.181869506835938, 17.84065818786621, 18.499446868896484, 19.158235549926758, 19.81702423095703, 20.475812911987305, 21.134601593017578]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 4.0, 5.0, 3.0, 5.0, 9.0, 4.0, 2.0, 5.0, 8.0, 8.0, 20.0, 19.0, 41.0, 61.0, 61.0, 92.0, 96.0, 109.0, 98.0, 68.0, 65.0, 59.0, 46.0, 32.0, 17.0, 14.0, 19.0, 8.0, 5.0, 12.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0], "bins": [-9.805558204650879, -9.537004470825195, -9.268450736999512, -8.999897003173828, -8.731342315673828, -8.462788581848145, -8.194234848022461, -7.925681114196777, -7.657127380371094, -7.38857364654541, -7.120019912719727, -6.851465702056885, -6.582911968231201, -6.314358234405518, -6.045804023742676, -5.777250289916992, -5.508696556091309, -5.240142822265625, -4.971589088439941, -4.7030348777771, -4.434481143951416, -4.165927410125732, -3.8973734378814697, -3.628819465637207, -3.3602657318115234, -3.09171199798584, -2.823158025741577, -2.5546040534973145, -2.286050319671631, -2.0174965858459473, -1.7489426136016846, -1.4803887605667114, -1.2118349075317383, -0.9432810544967651, -0.674727201461792, -0.40617334842681885, -0.1376194953918457, 0.13093435764312744, 0.3994882106781006, 0.6680420637130737, 0.9365959167480469, 1.20514976978302, 1.4737036228179932, 1.7422574758529663, 2.0108113288879395, 2.279365062713623, 2.5479190349578857, 2.8164730072021484, 3.085026741027832, 3.3535804748535156, 3.6221344470977783, 3.890688419342041, 4.159242153167725, 4.427795886993408, 4.69635009765625, 4.964903831481934, 5.233457565307617, 5.502011299133301, 5.770565032958984, 6.039119243621826, 6.30767297744751, 6.576226711273193, 6.844780921936035, 7.113334655761719, 7.381888389587402]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 2.0, 4.0, 8.0, 4.0, 12.0, 14.0, 14.0, 17.0, 32.0, 32.0, 38.0, 64.0, 72.0, 120.0, 165.0, 247.0, 459.0, 792.0, 1626.0, 4307.0, 21349.0, 4037364.0, 112071.0, 9387.0, 3026.0, 1250.0, 688.0, 393.0, 231.0, 172.0, 99.0, 54.0, 60.0, 37.0, 20.0, 19.0, 11.0, 7.0, 8.0, 1.0, 7.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.42578125, -5.26971435546875, -5.1136474609375, -4.95758056640625, -4.801513671875, -4.64544677734375, -4.4893798828125, -4.33331298828125, -4.17724609375, -4.02117919921875, -3.8651123046875, -3.70904541015625, -3.552978515625, -3.39691162109375, -3.2408447265625, -3.08477783203125, -2.9287109375, -2.77264404296875, -2.6165771484375, -2.46051025390625, -2.304443359375, -2.14837646484375, -1.9923095703125, -1.83624267578125, -1.68017578125, -1.52410888671875, -1.3680419921875, -1.21197509765625, -1.055908203125, -0.89984130859375, -0.7437744140625, -0.58770751953125, -0.431640625, -0.27557373046875, -0.1195068359375, 0.03656005859375, 0.192626953125, 0.34869384765625, 0.5047607421875, 0.66082763671875, 0.81689453125, 0.97296142578125, 1.1290283203125, 1.28509521484375, 1.441162109375, 1.59722900390625, 1.7532958984375, 1.90936279296875, 2.0654296875, 2.22149658203125, 2.3775634765625, 2.53363037109375, 2.689697265625, 2.84576416015625, 3.0018310546875, 3.15789794921875, 3.31396484375, 3.47003173828125, 3.6260986328125, 3.78216552734375, 3.938232421875, 4.09429931640625, 4.2503662109375, 4.40643310546875, 4.5625]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 1.0, 4.0, 8.0, 6.0, 6.0, 14.0, 17.0, 26.0, 69.0, 125.0, 178.0, 187.0, 144.0, 79.0, 44.0, 19.0, 17.0, 19.0, 5.0, 5.0, 6.0, 6.0, 7.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.2322998046875, -0.22590065002441406, -0.21950149536132812, -0.2131023406982422, -0.20670318603515625, -0.2003040313720703, -0.19390487670898438, -0.18750572204589844, -0.1811065673828125, -0.17470741271972656, -0.16830825805664062, -0.1619091033935547, -0.15550994873046875, -0.1491107940673828, -0.14271163940429688, -0.13631248474121094, -0.129913330078125, -0.12351417541503906, -0.11711502075195312, -0.11071586608886719, -0.10431671142578125, -0.09791755676269531, -0.09151840209960938, -0.08511924743652344, -0.0787200927734375, -0.07232093811035156, -0.06592178344726562, -0.05952262878417969, -0.05312347412109375, -0.04672431945800781, -0.040325164794921875, -0.03392601013183594, -0.02752685546875, -0.021127700805664062, -0.014728546142578125, -0.008329391479492188, -0.00193023681640625, 0.0044689178466796875, 0.010868072509765625, 0.017267227172851562, 0.0236663818359375, 0.030065536499023438, 0.036464691162109375, 0.04286384582519531, 0.04926300048828125, 0.05566215515136719, 0.062061309814453125, 0.06846046447753906, 0.074859619140625, 0.08125877380371094, 0.08765792846679688, 0.09405708312988281, 0.10045623779296875, 0.10685539245605469, 0.11325454711914062, 0.11965370178222656, 0.1260528564453125, 0.13245201110839844, 0.13885116577148438, 0.1452503204345703, 0.15164947509765625, 0.1580486297607422, 0.16444778442382812, 0.17084693908691406, 0.17724609375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 3.0, 2.0, 4.0, 6.0, 6.0, 5.0, 6.0, 10.0, 14.0, 18.0, 24.0, 32.0, 67.0, 116.0, 442.0, 2888.0, 136169.0, 4044204.0, 8973.0, 853.0, 177.0, 101.0, 51.0, 29.0, 19.0, 9.0, 16.0, 9.0, 10.0, 6.0, 2.0, 2.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-6.07421875, -5.8912353515625, -5.708251953125, -5.5252685546875, -5.34228515625, -5.1593017578125, -4.976318359375, -4.7933349609375, -4.6103515625, -4.4273681640625, -4.244384765625, -4.0614013671875, -3.87841796875, -3.6954345703125, -3.512451171875, -3.3294677734375, -3.146484375, -2.9635009765625, -2.780517578125, -2.5975341796875, -2.41455078125, -2.2315673828125, -2.048583984375, -1.8656005859375, -1.6826171875, -1.4996337890625, -1.316650390625, -1.1336669921875, -0.95068359375, -0.7677001953125, -0.584716796875, -0.4017333984375, -0.21875, -0.0357666015625, 0.147216796875, 0.3302001953125, 0.51318359375, 0.6961669921875, 0.879150390625, 1.0621337890625, 1.2451171875, 1.4281005859375, 1.611083984375, 1.7940673828125, 1.97705078125, 2.1600341796875, 2.343017578125, 2.5260009765625, 2.708984375, 2.8919677734375, 3.074951171875, 3.2579345703125, 3.44091796875, 3.6239013671875, 3.806884765625, 3.9898681640625, 4.1728515625, 4.3558349609375, 4.538818359375, 4.7218017578125, 4.90478515625, 5.0877685546875, 5.270751953125, 5.4537353515625, 5.63671875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 6.0, 7.0, 4.0, 9.0, 13.0, 11.0, 16.0, 22.0, 39.0, 60.0, 90.0, 167.0, 368.0, 964.0, 1480.0, 360.0, 152.0, 92.0, 59.0, 35.0, 21.0, 14.0, 22.0, 11.0, 13.0, 6.0, 5.0, 6.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.2315673828125, -0.22388267517089844, -0.21619796752929688, -0.2085132598876953, -0.20082855224609375, -0.1931438446044922, -0.18545913696289062, -0.17777442932128906, -0.1700897216796875, -0.16240501403808594, -0.15472030639648438, -0.1470355987548828, -0.13935089111328125, -0.1316661834716797, -0.12398147583007812, -0.11629676818847656, -0.108612060546875, -0.10092735290527344, -0.09324264526367188, -0.08555793762207031, -0.07787322998046875, -0.07018852233886719, -0.06250381469726562, -0.05481910705566406, -0.0471343994140625, -0.03944969177246094, -0.031764984130859375, -0.024080276489257812, -0.01639556884765625, -0.008710861206054688, -0.001026153564453125, 0.0066585540771484375, 0.01434326171875, 0.022027969360351562, 0.029712677001953125, 0.03739738464355469, 0.04508209228515625, 0.05276679992675781, 0.060451507568359375, 0.06813621520996094, 0.0758209228515625, 0.08350563049316406, 0.09119033813476562, 0.09887504577636719, 0.10655975341796875, 0.11424446105957031, 0.12192916870117188, 0.12961387634277344, 0.137298583984375, 0.14498329162597656, 0.15266799926757812, 0.1603527069091797, 0.16803741455078125, 0.1757221221923828, 0.18340682983398438, 0.19109153747558594, 0.1987762451171875, 0.20646095275878906, 0.21414566040039062, 0.2218303680419922, 0.22951507568359375, 0.2371997833251953, 0.24488449096679688, 0.25256919860839844, 0.26025390625]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 4.0, 4.0, 2.0, 9.0, 11.0, 29.0, 175.0, 540.0, 195.0, 31.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.672968864440918, -3.5300850868225098, -3.3872010707855225, -3.2443172931671143, -3.101433277130127, -2.9585494995117188, -2.8156657218933105, -2.6727819442749023, -2.529897928237915, -2.387014150619507, -2.2441301345825195, -2.1012463569641113, -1.9583624601364136, -1.8154785633087158, -1.6725947856903076, -1.5297108888626099, -1.386826992034912, -1.2439430952072144, -1.1010591983795166, -0.9581754207611084, -0.8152915239334106, -0.6724076271057129, -0.5295237898826599, -0.38663995265960693, -0.24375605583190918, -0.10087218880653381, 0.04201167821884155, 0.18489554524421692, 0.3277794122695923, 0.47066330909729004, 0.613547146320343, 0.756430983543396, 0.899315357208252, 1.0421992540359497, 1.1850831508636475, 1.3279669284820557, 1.4708508253097534, 1.6137347221374512, 1.7566184997558594, 1.8995023965835571, 2.042386293411255, 2.185270071029663, 2.3281540870666504, 2.4710378646850586, 2.613921642303467, 2.756805658340454, 2.8996894359588623, 3.0425734519958496, 3.185457229614258, 3.328341007232666, 3.4712250232696533, 3.6141088008880615, 3.756992816925049, 3.899876594543457, 4.042760372161865, 4.185644149780273, 4.32852840423584, 4.471412181854248, 4.614295959472656, 4.757180213928223, 4.900063991546631, 5.042947769165039, 5.185831546783447, 5.3287153244018555, 5.471599102020264]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 9.0, 10.0, 9.0, 25.0, 28.0, 31.0, 49.0, 59.0, 60.0, 70.0, 83.0, 102.0, 96.0, 71.0, 59.0, 58.0, 52.0, 29.0, 29.0, 17.0, 15.0, 11.0, 7.0, 3.0, 4.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.363701343536377, -1.3197206258773804, -1.2757399082183838, -1.2317591905593872, -1.1877784729003906, -1.143797755241394, -1.0998170375823975, -1.0558363199234009, -1.0118556022644043, -0.9678748846054077, -0.9238941669464111, -0.8799134492874146, -0.835932731628418, -0.7919520139694214, -0.7479712963104248, -0.7039905786514282, -0.6600098609924316, -0.6160291433334351, -0.5720484256744385, -0.5280677080154419, -0.4840869903564453, -0.44010627269744873, -0.39612555503845215, -0.35214483737945557, -0.308164119720459, -0.2641834020614624, -0.22020268440246582, -0.17622196674346924, -0.13224124908447266, -0.08826053142547607, -0.04427981376647949, -0.00029909610748291016, 0.04368162155151367, 0.08766233921051025, 0.13164305686950684, 0.17562377452850342, 0.2196044921875, 0.2635852098464966, 0.30756592750549316, 0.35154664516448975, 0.39552736282348633, 0.4395080804824829, 0.4834887981414795, 0.5274695158004761, 0.5714502334594727, 0.6154309511184692, 0.6594116687774658, 0.7033923864364624, 0.747373104095459, 0.7913538217544556, 0.8353345394134521, 0.8793152570724487, 0.9232959747314453, 0.9672766923904419, 1.0112574100494385, 1.055238127708435, 1.0992188453674316, 1.1431995630264282, 1.1871802806854248, 1.2311609983444214, 1.275141716003418, 1.3191224336624146, 1.3631031513214111, 1.4070838689804077, 1.4510645866394043]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 8.0, 3.0, 4.0, 6.0, 7.0, 15.0, 31.0, 27.0, 40.0, 60.0, 119.0, 228.0, 398.0, 957.0, 2472.0, 11183.0, 380327.0, 634140.0, 13606.0, 2883.0, 996.0, 459.0, 231.0, 125.0, 72.0, 52.0, 37.0, 13.0, 12.0, 16.0, 5.0, 6.0, 6.0, 4.0, 1.0, 4.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.380859375, -3.275390625, -3.169921875, -3.064453125, -2.958984375, -2.853515625, -2.748046875, -2.642578125, -2.537109375, -2.431640625, -2.326171875, -2.220703125, -2.115234375, -2.009765625, -1.904296875, -1.798828125, -1.693359375, -1.587890625, -1.482421875, -1.376953125, -1.271484375, -1.166015625, -1.060546875, -0.955078125, -0.849609375, -0.744140625, -0.638671875, -0.533203125, -0.427734375, -0.322265625, -0.216796875, -0.111328125, -0.005859375, 0.099609375, 0.205078125, 0.310546875, 0.416015625, 0.521484375, 0.626953125, 0.732421875, 0.837890625, 0.943359375, 1.048828125, 1.154296875, 1.259765625, 1.365234375, 1.470703125, 1.576171875, 1.681640625, 1.787109375, 1.892578125, 1.998046875, 2.103515625, 2.208984375, 2.314453125, 2.419921875, 2.525390625, 2.630859375, 2.736328125, 2.841796875, 2.947265625, 3.052734375, 3.158203125, 3.263671875, 3.369140625]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 10.0, 8.0, 10.0, 25.0, 66.0, 162.0, 227.0, 234.0, 130.0, 56.0, 34.0, 16.0, 4.0, 7.0, 5.0, 2.0, 3.0, 2.0, 0.0, 0.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2188720703125, -0.2107715606689453, -0.20267105102539062, -0.19457054138183594, -0.18647003173828125, -0.17836952209472656, -0.17026901245117188, -0.1621685028076172, -0.1540679931640625, -0.1459674835205078, -0.13786697387695312, -0.12976646423339844, -0.12166595458984375, -0.11356544494628906, -0.10546493530273438, -0.09736442565917969, -0.089263916015625, -0.08116340637207031, -0.07306289672851562, -0.06496238708496094, -0.05686187744140625, -0.04876136779785156, -0.040660858154296875, -0.03256034851074219, -0.0244598388671875, -0.016359329223632812, -0.008258819580078125, -0.0001583099365234375, 0.00794219970703125, 0.016042709350585938, 0.024143218994140625, 0.03224372863769531, 0.04034423828125, 0.04844474792480469, 0.056545257568359375, 0.06464576721191406, 0.07274627685546875, 0.08084678649902344, 0.08894729614257812, 0.09704780578613281, 0.1051483154296875, 0.11324882507324219, 0.12134933471679688, 0.12944984436035156, 0.13755035400390625, 0.14565086364746094, 0.15375137329101562, 0.1618518829345703, 0.169952392578125, 0.1780529022216797, 0.18615341186523438, 0.19425392150878906, 0.20235443115234375, 0.21045494079589844, 0.21855545043945312, 0.2266559600830078, 0.2347564697265625, 0.2428569793701172, 0.2509574890136719, 0.25905799865722656, 0.26715850830078125, 0.27525901794433594, 0.2833595275878906, 0.2914600372314453, 0.299560546875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 1.0, 5.0, 6.0, 11.0, 13.0, 20.0, 14.0, 24.0, 23.0, 48.0, 55.0, 70.0, 97.0, 152.0, 209.0, 331.0, 617.0, 1320.0, 3335.0, 10852.0, 44925.0, 242481.0, 550616.0, 151407.0, 29387.0, 7594.0, 2496.0, 992.0, 494.0, 284.0, 187.0, 134.0, 84.0, 71.0, 47.0, 37.0, 36.0, 19.0, 24.0, 18.0, 10.0, 4.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.345703125, -1.30279541015625, -1.2598876953125, -1.21697998046875, -1.174072265625, -1.13116455078125, -1.0882568359375, -1.04534912109375, -1.00244140625, -0.95953369140625, -0.9166259765625, -0.87371826171875, -0.830810546875, -0.78790283203125, -0.7449951171875, -0.70208740234375, -0.6591796875, -0.61627197265625, -0.5733642578125, -0.53045654296875, -0.487548828125, -0.44464111328125, -0.4017333984375, -0.35882568359375, -0.31591796875, -0.27301025390625, -0.2301025390625, -0.18719482421875, -0.144287109375, -0.10137939453125, -0.0584716796875, -0.01556396484375, 0.02734375, 0.07025146484375, 0.1131591796875, 0.15606689453125, 0.198974609375, 0.24188232421875, 0.2847900390625, 0.32769775390625, 0.37060546875, 0.41351318359375, 0.4564208984375, 0.49932861328125, 0.542236328125, 0.58514404296875, 0.6280517578125, 0.67095947265625, 0.7138671875, 0.75677490234375, 0.7996826171875, 0.84259033203125, 0.885498046875, 0.92840576171875, 0.9713134765625, 1.01422119140625, 1.05712890625, 1.10003662109375, 1.1429443359375, 1.18585205078125, 1.228759765625, 1.27166748046875, 1.3145751953125, 1.35748291015625, 1.400390625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 4.0, 3.0, 12.0, 4.0, 9.0, 14.0, 17.0, 19.0, 23.0, 16.0, 33.0, 38.0, 35.0, 46.0, 48.0, 51.0, 51.0, 46.0, 54.0, 55.0, 56.0, 51.0, 41.0, 47.0, 37.0, 45.0, 26.0, 21.0, 22.0, 18.0, 14.0, 11.0, 9.0, 7.0, 4.0, 4.0, 7.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64599609375, -0.6233596801757812, -0.6007232666015625, -0.5780868530273438, -0.555450439453125, -0.5328140258789062, -0.5101776123046875, -0.48754119873046875, -0.46490478515625, -0.44226837158203125, -0.4196319580078125, -0.39699554443359375, -0.374359130859375, -0.35172271728515625, -0.3290863037109375, -0.30644989013671875, -0.2838134765625, -0.26117706298828125, -0.2385406494140625, -0.21590423583984375, -0.193267822265625, -0.17063140869140625, -0.1479949951171875, -0.12535858154296875, -0.10272216796875, -0.08008575439453125, -0.0574493408203125, -0.03481292724609375, -0.012176513671875, 0.01045989990234375, 0.0330963134765625, 0.05573272705078125, 0.078369140625, 0.10100555419921875, 0.1236419677734375, 0.14627838134765625, 0.168914794921875, 0.19155120849609375, 0.2141876220703125, 0.23682403564453125, 0.25946044921875, 0.28209686279296875, 0.3047332763671875, 0.32736968994140625, 0.350006103515625, 0.37264251708984375, 0.3952789306640625, 0.41791534423828125, 0.4405517578125, 0.46318817138671875, 0.4858245849609375, 0.5084609985351562, 0.531097412109375, 0.5537338256835938, 0.5763702392578125, 0.5990066528320312, 0.62164306640625, 0.6442794799804688, 0.6669158935546875, 0.6895523071289062, 0.712188720703125, 0.7348251342773438, 0.7574615478515625, 0.7800979614257812, 0.802734375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 4.0, 6.0, 4.0, 5.0, 5.0, 12.0, 11.0, 30.0, 35.0, 57.0, 109.0, 208.0, 509.0, 1594.0, 6596.0, 56877.0, 893023.0, 78706.0, 7720.0, 1923.0, 612.0, 242.0, 105.0, 67.0, 30.0, 20.0, 19.0, 12.0, 6.0, 2.0, 3.0, 5.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.3203125, -2.26446533203125, -2.2086181640625, -2.15277099609375, -2.096923828125, -2.04107666015625, -1.9852294921875, -1.92938232421875, -1.87353515625, -1.81768798828125, -1.7618408203125, -1.70599365234375, -1.650146484375, -1.59429931640625, -1.5384521484375, -1.48260498046875, -1.4267578125, -1.37091064453125, -1.3150634765625, -1.25921630859375, -1.203369140625, -1.14752197265625, -1.0916748046875, -1.03582763671875, -0.97998046875, -0.92413330078125, -0.8682861328125, -0.81243896484375, -0.756591796875, -0.70074462890625, -0.6448974609375, -0.58905029296875, -0.533203125, -0.47735595703125, -0.4215087890625, -0.36566162109375, -0.309814453125, -0.25396728515625, -0.1981201171875, -0.14227294921875, -0.08642578125, -0.03057861328125, 0.0252685546875, 0.08111572265625, 0.136962890625, 0.19281005859375, 0.2486572265625, 0.30450439453125, 0.3603515625, 0.41619873046875, 0.4720458984375, 0.52789306640625, 0.583740234375, 0.63958740234375, 0.6954345703125, 0.75128173828125, 0.80712890625, 0.86297607421875, 0.9188232421875, 0.97467041015625, 1.030517578125, 1.08636474609375, 1.1422119140625, 1.19805908203125, 1.25390625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 8.0, 7.0, 15.0, 20.0, 15.0, 41.0, 53.0, 92.0, 154.0, 157.0, 131.0, 99.0, 70.0, 46.0, 28.0, 15.0, 11.0, 12.0, 4.0, 3.0, 3.0, 2.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0001633167266845703, -0.00015886686742305756, -0.0001544170081615448, -0.00014996714890003204, -0.0001455172896385193, -0.00014106743037700653, -0.00013661757111549377, -0.00013216771185398102, -0.00012771785259246826, -0.0001232679933309555, -0.00011881813406944275, -0.00011436827480792999, -0.00010991841554641724, -0.00010546855628490448, -0.00010101869702339172, -9.656883776187897e-05, -9.211897850036621e-05, -8.766911923885345e-05, -8.32192599773407e-05, -7.876940071582794e-05, -7.431954145431519e-05, -6.986968219280243e-05, -6.541982293128967e-05, -6.0969963669776917e-05, -5.652010440826416e-05, -5.2070245146751404e-05, -4.762038588523865e-05, -4.317052662372589e-05, -3.8720667362213135e-05, -3.427080810070038e-05, -2.9820948839187622e-05, -2.5371089577674866e-05, -2.092123031616211e-05, -1.6471371054649353e-05, -1.2021511793136597e-05, -7.57165253162384e-06, -3.121793270111084e-06, 1.3280659914016724e-06, 5.777925252914429e-06, 1.0227784514427185e-05, 1.4677643775939941e-05, 1.9127503037452698e-05, 2.3577362298965454e-05, 2.802722156047821e-05, 3.247708082199097e-05, 3.692694008350372e-05, 4.137679934501648e-05, 4.5826658606529236e-05, 5.027651786804199e-05, 5.472637712955475e-05, 5.9176236391067505e-05, 6.362609565258026e-05, 6.807595491409302e-05, 7.252581417560577e-05, 7.697567343711853e-05, 8.142553269863129e-05, 8.587539196014404e-05, 9.03252512216568e-05, 9.477511048316956e-05, 9.922496974468231e-05, 0.00010367482900619507, 0.00010812468826770782, 0.00011257454752922058, 0.00011702440679073334, 0.0001214742660522461]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 1.0, 9.0, 3.0, 11.0, 21.0, 19.0, 28.0, 55.0, 80.0, 142.0, 287.0, 550.0, 1240.0, 3328.0, 10246.0, 69096.0, 842185.0, 102637.0, 12274.0, 3658.0, 1414.0, 587.0, 282.0, 164.0, 76.0, 51.0, 36.0, 21.0, 15.0, 7.0, 12.0, 1.0, 5.0, 4.0, 1.0, 3.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.826171875, -1.7762298583984375, -1.726287841796875, -1.6763458251953125, -1.62640380859375, -1.5764617919921875, -1.526519775390625, -1.4765777587890625, -1.4266357421875, -1.3766937255859375, -1.326751708984375, -1.2768096923828125, -1.22686767578125, -1.1769256591796875, -1.126983642578125, -1.0770416259765625, -1.027099609375, -0.9771575927734375, -0.927215576171875, -0.8772735595703125, -0.82733154296875, -0.7773895263671875, -0.727447509765625, -0.6775054931640625, -0.6275634765625, -0.5776214599609375, -0.527679443359375, -0.4777374267578125, -0.42779541015625, -0.3778533935546875, -0.327911376953125, -0.2779693603515625, -0.22802734375, -0.1780853271484375, -0.128143310546875, -0.0782012939453125, -0.02825927734375, 0.0216827392578125, 0.071624755859375, 0.1215667724609375, 0.1715087890625, 0.2214508056640625, 0.271392822265625, 0.3213348388671875, 0.37127685546875, 0.4212188720703125, 0.471160888671875, 0.5211029052734375, 0.571044921875, 0.6209869384765625, 0.670928955078125, 0.7208709716796875, 0.77081298828125, 0.8207550048828125, 0.870697021484375, 0.9206390380859375, 0.9705810546875, 1.0205230712890625, 1.070465087890625, 1.1204071044921875, 1.17034912109375, 1.2202911376953125, 1.270233154296875, 1.3201751708984375, 1.3701171875]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 4.0, 4.0, 1.0, 6.0, 13.0, 11.0, 14.0, 16.0, 21.0, 30.0, 49.0, 48.0, 73.0, 85.0, 106.0, 89.0, 82.0, 78.0, 68.0, 58.0, 33.0, 28.0, 23.0, 11.0, 13.0, 8.0, 3.0, 3.0, 2.0, 6.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.443359375, -0.428192138671875, -0.41302490234375, -0.397857666015625, -0.3826904296875, -0.367523193359375, -0.35235595703125, -0.337188720703125, -0.322021484375, -0.306854248046875, -0.29168701171875, -0.276519775390625, -0.2613525390625, -0.246185302734375, -0.23101806640625, -0.215850830078125, -0.20068359375, -0.185516357421875, -0.17034912109375, -0.155181884765625, -0.1400146484375, -0.124847412109375, -0.10968017578125, -0.094512939453125, -0.079345703125, -0.064178466796875, -0.04901123046875, -0.033843994140625, -0.0186767578125, -0.003509521484375, 0.01165771484375, 0.026824951171875, 0.0419921875, 0.057159423828125, 0.07232666015625, 0.087493896484375, 0.1026611328125, 0.117828369140625, 0.13299560546875, 0.148162841796875, 0.163330078125, 0.178497314453125, 0.19366455078125, 0.208831787109375, 0.2239990234375, 0.239166259765625, 0.25433349609375, 0.269500732421875, 0.28466796875, 0.299835205078125, 0.31500244140625, 0.330169677734375, 0.3453369140625, 0.360504150390625, 0.37567138671875, 0.390838623046875, 0.406005859375, 0.421173095703125, 0.43634033203125, 0.451507568359375, 0.4666748046875, 0.481842041015625, 0.49700927734375, 0.512176513671875, 0.52734375]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 4.0, 12.0, 41.0, 159.0, 469.0, 232.0, 67.0, 13.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.33147621154785, -15.641979217529297, -14.952482223510742, -14.262985229492188, -13.573487281799316, -12.883990287780762, -12.194493293762207, -11.504995346069336, -10.815498352050781, -10.126001358032227, -9.436504364013672, -8.747007369995117, -8.057509422302246, -7.368012428283691, -6.678515434265137, -5.989017963409424, -5.299521446228027, -4.610024452209473, -3.9205269813537598, -3.231029987335205, -2.5415327548980713, -1.8520355224609375, -1.1625385284423828, -0.4730410575866699, 0.21645593643188477, 0.9059531092643738, 1.5954502820968628, 2.284947395324707, 2.974444627761841, 3.6639418601989746, 4.353438854217529, 5.042936325073242, 5.732433319091797, 6.421930313110352, 7.1114277839660645, 7.800924777984619, 8.490422248840332, 9.179919242858887, 9.869416236877441, 10.558914184570312, 11.248411178588867, 11.937908172607422, 12.627405166625977, 13.316902160644531, 14.006400108337402, 14.695897102355957, 15.385394096374512, 16.074892044067383, 16.764389038085938, 17.453886032104492, 18.143383026123047, 18.8328800201416, 19.522377014160156, 20.211875915527344, 20.901371002197266, 21.590869903564453, 22.280364990234375, 22.96986198425293, 23.659358978271484, 24.34885597229004, 25.038352966308594, 25.72785186767578, 26.417346954345703, 27.10684585571289, 27.796342849731445]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 7.0, 5.0, 9.0, 9.0, 12.0, 18.0, 24.0, 36.0, 40.0, 46.0, 37.0, 60.0, 61.0, 78.0, 58.0, 59.0, 64.0, 66.0, 57.0, 46.0, 34.0, 40.0, 38.0, 26.0, 17.0, 9.0, 11.0, 11.0, 6.0, 11.0, 5.0, 1.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.256053924560547, -5.034274101257324, -4.812494277954102, -4.590714454650879, -4.3689351081848145, -4.147155284881592, -3.925375461578369, -3.7035956382751465, -3.481815814971924, -3.260035991668701, -3.0382564067840576, -2.816476583480835, -2.5946967601776123, -2.3729171752929688, -2.151137351989746, -1.9293575286865234, -1.7075779438018799, -1.4857982397079468, -1.2640184164047241, -1.042238712310791, -0.8204589486122131, -0.5986791849136353, -0.37689948081970215, -0.1551196575164795, 0.06666004657745361, 0.2884398102760315, 0.5102195739746094, 0.7319992780685425, 0.9537790417671204, 1.1755588054656982, 1.3973385095596313, 1.619118332862854, 1.840898036956787, 2.0626778602600098, 2.2844574451446533, 2.506237268447876, 2.7280170917510986, 2.949796676635742, 3.171576499938965, 3.3933563232421875, 3.61513614654541, 3.836915969848633, 4.0586957931518555, 4.280475616455078, 4.502254962921143, 4.724034786224365, 4.945814609527588, 5.1675944328308105, 5.389373779296875, 5.611153602600098, 5.83293342590332, 6.054713249206543, 6.276492595672607, 6.49827241897583, 6.720052242279053, 6.941832065582275, 7.163611888885498, 7.385391712188721, 7.607171535491943, 7.828950881958008, 8.05073070526123, 8.272510528564453, 8.494290351867676, 8.716070175170898, 8.937849998474121]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 7.0, 9.0, 20.0, 31.0, 93.0, 201.0, 563.0, 4911.0, 4160226.0, 26140.0, 1261.0, 393.0, 177.0, 100.0, 59.0, 30.0, 16.0, 11.0, 9.0, 4.0, 4.0, 4.0, 0.0, 2.0, 2.0, 0.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.890625, -11.4901123046875, -11.089599609375, -10.6890869140625, -10.28857421875, -9.8880615234375, -9.487548828125, -9.0870361328125, -8.6865234375, -8.2860107421875, -7.885498046875, -7.4849853515625, -7.08447265625, -6.6839599609375, -6.283447265625, -5.8829345703125, -5.482421875, -5.0819091796875, -4.681396484375, -4.2808837890625, -3.88037109375, -3.4798583984375, -3.079345703125, -2.6788330078125, -2.2783203125, -1.8778076171875, -1.477294921875, -1.0767822265625, -0.67626953125, -0.2757568359375, 0.124755859375, 0.5252685546875, 0.92578125, 1.3262939453125, 1.726806640625, 2.1273193359375, 2.52783203125, 2.9283447265625, 3.328857421875, 3.7293701171875, 4.1298828125, 4.5303955078125, 4.930908203125, 5.3314208984375, 5.73193359375, 6.1324462890625, 6.532958984375, 6.9334716796875, 7.333984375, 7.7344970703125, 8.135009765625, 8.5355224609375, 8.93603515625, 9.3365478515625, 9.737060546875, 10.1375732421875, 10.5380859375, 10.9385986328125, 11.339111328125, 11.7396240234375, 12.14013671875, 12.5406494140625, 12.941162109375, 13.3416748046875, 13.7421875]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 7.0, 7.0, 12.0, 14.0, 39.0, 62.0, 114.0, 143.0, 155.0, 160.0, 102.0, 80.0, 37.0, 29.0, 14.0, 12.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26171875, -0.252593994140625, -0.24346923828125, -0.234344482421875, -0.2252197265625, -0.216094970703125, -0.20697021484375, -0.197845458984375, -0.188720703125, -0.179595947265625, -0.17047119140625, -0.161346435546875, -0.1522216796875, -0.143096923828125, -0.13397216796875, -0.124847412109375, -0.11572265625, -0.106597900390625, -0.09747314453125, -0.088348388671875, -0.0792236328125, -0.070098876953125, -0.06097412109375, -0.051849365234375, -0.042724609375, -0.033599853515625, -0.02447509765625, -0.015350341796875, -0.0062255859375, 0.002899169921875, 0.01202392578125, 0.021148681640625, 0.0302734375, 0.039398193359375, 0.04852294921875, 0.057647705078125, 0.0667724609375, 0.075897216796875, 0.08502197265625, 0.094146728515625, 0.103271484375, 0.112396240234375, 0.12152099609375, 0.130645751953125, 0.1397705078125, 0.148895263671875, 0.15802001953125, 0.167144775390625, 0.17626953125, 0.185394287109375, 0.19451904296875, 0.203643798828125, 0.2127685546875, 0.221893310546875, 0.23101806640625, 0.240142822265625, 0.249267578125, 0.258392333984375, 0.26751708984375, 0.276641845703125, 0.2857666015625, 0.294891357421875, 0.30401611328125, 0.313140869140625, 0.322265625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 6.0, 8.0, 10.0, 14.0, 15.0, 30.0, 37.0, 34.0, 44.0, 73.0, 87.0, 109.0, 119.0, 163.0, 1075.0, 463141.0, 3726703.0, 1601.0, 267.0, 142.0, 107.0, 85.0, 70.0, 76.0, 52.0, 57.0, 39.0, 35.0, 26.0, 21.0, 15.0, 7.0, 4.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-12.6953125, -12.3331298828125, -11.970947265625, -11.6087646484375, -11.24658203125, -10.8843994140625, -10.522216796875, -10.1600341796875, -9.7978515625, -9.4356689453125, -9.073486328125, -8.7113037109375, -8.34912109375, -7.9869384765625, -7.624755859375, -7.2625732421875, -6.900390625, -6.5382080078125, -6.176025390625, -5.8138427734375, -5.45166015625, -5.0894775390625, -4.727294921875, -4.3651123046875, -4.0029296875, -3.6407470703125, -3.278564453125, -2.9163818359375, -2.55419921875, -2.1920166015625, -1.829833984375, -1.4676513671875, -1.10546875, -0.7432861328125, -0.381103515625, -0.0189208984375, 0.34326171875, 0.7054443359375, 1.067626953125, 1.4298095703125, 1.7919921875, 2.1541748046875, 2.516357421875, 2.8785400390625, 3.24072265625, 3.6029052734375, 3.965087890625, 4.3272705078125, 4.689453125, 5.0516357421875, 5.413818359375, 5.7760009765625, 6.13818359375, 6.5003662109375, 6.862548828125, 7.2247314453125, 7.5869140625, 7.9490966796875, 8.311279296875, 8.6734619140625, 9.03564453125, 9.3978271484375, 9.760009765625, 10.1221923828125, 10.484375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 8.0, 8.0, 10.0, 34.0, 78.0, 319.0, 2847.0, 609.0, 113.0, 35.0, 11.0, 10.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3486328125, -0.3125762939453125, -0.276519775390625, -0.2404632568359375, -0.20440673828125, -0.1683502197265625, -0.132293701171875, -0.0962371826171875, -0.0601806640625, -0.0241241455078125, 0.011932373046875, 0.0479888916015625, 0.08404541015625, 0.1201019287109375, 0.156158447265625, 0.1922149658203125, 0.228271484375, 0.2643280029296875, 0.300384521484375, 0.3364410400390625, 0.37249755859375, 0.4085540771484375, 0.444610595703125, 0.4806671142578125, 0.5167236328125, 0.5527801513671875, 0.588836669921875, 0.6248931884765625, 0.66094970703125, 0.6970062255859375, 0.733062744140625, 0.7691192626953125, 0.80517578125, 0.8412322998046875, 0.877288818359375, 0.9133453369140625, 0.94940185546875, 0.9854583740234375, 1.021514892578125, 1.0575714111328125, 1.0936279296875, 1.1296844482421875, 1.165740966796875, 1.2017974853515625, 1.23785400390625, 1.2739105224609375, 1.309967041015625, 1.3460235595703125, 1.382080078125, 1.4181365966796875, 1.454193115234375, 1.4902496337890625, 1.52630615234375, 1.5623626708984375, 1.598419189453125, 1.6344757080078125, 1.6705322265625, 1.7065887451171875, 1.742645263671875, 1.7787017822265625, 1.81475830078125, 1.8508148193359375, 1.886871337890625, 1.9229278564453125, 1.958984375]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 13.0, 35.0, 88.0, 542.0, 248.0, 53.0, 15.0, 1.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.062538146972656, -11.574601173400879, -11.086664199829102, -10.598726272583008, -10.11078929901123, -9.622852325439453, -9.134915351867676, -8.646978378295898, -8.159040451049805, -7.671103477478027, -7.183166027069092, -6.6952290534973145, -6.207291603088379, -5.719354629516602, -5.231417655944824, -4.743480682373047, -4.2555437088012695, -3.767606496810913, -3.2796692848205566, -2.7917323112487793, -2.303795099258423, -1.8158578872680664, -1.327920913696289, -0.8399837017059326, -0.35204648971557617, 0.1358906626701355, 0.6238278150558472, 1.111764907836914, 1.5997021198272705, 2.087639331817627, 2.5755763053894043, 3.0635135173797607, 3.551450729370117, 4.0393877029418945, 4.52732515335083, 5.015262126922607, 5.503199577331543, 5.99113655090332, 6.479073524475098, 6.967010498046875, 7.4549479484558105, 7.942884922027588, 8.430822372436523, 8.9187593460083, 9.406696319580078, 9.894634246826172, 10.382570266723633, 10.870508193969727, 11.358445167541504, 11.846382141113281, 12.334319114685059, 12.822256088256836, 13.31019401550293, 13.798130989074707, 14.286067962646484, 14.774004936218262, 15.261941909790039, 15.749878883361816, 16.237815856933594, 16.725753784179688, 17.21368980407715, 17.701627731323242, 18.189563751220703, 18.677501678466797, 19.16543960571289]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 7.0, 14.0, 25.0, 53.0, 88.0, 75.0, 117.0, 128.0, 134.0, 126.0, 94.0, 59.0, 37.0, 22.0, 14.0, 8.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.903992652893066, -5.729015827178955, -5.554039001464844, -5.379061698913574, -5.204084873199463, -5.029108047485352, -4.85413122177124, -4.679154396057129, -4.504177570343018, -4.329200744628906, -4.154223918914795, -3.9792468547821045, -3.804270029067993, -3.6292929649353027, -3.4543161392211914, -3.27933931350708, -3.1043622493743896, -2.9293854236602783, -2.754408359527588, -2.5794315338134766, -2.4044547080993652, -2.229477882385254, -2.0545008182525635, -1.8795239925384521, -1.7045470476150513, -1.5295701026916504, -1.354593276977539, -1.1796163320541382, -1.0046393871307373, -0.829662561416626, -0.6546856164932251, -0.47970879077911377, -0.3047318458557129, -0.1297549456357956, 0.045221954584121704, 0.2201988697052002, 0.3951757550239563, 0.5701526403427124, 0.7451295852661133, 0.9201064109802246, 1.0950833559036255, 1.2700603008270264, 1.4450371265411377, 1.6200140714645386, 1.7949910163879395, 1.9699678421020508, 2.144944667816162, 2.3199214935302734, 2.494898557662964, 2.669875383377075, 2.8448524475097656, 3.019829273223877, 3.1948060989379883, 3.3697829246520996, 3.54475998878479, 3.7197368144989014, 3.894713878631592, 4.069690704345703, 4.2446675300598145, 4.419644355773926, 4.594621658325195, 4.769598484039307, 4.944575309753418, 5.119552135467529, 5.294528961181641]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 2.0, 11.0, 3.0, 9.0, 5.0, 10.0, 15.0, 10.0, 33.0, 49.0, 71.0, 92.0, 199.0, 413.0, 938.0, 2667.0, 11728.0, 134652.0, 818723.0, 67396.0, 7918.0, 2032.0, 752.0, 337.0, 184.0, 103.0, 61.0, 34.0, 31.0, 19.0, 16.0, 12.0, 8.0, 8.0, 7.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-4.62890625, -4.505096435546875, -4.38128662109375, -4.257476806640625, -4.1336669921875, -4.009857177734375, -3.88604736328125, -3.762237548828125, -3.638427734375, -3.514617919921875, -3.39080810546875, -3.266998291015625, -3.1431884765625, -3.019378662109375, -2.89556884765625, -2.771759033203125, -2.64794921875, -2.524139404296875, -2.40032958984375, -2.276519775390625, -2.1527099609375, -2.028900146484375, -1.90509033203125, -1.781280517578125, -1.657470703125, -1.533660888671875, -1.40985107421875, -1.286041259765625, -1.1622314453125, -1.038421630859375, -0.91461181640625, -0.790802001953125, -0.6669921875, -0.543182373046875, -0.41937255859375, -0.295562744140625, -0.1717529296875, -0.047943115234375, 0.07586669921875, 0.199676513671875, 0.323486328125, 0.447296142578125, 0.57110595703125, 0.694915771484375, 0.8187255859375, 0.942535400390625, 1.06634521484375, 1.190155029296875, 1.31396484375, 1.437774658203125, 1.56158447265625, 1.685394287109375, 1.8092041015625, 1.933013916015625, 2.05682373046875, 2.180633544921875, 2.304443359375, 2.428253173828125, 2.55206298828125, 2.675872802734375, 2.7996826171875, 2.923492431640625, 3.04730224609375, 3.171112060546875, 3.294921875]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 5.0, 8.0, 13.0, 21.0, 42.0, 64.0, 107.0, 119.0, 161.0, 120.0, 108.0, 87.0, 66.0, 35.0, 17.0, 13.0, 4.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.290771484375, -0.27957916259765625, -0.2683868408203125, -0.25719451904296875, -0.246002197265625, -0.23480987548828125, -0.2236175537109375, -0.21242523193359375, -0.20123291015625, -0.19004058837890625, -0.1788482666015625, -0.16765594482421875, -0.156463623046875, -0.14527130126953125, -0.1340789794921875, -0.12288665771484375, -0.1116943359375, -0.10050201416015625, -0.0893096923828125, -0.07811737060546875, -0.066925048828125, -0.05573272705078125, -0.0445404052734375, -0.03334808349609375, -0.02215576171875, -0.01096343994140625, 0.0002288818359375, 0.01142120361328125, 0.022613525390625, 0.03380584716796875, 0.0449981689453125, 0.05619049072265625, 0.0673828125, 0.07857513427734375, 0.0897674560546875, 0.10095977783203125, 0.112152099609375, 0.12334442138671875, 0.1345367431640625, 0.14572906494140625, 0.15692138671875, 0.16811370849609375, 0.1793060302734375, 0.19049835205078125, 0.201690673828125, 0.21288299560546875, 0.2240753173828125, 0.23526763916015625, 0.2464599609375, 0.25765228271484375, 0.2688446044921875, 0.28003692626953125, 0.291229248046875, 0.30242156982421875, 0.3136138916015625, 0.32480621337890625, 0.33599853515625, 0.34719085693359375, 0.3583831787109375, 0.36957550048828125, 0.380767822265625, 0.39196014404296875, 0.4031524658203125, 0.41434478759765625, 0.425537109375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 2.0, 5.0, 6.0, 4.0, 18.0, 22.0, 23.0, 39.0, 48.0, 81.0, 88.0, 158.0, 217.0, 360.0, 650.0, 1258.0, 3017.0, 8533.0, 31487.0, 142713.0, 500468.0, 277310.0, 59049.0, 14721.0, 4582.0, 1654.0, 763.0, 478.0, 250.0, 161.0, 126.0, 75.0, 61.0, 41.0, 32.0, 13.0, 13.0, 7.0, 11.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0], "bins": [-1.7490234375, -1.698638916015625, -1.64825439453125, -1.597869873046875, -1.5474853515625, -1.497100830078125, -1.44671630859375, -1.396331787109375, -1.345947265625, -1.295562744140625, -1.24517822265625, -1.194793701171875, -1.1444091796875, -1.094024658203125, -1.04364013671875, -0.993255615234375, -0.94287109375, -0.892486572265625, -0.84210205078125, -0.791717529296875, -0.7413330078125, -0.690948486328125, -0.64056396484375, -0.590179443359375, -0.539794921875, -0.489410400390625, -0.43902587890625, -0.388641357421875, -0.3382568359375, -0.287872314453125, -0.23748779296875, -0.187103271484375, -0.13671875, -0.086334228515625, -0.03594970703125, 0.014434814453125, 0.0648193359375, 0.115203857421875, 0.16558837890625, 0.215972900390625, 0.266357421875, 0.316741943359375, 0.36712646484375, 0.417510986328125, 0.4678955078125, 0.518280029296875, 0.56866455078125, 0.619049072265625, 0.66943359375, 0.719818115234375, 0.77020263671875, 0.820587158203125, 0.8709716796875, 0.921356201171875, 0.97174072265625, 1.022125244140625, 1.072509765625, 1.122894287109375, 1.17327880859375, 1.223663330078125, 1.2740478515625, 1.324432373046875, 1.37481689453125, 1.425201416015625, 1.4755859375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 2.0, 0.0, 5.0, 8.0, 9.0, 11.0, 11.0, 20.0, 20.0, 31.0, 34.0, 36.0, 48.0, 50.0, 56.0, 63.0, 76.0, 63.0, 67.0, 48.0, 66.0, 47.0, 40.0, 42.0, 25.0, 37.0, 20.0, 21.0, 17.0, 7.0, 13.0, 3.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9716796875, -0.9374847412109375, -0.903289794921875, -0.8690948486328125, -0.83489990234375, -0.8007049560546875, -0.766510009765625, -0.7323150634765625, -0.6981201171875, -0.6639251708984375, -0.629730224609375, -0.5955352783203125, -0.56134033203125, -0.5271453857421875, -0.492950439453125, -0.4587554931640625, -0.424560546875, -0.3903656005859375, -0.356170654296875, -0.3219757080078125, -0.28778076171875, -0.2535858154296875, -0.219390869140625, -0.1851959228515625, -0.1510009765625, -0.1168060302734375, -0.082611083984375, -0.0484161376953125, -0.01422119140625, 0.0199737548828125, 0.054168701171875, 0.0883636474609375, 0.12255859375, 0.1567535400390625, 0.190948486328125, 0.2251434326171875, 0.25933837890625, 0.2935333251953125, 0.327728271484375, 0.3619232177734375, 0.3961181640625, 0.4303131103515625, 0.464508056640625, 0.4987030029296875, 0.53289794921875, 0.5670928955078125, 0.601287841796875, 0.6354827880859375, 0.669677734375, 0.7038726806640625, 0.738067626953125, 0.7722625732421875, 0.80645751953125, 0.8406524658203125, 0.874847412109375, 0.9090423583984375, 0.9432373046875, 0.9774322509765625, 1.011627197265625, 1.0458221435546875, 1.08001708984375, 1.1142120361328125, 1.148406982421875, 1.1826019287109375, 1.216796875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 1.0, 5.0, 4.0, 8.0, 10.0, 17.0, 29.0, 18.0, 49.0, 53.0, 89.0, 117.0, 228.0, 457.0, 945.0, 2823.0, 12164.0, 172265.0, 815859.0, 34933.0, 5300.0, 1639.0, 720.0, 299.0, 178.0, 103.0, 71.0, 48.0, 26.0, 24.0, 15.0, 13.0, 9.0, 7.0, 3.0, 6.0, 4.0, 5.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0], "bins": [-1.87890625, -1.814666748046875, -1.75042724609375, -1.686187744140625, -1.6219482421875, -1.557708740234375, -1.49346923828125, -1.429229736328125, -1.364990234375, -1.300750732421875, -1.23651123046875, -1.172271728515625, -1.1080322265625, -1.043792724609375, -0.97955322265625, -0.915313720703125, -0.85107421875, -0.786834716796875, -0.72259521484375, -0.658355712890625, -0.5941162109375, -0.529876708984375, -0.46563720703125, -0.401397705078125, -0.337158203125, -0.272918701171875, -0.20867919921875, -0.144439697265625, -0.0802001953125, -0.015960693359375, 0.04827880859375, 0.112518310546875, 0.1767578125, 0.240997314453125, 0.30523681640625, 0.369476318359375, 0.4337158203125, 0.497955322265625, 0.56219482421875, 0.626434326171875, 0.690673828125, 0.754913330078125, 0.81915283203125, 0.883392333984375, 0.9476318359375, 1.011871337890625, 1.07611083984375, 1.140350341796875, 1.20458984375, 1.268829345703125, 1.33306884765625, 1.397308349609375, 1.4615478515625, 1.525787353515625, 1.59002685546875, 1.654266357421875, 1.718505859375, 1.782745361328125, 1.84698486328125, 1.911224365234375, 1.9754638671875, 2.039703369140625, 2.10394287109375, 2.168182373046875, 2.232421875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 7.0, 6.0, 10.0, 18.0, 22.0, 37.0, 47.0, 82.0, 143.0, 198.0, 171.0, 91.0, 60.0, 37.0, 22.0, 17.0, 9.0, 8.0, 5.0, 3.0, 7.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00024247169494628906, -0.0002358369529247284, -0.00022920221090316772, -0.00022256746888160706, -0.0002159327268600464, -0.00020929798483848572, -0.00020266324281692505, -0.00019602850079536438, -0.0001893937587738037, -0.00018275901675224304, -0.00017612427473068237, -0.0001694895327091217, -0.00016285479068756104, -0.00015622004866600037, -0.0001495853066444397, -0.00014295056462287903, -0.00013631582260131836, -0.0001296810805797577, -0.00012304633855819702, -0.00011641159653663635, -0.00010977685451507568, -0.00010314211249351501, -9.650737047195435e-05, -8.987262845039368e-05, -8.323788642883301e-05, -7.660314440727234e-05, -6.996840238571167e-05, -6.3333660364151e-05, -5.669891834259033e-05, -5.006417632102966e-05, -4.3429434299468994e-05, -3.6794692277908325e-05, -3.0159950256347656e-05, -2.3525208234786987e-05, -1.689046621322632e-05, -1.025572419166565e-05, -3.6209821701049805e-06, 3.0137598514556885e-06, 9.648501873016357e-06, 1.6283243894577026e-05, 2.2917985916137695e-05, 2.9552727937698364e-05, 3.618746995925903e-05, 4.28222119808197e-05, 4.945695400238037e-05, 5.609169602394104e-05, 6.272643804550171e-05, 6.936118006706238e-05, 7.599592208862305e-05, 8.263066411018372e-05, 8.926540613174438e-05, 9.590014815330505e-05, 0.00010253489017486572, 0.00010916963219642639, 0.00011580437421798706, 0.00012243911623954773, 0.0001290738582611084, 0.00013570860028266907, 0.00014234334230422974, 0.0001489780843257904, 0.00015561282634735107, 0.00016224756836891174, 0.0001688823103904724, 0.00017551705241203308, 0.00018215179443359375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 6.0, 7.0, 9.0, 13.0, 19.0, 30.0, 65.0, 96.0, 162.0, 320.0, 745.0, 2156.0, 7774.0, 50880.0, 844427.0, 124782.0, 12118.0, 3052.0, 1042.0, 384.0, 209.0, 100.0, 61.0, 34.0, 14.0, 19.0, 10.0, 8.0, 4.0, 5.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.341796875, -2.2812042236328125, -2.220611572265625, -2.1600189208984375, -2.09942626953125, -2.0388336181640625, -1.978240966796875, -1.9176483154296875, -1.8570556640625, -1.7964630126953125, -1.735870361328125, -1.6752777099609375, -1.61468505859375, -1.5540924072265625, -1.493499755859375, -1.4329071044921875, -1.372314453125, -1.3117218017578125, -1.251129150390625, -1.1905364990234375, -1.12994384765625, -1.0693511962890625, -1.008758544921875, -0.9481658935546875, -0.8875732421875, -0.8269805908203125, -0.766387939453125, -0.7057952880859375, -0.64520263671875, -0.5846099853515625, -0.524017333984375, -0.4634246826171875, -0.40283203125, -0.3422393798828125, -0.281646728515625, -0.2210540771484375, -0.16046142578125, -0.0998687744140625, -0.039276123046875, 0.0213165283203125, 0.0819091796875, 0.1425018310546875, 0.203094482421875, 0.2636871337890625, 0.32427978515625, 0.3848724365234375, 0.445465087890625, 0.5060577392578125, 0.566650390625, 0.6272430419921875, 0.687835693359375, 0.7484283447265625, 0.80902099609375, 0.8696136474609375, 0.930206298828125, 0.9907989501953125, 1.0513916015625, 1.1119842529296875, 1.172576904296875, 1.2331695556640625, 1.29376220703125, 1.3543548583984375, 1.414947509765625, 1.4755401611328125, 1.5361328125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 2.0, 2.0, 6.0, 9.0, 4.0, 9.0, 15.0, 20.0, 36.0, 46.0, 47.0, 76.0, 129.0, 105.0, 121.0, 95.0, 82.0, 51.0, 40.0, 27.0, 27.0, 9.0, 10.0, 8.0, 5.0, 4.0, 5.0, 0.0, 2.0, 3.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.73974609375, -0.718505859375, -0.697265625, -0.676025390625, -0.65478515625, -0.633544921875, -0.6123046875, -0.591064453125, -0.56982421875, -0.548583984375, -0.52734375, -0.506103515625, -0.48486328125, -0.463623046875, -0.4423828125, -0.421142578125, -0.39990234375, -0.378662109375, -0.357421875, -0.336181640625, -0.31494140625, -0.293701171875, -0.2724609375, -0.251220703125, -0.22998046875, -0.208740234375, -0.1875, -0.166259765625, -0.14501953125, -0.123779296875, -0.1025390625, -0.081298828125, -0.06005859375, -0.038818359375, -0.017578125, 0.003662109375, 0.02490234375, 0.046142578125, 0.0673828125, 0.088623046875, 0.10986328125, 0.131103515625, 0.15234375, 0.173583984375, 0.19482421875, 0.216064453125, 0.2373046875, 0.258544921875, 0.27978515625, 0.301025390625, 0.322265625, 0.343505859375, 0.36474609375, 0.385986328125, 0.4072265625, 0.428466796875, 0.44970703125, 0.470947265625, 0.4921875, 0.513427734375, 0.53466796875, 0.555908203125, 0.5771484375, 0.598388671875, 0.61962890625]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 9.0, 17.0, 33.0, 63.0, 144.0, 199.0, 242.0, 146.0, 73.0, 38.0, 21.0, 9.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.205010414123535, -9.782374382019043, -9.359739303588867, -8.937103271484375, -8.5144681930542, -8.091832160949707, -7.669196605682373, -7.246561050415039, -6.823925495147705, -6.401289939880371, -5.978654384613037, -5.556018829345703, -5.133382797241211, -4.710747718811035, -4.288111686706543, -3.865476131439209, -3.442840576171875, -3.020205020904541, -2.597569465637207, -2.174933671951294, -1.75229811668396, -1.329662561416626, -0.9070267677307129, -0.4843912124633789, -0.06175565719604492, 0.36087995767593384, 0.7835155725479126, 1.2061512470245361, 1.6287868022918701, 2.051422357559204, 2.474058151245117, 2.896693706512451, 3.3193283081054688, 3.7419638633728027, 4.164599418640137, 4.587235450744629, 5.009870529174805, 5.432506561279297, 5.855142116546631, 6.277777671813965, 6.700413227081299, 7.123048782348633, 7.545684337615967, 7.968319892883301, 8.390955924987793, 8.813591003417969, 9.236227035522461, 9.658863067626953, 10.081498146057129, 10.504134178161621, 10.926769256591797, 11.349405288696289, 11.772040367126465, 12.194676399230957, 12.617311477661133, 13.039947509765625, 13.462583541870117, 13.88521957397461, 14.307854652404785, 14.730490684509277, 15.153125762939453, 15.575761795043945, 15.998397827148438, 16.421031951904297, 16.84366798400879]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 5.0, 10.0, 7.0, 11.0, 11.0, 19.0, 18.0, 31.0, 29.0, 39.0, 42.0, 41.0, 51.0, 44.0, 51.0, 61.0, 58.0, 51.0, 47.0, 59.0, 47.0, 44.0, 32.0, 39.0, 33.0, 23.0, 24.0, 21.0, 9.0, 12.0, 7.0, 7.0, 6.0, 4.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.999790191650391, -5.7956647872924805, -5.591538906097412, -5.387413501739502, -5.183288097381592, -4.979162216186523, -4.775036811828613, -4.570911407470703, -4.366786003112793, -4.162660598754883, -3.9585349559783936, -3.7544093132019043, -3.550283908843994, -3.346158266067505, -3.1420326232910156, -2.9379072189331055, -2.733781337738037, -2.529655694961548, -2.3255302906036377, -2.1214046478271484, -1.9172791242599487, -1.713153600692749, -1.5090279579162598, -1.30490243434906, -1.1007769107818604, -0.8966513872146606, -0.6925258040428162, -0.4884002208709717, -0.284274697303772, -0.08014917373657227, 0.12397646903991699, 0.3281019926071167, 0.5322275161743164, 0.7363530397415161, 0.9404786229133606, 1.144604206085205, 1.3487297296524048, 1.5528552532196045, 1.7569808959960938, 1.9611064195632935, 2.165231943130493, 2.3693575859069824, 2.5734829902648926, 2.777608633041382, 2.981734275817871, 3.1858596801757812, 3.3899853229522705, 3.5941109657287598, 3.79823637008667, 4.00236177444458, 4.206487655639648, 4.410613059997559, 4.614738464355469, 4.818863868713379, 5.022989749908447, 5.227115154266357, 5.431241035461426, 5.635366439819336, 5.839492321014404, 6.0436177253723145, 6.247743129730225, 6.451869010925293, 6.655994415283203, 6.860119819641113, 7.064245223999023]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 7.0, 9.0, 8.0, 12.0, 37.0, 47.0, 82.0, 168.0, 346.0, 969.0, 2938.0, 12042.0, 124431.0, 4002103.0, 40983.0, 6583.0, 1827.0, 662.0, 363.0, 183.0, 113.0, 97.0, 69.0, 42.0, 33.0, 35.0, 12.0, 11.0, 17.0, 10.0, 7.0, 9.0, 3.0, 4.0, 2.0, 5.0, 4.0, 8.0, 3.0, 1.0, 4.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0], "bins": [-4.5234375, -4.35784912109375, -4.1922607421875, -4.02667236328125, -3.861083984375, -3.69549560546875, -3.5299072265625, -3.36431884765625, -3.19873046875, -3.03314208984375, -2.8675537109375, -2.70196533203125, -2.536376953125, -2.37078857421875, -2.2052001953125, -2.03961181640625, -1.8740234375, -1.70843505859375, -1.5428466796875, -1.37725830078125, -1.211669921875, -1.04608154296875, -0.8804931640625, -0.71490478515625, -0.54931640625, -0.38372802734375, -0.2181396484375, -0.05255126953125, 0.113037109375, 0.27862548828125, 0.4442138671875, 0.60980224609375, 0.775390625, 0.94097900390625, 1.1065673828125, 1.27215576171875, 1.437744140625, 1.60333251953125, 1.7689208984375, 1.93450927734375, 2.10009765625, 2.26568603515625, 2.4312744140625, 2.59686279296875, 2.762451171875, 2.92803955078125, 3.0936279296875, 3.25921630859375, 3.4248046875, 3.59039306640625, 3.7559814453125, 3.92156982421875, 4.087158203125, 4.25274658203125, 4.4183349609375, 4.58392333984375, 4.74951171875, 4.91510009765625, 5.0806884765625, 5.24627685546875, 5.411865234375, 5.57745361328125, 5.7430419921875, 5.90863037109375, 6.07421875]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 12.0, 7.0, 5.0, 26.0, 44.0, 62.0, 85.0, 113.0, 136.0, 132.0, 98.0, 91.0, 58.0, 54.0, 31.0, 20.0, 11.0, 7.0, 5.0, 2.0, 1.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.328857421875, -0.31723785400390625, -0.3056182861328125, -0.29399871826171875, -0.282379150390625, -0.27075958251953125, -0.2591400146484375, -0.24752044677734375, -0.23590087890625, -0.22428131103515625, -0.2126617431640625, -0.20104217529296875, -0.189422607421875, -0.17780303955078125, -0.1661834716796875, -0.15456390380859375, -0.1429443359375, -0.13132476806640625, -0.1197052001953125, -0.10808563232421875, -0.096466064453125, -0.08484649658203125, -0.0732269287109375, -0.06160736083984375, -0.04998779296875, -0.03836822509765625, -0.0267486572265625, -0.01512908935546875, -0.003509521484375, 0.00811004638671875, 0.0197296142578125, 0.03134918212890625, 0.04296875, 0.05458831787109375, 0.0662078857421875, 0.07782745361328125, 0.089447021484375, 0.10106658935546875, 0.1126861572265625, 0.12430572509765625, 0.13592529296875, 0.14754486083984375, 0.1591644287109375, 0.17078399658203125, 0.182403564453125, 0.19402313232421875, 0.2056427001953125, 0.21726226806640625, 0.2288818359375, 0.24050140380859375, 0.2521209716796875, 0.26374053955078125, 0.275360107421875, 0.28697967529296875, 0.2985992431640625, 0.31021881103515625, 0.32183837890625, 0.33345794677734375, 0.3450775146484375, 0.35669708251953125, 0.368316650390625, 0.37993621826171875, 0.3915557861328125, 0.40317535400390625, 0.414794921875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 5.0, 9.0, 13.0, 22.0, 33.0, 63.0, 108.0, 227.0, 423.0, 1206.0, 4852.0, 48228.0, 4069008.0, 62549.0, 5106.0, 1167.0, 478.0, 290.0, 170.0, 115.0, 61.0, 49.0, 36.0, 19.0, 19.0, 10.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.1328125, -5.9443359375, -5.755859375, -5.5673828125, -5.37890625, -5.1904296875, -5.001953125, -4.8134765625, -4.625, -4.4365234375, -4.248046875, -4.0595703125, -3.87109375, -3.6826171875, -3.494140625, -3.3056640625, -3.1171875, -2.9287109375, -2.740234375, -2.5517578125, -2.36328125, -2.1748046875, -1.986328125, -1.7978515625, -1.609375, -1.4208984375, -1.232421875, -1.0439453125, -0.85546875, -0.6669921875, -0.478515625, -0.2900390625, -0.1015625, 0.0869140625, 0.275390625, 0.4638671875, 0.65234375, 0.8408203125, 1.029296875, 1.2177734375, 1.40625, 1.5947265625, 1.783203125, 1.9716796875, 2.16015625, 2.3486328125, 2.537109375, 2.7255859375, 2.9140625, 3.1025390625, 3.291015625, 3.4794921875, 3.66796875, 3.8564453125, 4.044921875, 4.2333984375, 4.421875, 4.6103515625, 4.798828125, 4.9873046875, 5.17578125, 5.3642578125, 5.552734375, 5.7412109375, 5.9296875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 7.0, 8.0, 6.0, 17.0, 18.0, 25.0, 33.0, 60.0, 121.0, 311.0, 1954.0, 1023.0, 232.0, 93.0, 48.0, 35.0, 31.0, 17.0, 9.0, 14.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.421142578125, -0.3999290466308594, -0.37871551513671875, -0.3575019836425781, -0.3362884521484375, -0.3150749206542969, -0.29386138916015625, -0.2726478576660156, -0.251434326171875, -0.23022079467773438, -0.20900726318359375, -0.18779373168945312, -0.1665802001953125, -0.14536666870117188, -0.12415313720703125, -0.10293960571289062, -0.08172607421875, -0.060512542724609375, -0.03929901123046875, -0.018085479736328125, 0.0031280517578125, 0.024341583251953125, 0.04555511474609375, 0.06676864624023438, 0.087982177734375, 0.10919570922851562, 0.13040924072265625, 0.15162277221679688, 0.1728363037109375, 0.19404983520507812, 0.21526336669921875, 0.23647689819335938, 0.2576904296875, 0.2789039611816406, 0.30011749267578125, 0.3213310241699219, 0.3425445556640625, 0.3637580871582031, 0.38497161865234375, 0.4061851501464844, 0.427398681640625, 0.4486122131347656, 0.46982574462890625, 0.4910392761230469, 0.5122528076171875, 0.5334663391113281, 0.5546798706054688, 0.5758934020996094, 0.59710693359375, 0.6183204650878906, 0.6395339965820312, 0.6607475280761719, 0.6819610595703125, 0.7031745910644531, 0.7243881225585938, 0.7456016540527344, 0.766815185546875, 0.7880287170410156, 0.8092422485351562, 0.8304557800292969, 0.8516693115234375, 0.8728828430175781, 0.8940963745117188, 0.9153099060058594, 0.9365234375]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 7.0, 17.0, 35.0, 88.0, 233.0, 335.0, 180.0, 59.0, 13.0, 9.0, 9.0, 4.0, 2.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5915632247924805, -4.385827541351318, -4.180091381072998, -3.974355697631836, -3.7686197757720947, -3.5628838539123535, -3.3571481704711914, -3.15141224861145, -2.945676326751709, -2.7399404048919678, -2.5342044830322266, -2.3284687995910645, -2.1227328777313232, -1.916996955871582, -1.7112611532211304, -1.5055253505706787, -1.2997894287109375, -1.0940535068511963, -0.8883177042007446, -0.6825818419456482, -0.47684597969055176, -0.27111005783081055, -0.06537425518035889, 0.14036154747009277, 0.346097469329834, 0.5518333315849304, 0.7575691938400269, 0.9633050560951233, 1.1690409183502197, 1.374776840209961, 1.5805126428604126, 1.7862484455108643, 1.9919843673706055, 2.1977202892303467, 2.403456211090088, 2.60919189453125, 2.814927816390991, 3.0206637382507324, 3.2263994216918945, 3.4321353435516357, 3.637871265411377, 3.843607187271118, 4.049343109130859, 4.2550787925720215, 4.460814476013184, 4.666550636291504, 4.872286319732666, 5.078022003173828, 5.283758163452148, 5.4894938468933105, 5.695230007171631, 5.900965690612793, 6.106701850891113, 6.312437534332275, 6.5181732177734375, 6.723909378051758, 6.92964506149292, 7.135380744934082, 7.341116905212402, 7.5468525886535645, 7.752588272094727, 7.958324432373047, 8.164060592651367, 8.369795799255371, 8.575531959533691]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 6.0, 6.0, 8.0, 17.0, 20.0, 33.0, 41.0, 54.0, 59.0, 69.0, 93.0, 102.0, 106.0, 85.0, 56.0, 59.0, 45.0, 41.0, 29.0, 20.0, 15.0, 13.0, 9.0, 8.0, 5.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8537631034851074, -2.7675726413726807, -2.681381940841675, -2.595191478729248, -2.5090010166168213, -2.4228103160858154, -2.3366198539733887, -2.250429153442383, -2.164238691329956, -2.0780482292175293, -1.991857647895813, -1.9056670665740967, -1.8194764852523804, -1.733285903930664, -1.6470954418182373, -1.560904860496521, -1.4747143983840942, -1.388523817062378, -1.3023333549499512, -1.2161427736282349, -1.1299521923065186, -1.0437617301940918, -0.9575711488723755, -0.8713805675506592, -0.7851900458335876, -0.6989995241165161, -0.6128089427947998, -0.5266184210777283, -0.44042786955833435, -0.35423731803894043, -0.2680467963218689, -0.1818562150001526, -0.09566569328308105, -0.00947514921426773, 0.0767153948545456, 0.16290593147277832, 0.24909648299217224, 0.33528703451156616, 0.4214775562286377, 0.507668137550354, 0.5938586592674255, 0.6800491809844971, 0.7662397623062134, 0.8524302840232849, 0.9386208057403564, 1.0248113870620728, 1.111001968383789, 1.1971924304962158, 1.2833830118179321, 1.3695735931396484, 1.4557640552520752, 1.5419546365737915, 1.6281452178955078, 1.7143356800079346, 1.8005262613296509, 1.8867168426513672, 1.972907304763794, 2.0590977668762207, 2.1452884674072266, 2.2314789295196533, 2.31766939163208, 2.403860092163086, 2.4900505542755127, 2.5762410163879395, 2.6624317169189453]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 4.0, 4.0, 7.0, 9.0, 6.0, 15.0, 13.0, 31.0, 34.0, 56.0, 82.0, 116.0, 182.0, 327.0, 615.0, 1376.0, 3610.0, 13287.0, 94959.0, 711062.0, 193081.0, 21152.0, 5044.0, 1715.0, 742.0, 394.0, 212.0, 134.0, 94.0, 56.0, 40.0, 25.0, 21.0, 12.0, 11.0, 13.0, 4.0, 5.0, 1.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.076171875, -2.98736572265625, -2.8985595703125, -2.80975341796875, -2.720947265625, -2.63214111328125, -2.5433349609375, -2.45452880859375, -2.36572265625, -2.27691650390625, -2.1881103515625, -2.09930419921875, -2.010498046875, -1.92169189453125, -1.8328857421875, -1.74407958984375, -1.6552734375, -1.56646728515625, -1.4776611328125, -1.38885498046875, -1.300048828125, -1.21124267578125, -1.1224365234375, -1.03363037109375, -0.94482421875, -0.85601806640625, -0.7672119140625, -0.67840576171875, -0.589599609375, -0.50079345703125, -0.4119873046875, -0.32318115234375, -0.234375, -0.14556884765625, -0.0567626953125, 0.03204345703125, 0.120849609375, 0.20965576171875, 0.2984619140625, 0.38726806640625, 0.47607421875, 0.56488037109375, 0.6536865234375, 0.74249267578125, 0.831298828125, 0.92010498046875, 1.0089111328125, 1.09771728515625, 1.1865234375, 1.27532958984375, 1.3641357421875, 1.45294189453125, 1.541748046875, 1.63055419921875, 1.7193603515625, 1.80816650390625, 1.89697265625, 1.98577880859375, 2.0745849609375, 2.16339111328125, 2.252197265625, 2.34100341796875, 2.4298095703125, 2.51861572265625, 2.607421875]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 6.0, 8.0, 16.0, 23.0, 40.0, 54.0, 79.0, 108.0, 115.0, 113.0, 106.0, 103.0, 70.0, 60.0, 36.0, 21.0, 16.0, 6.0, 5.0, 6.0, 5.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.322998046875, -0.3112945556640625, -0.299591064453125, -0.2878875732421875, -0.27618408203125, -0.2644805908203125, -0.252777099609375, -0.2410736083984375, -0.2293701171875, -0.2176666259765625, -0.205963134765625, -0.1942596435546875, -0.18255615234375, -0.1708526611328125, -0.159149169921875, -0.1474456787109375, -0.1357421875, -0.1240386962890625, -0.112335205078125, -0.1006317138671875, -0.08892822265625, -0.0772247314453125, -0.065521240234375, -0.0538177490234375, -0.0421142578125, -0.0304107666015625, -0.018707275390625, -0.0070037841796875, 0.00469970703125, 0.0164031982421875, 0.028106689453125, 0.0398101806640625, 0.051513671875, 0.0632171630859375, 0.074920654296875, 0.0866241455078125, 0.09832763671875, 0.1100311279296875, 0.121734619140625, 0.1334381103515625, 0.1451416015625, 0.1568450927734375, 0.168548583984375, 0.1802520751953125, 0.19195556640625, 0.2036590576171875, 0.215362548828125, 0.2270660400390625, 0.23876953125, 0.2504730224609375, 0.262176513671875, 0.2738800048828125, 0.28558349609375, 0.2972869873046875, 0.308990478515625, 0.3206939697265625, 0.3323974609375, 0.3441009521484375, 0.355804443359375, 0.3675079345703125, 0.37921142578125, 0.3909149169921875, 0.402618408203125, 0.4143218994140625, 0.426025390625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 8.0, 6.0, 6.0, 12.0, 12.0, 19.0, 34.0, 41.0, 58.0, 69.0, 102.0, 199.0, 241.0, 486.0, 758.0, 1419.0, 3092.0, 7192.0, 19880.0, 60874.0, 199670.0, 416620.0, 230112.0, 70265.0, 22114.0, 8270.0, 3334.0, 1582.0, 790.0, 431.0, 287.0, 171.0, 112.0, 91.0, 59.0, 32.0, 27.0, 22.0, 19.0, 13.0, 6.0, 7.0, 6.0, 7.0, 3.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.3056640625, -1.26556396484375, -1.2254638671875, -1.18536376953125, -1.145263671875, -1.10516357421875, -1.0650634765625, -1.02496337890625, -0.98486328125, -0.94476318359375, -0.9046630859375, -0.86456298828125, -0.824462890625, -0.78436279296875, -0.7442626953125, -0.70416259765625, -0.6640625, -0.62396240234375, -0.5838623046875, -0.54376220703125, -0.503662109375, -0.46356201171875, -0.4234619140625, -0.38336181640625, -0.34326171875, -0.30316162109375, -0.2630615234375, -0.22296142578125, -0.182861328125, -0.14276123046875, -0.1026611328125, -0.06256103515625, -0.0224609375, 0.01763916015625, 0.0577392578125, 0.09783935546875, 0.137939453125, 0.17803955078125, 0.2181396484375, 0.25823974609375, 0.29833984375, 0.33843994140625, 0.3785400390625, 0.41864013671875, 0.458740234375, 0.49884033203125, 0.5389404296875, 0.57904052734375, 0.619140625, 0.65924072265625, 0.6993408203125, 0.73944091796875, 0.779541015625, 0.81964111328125, 0.8597412109375, 0.89984130859375, 0.93994140625, 0.98004150390625, 1.0201416015625, 1.06024169921875, 1.100341796875, 1.14044189453125, 1.1805419921875, 1.22064208984375, 1.2607421875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 0.0, 1.0, 4.0, 3.0, 6.0, 11.0, 10.0, 8.0, 12.0, 21.0, 25.0, 16.0, 23.0, 31.0, 27.0, 31.0, 33.0, 32.0, 42.0, 48.0, 51.0, 46.0, 37.0, 46.0, 43.0, 42.0, 31.0, 44.0, 33.0, 30.0, 25.0, 39.0, 24.0, 20.0, 22.0, 16.0, 12.0, 15.0, 6.0, 11.0, 5.0, 8.0, 4.0, 5.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.8994140625, -0.8723068237304688, -0.8451995849609375, -0.8180923461914062, -0.790985107421875, -0.7638778686523438, -0.7367706298828125, -0.7096633911132812, -0.68255615234375, -0.6554489135742188, -0.6283416748046875, -0.6012344360351562, -0.574127197265625, -0.5470199584960938, -0.5199127197265625, -0.49280548095703125, -0.4656982421875, -0.43859100341796875, -0.4114837646484375, -0.38437652587890625, -0.357269287109375, -0.33016204833984375, -0.3030548095703125, -0.27594757080078125, -0.24884033203125, -0.22173309326171875, -0.1946258544921875, -0.16751861572265625, -0.140411376953125, -0.11330413818359375, -0.0861968994140625, -0.05908966064453125, -0.031982421875, -0.00487518310546875, 0.0222320556640625, 0.04933929443359375, 0.076446533203125, 0.10355377197265625, 0.1306610107421875, 0.15776824951171875, 0.18487548828125, 0.21198272705078125, 0.2390899658203125, 0.26619720458984375, 0.293304443359375, 0.32041168212890625, 0.3475189208984375, 0.37462615966796875, 0.4017333984375, 0.42884063720703125, 0.4559478759765625, 0.48305511474609375, 0.510162353515625, 0.5372695922851562, 0.5643768310546875, 0.5914840698242188, 0.61859130859375, 0.6456985473632812, 0.6728057861328125, 0.6999130249023438, 0.727020263671875, 0.7541275024414062, 0.7812347412109375, 0.8083419799804688, 0.83544921875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 7.0, 5.0, 7.0, 9.0, 22.0, 21.0, 21.0, 34.0, 44.0, 68.0, 116.0, 188.0, 394.0, 860.0, 2171.0, 6244.0, 23669.0, 172745.0, 728892.0, 89522.0, 15862.0, 4548.0, 1624.0, 691.0, 345.0, 168.0, 79.0, 50.0, 31.0, 27.0, 23.0, 21.0, 14.0, 7.0, 6.0, 3.0, 2.0, 4.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.998046875, -0.9672088623046875, -0.936370849609375, -0.9055328369140625, -0.87469482421875, -0.8438568115234375, -0.813018798828125, -0.7821807861328125, -0.7513427734375, -0.7205047607421875, -0.689666748046875, -0.6588287353515625, -0.62799072265625, -0.5971527099609375, -0.566314697265625, -0.5354766845703125, -0.504638671875, -0.4738006591796875, -0.442962646484375, -0.4121246337890625, -0.38128662109375, -0.3504486083984375, -0.319610595703125, -0.2887725830078125, -0.2579345703125, -0.2270965576171875, -0.196258544921875, -0.1654205322265625, -0.13458251953125, -0.1037445068359375, -0.072906494140625, -0.0420684814453125, -0.01123046875, 0.0196075439453125, 0.050445556640625, 0.0812835693359375, 0.11212158203125, 0.1429595947265625, 0.173797607421875, 0.2046356201171875, 0.2354736328125, 0.2663116455078125, 0.297149658203125, 0.3279876708984375, 0.35882568359375, 0.3896636962890625, 0.420501708984375, 0.4513397216796875, 0.482177734375, 0.5130157470703125, 0.543853759765625, 0.5746917724609375, 0.60552978515625, 0.6363677978515625, 0.667205810546875, 0.6980438232421875, 0.7288818359375, 0.7597198486328125, 0.790557861328125, 0.8213958740234375, 0.85223388671875, 0.8830718994140625, 0.913909912109375, 0.9447479248046875, 0.9755859375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 3.0, 4.0, 8.0, 14.0, 22.0, 31.0, 36.0, 62.0, 107.0, 175.0, 186.0, 141.0, 76.0, 44.0, 22.0, 23.0, 19.0, 9.0, 6.0, 1.0, 4.0, 2.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00020837783813476562, -0.00020262226462364197, -0.0001968666911125183, -0.00019111111760139465, -0.000185355544090271, -0.00017959997057914734, -0.00017384439706802368, -0.00016808882355690002, -0.00016233325004577637, -0.0001565776765346527, -0.00015082210302352905, -0.0001450665295124054, -0.00013931095600128174, -0.00013355538249015808, -0.00012779980897903442, -0.00012204423546791077, -0.00011628866195678711, -0.00011053308844566345, -0.0001047775149345398, -9.902194142341614e-05, -9.326636791229248e-05, -8.751079440116882e-05, -8.175522089004517e-05, -7.599964737892151e-05, -7.024407386779785e-05, -6.44885003566742e-05, -5.873292684555054e-05, -5.297735333442688e-05, -4.722177982330322e-05, -4.1466206312179565e-05, -3.571063280105591e-05, -2.995505928993225e-05, -2.4199485778808594e-05, -1.8443912267684937e-05, -1.268833875656128e-05, -6.932765245437622e-06, -1.1771917343139648e-06, 4.578381776809692e-06, 1.033395528793335e-05, 1.6089528799057007e-05, 2.1845102310180664e-05, 2.760067582130432e-05, 3.335624933242798e-05, 3.9111822843551636e-05, 4.486739635467529e-05, 5.062296986579895e-05, 5.637854337692261e-05, 6.213411688804626e-05, 6.788969039916992e-05, 7.364526391029358e-05, 7.940083742141724e-05, 8.51564109325409e-05, 9.091198444366455e-05, 9.666755795478821e-05, 0.00010242313146591187, 0.00010817870497703552, 0.00011393427848815918, 0.00011968985199928284, 0.0001254454255104065, 0.00013120099902153015, 0.0001369565725326538, 0.00014271214604377747, 0.00014846771955490112, 0.00015422329306602478, 0.00015997886657714844]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 5.0, 1.0, 5.0, 6.0, 9.0, 6.0, 12.0, 17.0, 26.0, 37.0, 44.0, 89.0, 121.0, 223.0, 392.0, 829.0, 1992.0, 5598.0, 21805.0, 151649.0, 742135.0, 98770.0, 16798.0, 4795.0, 1667.0, 707.0, 330.0, 182.0, 121.0, 50.0, 50.0, 30.0, 21.0, 12.0, 10.0, 4.0, 7.0, 0.0, 4.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.72216796875, -0.6913223266601562, -0.6604766845703125, -0.6296310424804688, -0.598785400390625, -0.5679397583007812, -0.5370941162109375, -0.5062484741210938, -0.47540283203125, -0.44455718994140625, -0.4137115478515625, -0.38286590576171875, -0.352020263671875, -0.32117462158203125, -0.2903289794921875, -0.25948333740234375, -0.2286376953125, -0.19779205322265625, -0.1669464111328125, -0.13610076904296875, -0.105255126953125, -0.07440948486328125, -0.0435638427734375, -0.01271820068359375, 0.01812744140625, 0.04897308349609375, 0.0798187255859375, 0.11066436767578125, 0.141510009765625, 0.17235565185546875, 0.2032012939453125, 0.23404693603515625, 0.264892578125, 0.29573822021484375, 0.3265838623046875, 0.35742950439453125, 0.388275146484375, 0.41912078857421875, 0.4499664306640625, 0.48081207275390625, 0.51165771484375, 0.5425033569335938, 0.5733489990234375, 0.6041946411132812, 0.635040283203125, 0.6658859252929688, 0.6967315673828125, 0.7275772094726562, 0.7584228515625, 0.7892684936523438, 0.8201141357421875, 0.8509597778320312, 0.881805419921875, 0.9126510620117188, 0.9434967041015625, 0.9743423461914062, 1.00518798828125, 1.0360336303710938, 1.0668792724609375, 1.0977249145507812, 1.128570556640625, 1.1594161987304688, 1.1902618408203125, 1.2211074829101562, 1.251953125]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 8.0, 1.0, 2.0, 1.0, 3.0, 3.0, 6.0, 6.0, 20.0, 12.0, 26.0, 31.0, 55.0, 74.0, 115.0, 122.0, 135.0, 125.0, 77.0, 47.0, 40.0, 30.0, 21.0, 12.0, 15.0, 10.0, 5.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.662109375, -0.64190673828125, -0.6217041015625, -0.60150146484375, -0.581298828125, -0.56109619140625, -0.5408935546875, -0.52069091796875, -0.50048828125, -0.48028564453125, -0.4600830078125, -0.43988037109375, -0.419677734375, -0.39947509765625, -0.3792724609375, -0.35906982421875, -0.3388671875, -0.31866455078125, -0.2984619140625, -0.27825927734375, -0.258056640625, -0.23785400390625, -0.2176513671875, -0.19744873046875, -0.17724609375, -0.15704345703125, -0.1368408203125, -0.11663818359375, -0.096435546875, -0.07623291015625, -0.0560302734375, -0.03582763671875, -0.015625, 0.00457763671875, 0.0247802734375, 0.04498291015625, 0.065185546875, 0.08538818359375, 0.1055908203125, 0.12579345703125, 0.14599609375, 0.16619873046875, 0.1864013671875, 0.20660400390625, 0.226806640625, 0.24700927734375, 0.2672119140625, 0.28741455078125, 0.3076171875, 0.32781982421875, 0.3480224609375, 0.36822509765625, 0.388427734375, 0.40863037109375, 0.4288330078125, 0.44903564453125, 0.46923828125, 0.48944091796875, 0.5096435546875, 0.52984619140625, 0.550048828125, 0.57025146484375, 0.5904541015625, 0.61065673828125, 0.630859375]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 9.0, 22.0, 35.0, 87.0, 229.0, 309.0, 189.0, 71.0, 32.0, 15.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.56186294555664, -23.955339431762695, -23.34881591796875, -22.742292404174805, -22.13576889038086, -21.529247283935547, -20.9227237701416, -20.316200256347656, -19.70967674255371, -19.103153228759766, -18.49662971496582, -17.890106201171875, -17.283584594726562, -16.677061080932617, -16.070537567138672, -15.464014053344727, -14.857490539550781, -14.250967025756836, -13.64444351196289, -13.037920951843262, -12.431397438049316, -11.824873924255371, -11.218351364135742, -10.611827850341797, -10.005304336547852, -9.398780822753906, -8.792257308959961, -8.185734748840332, -7.579211235046387, -6.972687721252441, -6.366164684295654, -5.759641647338867, -5.1531171798706055, -4.54659366607666, -3.940070629119873, -3.333547353744507, -2.7270240783691406, -2.1205008029937744, -1.5139775276184082, -0.9074544906616211, -0.3009309768676758, 0.30559229850769043, 0.9121155738830566, 1.5186388492584229, 2.125162124633789, 2.7316854000091553, 3.3382086753845215, 3.9447317123413086, 4.551255226135254, 5.157778739929199, 5.764301776885986, 6.370824813842773, 6.977348327636719, 7.583871841430664, 8.19039535522461, 8.796917915344238, 9.403441429138184, 10.009964942932129, 10.616487503051758, 11.223011016845703, 11.829534530639648, 12.436058044433594, 13.042581558227539, 13.649104118347168, 14.255627632141113]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 5.0, 4.0, 4.0, 6.0, 16.0, 15.0, 10.0, 16.0, 21.0, 32.0, 47.0, 42.0, 38.0, 44.0, 53.0, 54.0, 47.0, 63.0, 60.0, 60.0, 60.0, 53.0, 48.0, 31.0, 23.0, 36.0, 19.0, 20.0, 14.0, 18.0, 11.0, 7.0, 10.0, 11.0, 5.0, 5.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-8.05985164642334, -7.851208209991455, -7.64256477355957, -7.433920860290527, -7.225277423858643, -7.016633987426758, -6.807990074157715, -6.59934663772583, -6.390703201293945, -6.1820597648620605, -5.973416328430176, -5.764772415161133, -5.556128978729248, -5.347485542297363, -5.13884162902832, -4.9301981925964355, -4.721554756164551, -4.512911319732666, -4.304267883300781, -4.095623970031738, -3.8869805335998535, -3.6783370971679688, -3.469693422317505, -3.261049747467041, -3.0524063110351562, -2.8437628746032715, -2.6351191997528076, -2.4264755249023438, -2.217832088470459, -2.009188652038574, -1.8005449771881104, -1.591901421546936, -1.3832578659057617, -1.1746143102645874, -0.9659707546234131, -0.7573271989822388, -0.5486836433410645, -0.34004008769989014, -0.13139653205871582, 0.0772470235824585, 0.2858905792236328, 0.49453413486480713, 0.7031776905059814, 0.9118212461471558, 1.12046480178833, 1.3291083574295044, 1.5377519130706787, 1.746395468711853, 1.9550390243530273, 2.163682460784912, 2.372326135635376, 2.58096981048584, 2.7896132469177246, 2.9982566833496094, 3.2069003582000732, 3.415544033050537, 3.624187469482422, 3.8328309059143066, 4.041474342346191, 4.250118255615234, 4.458761692047119, 4.667405128479004, 4.876049041748047, 5.084692478179932, 5.293335914611816]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 1.0, 3.0, 7.0, 12.0, 15.0, 22.0, 42.0, 60.0, 73.0, 132.0, 234.0, 475.0, 1028.0, 2776.0, 9995.0, 59699.0, 4037014.0, 67162.0, 10291.0, 2792.0, 1031.0, 468.0, 297.0, 154.0, 109.0, 99.0, 49.0, 43.0, 54.0, 28.0, 22.0, 11.0, 14.0, 23.0, 8.0, 8.0, 7.0, 3.0, 6.0, 6.0, 5.0, 5.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.927734375, -2.797760009765625, -2.66778564453125, -2.537811279296875, -2.4078369140625, -2.277862548828125, -2.14788818359375, -2.017913818359375, -1.887939453125, -1.757965087890625, -1.62799072265625, -1.498016357421875, -1.3680419921875, -1.238067626953125, -1.10809326171875, -0.978118896484375, -0.84814453125, -0.718170166015625, -0.58819580078125, -0.458221435546875, -0.3282470703125, -0.198272705078125, -0.06829833984375, 0.061676025390625, 0.191650390625, 0.321624755859375, 0.45159912109375, 0.581573486328125, 0.7115478515625, 0.841522216796875, 0.97149658203125, 1.101470947265625, 1.2314453125, 1.361419677734375, 1.49139404296875, 1.621368408203125, 1.7513427734375, 1.881317138671875, 2.01129150390625, 2.141265869140625, 2.271240234375, 2.401214599609375, 2.53118896484375, 2.661163330078125, 2.7911376953125, 2.921112060546875, 3.05108642578125, 3.181060791015625, 3.31103515625, 3.441009521484375, 3.57098388671875, 3.700958251953125, 3.8309326171875, 3.960906982421875, 4.09088134765625, 4.220855712890625, 4.350830078125, 4.480804443359375, 4.61077880859375, 4.740753173828125, 4.8707275390625, 5.000701904296875, 5.13067626953125, 5.260650634765625, 5.390625]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 8.0, 6.0, 8.0, 15.0, 25.0, 47.0, 71.0, 90.0, 93.0, 119.0, 115.0, 91.0, 92.0, 69.0, 49.0, 36.0, 23.0, 14.0, 10.0, 4.0, 3.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.31640625, -0.3047943115234375, -0.293182373046875, -0.2815704345703125, -0.26995849609375, -0.2583465576171875, -0.246734619140625, -0.2351226806640625, -0.2235107421875, -0.2118988037109375, -0.200286865234375, -0.1886749267578125, -0.17706298828125, -0.1654510498046875, -0.153839111328125, -0.1422271728515625, -0.130615234375, -0.1190032958984375, -0.107391357421875, -0.0957794189453125, -0.08416748046875, -0.0725555419921875, -0.060943603515625, -0.0493316650390625, -0.0377197265625, -0.0261077880859375, -0.014495849609375, -0.0028839111328125, 0.00872802734375, 0.0203399658203125, 0.031951904296875, 0.0435638427734375, 0.05517578125, 0.0667877197265625, 0.078399658203125, 0.0900115966796875, 0.10162353515625, 0.1132354736328125, 0.124847412109375, 0.1364593505859375, 0.1480712890625, 0.1596832275390625, 0.171295166015625, 0.1829071044921875, 0.19451904296875, 0.2061309814453125, 0.217742919921875, 0.2293548583984375, 0.240966796875, 0.2525787353515625, 0.264190673828125, 0.2758026123046875, 0.28741455078125, 0.2990264892578125, 0.310638427734375, 0.3222503662109375, 0.3338623046875, 0.3454742431640625, 0.357086181640625, 0.3686981201171875, 0.38031005859375, 0.3919219970703125, 0.403533935546875, 0.4151458740234375, 0.4267578125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 9.0, 6.0, 10.0, 13.0, 40.0, 49.0, 100.0, 149.0, 341.0, 633.0, 1595.0, 4766.0, 21390.0, 432061.0, 3691061.0, 31908.0, 6374.0, 1964.0, 805.0, 401.0, 230.0, 128.0, 89.0, 50.0, 32.0, 30.0, 18.0, 11.0, 9.0, 3.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-5.2265625, -5.099456787109375, -4.97235107421875, -4.845245361328125, -4.7181396484375, -4.591033935546875, -4.46392822265625, -4.336822509765625, -4.209716796875, -4.082611083984375, -3.95550537109375, -3.828399658203125, -3.7012939453125, -3.574188232421875, -3.44708251953125, -3.319976806640625, -3.19287109375, -3.065765380859375, -2.93865966796875, -2.811553955078125, -2.6844482421875, -2.557342529296875, -2.43023681640625, -2.303131103515625, -2.176025390625, -2.048919677734375, -1.92181396484375, -1.794708251953125, -1.6676025390625, -1.540496826171875, -1.41339111328125, -1.286285400390625, -1.1591796875, -1.032073974609375, -0.90496826171875, -0.777862548828125, -0.6507568359375, -0.523651123046875, -0.39654541015625, -0.269439697265625, -0.142333984375, -0.015228271484375, 0.11187744140625, 0.238983154296875, 0.3660888671875, 0.493194580078125, 0.62030029296875, 0.747406005859375, 0.87451171875, 1.001617431640625, 1.12872314453125, 1.255828857421875, 1.3829345703125, 1.510040283203125, 1.63714599609375, 1.764251708984375, 1.891357421875, 2.018463134765625, 2.14556884765625, 2.272674560546875, 2.3997802734375, 2.526885986328125, 2.65399169921875, 2.781097412109375, 2.908203125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 5.0, 6.0, 11.0, 17.0, 16.0, 22.0, 38.0, 63.0, 119.0, 388.0, 2373.0, 670.0, 168.0, 71.0, 33.0, 20.0, 16.0, 11.0, 8.0, 5.0, 5.0, 3.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51025390625, -0.48667144775390625, -0.4630889892578125, -0.43950653076171875, -0.415924072265625, -0.39234161376953125, -0.3687591552734375, -0.34517669677734375, -0.32159423828125, -0.29801177978515625, -0.2744293212890625, -0.25084686279296875, -0.227264404296875, -0.20368194580078125, -0.1800994873046875, -0.15651702880859375, -0.1329345703125, -0.10935211181640625, -0.0857696533203125, -0.06218719482421875, -0.038604736328125, -0.01502227783203125, 0.0085601806640625, 0.03214263916015625, 0.05572509765625, 0.07930755615234375, 0.1028900146484375, 0.12647247314453125, 0.150054931640625, 0.17363739013671875, 0.1972198486328125, 0.22080230712890625, 0.244384765625, 0.26796722412109375, 0.2915496826171875, 0.31513214111328125, 0.338714599609375, 0.36229705810546875, 0.3858795166015625, 0.40946197509765625, 0.43304443359375, 0.45662689208984375, 0.4802093505859375, 0.5037918090820312, 0.527374267578125, 0.5509567260742188, 0.5745391845703125, 0.5981216430664062, 0.6217041015625, 0.6452865600585938, 0.6688690185546875, 0.6924514770507812, 0.716033935546875, 0.7396163940429688, 0.7631988525390625, 0.7867813110351562, 0.81036376953125, 0.8339462280273438, 0.8575286865234375, 0.8811111450195312, 0.904693603515625, 0.9282760620117188, 0.9518585205078125, 0.9754409790039062, 0.9990234375]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 7.0, 13.0, 43.0, 96.0, 249.0, 325.0, 174.0, 62.0, 23.0, 10.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.948447227478027, -6.703046798706055, -6.457646369934082, -6.212245941162109, -5.966845512390137, -5.721445083618164, -5.476044654846191, -5.230644226074219, -4.985243797302246, -4.739843368530273, -4.494442939758301, -4.249042510986328, -4.0036420822143555, -3.758241653442383, -3.512840986251831, -3.2674405574798584, -3.0220398902893066, -2.776639461517334, -2.5312390327453613, -2.2858386039733887, -2.040438175201416, -1.7950376272201538, -1.5496370792388916, -1.304236650466919, -1.0588362216949463, -0.8134357929229736, -0.5680353045463562, -0.32263481616973877, -0.07723438739776611, 0.16816604137420654, 0.41356658935546875, 0.6589670181274414, 0.9043674468994141, 1.1497678756713867, 1.3951683044433594, 1.6405688524246216, 1.8859692811965942, 2.1313695907592773, 2.376770257949829, 2.6221706867218018, 2.8675711154937744, 3.112971544265747, 3.3583719730377197, 3.6037726402282715, 3.849173069000244, 4.094573497772217, 4.3399739265441895, 4.585374355316162, 4.830774784088135, 5.076175212860107, 5.32157564163208, 5.566976070404053, 5.812376499176025, 6.057776927947998, 6.303177833557129, 6.548578262329102, 6.793978691101074, 7.039379119873047, 7.2847795486450195, 7.530179977416992, 7.775580406188965, 8.020980834960938, 8.26638126373291, 8.511781692504883, 8.757182121276855]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 2.0, 10.0, 5.0, 10.0, 13.0, 16.0, 14.0, 22.0, 28.0, 24.0, 21.0, 36.0, 43.0, 48.0, 52.0, 45.0, 44.0, 45.0, 54.0, 57.0, 33.0, 39.0, 49.0, 35.0, 26.0, 32.0, 27.0, 32.0, 23.0, 22.0, 21.0, 10.0, 17.0, 6.0, 10.0, 9.0, 7.0, 6.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4789817333221436, -1.424920916557312, -1.3708600997924805, -1.316799283027649, -1.2627384662628174, -1.2086775302886963, -1.1546168327331543, -1.1005558967590332, -1.0464950799942017, -0.9924342632293701, -0.9383734464645386, -0.884312629699707, -0.8302517533302307, -0.7761909365653992, -0.7221301198005676, -0.6680692434310913, -0.6140084862709045, -0.559947669506073, -0.5058868527412415, -0.4518260061740875, -0.3977651596069336, -0.34370434284210205, -0.2896435260772705, -0.23558267951011658, -0.18152186274528503, -0.1274610310792923, -0.07340020686388016, -0.019339382648468018, 0.03472144901752472, 0.08878228068351746, 0.142843097448349, 0.19690394401550293, 0.2509647607803345, 0.305025577545166, 0.35908642411231995, 0.4131472408771515, 0.4672080874443054, 0.521268904209137, 0.5753297209739685, 0.6293905973434448, 0.6834514141082764, 0.7375122308731079, 0.7915730476379395, 0.845633864402771, 0.8996947407722473, 0.9537555575370789, 1.0078163146972656, 1.0618772506713867, 1.1159379482269287, 1.1699987649917603, 1.2240595817565918, 1.2781203985214233, 1.3321812152862549, 1.386242151260376, 1.440302848815918, 1.494363784790039, 1.5484246015548706, 1.6024854183197021, 1.6565462350845337, 1.7106070518493652, 1.7646678686141968, 1.8187286853790283, 1.8727896213531494, 1.926850438117981, 1.9809112548828125]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 5.0, 11.0, 13.0, 11.0, 24.0, 33.0, 43.0, 66.0, 119.0, 200.0, 366.0, 598.0, 1482.0, 3640.0, 13257.0, 81294.0, 628492.0, 276388.0, 31248.0, 6819.0, 2339.0, 975.0, 459.0, 238.0, 150.0, 81.0, 61.0, 37.0, 34.0, 19.0, 20.0, 11.0, 7.0, 5.0, 5.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3671875, -2.275299072265625, -2.18341064453125, -2.091522216796875, -1.9996337890625, -1.907745361328125, -1.81585693359375, -1.723968505859375, -1.632080078125, -1.540191650390625, -1.44830322265625, -1.356414794921875, -1.2645263671875, -1.172637939453125, -1.08074951171875, -0.988861083984375, -0.89697265625, -0.805084228515625, -0.71319580078125, -0.621307373046875, -0.5294189453125, -0.437530517578125, -0.34564208984375, -0.253753662109375, -0.161865234375, -0.069976806640625, 0.02191162109375, 0.113800048828125, 0.2056884765625, 0.297576904296875, 0.38946533203125, 0.481353759765625, 0.5732421875, 0.665130615234375, 0.75701904296875, 0.848907470703125, 0.9407958984375, 1.032684326171875, 1.12457275390625, 1.216461181640625, 1.308349609375, 1.400238037109375, 1.49212646484375, 1.584014892578125, 1.6759033203125, 1.767791748046875, 1.85968017578125, 1.951568603515625, 2.04345703125, 2.135345458984375, 2.22723388671875, 2.319122314453125, 2.4110107421875, 2.502899169921875, 2.59478759765625, 2.686676025390625, 2.778564453125, 2.870452880859375, 2.96234130859375, 3.054229736328125, 3.1461181640625, 3.238006591796875, 3.32989501953125, 3.421783447265625, 3.513671875]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 8.0, 7.0, 8.0, 7.0, 23.0, 34.0, 46.0, 73.0, 68.0, 96.0, 108.0, 111.0, 100.0, 87.0, 58.0, 59.0, 34.0, 18.0, 19.0, 10.0, 11.0, 4.0, 5.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.3203125, -0.3080902099609375, -0.295867919921875, -0.2836456298828125, -0.27142333984375, -0.2592010498046875, -0.246978759765625, -0.2347564697265625, -0.2225341796875, -0.2103118896484375, -0.198089599609375, -0.1858673095703125, -0.17364501953125, -0.1614227294921875, -0.149200439453125, -0.1369781494140625, -0.124755859375, -0.1125335693359375, -0.100311279296875, -0.0880889892578125, -0.07586669921875, -0.0636444091796875, -0.051422119140625, -0.0391998291015625, -0.0269775390625, -0.0147552490234375, -0.002532958984375, 0.0096893310546875, 0.02191162109375, 0.0341339111328125, 0.046356201171875, 0.0585784912109375, 0.07080078125, 0.0830230712890625, 0.095245361328125, 0.1074676513671875, 0.11968994140625, 0.1319122314453125, 0.144134521484375, 0.1563568115234375, 0.1685791015625, 0.1808013916015625, 0.193023681640625, 0.2052459716796875, 0.21746826171875, 0.2296905517578125, 0.241912841796875, 0.2541351318359375, 0.266357421875, 0.2785797119140625, 0.290802001953125, 0.3030242919921875, 0.31524658203125, 0.3274688720703125, 0.339691162109375, 0.3519134521484375, 0.3641357421875, 0.3763580322265625, 0.388580322265625, 0.4008026123046875, 0.41302490234375, 0.4252471923828125, 0.437469482421875, 0.4496917724609375, 0.4619140625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 5.0, 6.0, 9.0, 21.0, 18.0, 29.0, 61.0, 109.0, 196.0, 329.0, 614.0, 1503.0, 3931.0, 15120.0, 81796.0, 490465.0, 379661.0, 57515.0, 11380.0, 3378.0, 1196.0, 579.0, 273.0, 143.0, 88.0, 44.0, 32.0, 20.0, 9.0, 4.0, 5.0, 5.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.49609375, -2.42657470703125, -2.3570556640625, -2.28753662109375, -2.218017578125, -2.14849853515625, -2.0789794921875, -2.00946044921875, -1.93994140625, -1.87042236328125, -1.8009033203125, -1.73138427734375, -1.661865234375, -1.59234619140625, -1.5228271484375, -1.45330810546875, -1.3837890625, -1.31427001953125, -1.2447509765625, -1.17523193359375, -1.105712890625, -1.03619384765625, -0.9666748046875, -0.89715576171875, -0.82763671875, -0.75811767578125, -0.6885986328125, -0.61907958984375, -0.549560546875, -0.48004150390625, -0.4105224609375, -0.34100341796875, -0.271484375, -0.20196533203125, -0.1324462890625, -0.06292724609375, 0.006591796875, 0.07611083984375, 0.1456298828125, 0.21514892578125, 0.28466796875, 0.35418701171875, 0.4237060546875, 0.49322509765625, 0.562744140625, 0.63226318359375, 0.7017822265625, 0.77130126953125, 0.8408203125, 0.91033935546875, 0.9798583984375, 1.04937744140625, 1.118896484375, 1.18841552734375, 1.2579345703125, 1.32745361328125, 1.39697265625, 1.46649169921875, 1.5360107421875, 1.60552978515625, 1.675048828125, 1.74456787109375, 1.8140869140625, 1.88360595703125, 1.953125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 6.0, 1.0, 4.0, 6.0, 4.0, 2.0, 11.0, 11.0, 21.0, 13.0, 18.0, 20.0, 29.0, 34.0, 37.0, 38.0, 44.0, 59.0, 50.0, 53.0, 47.0, 46.0, 54.0, 48.0, 37.0, 47.0, 46.0, 29.0, 29.0, 26.0, 22.0, 22.0, 26.0, 12.0, 11.0, 7.0, 10.0, 10.0, 8.0, 4.0, 6.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.93408203125, -0.8997726440429688, -0.8654632568359375, -0.8311538696289062, -0.796844482421875, -0.7625350952148438, -0.7282257080078125, -0.6939163208007812, -0.65960693359375, -0.6252975463867188, -0.5909881591796875, -0.5566787719726562, -0.522369384765625, -0.48805999755859375, -0.4537506103515625, -0.41944122314453125, -0.3851318359375, -0.35082244873046875, -0.3165130615234375, -0.28220367431640625, -0.247894287109375, -0.21358489990234375, -0.1792755126953125, -0.14496612548828125, -0.11065673828125, -0.07634735107421875, -0.0420379638671875, -0.00772857666015625, 0.026580810546875, 0.06089019775390625, 0.0951995849609375, 0.12950897216796875, 0.163818359375, 0.19812774658203125, 0.2324371337890625, 0.26674652099609375, 0.301055908203125, 0.33536529541015625, 0.3696746826171875, 0.40398406982421875, 0.43829345703125, 0.47260284423828125, 0.5069122314453125, 0.5412216186523438, 0.575531005859375, 0.6098403930664062, 0.6441497802734375, 0.6784591674804688, 0.7127685546875, 0.7470779418945312, 0.7813873291015625, 0.8156967163085938, 0.850006103515625, 0.8843154907226562, 0.9186248779296875, 0.9529342651367188, 0.98724365234375, 1.0215530395507812, 1.0558624267578125, 1.0901718139648438, 1.124481201171875, 1.1587905883789062, 1.1930999755859375, 1.2274093627929688, 1.26171875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 3.0, 3.0, 4.0, 10.0, 13.0, 6.0, 15.0, 28.0, 43.0, 54.0, 130.0, 187.0, 366.0, 985.0, 2796.0, 12259.0, 105854.0, 849691.0, 63280.0, 8988.0, 2275.0, 770.0, 337.0, 186.0, 79.0, 57.0, 38.0, 34.0, 14.0, 10.0, 14.0, 10.0, 2.0, 7.0, 5.0, 5.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.626953125, -1.576751708984375, -1.52655029296875, -1.476348876953125, -1.4261474609375, -1.375946044921875, -1.32574462890625, -1.275543212890625, -1.225341796875, -1.175140380859375, -1.12493896484375, -1.074737548828125, -1.0245361328125, -0.974334716796875, -0.92413330078125, -0.873931884765625, -0.82373046875, -0.773529052734375, -0.72332763671875, -0.673126220703125, -0.6229248046875, -0.572723388671875, -0.52252197265625, -0.472320556640625, -0.422119140625, -0.371917724609375, -0.32171630859375, -0.271514892578125, -0.2213134765625, -0.171112060546875, -0.12091064453125, -0.070709228515625, -0.0205078125, 0.029693603515625, 0.07989501953125, 0.130096435546875, 0.1802978515625, 0.230499267578125, 0.28070068359375, 0.330902099609375, 0.381103515625, 0.431304931640625, 0.48150634765625, 0.531707763671875, 0.5819091796875, 0.632110595703125, 0.68231201171875, 0.732513427734375, 0.78271484375, 0.832916259765625, 0.88311767578125, 0.933319091796875, 0.9835205078125, 1.033721923828125, 1.08392333984375, 1.134124755859375, 1.184326171875, 1.234527587890625, 1.28472900390625, 1.334930419921875, 1.3851318359375, 1.435333251953125, 1.48553466796875, 1.535736083984375, 1.5859375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 5.0, 7.0, 5.0, 5.0, 14.0, 14.0, 28.0, 39.0, 58.0, 88.0, 146.0, 148.0, 124.0, 94.0, 68.0, 32.0, 34.0, 17.0, 9.0, 10.0, 7.0, 7.0, 5.0, 7.0, 2.0, 1.0, 2.0, 4.0, 1.0, 2.0, 3.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.00021529197692871094, -0.00020903348922729492, -0.0002027750015258789, -0.0001965165138244629, -0.00019025802612304688, -0.00018399953842163086, -0.00017774105072021484, -0.00017148256301879883, -0.0001652240753173828, -0.0001589655876159668, -0.00015270709991455078, -0.00014644861221313477, -0.00014019012451171875, -0.00013393163681030273, -0.00012767314910888672, -0.0001214146614074707, -0.00011515617370605469, -0.00010889768600463867, -0.00010263919830322266, -9.638071060180664e-05, -9.012222290039062e-05, -8.386373519897461e-05, -7.76052474975586e-05, -7.134675979614258e-05, -6.508827209472656e-05, -5.882978439331055e-05, -5.257129669189453e-05, -4.6312808990478516e-05, -4.00543212890625e-05, -3.3795833587646484e-05, -2.753734588623047e-05, -2.1278858184814453e-05, -1.5020370483398438e-05, -8.761882781982422e-06, -2.5033950805664062e-06, 3.7550926208496094e-06, 1.0013580322265625e-05, 1.627206802368164e-05, 2.2530555725097656e-05, 2.8789043426513672e-05, 3.504753112792969e-05, 4.13060188293457e-05, 4.756450653076172e-05, 5.3822994232177734e-05, 6.008148193359375e-05, 6.633996963500977e-05, 7.259845733642578e-05, 7.88569450378418e-05, 8.511543273925781e-05, 9.137392044067383e-05, 9.763240814208984e-05, 0.00010389089584350586, 0.00011014938354492188, 0.00011640787124633789, 0.0001226663589477539, 0.00012892484664916992, 0.00013518333435058594, 0.00014144182205200195, 0.00014770030975341797, 0.00015395879745483398, 0.00016021728515625, 0.00016647577285766602, 0.00017273426055908203, 0.00017899274826049805, 0.00018525123596191406]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 4.0, 10.0, 6.0, 7.0, 10.0, 12.0, 18.0, 25.0, 54.0, 88.0, 156.0, 268.0, 562.0, 1268.0, 4178.0, 25605.0, 810881.0, 188945.0, 11994.0, 2566.0, 926.0, 440.0, 238.0, 124.0, 56.0, 35.0, 31.0, 22.0, 13.0, 3.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8056640625, -1.7383270263671875, -1.670989990234375, -1.6036529541015625, -1.53631591796875, -1.4689788818359375, -1.401641845703125, -1.3343048095703125, -1.2669677734375, -1.1996307373046875, -1.132293701171875, -1.0649566650390625, -0.99761962890625, -0.9302825927734375, -0.862945556640625, -0.7956085205078125, -0.728271484375, -0.6609344482421875, -0.593597412109375, -0.5262603759765625, -0.45892333984375, -0.3915863037109375, -0.324249267578125, -0.2569122314453125, -0.1895751953125, -0.1222381591796875, -0.054901123046875, 0.0124359130859375, 0.07977294921875, 0.1471099853515625, 0.214447021484375, 0.2817840576171875, 0.34912109375, 0.4164581298828125, 0.483795166015625, 0.5511322021484375, 0.61846923828125, 0.6858062744140625, 0.753143310546875, 0.8204803466796875, 0.8878173828125, 0.9551544189453125, 1.022491455078125, 1.0898284912109375, 1.15716552734375, 1.2245025634765625, 1.291839599609375, 1.3591766357421875, 1.426513671875, 1.4938507080078125, 1.561187744140625, 1.6285247802734375, 1.69586181640625, 1.7631988525390625, 1.830535888671875, 1.8978729248046875, 1.9652099609375, 2.0325469970703125, 2.099884033203125, 2.1672210693359375, 2.23455810546875, 2.3018951416015625, 2.369232177734375, 2.4365692138671875, 2.50390625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 6.0, 12.0, 19.0, 22.0, 34.0, 54.0, 73.0, 110.0, 180.0, 169.0, 128.0, 65.0, 36.0, 31.0, 19.0, 8.0, 10.0, 9.0, 4.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0556640625, -1.0254898071289062, -0.9953155517578125, -0.9651412963867188, -0.934967041015625, -0.9047927856445312, -0.8746185302734375, -0.8444442749023438, -0.81427001953125, -0.7840957641601562, -0.7539215087890625, -0.7237472534179688, -0.693572998046875, -0.6633987426757812, -0.6332244873046875, -0.6030502319335938, -0.5728759765625, -0.5427017211914062, -0.5125274658203125, -0.48235321044921875, -0.452178955078125, -0.42200469970703125, -0.3918304443359375, -0.36165618896484375, -0.33148193359375, -0.30130767822265625, -0.2711334228515625, -0.24095916748046875, -0.210784912109375, -0.18061065673828125, -0.1504364013671875, -0.12026214599609375, -0.090087890625, -0.05991363525390625, -0.0297393798828125, 0.00043487548828125, 0.030609130859375, 0.06078338623046875, 0.0909576416015625, 0.12113189697265625, 0.15130615234375, 0.18148040771484375, 0.2116546630859375, 0.24182891845703125, 0.272003173828125, 0.30217742919921875, 0.3323516845703125, 0.36252593994140625, 0.3927001953125, 0.42287445068359375, 0.4530487060546875, 0.48322296142578125, 0.513397216796875, 0.5435714721679688, 0.5737457275390625, 0.6039199829101562, 0.63409423828125, 0.6642684936523438, 0.6944427490234375, 0.7246170043945312, 0.754791259765625, 0.7849655151367188, 0.8151397705078125, 0.8453140258789062, 0.87548828125]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 8.0, 11.0, 14.0, 30.0, 51.0, 115.0, 183.0, 218.0, 175.0, 100.0, 44.0, 25.0, 22.0, 4.0, 2.0, 4.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.00187873840332, -7.482860565185547, -6.963841915130615, -6.444823265075684, -5.92580509185791, -5.406786918640137, -4.887768268585205, -4.368749618530273, -3.8497314453125, -3.3307130336761475, -2.811694622039795, -2.2926762104034424, -1.7736577987670898, -1.2546393871307373, -0.7356209754943848, -0.21660256385803223, 0.3024158477783203, 0.8214342594146729, 1.3404526710510254, 1.859471082687378, 2.3784894943237305, 2.897507905960083, 3.4165263175964355, 3.935544729232788, 4.454563140869141, 4.973581314086914, 5.492599964141846, 6.011618614196777, 6.530636787414551, 7.049654960632324, 7.568673610687256, 8.087692260742188, 8.606710433959961, 9.125728607177734, 9.644746780395508, 10.163765907287598, 10.682784080505371, 11.201802253723145, 11.720821380615234, 12.239839553833008, 12.758857727050781, 13.277875900268555, 13.796894073486328, 14.315913200378418, 14.834931373596191, 15.353949546813965, 15.872968673706055, 16.391986846923828, 16.9110050201416, 17.430023193359375, 17.94904136657715, 18.468059539794922, 18.987079620361328, 19.5060977935791, 20.025115966796875, 20.54413414001465, 21.063152313232422, 21.582170486450195, 22.10118865966797, 22.620206832885742, 23.139225006103516, 23.658245086669922, 24.177263259887695, 24.69628143310547, 25.215299606323242]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 4.0, 7.0, 14.0, 10.0, 14.0, 14.0, 20.0, 20.0, 25.0, 28.0, 34.0, 52.0, 50.0, 54.0, 52.0, 66.0, 48.0, 57.0, 63.0, 43.0, 55.0, 48.0, 37.0, 35.0, 27.0, 27.0, 21.0, 18.0, 14.0, 16.0, 11.0, 5.0, 6.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.04636287689209, -5.812415599822998, -5.578468322753906, -5.344521522521973, -5.110574245452881, -4.876626968383789, -4.642679691314697, -4.4087324142456055, -4.174785137176514, -3.940837860107422, -3.706890821456909, -3.4729435443878174, -3.2389962673187256, -3.005049228668213, -2.771101951599121, -2.5371546745300293, -2.3032076358795166, -2.069260358810425, -1.8353132009506226, -1.6013660430908203, -1.3674187660217285, -1.1334716081619263, -0.899524450302124, -0.6655771732330322, -0.43163001537323, -0.19768281280994415, 0.036264389753341675, 0.2702115774154663, 0.5041587948799133, 0.7381060123443604, 0.9720531702041626, 1.2060004472732544, 1.4399476051330566, 1.6738947629928589, 1.9078420400619507, 2.141789197921753, 2.3757364749908447, 2.6096835136413574, 2.843630790710449, 3.077578067779541, 3.311525344848633, 3.5454726219177246, 3.7794196605682373, 4.01336669921875, 4.247313976287842, 4.481261253356934, 4.715208530426025, 4.949155807495117, 5.183102607727051, 5.417049884796143, 5.650997161865234, 5.884943962097168, 6.11889123916626, 6.352838516235352, 6.586785793304443, 6.820733070373535, 7.054680347442627, 7.288627624511719, 7.5225749015808105, 7.756522178649902, 7.990468978881836, 8.224416732788086, 8.45836353302002, 8.692310333251953, 8.926258087158203]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 19.0, 30.0, 48.0, 98.0, 186.0, 409.0, 896.0, 2451.0, 9659.0, 66338.0, 3995051.0, 101035.0, 12961.0, 2810.0, 973.0, 439.0, 276.0, 179.0, 113.0, 71.0, 68.0, 38.0, 43.0, 23.0, 16.0, 15.0, 13.0, 4.0, 6.0, 5.0, 4.0, 3.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.419921875, -3.268463134765625, -3.11700439453125, -2.965545654296875, -2.8140869140625, -2.662628173828125, -2.51116943359375, -2.359710693359375, -2.208251953125, -2.056793212890625, -1.90533447265625, -1.753875732421875, -1.6024169921875, -1.450958251953125, -1.29949951171875, -1.148040771484375, -0.99658203125, -0.845123291015625, -0.69366455078125, -0.542205810546875, -0.3907470703125, -0.239288330078125, -0.08782958984375, 0.063629150390625, 0.215087890625, 0.366546630859375, 0.51800537109375, 0.669464111328125, 0.8209228515625, 0.972381591796875, 1.12384033203125, 1.275299072265625, 1.4267578125, 1.578216552734375, 1.72967529296875, 1.881134033203125, 2.0325927734375, 2.184051513671875, 2.33551025390625, 2.486968994140625, 2.638427734375, 2.789886474609375, 2.94134521484375, 3.092803955078125, 3.2442626953125, 3.395721435546875, 3.54718017578125, 3.698638916015625, 3.85009765625, 4.001556396484375, 4.15301513671875, 4.304473876953125, 4.4559326171875, 4.607391357421875, 4.75885009765625, 4.910308837890625, 5.061767578125, 5.213226318359375, 5.36468505859375, 5.516143798828125, 5.6676025390625, 5.819061279296875, 5.97052001953125, 6.121978759765625, 6.2734375]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 3.0, 5.0, 5.0, 4.0, 7.0, 4.0, 7.0, 12.0, 30.0, 42.0, 49.0, 59.0, 84.0, 95.0, 94.0, 95.0, 90.0, 78.0, 61.0, 55.0, 37.0, 18.0, 27.0, 13.0, 9.0, 8.0, 5.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.285888671875, -0.2740287780761719, -0.26216888427734375, -0.2503089904785156, -0.2384490966796875, -0.22658920288085938, -0.21472930908203125, -0.20286941528320312, -0.191009521484375, -0.17914962768554688, -0.16728973388671875, -0.15542984008789062, -0.1435699462890625, -0.13171005249023438, -0.11985015869140625, -0.10799026489257812, -0.09613037109375, -0.08427047729492188, -0.07241058349609375, -0.060550689697265625, -0.0486907958984375, -0.036830902099609375, -0.02497100830078125, -0.013111114501953125, -0.001251220703125, 0.010608673095703125, 0.02246856689453125, 0.034328460693359375, 0.0461883544921875, 0.058048248291015625, 0.06990814208984375, 0.08176803588867188, 0.0936279296875, 0.10548782348632812, 0.11734771728515625, 0.12920761108398438, 0.1410675048828125, 0.15292739868164062, 0.16478729248046875, 0.17664718627929688, 0.188507080078125, 0.20036697387695312, 0.21222686767578125, 0.22408676147460938, 0.2359466552734375, 0.24780654907226562, 0.25966644287109375, 0.2715263366699219, 0.28338623046875, 0.2952461242675781, 0.30710601806640625, 0.3189659118652344, 0.3308258056640625, 0.3426856994628906, 0.35454559326171875, 0.3664054870605469, 0.378265380859375, 0.3901252746582031, 0.40198516845703125, 0.4138450622558594, 0.4257049560546875, 0.4375648498535156, 0.44942474365234375, 0.4612846374511719, 0.47314453125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 3.0, 2.0, 4.0, 6.0, 4.0, 8.0, 11.0, 15.0, 14.0, 36.0, 73.0, 107.0, 153.0, 288.0, 558.0, 1192.0, 2903.0, 9605.0, 49739.0, 3809965.0, 287198.0, 22373.0, 5702.0, 2110.0, 985.0, 499.0, 274.0, 168.0, 95.0, 53.0, 49.0, 22.0, 24.0, 17.0, 5.0, 9.0, 4.0, 4.0, 5.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.609375, -5.464752197265625, -5.32012939453125, -5.175506591796875, -5.0308837890625, -4.886260986328125, -4.74163818359375, -4.597015380859375, -4.452392578125, -4.307769775390625, -4.16314697265625, -4.018524169921875, -3.8739013671875, -3.729278564453125, -3.58465576171875, -3.440032958984375, -3.29541015625, -3.150787353515625, -3.00616455078125, -2.861541748046875, -2.7169189453125, -2.572296142578125, -2.42767333984375, -2.283050537109375, -2.138427734375, -1.993804931640625, -1.84918212890625, -1.704559326171875, -1.5599365234375, -1.415313720703125, -1.27069091796875, -1.126068115234375, -0.9814453125, -0.836822509765625, -0.69219970703125, -0.547576904296875, -0.4029541015625, -0.258331298828125, -0.11370849609375, 0.030914306640625, 0.175537109375, 0.320159912109375, 0.46478271484375, 0.609405517578125, 0.7540283203125, 0.898651123046875, 1.04327392578125, 1.187896728515625, 1.33251953125, 1.477142333984375, 1.62176513671875, 1.766387939453125, 1.9110107421875, 2.055633544921875, 2.20025634765625, 2.344879150390625, 2.489501953125, 2.634124755859375, 2.77874755859375, 2.923370361328125, 3.0679931640625, 3.212615966796875, 3.35723876953125, 3.501861572265625, 3.646484375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 6.0, 5.0, 11.0, 18.0, 14.0, 24.0, 23.0, 49.0, 89.0, 180.0, 540.0, 2022.0, 665.0, 171.0, 72.0, 52.0, 34.0, 26.0, 25.0, 7.0, 9.0, 6.0, 7.0, 2.0, 2.0, 3.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.994140625, -0.9593353271484375, -0.924530029296875, -0.8897247314453125, -0.85491943359375, -0.8201141357421875, -0.785308837890625, -0.7505035400390625, -0.7156982421875, -0.6808929443359375, -0.646087646484375, -0.6112823486328125, -0.57647705078125, -0.5416717529296875, -0.506866455078125, -0.4720611572265625, -0.437255859375, -0.4024505615234375, -0.367645263671875, -0.3328399658203125, -0.29803466796875, -0.2632293701171875, -0.228424072265625, -0.1936187744140625, -0.1588134765625, -0.1240081787109375, -0.089202880859375, -0.0543975830078125, -0.01959228515625, 0.0152130126953125, 0.050018310546875, 0.0848236083984375, 0.11962890625, 0.1544342041015625, 0.189239501953125, 0.2240447998046875, 0.25885009765625, 0.2936553955078125, 0.328460693359375, 0.3632659912109375, 0.3980712890625, 0.4328765869140625, 0.467681884765625, 0.5024871826171875, 0.53729248046875, 0.5720977783203125, 0.606903076171875, 0.6417083740234375, 0.676513671875, 0.7113189697265625, 0.746124267578125, 0.7809295654296875, 0.81573486328125, 0.8505401611328125, 0.885345458984375, 0.9201507568359375, 0.9549560546875, 0.9897613525390625, 1.024566650390625, 1.0593719482421875, 1.09417724609375, 1.1289825439453125, 1.163787841796875, 1.1985931396484375, 1.2333984375]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 12.0, 18.0, 74.0, 229.0, 434.0, 180.0, 43.0, 9.0, 3.0, 5.0, 0.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.375373363494873, -6.826822280883789, -6.278271675109863, -5.729720592498779, -5.181169509887695, -4.6326189041137695, -4.0840678215026855, -3.5355169773101807, -2.986966133117676, -2.438415288925171, -1.8898643255233765, -1.341313362121582, -0.7927625179290771, -0.24421167373657227, 0.3043394088745117, 0.8528902530670166, 1.4014410972595215, 1.9499919414520264, 2.4985427856445312, 3.0470938682556152, 3.59564471244812, 4.144195556640625, 4.692746639251709, 5.241297721862793, 5.789848327636719, 6.338399410247803, 6.8869500160217285, 7.4355010986328125, 7.984051704406738, 8.532602310180664, 9.081153869628906, 9.629704475402832, 10.17825698852539, 10.726807594299316, 11.275359153747559, 11.823909759521484, 12.37246036529541, 12.921010971069336, 13.469562530517578, 14.018113136291504, 14.56666374206543, 15.115214347839355, 15.663765907287598, 16.212316513061523, 16.760868072509766, 17.309417724609375, 17.857969284057617, 18.40652084350586, 18.95507049560547, 19.50362205505371, 20.05217170715332, 20.600723266601562, 21.149274826049805, 21.697824478149414, 22.246376037597656, 22.7949275970459, 23.34347915649414, 23.892030715942383, 24.440580368041992, 24.989131927490234, 25.537683486938477, 26.086233139038086, 26.634784698486328, 27.18333625793457, 27.73188591003418]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 2.0, 11.0, 12.0, 10.0, 15.0, 48.0, 60.0, 72.0, 82.0, 106.0, 90.0, 105.0, 88.0, 76.0, 53.0, 50.0, 31.0, 40.0, 29.0, 14.0, 4.0, 1.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.436782360076904, -6.256065845489502, -6.0753493309021, -5.8946332931518555, -5.713916778564453, -5.533200263977051, -5.352483749389648, -5.171767234802246, -4.991050720214844, -4.810334205627441, -4.629617691040039, -4.448901176452637, -4.268185138702393, -4.08746862411499, -3.906752109527588, -3.7260355949401855, -3.5453195571899414, -3.364603042602539, -3.183886766433716, -3.0031702518463135, -2.8224539756774902, -2.641737461090088, -2.4610209465026855, -2.280304431915283, -2.09958815574646, -1.9188717603683472, -1.7381553649902344, -1.557438850402832, -1.3767224550247192, -1.1960060596466064, -1.015289545059204, -0.8345731496810913, -0.6538572311401367, -0.47314080595970154, -0.29242438077926636, -0.11170792579650879, 0.069008469581604, 0.2497248649597168, 0.43044137954711914, 0.6111577749252319, 0.7918741703033447, 0.9725905656814575, 1.1533069610595703, 1.3340234756469727, 1.5147398710250854, 1.6954562664031982, 1.8761727809906006, 2.056889057159424, 2.237605571746826, 2.4183220863342285, 2.5990383625030518, 2.779754877090454, 2.9604711532592773, 3.1411876678466797, 3.321904182434082, 3.5026206970214844, 3.6833369731903076, 3.86405348777771, 4.044769763946533, 4.2254862785339355, 4.406202793121338, 4.586918830871582, 4.767635345458984, 4.948351860046387, 5.129068374633789]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 6.0, 1.0, 6.0, 13.0, 15.0, 12.0, 16.0, 27.0, 46.0, 53.0, 99.0, 124.0, 187.0, 306.0, 526.0, 1057.0, 2356.0, 6631.0, 29248.0, 271570.0, 640698.0, 76078.0, 12449.0, 3698.0, 1515.0, 735.0, 365.0, 241.0, 144.0, 117.0, 63.0, 46.0, 28.0, 24.0, 13.0, 17.0, 8.0, 6.0, 5.0, 3.0, 2.0, 0.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.189453125, -3.09051513671875, -2.9915771484375, -2.89263916015625, -2.793701171875, -2.69476318359375, -2.5958251953125, -2.49688720703125, -2.39794921875, -2.29901123046875, -2.2000732421875, -2.10113525390625, -2.002197265625, -1.90325927734375, -1.8043212890625, -1.70538330078125, -1.6064453125, -1.50750732421875, -1.4085693359375, -1.30963134765625, -1.210693359375, -1.11175537109375, -1.0128173828125, -0.91387939453125, -0.81494140625, -0.71600341796875, -0.6170654296875, -0.51812744140625, -0.419189453125, -0.32025146484375, -0.2213134765625, -0.12237548828125, -0.0234375, 0.07550048828125, 0.1744384765625, 0.27337646484375, 0.372314453125, 0.47125244140625, 0.5701904296875, 0.66912841796875, 0.76806640625, 0.86700439453125, 0.9659423828125, 1.06488037109375, 1.163818359375, 1.26275634765625, 1.3616943359375, 1.46063232421875, 1.5595703125, 1.65850830078125, 1.7574462890625, 1.85638427734375, 1.955322265625, 2.05426025390625, 2.1531982421875, 2.25213623046875, 2.35107421875, 2.45001220703125, 2.5489501953125, 2.64788818359375, 2.746826171875, 2.84576416015625, 2.9447021484375, 3.04364013671875, 3.142578125]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 4.0, 5.0, 14.0, 14.0, 21.0, 35.0, 47.0, 95.0, 116.0, 122.0, 122.0, 100.0, 95.0, 82.0, 36.0, 32.0, 27.0, 14.0, 4.0, 5.0, 2.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.47998046875, -0.463623046875, -0.447265625, -0.430908203125, -0.41455078125, -0.398193359375, -0.3818359375, -0.365478515625, -0.34912109375, -0.332763671875, -0.31640625, -0.300048828125, -0.28369140625, -0.267333984375, -0.2509765625, -0.234619140625, -0.21826171875, -0.201904296875, -0.185546875, -0.169189453125, -0.15283203125, -0.136474609375, -0.1201171875, -0.103759765625, -0.08740234375, -0.071044921875, -0.0546875, -0.038330078125, -0.02197265625, -0.005615234375, 0.0107421875, 0.027099609375, 0.04345703125, 0.059814453125, 0.076171875, 0.092529296875, 0.10888671875, 0.125244140625, 0.1416015625, 0.157958984375, 0.17431640625, 0.190673828125, 0.20703125, 0.223388671875, 0.23974609375, 0.256103515625, 0.2724609375, 0.288818359375, 0.30517578125, 0.321533203125, 0.337890625, 0.354248046875, 0.37060546875, 0.386962890625, 0.4033203125, 0.419677734375, 0.43603515625, 0.452392578125, 0.46875, 0.485107421875, 0.50146484375, 0.517822265625, 0.5341796875, 0.550537109375, 0.56689453125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 5.0, 7.0, 7.0, 13.0, 12.0, 19.0, 21.0, 36.0, 36.0, 74.0, 85.0, 139.0, 185.0, 292.0, 519.0, 862.0, 1605.0, 3193.0, 6824.0, 16420.0, 42460.0, 117174.0, 295449.0, 332344.0, 143017.0, 51696.0, 19660.0, 8194.0, 3741.0, 1745.0, 1041.0, 552.0, 358.0, 231.0, 162.0, 110.0, 80.0, 54.0, 40.0, 22.0, 25.0, 11.0, 11.0, 11.0, 6.0, 7.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.0888671875, -1.0526885986328125, -1.016510009765625, -0.9803314208984375, -0.94415283203125, -0.9079742431640625, -0.871795654296875, -0.8356170654296875, -0.7994384765625, -0.7632598876953125, -0.727081298828125, -0.6909027099609375, -0.65472412109375, -0.6185455322265625, -0.582366943359375, -0.5461883544921875, -0.510009765625, -0.4738311767578125, -0.437652587890625, -0.4014739990234375, -0.36529541015625, -0.3291168212890625, -0.292938232421875, -0.2567596435546875, -0.2205810546875, -0.1844024658203125, -0.148223876953125, -0.1120452880859375, -0.07586669921875, -0.0396881103515625, -0.003509521484375, 0.0326690673828125, 0.06884765625, 0.1050262451171875, 0.141204833984375, 0.1773834228515625, 0.21356201171875, 0.2497406005859375, 0.285919189453125, 0.3220977783203125, 0.3582763671875, 0.3944549560546875, 0.430633544921875, 0.4668121337890625, 0.50299072265625, 0.5391693115234375, 0.575347900390625, 0.6115264892578125, 0.647705078125, 0.6838836669921875, 0.720062255859375, 0.7562408447265625, 0.79241943359375, 0.8285980224609375, 0.864776611328125, 0.9009552001953125, 0.9371337890625, 0.9733123779296875, 1.009490966796875, 1.0456695556640625, 1.08184814453125, 1.1180267333984375, 1.154205322265625, 1.1903839111328125, 1.2265625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 4.0, 6.0, 6.0, 9.0, 9.0, 7.0, 14.0, 16.0, 9.0, 22.0, 20.0, 30.0, 34.0, 29.0, 49.0, 37.0, 43.0, 39.0, 40.0, 50.0, 55.0, 61.0, 40.0, 38.0, 41.0, 45.0, 17.0, 34.0, 33.0, 28.0, 24.0, 17.0, 15.0, 22.0, 15.0, 7.0, 5.0, 7.0, 4.0, 4.0, 4.0, 2.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.1015625, -1.0679168701171875, -1.034271240234375, -1.0006256103515625, -0.96697998046875, -0.9333343505859375, -0.899688720703125, -0.8660430908203125, -0.8323974609375, -0.7987518310546875, -0.765106201171875, -0.7314605712890625, -0.69781494140625, -0.6641693115234375, -0.630523681640625, -0.5968780517578125, -0.563232421875, -0.5295867919921875, -0.495941162109375, -0.4622955322265625, -0.42864990234375, -0.3950042724609375, -0.361358642578125, -0.3277130126953125, -0.2940673828125, -0.2604217529296875, -0.226776123046875, -0.1931304931640625, -0.15948486328125, -0.1258392333984375, -0.092193603515625, -0.0585479736328125, -0.02490234375, 0.0087432861328125, 0.042388916015625, 0.0760345458984375, 0.10968017578125, 0.1433258056640625, 0.176971435546875, 0.2106170654296875, 0.2442626953125, 0.2779083251953125, 0.311553955078125, 0.3451995849609375, 0.37884521484375, 0.4124908447265625, 0.446136474609375, 0.4797821044921875, 0.513427734375, 0.5470733642578125, 0.580718994140625, 0.6143646240234375, 0.64801025390625, 0.6816558837890625, 0.715301513671875, 0.7489471435546875, 0.7825927734375, 0.8162384033203125, 0.849884033203125, 0.8835296630859375, 0.91717529296875, 0.9508209228515625, 0.984466552734375, 1.0181121826171875, 1.0517578125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 7.0, 7.0, 4.0, 10.0, 12.0, 14.0, 40.0, 47.0, 70.0, 119.0, 180.0, 338.0, 627.0, 1230.0, 2664.0, 6608.0, 20800.0, 102768.0, 661638.0, 203922.0, 31487.0, 9148.0, 3544.0, 1503.0, 741.0, 392.0, 239.0, 156.0, 78.0, 47.0, 27.0, 39.0, 15.0, 7.0, 11.0, 11.0, 6.0, 3.0, 2.0, 1.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0693359375, -1.036590576171875, -1.00384521484375, -0.971099853515625, -0.9383544921875, -0.905609130859375, -0.87286376953125, -0.840118408203125, -0.807373046875, -0.774627685546875, -0.74188232421875, -0.709136962890625, -0.6763916015625, -0.643646240234375, -0.61090087890625, -0.578155517578125, -0.54541015625, -0.512664794921875, -0.47991943359375, -0.447174072265625, -0.4144287109375, -0.381683349609375, -0.34893798828125, -0.316192626953125, -0.283447265625, -0.250701904296875, -0.21795654296875, -0.185211181640625, -0.1524658203125, -0.119720458984375, -0.08697509765625, -0.054229736328125, -0.021484375, 0.011260986328125, 0.04400634765625, 0.076751708984375, 0.1094970703125, 0.142242431640625, 0.17498779296875, 0.207733154296875, 0.240478515625, 0.273223876953125, 0.30596923828125, 0.338714599609375, 0.3714599609375, 0.404205322265625, 0.43695068359375, 0.469696044921875, 0.50244140625, 0.535186767578125, 0.56793212890625, 0.600677490234375, 0.6334228515625, 0.666168212890625, 0.69891357421875, 0.731658935546875, 0.764404296875, 0.797149658203125, 0.82989501953125, 0.862640380859375, 0.8953857421875, 0.928131103515625, 0.96087646484375, 0.993621826171875, 1.0263671875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 3.0, 5.0, 6.0, 7.0, 9.0, 12.0, 11.0, 21.0, 21.0, 31.0, 49.0, 69.0, 77.0, 127.0, 142.0, 101.0, 80.0, 49.0, 54.0, 25.0, 25.0, 13.0, 12.0, 14.0, 10.0, 10.0, 2.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0001386404037475586, -0.00013392791152000427, -0.00012921541929244995, -0.00012450292706489563, -0.00011979043483734131, -0.00011507794260978699, -0.00011036545038223267, -0.00010565295815467834, -0.00010094046592712402, -9.62279736995697e-05, -9.151548147201538e-05, -8.680298924446106e-05, -8.209049701690674e-05, -7.737800478935242e-05, -7.26655125617981e-05, -6.795302033424377e-05, -6.324052810668945e-05, -5.852803587913513e-05, -5.381554365158081e-05, -4.910305142402649e-05, -4.439055919647217e-05, -3.967806696891785e-05, -3.4965574741363525e-05, -3.0253082513809204e-05, -2.5540590286254883e-05, -2.082809805870056e-05, -1.611560583114624e-05, -1.1403113603591919e-05, -6.690621376037598e-06, -1.9781291484832764e-06, 2.734363079071045e-06, 7.446855306625366e-06, 1.2159347534179688e-05, 1.687183976173401e-05, 2.158433198928833e-05, 2.629682421684265e-05, 3.100931644439697e-05, 3.5721808671951294e-05, 4.0434300899505615e-05, 4.5146793127059937e-05, 4.985928535461426e-05, 5.457177758216858e-05, 5.92842698097229e-05, 6.399676203727722e-05, 6.870925426483154e-05, 7.342174649238586e-05, 7.813423871994019e-05, 8.284673094749451e-05, 8.755922317504883e-05, 9.227171540260315e-05, 9.698420763015747e-05, 0.00010169669985771179, 0.00010640919208526611, 0.00011112168431282043, 0.00011583417654037476, 0.00012054666876792908, 0.0001252591609954834, 0.00012997165322303772, 0.00013468414545059204, 0.00013939663767814636, 0.00014410912990570068, 0.000148821622133255, 0.00015353411436080933, 0.00015824660658836365, 0.00016295909881591797]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 7.0, 15.0, 8.0, 21.0, 39.0, 68.0, 126.0, 258.0, 570.0, 1640.0, 5671.0, 30867.0, 754638.0, 233066.0, 16004.0, 3560.0, 1085.0, 457.0, 192.0, 109.0, 44.0, 43.0, 23.0, 10.0, 9.0, 11.0, 5.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.26171875, -2.19677734375, -2.1318359375, -2.06689453125, -2.001953125, -1.93701171875, -1.8720703125, -1.80712890625, -1.7421875, -1.67724609375, -1.6123046875, -1.54736328125, -1.482421875, -1.41748046875, -1.3525390625, -1.28759765625, -1.22265625, -1.15771484375, -1.0927734375, -1.02783203125, -0.962890625, -0.89794921875, -0.8330078125, -0.76806640625, -0.703125, -0.63818359375, -0.5732421875, -0.50830078125, -0.443359375, -0.37841796875, -0.3134765625, -0.24853515625, -0.18359375, -0.11865234375, -0.0537109375, 0.01123046875, 0.076171875, 0.14111328125, 0.2060546875, 0.27099609375, 0.3359375, 0.40087890625, 0.4658203125, 0.53076171875, 0.595703125, 0.66064453125, 0.7255859375, 0.79052734375, 0.85546875, 0.92041015625, 0.9853515625, 1.05029296875, 1.115234375, 1.18017578125, 1.2451171875, 1.31005859375, 1.375, 1.43994140625, 1.5048828125, 1.56982421875, 1.634765625, 1.69970703125, 1.7646484375, 1.82958984375, 1.89453125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 5.0, 4.0, 4.0, 12.0, 7.0, 10.0, 15.0, 14.0, 12.0, 14.0, 29.0, 55.0, 76.0, 100.0, 127.0, 143.0, 125.0, 78.0, 47.0, 40.0, 26.0, 17.0, 16.0, 6.0, 4.0, 7.0, 2.0, 4.0, 6.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.91162109375, -0.8832244873046875, -0.854827880859375, -0.8264312744140625, -0.79803466796875, -0.7696380615234375, -0.741241455078125, -0.7128448486328125, -0.6844482421875, -0.6560516357421875, -0.627655029296875, -0.5992584228515625, -0.57086181640625, -0.5424652099609375, -0.514068603515625, -0.4856719970703125, -0.457275390625, -0.4288787841796875, -0.400482177734375, -0.3720855712890625, -0.34368896484375, -0.3152923583984375, -0.286895751953125, -0.2584991455078125, -0.2301025390625, -0.2017059326171875, -0.173309326171875, -0.1449127197265625, -0.11651611328125, -0.0881195068359375, -0.059722900390625, -0.0313262939453125, -0.0029296875, 0.0254669189453125, 0.053863525390625, 0.0822601318359375, 0.11065673828125, 0.1390533447265625, 0.167449951171875, 0.1958465576171875, 0.2242431640625, 0.2526397705078125, 0.281036376953125, 0.3094329833984375, 0.33782958984375, 0.3662261962890625, 0.394622802734375, 0.4230194091796875, 0.451416015625, 0.4798126220703125, 0.508209228515625, 0.5366058349609375, 0.56500244140625, 0.5933990478515625, 0.621795654296875, 0.6501922607421875, 0.6785888671875, 0.7069854736328125, 0.735382080078125, 0.7637786865234375, 0.79217529296875, 0.8205718994140625, 0.848968505859375, 0.8773651123046875, 0.90576171875]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 4.0, 9.0, 10.0, 23.0, 32.0, 40.0, 59.0, 113.0, 111.0, 144.0, 141.0, 117.0, 79.0, 38.0, 36.0, 20.0, 7.0, 11.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-13.018125534057617, -12.676589012145996, -12.335051536560059, -11.993515014648438, -11.651978492736816, -11.310441970825195, -10.968904495239258, -10.627367973327637, -10.285831451416016, -9.944294929504395, -9.602757453918457, -9.261220932006836, -8.919684410095215, -8.578147888183594, -8.236610412597656, -7.895073890686035, -7.553536415100098, -7.211999416351318, -6.870462894439697, -6.528925895690918, -6.187389373779297, -5.845852375030518, -5.504315376281738, -5.162778854370117, -4.821241855621338, -4.479704856872559, -4.1381683349609375, -3.796631336212158, -3.455094575881958, -3.113557815551758, -2.7720208168029785, -2.4304840564727783, -2.0889463424682617, -1.7474095821380615, -1.4058727025985718, -1.064335823059082, -0.7227990627288818, -0.38126230239868164, -0.039725303649902344, 0.30181145668029785, 0.643348217010498, 0.984885036945343, 1.326421856880188, 1.6679587364196777, 2.009495496749878, 2.351032257080078, 2.6925692558288574, 3.0341060161590576, 3.375642776489258, 3.717179536819458, 4.058716297149658, 4.4002532958984375, 4.741789817810059, 5.083326816558838, 5.424863815307617, 5.766400337219238, 6.107937335968018, 6.449474334716797, 6.791010856628418, 7.132547855377197, 7.474084854125977, 7.815621376037598, 8.157157897949219, 8.498695373535156, 8.840231895446777]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 2.0, 4.0, 4.0, 5.0, 5.0, 11.0, 13.0, 12.0, 12.0, 22.0, 17.0, 28.0, 15.0, 24.0, 16.0, 23.0, 27.0, 32.0, 31.0, 31.0, 43.0, 31.0, 35.0, 46.0, 36.0, 29.0, 48.0, 34.0, 38.0, 33.0, 40.0, 27.0, 33.0, 24.0, 32.0, 21.0, 22.0, 21.0, 13.0, 8.0, 11.0, 10.0, 7.0, 3.0, 5.0, 4.0, 3.0, 5.0, 4.0, 2.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-5.346571445465088, -5.179823875427246, -5.013076305389404, -4.8463287353515625, -4.679581165313721, -4.512833595275879, -4.346086025238037, -4.179338455200195, -4.0125908851623535, -3.8458433151245117, -3.67909574508667, -3.512348175048828, -3.3456006050109863, -3.1788530349731445, -3.0121054649353027, -2.845357894897461, -2.678610324859619, -2.5118627548217773, -2.3451151847839355, -2.1783676147460938, -2.011620044708252, -1.8448724746704102, -1.6781249046325684, -1.5113773345947266, -1.3446297645568848, -1.177882194519043, -1.0111346244812012, -0.8443870544433594, -0.6776394844055176, -0.5108919143676758, -0.344144344329834, -0.1773967742919922, -0.010649681091308594, 0.1560978889465332, 0.322845458984375, 0.4895930290222168, 0.6563405990600586, 0.8230881690979004, 0.9898357391357422, 1.156583309173584, 1.3233308792114258, 1.4900784492492676, 1.6568260192871094, 1.8235735893249512, 1.990321159362793, 2.1570687294006348, 2.3238162994384766, 2.4905638694763184, 2.65731143951416, 2.824059009552002, 2.9908065795898438, 3.1575541496276855, 3.3243017196655273, 3.491049289703369, 3.657796859741211, 3.8245444297790527, 3.9912919998168945, 4.158039569854736, 4.324787139892578, 4.49153470993042, 4.658282279968262, 4.8250298500061035, 4.991777420043945, 5.158524990081787, 5.325272560119629]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 6.0, 7.0, 7.0, 8.0, 6.0, 10.0, 8.0, 22.0, 22.0, 34.0, 82.0, 138.0, 338.0, 925.0, 3384.0, 19195.0, 3827233.0, 326171.0, 12301.0, 2553.0, 831.0, 365.0, 197.0, 122.0, 83.0, 61.0, 37.0, 35.0, 26.0, 22.0, 21.0, 13.0, 7.0, 6.0, 2.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.37109375, -5.212646484375, -5.05419921875, -4.895751953125, -4.7373046875, -4.578857421875, -4.42041015625, -4.261962890625, -4.103515625, -3.945068359375, -3.78662109375, -3.628173828125, -3.4697265625, -3.311279296875, -3.15283203125, -2.994384765625, -2.8359375, -2.677490234375, -2.51904296875, -2.360595703125, -2.2021484375, -2.043701171875, -1.88525390625, -1.726806640625, -1.568359375, -1.409912109375, -1.25146484375, -1.093017578125, -0.9345703125, -0.776123046875, -0.61767578125, -0.459228515625, -0.30078125, -0.142333984375, 0.01611328125, 0.174560546875, 0.3330078125, 0.491455078125, 0.64990234375, 0.808349609375, 0.966796875, 1.125244140625, 1.28369140625, 1.442138671875, 1.6005859375, 1.759033203125, 1.91748046875, 2.075927734375, 2.234375, 2.392822265625, 2.55126953125, 2.709716796875, 2.8681640625, 3.026611328125, 3.18505859375, 3.343505859375, 3.501953125, 3.660400390625, 3.81884765625, 3.977294921875, 4.1357421875, 4.294189453125, 4.45263671875, 4.611083984375, 4.76953125]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 8.0, 5.0, 11.0, 29.0, 33.0, 56.0, 68.0, 89.0, 103.0, 108.0, 84.0, 112.0, 76.0, 77.0, 42.0, 37.0, 23.0, 11.0, 11.0, 0.0, 2.0, 2.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.448486328125, -0.4330406188964844, -0.41759490966796875, -0.4021492004394531, -0.3867034912109375, -0.3712577819824219, -0.35581207275390625, -0.3403663635253906, -0.324920654296875, -0.3094749450683594, -0.29402923583984375, -0.2785835266113281, -0.2631378173828125, -0.24769210815429688, -0.23224639892578125, -0.21680068969726562, -0.20135498046875, -0.18590927124023438, -0.17046356201171875, -0.15501785278320312, -0.1395721435546875, -0.12412643432617188, -0.10868072509765625, -0.09323501586914062, -0.077789306640625, -0.062343597412109375, -0.04689788818359375, -0.031452178955078125, -0.0160064697265625, -0.000560760498046875, 0.01488494873046875, 0.030330657958984375, 0.0457763671875, 0.061222076416015625, 0.07666778564453125, 0.09211349487304688, 0.1075592041015625, 0.12300491333007812, 0.13845062255859375, 0.15389633178710938, 0.169342041015625, 0.18478775024414062, 0.20023345947265625, 0.21567916870117188, 0.2311248779296875, 0.24657058715820312, 0.26201629638671875, 0.2774620056152344, 0.29290771484375, 0.3083534240722656, 0.32379913330078125, 0.3392448425292969, 0.3546905517578125, 0.3701362609863281, 0.38558197021484375, 0.4010276794433594, 0.416473388671875, 0.4319190979003906, 0.44736480712890625, 0.4628105163574219, 0.4782562255859375, 0.4937019348144531, 0.5091476440429688, 0.5245933532714844, 0.5400390625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 4.0, 8.0, 13.0, 27.0, 44.0, 59.0, 124.0, 236.0, 410.0, 772.0, 1561.0, 3212.0, 7509.0, 21593.0, 123156.0, 3807792.0, 186433.0, 25979.0, 8326.0, 3542.0, 1641.0, 801.0, 424.0, 258.0, 137.0, 71.0, 47.0, 32.0, 28.0, 7.0, 12.0, 7.0, 1.0, 6.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.4921875, -2.42010498046875, -2.3480224609375, -2.27593994140625, -2.203857421875, -2.13177490234375, -2.0596923828125, -1.98760986328125, -1.91552734375, -1.84344482421875, -1.7713623046875, -1.69927978515625, -1.627197265625, -1.55511474609375, -1.4830322265625, -1.41094970703125, -1.3388671875, -1.26678466796875, -1.1947021484375, -1.12261962890625, -1.050537109375, -0.97845458984375, -0.9063720703125, -0.83428955078125, -0.76220703125, -0.69012451171875, -0.6180419921875, -0.54595947265625, -0.473876953125, -0.40179443359375, -0.3297119140625, -0.25762939453125, -0.185546875, -0.11346435546875, -0.0413818359375, 0.03070068359375, 0.102783203125, 0.17486572265625, 0.2469482421875, 0.31903076171875, 0.39111328125, 0.46319580078125, 0.5352783203125, 0.60736083984375, 0.679443359375, 0.75152587890625, 0.8236083984375, 0.89569091796875, 0.9677734375, 1.03985595703125, 1.1119384765625, 1.18402099609375, 1.256103515625, 1.32818603515625, 1.4002685546875, 1.47235107421875, 1.54443359375, 1.61651611328125, 1.6885986328125, 1.76068115234375, 1.832763671875, 1.90484619140625, 1.9769287109375, 2.04901123046875, 2.12109375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 7.0, 2.0, 3.0, 5.0, 7.0, 5.0, 5.0, 12.0, 10.0, 19.0, 18.0, 24.0, 46.0, 77.0, 135.0, 290.0, 1064.0, 1585.0, 337.0, 168.0, 92.0, 47.0, 23.0, 22.0, 14.0, 8.0, 8.0, 7.0, 8.0, 4.0, 5.0, 4.0, 1.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.57568359375, -0.5565567016601562, -0.5374298095703125, -0.5183029174804688, -0.499176025390625, -0.48004913330078125, -0.4609222412109375, -0.44179534912109375, -0.42266845703125, -0.40354156494140625, -0.3844146728515625, -0.36528778076171875, -0.346160888671875, -0.32703399658203125, -0.3079071044921875, -0.28878021240234375, -0.2696533203125, -0.25052642822265625, -0.2313995361328125, -0.21227264404296875, -0.193145751953125, -0.17401885986328125, -0.1548919677734375, -0.13576507568359375, -0.11663818359375, -0.09751129150390625, -0.0783843994140625, -0.05925750732421875, -0.040130615234375, -0.02100372314453125, -0.0018768310546875, 0.01725006103515625, 0.036376953125, 0.05550384521484375, 0.0746307373046875, 0.09375762939453125, 0.112884521484375, 0.13201141357421875, 0.1511383056640625, 0.17026519775390625, 0.18939208984375, 0.20851898193359375, 0.2276458740234375, 0.24677276611328125, 0.265899658203125, 0.28502655029296875, 0.3041534423828125, 0.32328033447265625, 0.3424072265625, 0.36153411865234375, 0.3806610107421875, 0.39978790283203125, 0.418914794921875, 0.43804168701171875, 0.4571685791015625, 0.47629547119140625, 0.49542236328125, 0.5145492553710938, 0.5336761474609375, 0.5528030395507812, 0.571929931640625, 0.5910568237304688, 0.6101837158203125, 0.6293106079101562, 0.6484375]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 6.0, 7.0, 9.0, 13.0, 36.0, 50.0, 95.0, 179.0, 203.0, 186.0, 102.0, 52.0, 35.0, 12.0, 8.0, 10.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.484475612640381, -6.312633991241455, -6.140791893005371, -5.968950271606445, -5.7971086502075195, -5.6252665519714355, -5.45342493057251, -5.281582832336426, -5.1097412109375, -4.937899589538574, -4.76605749130249, -4.5942158699035645, -4.4223737716674805, -4.250532150268555, -4.078690528869629, -3.906848669052124, -3.735006809234619, -3.5631649494171143, -3.3913230895996094, -3.2194814682006836, -3.0476396083831787, -2.875797748565674, -2.703956127166748, -2.532114267349243, -2.3602724075317383, -2.1884305477142334, -2.0165886878967285, -1.8447470664978027, -1.6729052066802979, -1.501063346862793, -1.3292216062545776, -1.1573798656463623, -0.9855375289916992, -0.8136957287788391, -0.641853928565979, -0.4700121283531189, -0.2981703281402588, -0.12632852792739868, 0.045513272285461426, 0.21735501289367676, 0.38919687271118164, 0.5610386729240417, 0.7328804731369019, 0.904722273349762, 1.076564073562622, 1.248405933380127, 1.4202476739883423, 1.5920894145965576, 1.7639312744140625, 1.9357731342315674, 2.1076149940490723, 2.279456615447998, 2.451298475265503, 2.623140335083008, 2.7949819564819336, 2.9668238162994385, 3.1386656761169434, 3.3105075359344482, 3.482349395751953, 3.654191017150879, 3.826032876968384, 3.9978747367858887, 4.1697163581848145, 4.341558456420898, 4.513400077819824]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 2.0, 3.0, 9.0, 10.0, 13.0, 9.0, 16.0, 20.0, 25.0, 27.0, 38.0, 33.0, 48.0, 40.0, 40.0, 51.0, 45.0, 42.0, 54.0, 56.0, 49.0, 57.0, 52.0, 53.0, 40.0, 20.0, 27.0, 20.0, 20.0, 13.0, 14.0, 14.0, 15.0, 14.0, 4.0, 3.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.7820212841033936, -2.7063207626342773, -2.6306204795837402, -2.554919958114624, -2.479219675064087, -2.4035191535949707, -2.3278188705444336, -2.2521183490753174, -2.176417827606201, -2.100717306137085, -2.025017023086548, -1.9493165016174316, -1.873616099357605, -1.7979156970977783, -1.7222152948379517, -1.646514892578125, -1.5708144903182983, -1.4951140880584717, -1.419413685798645, -1.3437132835388184, -1.2680127620697021, -1.1923123598098755, -1.1166119575500488, -1.0409114360809326, -0.9652110934257507, -0.8895106911659241, -0.8138102293014526, -0.738109827041626, -0.6624094247817993, -0.5867089629173279, -0.5110085606575012, -0.4353080987930298, -0.3596076965332031, -0.2839072644710541, -0.20820684731006622, -0.13250643014907837, -0.05680599808692932, 0.018894433975219727, 0.09459483623504639, 0.17029529809951782, 0.24599570035934448, 0.32169613242149353, 0.3973965644836426, 0.47309696674346924, 0.5487973690032959, 0.6244978308677673, 0.700198233127594, 0.7758986949920654, 0.8515990972518921, 0.9272994995117188, 1.0029999017715454, 1.078700304031372, 1.1544008255004883, 1.230101227760315, 1.3058016300201416, 1.3815021514892578, 1.457202434539795, 1.5329028367996216, 1.6086032390594482, 1.6843037605285645, 1.7600041627883911, 1.8357045650482178, 1.9114049673080444, 1.987105369567871, 2.0628058910369873]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 2.0, 5.0, 7.0, 9.0, 18.0, 20.0, 18.0, 25.0, 43.0, 68.0, 122.0, 159.0, 283.0, 485.0, 1002.0, 2080.0, 5410.0, 18791.0, 119398.0, 629306.0, 227381.0, 31164.0, 7452.0, 2675.0, 1209.0, 552.0, 316.0, 176.0, 106.0, 89.0, 53.0, 27.0, 32.0, 15.0, 18.0, 8.0, 8.0, 7.0, 5.0, 4.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.771484375, -2.681060791015625, -2.59063720703125, -2.500213623046875, -2.4097900390625, -2.319366455078125, -2.22894287109375, -2.138519287109375, -2.048095703125, -1.957672119140625, -1.86724853515625, -1.776824951171875, -1.6864013671875, -1.595977783203125, -1.50555419921875, -1.415130615234375, -1.32470703125, -1.234283447265625, -1.14385986328125, -1.053436279296875, -0.9630126953125, -0.872589111328125, -0.78216552734375, -0.691741943359375, -0.601318359375, -0.510894775390625, -0.42047119140625, -0.330047607421875, -0.2396240234375, -0.149200439453125, -0.05877685546875, 0.031646728515625, 0.1220703125, 0.212493896484375, 0.30291748046875, 0.393341064453125, 0.4837646484375, 0.574188232421875, 0.66461181640625, 0.755035400390625, 0.845458984375, 0.935882568359375, 1.02630615234375, 1.116729736328125, 1.2071533203125, 1.297576904296875, 1.38800048828125, 1.478424072265625, 1.56884765625, 1.659271240234375, 1.74969482421875, 1.840118408203125, 1.9305419921875, 2.020965576171875, 2.11138916015625, 2.201812744140625, 2.292236328125, 2.382659912109375, 2.47308349609375, 2.563507080078125, 2.6539306640625, 2.744354248046875, 2.83477783203125, 2.925201416015625, 3.015625]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 3.0, 4.0, 10.0, 15.0, 13.0, 32.0, 34.0, 53.0, 73.0, 82.0, 90.0, 101.0, 98.0, 105.0, 79.0, 67.0, 57.0, 35.0, 21.0, 5.0, 9.0, 4.0, 3.0, 1.0, 1.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.458251953125, -0.4423789978027344, -0.42650604248046875, -0.4106330871582031, -0.3947601318359375, -0.3788871765136719, -0.36301422119140625, -0.3471412658691406, -0.331268310546875, -0.3153953552246094, -0.29952239990234375, -0.2836494445800781, -0.2677764892578125, -0.2519035339355469, -0.23603057861328125, -0.22015762329101562, -0.20428466796875, -0.18841171264648438, -0.17253875732421875, -0.15666580200195312, -0.1407928466796875, -0.12491989135742188, -0.10904693603515625, -0.09317398071289062, -0.077301025390625, -0.061428070068359375, -0.04555511474609375, -0.029682159423828125, -0.0138092041015625, 0.002063751220703125, 0.01793670654296875, 0.033809661865234375, 0.0496826171875, 0.06555557250976562, 0.08142852783203125, 0.09730148315429688, 0.1131744384765625, 0.12904739379882812, 0.14492034912109375, 0.16079330444335938, 0.176666259765625, 0.19253921508789062, 0.20841217041015625, 0.22428512573242188, 0.2401580810546875, 0.2560310363769531, 0.27190399169921875, 0.2877769470214844, 0.30364990234375, 0.3195228576660156, 0.33539581298828125, 0.3512687683105469, 0.3671417236328125, 0.3830146789550781, 0.39888763427734375, 0.4147605895996094, 0.430633544921875, 0.4465065002441406, 0.46237945556640625, 0.4782524108886719, 0.4941253662109375, 0.5099983215332031, 0.5258712768554688, 0.5417442321777344, 0.5576171875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 5.0, 7.0, 11.0, 17.0, 16.0, 17.0, 27.0, 42.0, 50.0, 63.0, 109.0, 161.0, 256.0, 459.0, 713.0, 1310.0, 2663.0, 5906.0, 14786.0, 40392.0, 120400.0, 317846.0, 336441.0, 133286.0, 44544.0, 16207.0, 6586.0, 2943.0, 1338.0, 739.0, 403.0, 259.0, 167.0, 97.0, 90.0, 54.0, 35.0, 36.0, 17.0, 21.0, 11.0, 6.0, 6.0, 5.0, 3.0, 6.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2236328125, -1.1842193603515625, -1.144805908203125, -1.1053924560546875, -1.06597900390625, -1.0265655517578125, -0.987152099609375, -0.9477386474609375, -0.9083251953125, -0.8689117431640625, -0.829498291015625, -0.7900848388671875, -0.75067138671875, -0.7112579345703125, -0.671844482421875, -0.6324310302734375, -0.593017578125, -0.5536041259765625, -0.514190673828125, -0.4747772216796875, -0.43536376953125, -0.3959503173828125, -0.356536865234375, -0.3171234130859375, -0.2777099609375, -0.2382965087890625, -0.198883056640625, -0.1594696044921875, -0.12005615234375, -0.0806427001953125, -0.041229248046875, -0.0018157958984375, 0.03759765625, 0.0770111083984375, 0.116424560546875, 0.1558380126953125, 0.19525146484375, 0.2346649169921875, 0.274078369140625, 0.3134918212890625, 0.3529052734375, 0.3923187255859375, 0.431732177734375, 0.4711456298828125, 0.51055908203125, 0.5499725341796875, 0.589385986328125, 0.6287994384765625, 0.668212890625, 0.7076263427734375, 0.747039794921875, 0.7864532470703125, 0.82586669921875, 0.8652801513671875, 0.904693603515625, 0.9441070556640625, 0.9835205078125, 1.0229339599609375, 1.062347412109375, 1.1017608642578125, 1.14117431640625, 1.1805877685546875, 1.220001220703125, 1.2594146728515625, 1.298828125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 9.0, 10.0, 8.0, 12.0, 14.0, 15.0, 20.0, 26.0, 33.0, 40.0, 37.0, 34.0, 36.0, 46.0, 48.0, 46.0, 51.0, 37.0, 52.0, 41.0, 45.0, 46.0, 44.0, 47.0, 22.0, 29.0, 30.0, 27.0, 18.0, 18.0, 8.0, 7.0, 12.0, 9.0, 6.0, 5.0, 9.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2548828125, -1.2169036865234375, -1.178924560546875, -1.1409454345703125, -1.10296630859375, -1.0649871826171875, -1.027008056640625, -0.9890289306640625, -0.9510498046875, -0.9130706787109375, -0.875091552734375, -0.8371124267578125, -0.79913330078125, -0.7611541748046875, -0.723175048828125, -0.6851959228515625, -0.647216796875, -0.6092376708984375, -0.571258544921875, -0.5332794189453125, -0.49530029296875, -0.4573211669921875, -0.419342041015625, -0.3813629150390625, -0.3433837890625, -0.3054046630859375, -0.267425537109375, -0.2294464111328125, -0.19146728515625, -0.1534881591796875, -0.115509033203125, -0.0775299072265625, -0.03955078125, -0.0015716552734375, 0.036407470703125, 0.0743865966796875, 0.11236572265625, 0.1503448486328125, 0.188323974609375, 0.2263031005859375, 0.2642822265625, 0.3022613525390625, 0.340240478515625, 0.3782196044921875, 0.41619873046875, 0.4541778564453125, 0.492156982421875, 0.5301361083984375, 0.568115234375, 0.6060943603515625, 0.644073486328125, 0.6820526123046875, 0.72003173828125, 0.7580108642578125, 0.795989990234375, 0.8339691162109375, 0.8719482421875, 0.9099273681640625, 0.947906494140625, 0.9858856201171875, 1.02386474609375, 1.0618438720703125, 1.099822998046875, 1.1378021240234375, 1.17578125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 7.0, 9.0, 17.0, 37.0, 47.0, 88.0, 181.0, 313.0, 857.0, 3091.0, 20045.0, 341728.0, 640843.0, 34733.0, 4606.0, 1085.0, 396.0, 197.0, 101.0, 73.0, 40.0, 22.0, 10.0, 9.0, 4.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-1.85546875, -1.80548095703125, -1.7554931640625, -1.70550537109375, -1.655517578125, -1.60552978515625, -1.5555419921875, -1.50555419921875, -1.45556640625, -1.40557861328125, -1.3555908203125, -1.30560302734375, -1.255615234375, -1.20562744140625, -1.1556396484375, -1.10565185546875, -1.0556640625, -1.00567626953125, -0.9556884765625, -0.90570068359375, -0.855712890625, -0.80572509765625, -0.7557373046875, -0.70574951171875, -0.65576171875, -0.60577392578125, -0.5557861328125, -0.50579833984375, -0.455810546875, -0.40582275390625, -0.3558349609375, -0.30584716796875, -0.255859375, -0.20587158203125, -0.1558837890625, -0.10589599609375, -0.055908203125, -0.00592041015625, 0.0440673828125, 0.09405517578125, 0.14404296875, 0.19403076171875, 0.2440185546875, 0.29400634765625, 0.343994140625, 0.39398193359375, 0.4439697265625, 0.49395751953125, 0.5439453125, 0.59393310546875, 0.6439208984375, 0.69390869140625, 0.743896484375, 0.79388427734375, 0.8438720703125, 0.89385986328125, 0.94384765625, 0.99383544921875, 1.0438232421875, 1.09381103515625, 1.143798828125, 1.19378662109375, 1.2437744140625, 1.29376220703125, 1.34375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 5.0, 3.0, 6.0, 7.0, 12.0, 16.0, 31.0, 47.0, 76.0, 96.0, 131.0, 160.0, 136.0, 93.0, 60.0, 41.0, 24.0, 12.0, 9.0, 7.0, 5.0, 7.0, 3.0, 7.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00019216537475585938, -0.00018562376499176025, -0.00017908215522766113, -0.000172540545463562, -0.0001659989356994629, -0.00015945732593536377, -0.00015291571617126465, -0.00014637410640716553, -0.0001398324966430664, -0.00013329088687896729, -0.00012674927711486816, -0.00012020766735076904, -0.00011366605758666992, -0.0001071244478225708, -0.00010058283805847168, -9.404122829437256e-05, -8.749961853027344e-05, -8.095800876617432e-05, -7.44163990020752e-05, -6.787478923797607e-05, -6.133317947387695e-05, -5.479156970977783e-05, -4.824995994567871e-05, -4.170835018157959e-05, -3.516674041748047e-05, -2.8625130653381348e-05, -2.2083520889282227e-05, -1.5541911125183105e-05, -9.000301361083984e-06, -2.4586915969848633e-06, 4.082918167114258e-06, 1.0624527931213379e-05, 1.71661376953125e-05, 2.370774745941162e-05, 3.0249357223510742e-05, 3.679096698760986e-05, 4.3332576751708984e-05, 4.9874186515808105e-05, 5.6415796279907227e-05, 6.295740604400635e-05, 6.949901580810547e-05, 7.604062557220459e-05, 8.258223533630371e-05, 8.912384510040283e-05, 9.566545486450195e-05, 0.00010220706462860107, 0.0001087486743927002, 0.00011529028415679932, 0.00012183189392089844, 0.00012837350368499756, 0.00013491511344909668, 0.0001414567232131958, 0.00014799833297729492, 0.00015453994274139404, 0.00016108155250549316, 0.00016762316226959229, 0.0001741647720336914, 0.00018070638179779053, 0.00018724799156188965, 0.00019378960132598877, 0.0002003312110900879, 0.000206872820854187, 0.00021341443061828613, 0.00021995604038238525, 0.00022649765014648438]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 6.0, 8.0, 10.0, 9.0, 24.0, 46.0, 48.0, 98.0, 175.0, 471.0, 1610.0, 8752.0, 113499.0, 855823.0, 60008.0, 6007.0, 1202.0, 365.0, 178.0, 95.0, 46.0, 30.0, 18.0, 17.0, 8.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5234375, -1.465728759765625, -1.40802001953125, -1.350311279296875, -1.2926025390625, -1.234893798828125, -1.17718505859375, -1.119476318359375, -1.061767578125, -1.004058837890625, -0.94635009765625, -0.888641357421875, -0.8309326171875, -0.773223876953125, -0.71551513671875, -0.657806396484375, -0.60009765625, -0.542388916015625, -0.48468017578125, -0.426971435546875, -0.3692626953125, -0.311553955078125, -0.25384521484375, -0.196136474609375, -0.138427734375, -0.080718994140625, -0.02301025390625, 0.034698486328125, 0.0924072265625, 0.150115966796875, 0.20782470703125, 0.265533447265625, 0.3232421875, 0.380950927734375, 0.43865966796875, 0.496368408203125, 0.5540771484375, 0.611785888671875, 0.66949462890625, 0.727203369140625, 0.784912109375, 0.842620849609375, 0.90032958984375, 0.958038330078125, 1.0157470703125, 1.073455810546875, 1.13116455078125, 1.188873291015625, 1.24658203125, 1.304290771484375, 1.36199951171875, 1.419708251953125, 1.4774169921875, 1.535125732421875, 1.59283447265625, 1.650543212890625, 1.708251953125, 1.765960693359375, 1.82366943359375, 1.881378173828125, 1.9390869140625, 1.996795654296875, 2.05450439453125, 2.112213134765625, 2.169921875]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 6.0, 1.0, 9.0, 12.0, 20.0, 27.0, 41.0, 51.0, 85.0, 111.0, 113.0, 140.0, 133.0, 81.0, 58.0, 39.0, 32.0, 20.0, 12.0, 6.0, 6.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.56494140625, -0.5354843139648438, -0.5060272216796875, -0.47657012939453125, -0.447113037109375, -0.41765594482421875, -0.3881988525390625, -0.35874176025390625, -0.32928466796875, -0.29982757568359375, -0.2703704833984375, -0.24091339111328125, -0.211456298828125, -0.18199920654296875, -0.1525421142578125, -0.12308502197265625, -0.0936279296875, -0.06417083740234375, -0.0347137451171875, -0.00525665283203125, 0.024200439453125, 0.05365753173828125, 0.0831146240234375, 0.11257171630859375, 0.14202880859375, 0.17148590087890625, 0.2009429931640625, 0.23040008544921875, 0.259857177734375, 0.28931427001953125, 0.3187713623046875, 0.34822845458984375, 0.377685546875, 0.40714263916015625, 0.4365997314453125, 0.46605682373046875, 0.495513916015625, 0.5249710083007812, 0.5544281005859375, 0.5838851928710938, 0.61334228515625, 0.6427993774414062, 0.6722564697265625, 0.7017135620117188, 0.731170654296875, 0.7606277465820312, 0.7900848388671875, 0.8195419311523438, 0.8489990234375, 0.8784561157226562, 0.9079132080078125, 0.9373703002929688, 0.966827392578125, 0.9962844848632812, 1.0257415771484375, 1.0551986694335938, 1.08465576171875, 1.1141128540039062, 1.1435699462890625, 1.1730270385742188, 1.202484130859375, 1.2319412231445312, 1.2613983154296875, 1.2908554077148438, 1.3203125]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 6.0, 17.0, 40.0, 111.0, 216.0, 321.0, 174.0, 76.0, 32.0, 8.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.068765640258789, -11.287035942077637, -10.505306243896484, -9.723577499389648, -8.941847801208496, -8.160118103027344, -7.37838888168335, -6.5966596603393555, -5.814929962158203, -5.033200263977051, -4.251471042633057, -3.4697415828704834, -2.68801212310791, -1.906282663345337, -1.1245532035827637, -0.34282398223876953, 0.4389057159423828, 1.220635175704956, 2.0023646354675293, 2.7840940952301025, 3.565823554992676, 4.347553253173828, 5.129282474517822, 5.911011695861816, 6.692741394042969, 7.474471092224121, 8.256200790405273, 9.03792953491211, 9.819659233093262, 10.601388931274414, 11.38311767578125, 12.164847373962402, 12.946578979492188, 13.72830867767334, 14.510038375854492, 15.291767120361328, 16.073497772216797, 16.855226516723633, 17.63695526123047, 18.418685913085938, 19.200414657592773, 19.98214340209961, 20.763874053955078, 21.545602798461914, 22.32733154296875, 23.10906219482422, 23.890790939331055, 24.67251968383789, 25.45425033569336, 26.235979080200195, 27.017709732055664, 27.7994384765625, 28.58116912841797, 29.362897872924805, 30.14462661743164, 30.92635726928711, 31.708086013793945, 32.48981475830078, 33.27154541015625, 34.05327606201172, 34.83500289916992, 35.61673355102539, 36.39846420288086, 37.18019104003906, 37.96192169189453]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 2.0, 6.0, 4.0, 5.0, 8.0, 6.0, 13.0, 19.0, 13.0, 17.0, 19.0, 20.0, 28.0, 20.0, 29.0, 38.0, 39.0, 30.0, 41.0, 45.0, 38.0, 51.0, 32.0, 46.0, 40.0, 39.0, 46.0, 28.0, 42.0, 32.0, 23.0, 24.0, 23.0, 27.0, 17.0, 21.0, 12.0, 11.0, 9.0, 7.0, 9.0, 2.0, 5.0, 3.0, 6.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.174185752868652, -5.975380897521973, -5.776576519012451, -5.5777716636657715, -5.37896728515625, -5.18016242980957, -4.981357574462891, -4.782553195953369, -4.583748817443848, -4.384943962097168, -4.1861395835876465, -3.987334728240967, -3.7885303497314453, -3.5897254943847656, -3.390920877456665, -3.1921162605285645, -2.9933114051818848, -2.794506788253784, -2.5957021713256836, -2.396897315979004, -2.1980929374694824, -1.9992882013320923, -1.8004834651947021, -1.6016788482666016, -1.402874231338501, -1.2040696144104004, -1.0052649974822998, -0.8064602613449097, -0.6076556444168091, -0.4088510274887085, -0.21004629135131836, -0.011241674423217773, 0.18756341934204102, 0.386368066072464, 0.585172712802887, 0.7839773893356323, 0.9827820062637329, 1.1815866231918335, 1.3803913593292236, 1.5791959762573242, 1.7780005931854248, 1.9768052101135254, 2.175609827041626, 2.3744144439697266, 2.5732192993164062, 2.7720236778259277, 2.9708285331726074, 3.169633150100708, 3.3684377670288086, 3.567242383956909, 3.7660470008850098, 3.9648518562316895, 4.163656234741211, 4.362461090087891, 4.56126594543457, 4.760070323944092, 4.958874702453613, 5.157679557800293, 5.3564839363098145, 5.555288791656494, 5.754093170166016, 5.952898025512695, 6.151702880859375, 6.3505072593688965, 6.549312114715576]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 9.0, 8.0, 8.0, 9.0, 11.0, 24.0, 36.0, 52.0, 80.0, 132.0, 239.0, 461.0, 1318.0, 4155.0, 18081.0, 452383.0, 3683279.0, 25534.0, 5238.0, 1654.0, 637.0, 308.0, 188.0, 113.0, 84.0, 58.0, 39.0, 30.0, 19.0, 23.0, 22.0, 9.0, 7.0, 6.0, 3.0, 6.0, 2.0, 4.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-4.69921875, -4.5614013671875, -4.423583984375, -4.2857666015625, -4.14794921875, -4.0101318359375, -3.872314453125, -3.7344970703125, -3.5966796875, -3.4588623046875, -3.321044921875, -3.1832275390625, -3.04541015625, -2.9075927734375, -2.769775390625, -2.6319580078125, -2.494140625, -2.3563232421875, -2.218505859375, -2.0806884765625, -1.94287109375, -1.8050537109375, -1.667236328125, -1.5294189453125, -1.3916015625, -1.2537841796875, -1.115966796875, -0.9781494140625, -0.84033203125, -0.7025146484375, -0.564697265625, -0.4268798828125, -0.2890625, -0.1512451171875, -0.013427734375, 0.1243896484375, 0.26220703125, 0.4000244140625, 0.537841796875, 0.6756591796875, 0.8134765625, 0.9512939453125, 1.089111328125, 1.2269287109375, 1.36474609375, 1.5025634765625, 1.640380859375, 1.7781982421875, 1.916015625, 2.0538330078125, 2.191650390625, 2.3294677734375, 2.46728515625, 2.6051025390625, 2.742919921875, 2.8807373046875, 3.0185546875, 3.1563720703125, 3.294189453125, 3.4320068359375, 3.56982421875, 3.7076416015625, 3.845458984375, 3.9832763671875, 4.12109375]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 7.0, 8.0, 15.0, 13.0, 21.0, 25.0, 40.0, 45.0, 68.0, 69.0, 87.0, 86.0, 86.0, 72.0, 85.0, 64.0, 61.0, 47.0, 34.0, 22.0, 9.0, 12.0, 6.0, 5.0, 3.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.454833984375, -0.4397926330566406, -0.42475128173828125, -0.4097099304199219, -0.3946685791015625, -0.3796272277832031, -0.36458587646484375, -0.3495445251464844, -0.334503173828125, -0.3194618225097656, -0.30442047119140625, -0.2893791198730469, -0.2743377685546875, -0.2592964172363281, -0.24425506591796875, -0.22921371459960938, -0.21417236328125, -0.19913101196289062, -0.18408966064453125, -0.16904830932617188, -0.1540069580078125, -0.13896560668945312, -0.12392425537109375, -0.10888290405273438, -0.093841552734375, -0.07880020141601562, -0.06375885009765625, -0.048717498779296875, -0.0336761474609375, -0.018634796142578125, -0.00359344482421875, 0.011447906494140625, 0.0264892578125, 0.041530609130859375, 0.05657196044921875, 0.07161331176757812, 0.0866546630859375, 0.10169601440429688, 0.11673736572265625, 0.13177871704101562, 0.146820068359375, 0.16186141967773438, 0.17690277099609375, 0.19194412231445312, 0.2069854736328125, 0.22202682495117188, 0.23706817626953125, 0.2521095275878906, 0.26715087890625, 0.2821922302246094, 0.29723358154296875, 0.3122749328613281, 0.3273162841796875, 0.3423576354980469, 0.35739898681640625, 0.3724403381347656, 0.387481689453125, 0.4025230407714844, 0.41756439208984375, 0.4326057434082031, 0.4476470947265625, 0.4626884460449219, 0.47772979736328125, 0.4927711486816406, 0.5078125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 6.0, 4.0, 7.0, 6.0, 12.0, 11.0, 20.0, 36.0, 45.0, 72.0, 118.0, 198.0, 320.0, 545.0, 892.0, 1615.0, 3346.0, 7419.0, 19648.0, 70440.0, 1489584.0, 2484813.0, 77961.0, 21003.0, 8015.0, 3686.0, 1916.0, 1016.0, 551.0, 363.0, 199.0, 133.0, 102.0, 63.0, 41.0, 28.0, 13.0, 13.0, 10.0, 4.0, 2.0, 3.0, 2.0, 6.0, 1.0, 2.0, 1.0], "bins": [-2.365234375, -2.30303955078125, -2.2408447265625, -2.17864990234375, -2.116455078125, -2.05426025390625, -1.9920654296875, -1.92987060546875, -1.86767578125, -1.80548095703125, -1.7432861328125, -1.68109130859375, -1.618896484375, -1.55670166015625, -1.4945068359375, -1.43231201171875, -1.3701171875, -1.30792236328125, -1.2457275390625, -1.18353271484375, -1.121337890625, -1.05914306640625, -0.9969482421875, -0.93475341796875, -0.87255859375, -0.81036376953125, -0.7481689453125, -0.68597412109375, -0.623779296875, -0.56158447265625, -0.4993896484375, -0.43719482421875, -0.375, -0.31280517578125, -0.2506103515625, -0.18841552734375, -0.126220703125, -0.06402587890625, -0.0018310546875, 0.06036376953125, 0.12255859375, 0.18475341796875, 0.2469482421875, 0.30914306640625, 0.371337890625, 0.43353271484375, 0.4957275390625, 0.55792236328125, 0.6201171875, 0.68231201171875, 0.7445068359375, 0.80670166015625, 0.868896484375, 0.93109130859375, 0.9932861328125, 1.05548095703125, 1.11767578125, 1.17987060546875, 1.2420654296875, 1.30426025390625, 1.366455078125, 1.42864990234375, 1.4908447265625, 1.55303955078125, 1.615234375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 5.0, 6.0, 15.0, 10.0, 21.0, 40.0, 35.0, 68.0, 183.0, 468.0, 2085.0, 686.0, 180.0, 97.0, 46.0, 35.0, 20.0, 14.0, 13.0, 9.0, 7.0, 10.0, 3.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.94189453125, -0.9089431762695312, -0.8759918212890625, -0.8430404663085938, -0.810089111328125, -0.7771377563476562, -0.7441864013671875, -0.7112350463867188, -0.67828369140625, -0.6453323364257812, -0.6123809814453125, -0.5794296264648438, -0.546478271484375, -0.5135269165039062, -0.4805755615234375, -0.44762420654296875, -0.4146728515625, -0.38172149658203125, -0.3487701416015625, -0.31581878662109375, -0.282867431640625, -0.24991607666015625, -0.2169647216796875, -0.18401336669921875, -0.15106201171875, -0.11811065673828125, -0.0851593017578125, -0.05220794677734375, -0.019256591796875, 0.01369476318359375, 0.0466461181640625, 0.07959747314453125, 0.112548828125, 0.14550018310546875, 0.1784515380859375, 0.21140289306640625, 0.244354248046875, 0.27730560302734375, 0.3102569580078125, 0.34320831298828125, 0.37615966796875, 0.40911102294921875, 0.4420623779296875, 0.47501373291015625, 0.507965087890625, 0.5409164428710938, 0.5738677978515625, 0.6068191528320312, 0.6397705078125, 0.6727218627929688, 0.7056732177734375, 0.7386245727539062, 0.771575927734375, 0.8045272827148438, 0.8374786376953125, 0.8704299926757812, 0.90338134765625, 0.9363327026367188, 0.9692840576171875, 1.0022354125976562, 1.035186767578125, 1.0681381225585938, 1.1010894775390625, 1.1340408325195312, 1.1669921875]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 6.0, 36.0, 106.0, 288.0, 328.0, 148.0, 54.0, 23.0, 9.0, 6.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.847047805786133, -11.43986701965332, -11.032686233520508, -10.625505447387695, -10.2183256149292, -9.811144828796387, -9.403964042663574, -8.996783256530762, -8.589603424072266, -8.182422637939453, -7.775242328643799, -7.368061542510986, -6.960881233215332, -6.5537004470825195, -6.146519660949707, -5.7393388748168945, -5.332158088684082, -4.9249773025512695, -4.517796993255615, -4.110616207122803, -3.7034356594085693, -3.296255111694336, -2.8890743255615234, -2.48189377784729, -2.0747132301330566, -1.6675326824188232, -1.2603520154953003, -0.8531713485717773, -0.44599080085754395, -0.03881025314331055, 0.36837053298950195, 0.7755510807037354, 1.1827316284179688, 1.5899121761322021, 1.997092843055725, 2.404273509979248, 2.8114540576934814, 3.218634605407715, 3.6258153915405273, 4.03299617767334, 4.440176486968994, 4.847357273101807, 5.254537582397461, 5.661718368530273, 6.068899154663086, 6.47607946395874, 6.883260250091553, 7.290440559387207, 7.6976213455200195, 8.104802131652832, 8.511982917785645, 8.91916275024414, 9.326343536376953, 9.733524322509766, 10.140705108642578, 10.54788589477539, 10.955066680908203, 11.362247467041016, 11.769428253173828, 12.17660903930664, 12.583788871765137, 12.99096965789795, 13.398150444030762, 13.805331230163574, 14.21251106262207]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 0.0, 3.0, 11.0, 10.0, 17.0, 16.0, 14.0, 13.0, 17.0, 33.0, 32.0, 49.0, 33.0, 48.0, 56.0, 58.0, 57.0, 49.0, 41.0, 59.0, 54.0, 51.0, 41.0, 37.0, 43.0, 32.0, 21.0, 28.0, 22.0, 20.0, 14.0, 5.0, 8.0, 2.0, 3.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.402423858642578, -3.296762228012085, -3.191100597381592, -3.0854389667510986, -2.9797773361206055, -2.874115467071533, -2.76845383644104, -2.662792205810547, -2.5571305751800537, -2.4514689445495605, -2.3458073139190674, -2.240145683288574, -2.134483814239502, -2.028822422027588, -1.9231605529785156, -1.8174989223480225, -1.7118372917175293, -1.6061756610870361, -1.500514030456543, -1.3948522806167603, -1.289190649986267, -1.183529019355774, -1.0778672695159912, -0.972205638885498, -0.8665440082550049, -0.7608823776245117, -0.6552206873893738, -0.5495589971542358, -0.4438973665237427, -0.3382357358932495, -0.23257404565811157, -0.12691235542297363, -0.02125072479248047, 0.08441093564033508, 0.19007259607315063, 0.2957342565059662, 0.40139591693878174, 0.5070575475692749, 0.6127192378044128, 0.7183809280395508, 0.824042558670044, 0.9297041893005371, 1.0353658199310303, 1.141027569770813, 1.2466892004013062, 1.3523508310317993, 1.458012580871582, 1.5636742115020752, 1.6693358421325684, 1.7749974727630615, 1.8806591033935547, 1.9863208532333374, 2.091982364654541, 2.1976442337036133, 2.3033058643341064, 2.4089674949645996, 2.5146291255950928, 2.620290756225586, 2.725952386856079, 2.8316140174865723, 2.9372758865356445, 3.0429372787475586, 3.148599147796631, 3.254260778427124, 3.359922409057617]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 4.0, 2.0, 3.0, 15.0, 12.0, 11.0, 20.0, 56.0, 58.0, 80.0, 164.0, 288.0, 617.0, 1353.0, 3865.0, 15188.0, 117427.0, 792467.0, 97288.0, 13539.0, 3518.0, 1237.0, 575.0, 292.0, 167.0, 101.0, 56.0, 52.0, 37.0, 18.0, 9.0, 12.0, 9.0, 5.0, 9.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.75390625, -3.638275146484375, -3.52264404296875, -3.407012939453125, -3.2913818359375, -3.175750732421875, -3.06011962890625, -2.944488525390625, -2.828857421875, -2.713226318359375, -2.59759521484375, -2.481964111328125, -2.3663330078125, -2.250701904296875, -2.13507080078125, -2.019439697265625, -1.90380859375, -1.788177490234375, -1.67254638671875, -1.556915283203125, -1.4412841796875, -1.325653076171875, -1.21002197265625, -1.094390869140625, -0.978759765625, -0.863128662109375, -0.74749755859375, -0.631866455078125, -0.5162353515625, -0.400604248046875, -0.28497314453125, -0.169342041015625, -0.0537109375, 0.061920166015625, 0.17755126953125, 0.293182373046875, 0.4088134765625, 0.524444580078125, 0.64007568359375, 0.755706787109375, 0.871337890625, 0.986968994140625, 1.10260009765625, 1.218231201171875, 1.3338623046875, 1.449493408203125, 1.56512451171875, 1.680755615234375, 1.79638671875, 1.912017822265625, 2.02764892578125, 2.143280029296875, 2.2589111328125, 2.374542236328125, 2.49017333984375, 2.605804443359375, 2.721435546875, 2.837066650390625, 2.95269775390625, 3.068328857421875, 3.1839599609375, 3.299591064453125, 3.41522216796875, 3.530853271484375, 3.646484375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 6.0, 7.0, 8.0, 19.0, 17.0, 28.0, 40.0, 58.0, 70.0, 74.0, 100.0, 86.0, 92.0, 81.0, 75.0, 74.0, 50.0, 29.0, 27.0, 19.0, 16.0, 12.0, 2.0, 2.0, 3.0, 1.0, 5.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.44677734375, -0.43021392822265625, -0.4136505126953125, -0.39708709716796875, -0.380523681640625, -0.36396026611328125, -0.3473968505859375, -0.33083343505859375, -0.31427001953125, -0.29770660400390625, -0.2811431884765625, -0.26457977294921875, -0.248016357421875, -0.23145294189453125, -0.2148895263671875, -0.19832611083984375, -0.1817626953125, -0.16519927978515625, -0.1486358642578125, -0.13207244873046875, -0.115509033203125, -0.09894561767578125, -0.0823822021484375, -0.06581878662109375, -0.04925537109375, -0.03269195556640625, -0.0161285400390625, 0.00043487548828125, 0.016998291015625, 0.03356170654296875, 0.0501251220703125, 0.06668853759765625, 0.083251953125, 0.09981536865234375, 0.1163787841796875, 0.13294219970703125, 0.149505615234375, 0.16606903076171875, 0.1826324462890625, 0.19919586181640625, 0.21575927734375, 0.23232269287109375, 0.2488861083984375, 0.26544952392578125, 0.282012939453125, 0.29857635498046875, 0.3151397705078125, 0.33170318603515625, 0.3482666015625, 0.36483001708984375, 0.3813934326171875, 0.39795684814453125, 0.414520263671875, 0.43108367919921875, 0.4476470947265625, 0.46421051025390625, 0.48077392578125, 0.49733734130859375, 0.5139007568359375, 0.5304641723632812, 0.547027587890625, 0.5635910034179688, 0.5801544189453125, 0.5967178344726562, 0.61328125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 6.0, 7.0, 11.0, 9.0, 8.0, 23.0, 24.0, 37.0, 65.0, 107.0, 152.0, 264.0, 549.0, 1125.0, 2496.0, 6729.0, 21732.0, 95293.0, 522385.0, 320087.0, 54820.0, 14188.0, 4674.0, 1865.0, 856.0, 440.0, 222.0, 124.0, 87.0, 51.0, 28.0, 26.0, 21.0, 10.0, 8.0, 4.0, 8.0, 1.0, 7.0, 5.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.73828125, -1.6800079345703125, -1.621734619140625, -1.5634613037109375, -1.50518798828125, -1.4469146728515625, -1.388641357421875, -1.3303680419921875, -1.2720947265625, -1.2138214111328125, -1.155548095703125, -1.0972747802734375, -1.03900146484375, -0.9807281494140625, -0.922454833984375, -0.8641815185546875, -0.805908203125, -0.7476348876953125, -0.689361572265625, -0.6310882568359375, -0.57281494140625, -0.5145416259765625, -0.456268310546875, -0.3979949951171875, -0.3397216796875, -0.2814483642578125, -0.223175048828125, -0.1649017333984375, -0.10662841796875, -0.0483551025390625, 0.009918212890625, 0.0681915283203125, 0.12646484375, 0.1847381591796875, 0.243011474609375, 0.3012847900390625, 0.35955810546875, 0.4178314208984375, 0.476104736328125, 0.5343780517578125, 0.5926513671875, 0.6509246826171875, 0.709197998046875, 0.7674713134765625, 0.82574462890625, 0.8840179443359375, 0.942291259765625, 1.0005645751953125, 1.058837890625, 1.1171112060546875, 1.175384521484375, 1.2336578369140625, 1.29193115234375, 1.3502044677734375, 1.408477783203125, 1.4667510986328125, 1.5250244140625, 1.5832977294921875, 1.641571044921875, 1.6998443603515625, 1.75811767578125, 1.8163909912109375, 1.874664306640625, 1.9329376220703125, 1.9912109375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 7.0, 4.0, 5.0, 12.0, 7.0, 9.0, 17.0, 17.0, 16.0, 17.0, 16.0, 23.0, 32.0, 36.0, 38.0, 41.0, 48.0, 49.0, 42.0, 53.0, 41.0, 40.0, 43.0, 36.0, 38.0, 44.0, 44.0, 43.0, 29.0, 31.0, 19.0, 18.0, 13.0, 15.0, 13.0, 8.0, 14.0, 5.0, 7.0, 6.0, 0.0, 1.0, 3.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2822265625, -1.2428131103515625, -1.203399658203125, -1.1639862060546875, -1.12457275390625, -1.0851593017578125, -1.045745849609375, -1.0063323974609375, -0.9669189453125, -0.9275054931640625, -0.888092041015625, -0.8486785888671875, -0.80926513671875, -0.7698516845703125, -0.730438232421875, -0.6910247802734375, -0.651611328125, -0.6121978759765625, -0.572784423828125, -0.5333709716796875, -0.49395751953125, -0.4545440673828125, -0.415130615234375, -0.3757171630859375, -0.3363037109375, -0.2968902587890625, -0.257476806640625, -0.2180633544921875, -0.17864990234375, -0.1392364501953125, -0.099822998046875, -0.0604095458984375, -0.02099609375, 0.0184173583984375, 0.057830810546875, 0.0972442626953125, 0.13665771484375, 0.1760711669921875, 0.215484619140625, 0.2548980712890625, 0.2943115234375, 0.3337249755859375, 0.373138427734375, 0.4125518798828125, 0.45196533203125, 0.4913787841796875, 0.530792236328125, 0.5702056884765625, 0.609619140625, 0.6490325927734375, 0.688446044921875, 0.7278594970703125, 0.76727294921875, 0.8066864013671875, 0.846099853515625, 0.8855133056640625, 0.9249267578125, 0.9643402099609375, 1.003753662109375, 1.0431671142578125, 1.08258056640625, 1.1219940185546875, 1.161407470703125, 1.2008209228515625, 1.240234375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 2.0, 4.0, 2.0, 6.0, 7.0, 12.0, 19.0, 15.0, 33.0, 55.0, 105.0, 228.0, 479.0, 1321.0, 4566.0, 24387.0, 355895.0, 616515.0, 35929.0, 6216.0, 1642.0, 530.0, 241.0, 125.0, 69.0, 34.0, 31.0, 20.0, 17.0, 13.0, 8.0, 4.0, 8.0, 2.0, 8.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.0322265625, -0.9967498779296875, -0.961273193359375, -0.9257965087890625, -0.89031982421875, -0.8548431396484375, -0.819366455078125, -0.7838897705078125, -0.7484130859375, -0.7129364013671875, -0.677459716796875, -0.6419830322265625, -0.60650634765625, -0.5710296630859375, -0.535552978515625, -0.5000762939453125, -0.464599609375, -0.4291229248046875, -0.393646240234375, -0.3581695556640625, -0.32269287109375, -0.2872161865234375, -0.251739501953125, -0.2162628173828125, -0.1807861328125, -0.1453094482421875, -0.109832763671875, -0.0743560791015625, -0.03887939453125, -0.0034027099609375, 0.032073974609375, 0.0675506591796875, 0.10302734375, 0.1385040283203125, 0.173980712890625, 0.2094573974609375, 0.24493408203125, 0.2804107666015625, 0.315887451171875, 0.3513641357421875, 0.3868408203125, 0.4223175048828125, 0.457794189453125, 0.4932708740234375, 0.52874755859375, 0.5642242431640625, 0.599700927734375, 0.6351776123046875, 0.670654296875, 0.7061309814453125, 0.741607666015625, 0.7770843505859375, 0.81256103515625, 0.8480377197265625, 0.883514404296875, 0.9189910888671875, 0.9544677734375, 0.9899444580078125, 1.025421142578125, 1.0608978271484375, 1.09637451171875, 1.1318511962890625, 1.167327880859375, 1.2028045654296875, 1.23828125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 7.0, 12.0, 13.0, 20.0, 21.0, 32.0, 72.0, 111.0, 209.0, 182.0, 114.0, 70.0, 46.0, 22.0, 21.0, 14.0, 11.0, 12.0, 5.0, 0.0, 3.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00015091896057128906, -0.00014552287757396698, -0.0001401267945766449, -0.00013473071157932281, -0.00012933462858200073, -0.00012393854558467865, -0.00011854246258735657, -0.00011314637959003448, -0.0001077502965927124, -0.00010235421359539032, -9.695813059806824e-05, -9.156204760074615e-05, -8.616596460342407e-05, -8.076988160610199e-05, -7.537379860877991e-05, -6.997771561145782e-05, -6.458163261413574e-05, -5.918554961681366e-05, -5.378946661949158e-05, -4.8393383622169495e-05, -4.299730062484741e-05, -3.760121762752533e-05, -3.220513463020325e-05, -2.6809051632881165e-05, -2.1412968635559082e-05, -1.6016885638237e-05, -1.0620802640914917e-05, -5.2247196435928345e-06, 1.7136335372924805e-07, 5.5674463510513306e-06, 1.0963529348373413e-05, 1.6359612345695496e-05, 2.1755695343017578e-05, 2.715177834033966e-05, 3.254786133766174e-05, 3.7943944334983826e-05, 4.334002733230591e-05, 4.873611032962799e-05, 5.413219332695007e-05, 5.9528276324272156e-05, 6.492435932159424e-05, 7.032044231891632e-05, 7.57165253162384e-05, 8.111260831356049e-05, 8.650869131088257e-05, 9.190477430820465e-05, 9.730085730552673e-05, 0.00010269694030284882, 0.0001080930233001709, 0.00011348910629749298, 0.00011888518929481506, 0.00012428127229213715, 0.00012967735528945923, 0.0001350734382867813, 0.0001404695212841034, 0.00014586560428142548, 0.00015126168727874756, 0.00015665777027606964, 0.00016205385327339172, 0.0001674499362707138, 0.0001728460192680359, 0.00017824210226535797, 0.00018363818526268005, 0.00018903426826000214, 0.00019443035125732422]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 4.0, 0.0, 7.0, 6.0, 10.0, 28.0, 24.0, 60.0, 73.0, 99.0, 193.0, 423.0, 929.0, 2782.0, 13661.0, 185350.0, 800559.0, 36331.0, 5241.0, 1496.0, 607.0, 259.0, 143.0, 96.0, 54.0, 53.0, 21.0, 15.0, 10.0, 5.0, 7.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2705078125, -1.225494384765625, -1.18048095703125, -1.135467529296875, -1.0904541015625, -1.045440673828125, -1.00042724609375, -0.955413818359375, -0.910400390625, -0.865386962890625, -0.82037353515625, -0.775360107421875, -0.7303466796875, -0.685333251953125, -0.64031982421875, -0.595306396484375, -0.55029296875, -0.505279541015625, -0.46026611328125, -0.415252685546875, -0.3702392578125, -0.325225830078125, -0.28021240234375, -0.235198974609375, -0.190185546875, -0.145172119140625, -0.10015869140625, -0.055145263671875, -0.0101318359375, 0.034881591796875, 0.07989501953125, 0.124908447265625, 0.169921875, 0.214935302734375, 0.25994873046875, 0.304962158203125, 0.3499755859375, 0.394989013671875, 0.44000244140625, 0.485015869140625, 0.530029296875, 0.575042724609375, 0.62005615234375, 0.665069580078125, 0.7100830078125, 0.755096435546875, 0.80010986328125, 0.845123291015625, 0.89013671875, 0.935150146484375, 0.98016357421875, 1.025177001953125, 1.0701904296875, 1.115203857421875, 1.16021728515625, 1.205230712890625, 1.250244140625, 1.295257568359375, 1.34027099609375, 1.385284423828125, 1.4302978515625, 1.475311279296875, 1.52032470703125, 1.565338134765625, 1.6103515625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 2.0, 5.0, 8.0, 13.0, 18.0, 22.0, 42.0, 42.0, 93.0, 151.0, 190.0, 159.0, 97.0, 40.0, 31.0, 22.0, 21.0, 19.0, 11.0, 3.0, 6.0, 2.0, 6.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.916015625, -0.8878860473632812, -0.8597564697265625, -0.8316268920898438, -0.803497314453125, -0.7753677368164062, -0.7472381591796875, -0.7191085815429688, -0.69097900390625, -0.6628494262695312, -0.6347198486328125, -0.6065902709960938, -0.578460693359375, -0.5503311157226562, -0.5222015380859375, -0.49407196044921875, -0.4659423828125, -0.43781280517578125, -0.4096832275390625, -0.38155364990234375, -0.353424072265625, -0.32529449462890625, -0.2971649169921875, -0.26903533935546875, -0.24090576171875, -0.21277618408203125, -0.1846466064453125, -0.15651702880859375, -0.128387451171875, -0.10025787353515625, -0.0721282958984375, -0.04399871826171875, -0.015869140625, 0.01226043701171875, 0.0403900146484375, 0.06851959228515625, 0.096649169921875, 0.12477874755859375, 0.1529083251953125, 0.18103790283203125, 0.20916748046875, 0.23729705810546875, 0.2654266357421875, 0.29355621337890625, 0.321685791015625, 0.34981536865234375, 0.3779449462890625, 0.40607452392578125, 0.4342041015625, 0.46233367919921875, 0.4904632568359375, 0.5185928344726562, 0.546722412109375, 0.5748519897460938, 0.6029815673828125, 0.6311111450195312, 0.65924072265625, 0.6873703002929688, 0.7154998779296875, 0.7436294555664062, 0.771759033203125, 0.7998886108398438, 0.8280181884765625, 0.8561477661132812, 0.88427734375]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 11.0, 9.0, 34.0, 51.0, 89.0, 128.0, 167.0, 192.0, 143.0, 93.0, 49.0, 18.0, 13.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.13174057006836, -21.66269874572754, -21.19365692138672, -20.7246150970459, -20.255573272705078, -19.786529541015625, -19.317487716674805, -18.848445892333984, -18.379404067993164, -17.910362243652344, -17.441320419311523, -16.972278594970703, -16.503236770629883, -16.034194946289062, -15.565152168273926, -15.096109390258789, -14.627067565917969, -14.158025741577148, -13.688983917236328, -13.219941139221191, -12.750899314880371, -12.28185749053955, -11.81281566619873, -11.343772888183594, -10.87473201751709, -10.40569019317627, -9.93664836883545, -9.467605590820312, -8.998563766479492, -8.529521942138672, -8.060480117797852, -7.591437816619873, -7.1223955154418945, -6.653353691101074, -6.184311389923096, -5.715269565582275, -5.246227264404297, -4.777185440063477, -4.308143615722656, -3.8391013145446777, -3.3700592517852783, -2.901017189025879, -2.4319751262664795, -1.9629331827163696, -1.4938911199569702, -1.0248491764068604, -0.5558071136474609, -0.08676505088806152, 0.3822770118713379, 0.8513190746307373, 1.3203611373901367, 1.7894030809402466, 2.2584452629089355, 2.727487087249756, 3.1965291500091553, 3.6655712127685547, 4.134613037109375, 4.603654861450195, 5.072697162628174, 5.541738986968994, 6.010781288146973, 6.479823112487793, 6.948864936828613, 7.417907238006592, 7.88694953918457]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 4.0, 2.0, 2.0, 2.0, 4.0, 4.0, 12.0, 10.0, 15.0, 14.0, 13.0, 15.0, 21.0, 23.0, 27.0, 29.0, 19.0, 35.0, 30.0, 35.0, 33.0, 35.0, 45.0, 40.0, 43.0, 31.0, 35.0, 31.0, 29.0, 38.0, 46.0, 41.0, 30.0, 33.0, 32.0, 24.0, 15.0, 18.0, 11.0, 21.0, 5.0, 10.0, 11.0, 6.0, 10.0, 4.0, 3.0, 4.0, 2.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.049078941345215, -4.876288890838623, -4.703498363494873, -4.530708312988281, -4.357917785644531, -4.1851277351379395, -4.012337684631348, -3.8395471572875977, -3.666757106781006, -3.493966817855835, -3.321176528930664, -3.1483864784240723, -2.9755961894989014, -2.8028059005737305, -2.6300156116485596, -2.4572253227233887, -2.2844350337982178, -2.111644744873047, -1.9388545751571655, -1.7660642862319946, -1.5932741165161133, -1.4204838275909424, -1.2476935386657715, -1.0749033689498901, -0.9021130800247192, -0.7293228507041931, -0.556532621383667, -0.3837423324584961, -0.21095210313796997, -0.03816187381744385, 0.13462841510772705, 0.3074185848236084, 0.4802088737487793, 0.6529991030693054, 0.8257893323898315, 0.9985796213150024, 1.1713697910308838, 1.3441600799560547, 1.5169503688812256, 1.689740538597107, 1.8625308275222778, 2.035320997238159, 2.20811128616333, 2.380901575088501, 2.553691864013672, 2.7264819145202637, 2.8992724418640137, 3.0720624923706055, 3.2448527812957764, 3.4176430702209473, 3.590433359146118, 3.763223648071289, 3.936013698577881, 4.108803749084473, 4.281594276428223, 4.4543843269348145, 4.6271748542785645, 4.799964904785156, 4.972755432128906, 5.145545482635498, 5.318336009979248, 5.49112606048584, 5.66391658782959, 5.836706638336182, 6.009496688842773]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 12.0, 3.0, 9.0, 11.0, 13.0, 27.0, 30.0, 41.0, 75.0, 139.0, 256.0, 586.0, 1617.0, 5729.0, 37030.0, 4058061.0, 78360.0, 8462.0, 2237.0, 757.0, 307.0, 178.0, 96.0, 55.0, 50.0, 24.0, 27.0, 10.0, 26.0, 10.0, 9.0, 9.0, 8.0, 3.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.609375, -4.463623046875, -4.31787109375, -4.172119140625, -4.0263671875, -3.880615234375, -3.73486328125, -3.589111328125, -3.443359375, -3.297607421875, -3.15185546875, -3.006103515625, -2.8603515625, -2.714599609375, -2.56884765625, -2.423095703125, -2.27734375, -2.131591796875, -1.98583984375, -1.840087890625, -1.6943359375, -1.548583984375, -1.40283203125, -1.257080078125, -1.111328125, -0.965576171875, -0.81982421875, -0.674072265625, -0.5283203125, -0.382568359375, -0.23681640625, -0.091064453125, 0.0546875, 0.200439453125, 0.34619140625, 0.491943359375, 0.6376953125, 0.783447265625, 0.92919921875, 1.074951171875, 1.220703125, 1.366455078125, 1.51220703125, 1.657958984375, 1.8037109375, 1.949462890625, 2.09521484375, 2.240966796875, 2.38671875, 2.532470703125, 2.67822265625, 2.823974609375, 2.9697265625, 3.115478515625, 3.26123046875, 3.406982421875, 3.552734375, 3.698486328125, 3.84423828125, 3.989990234375, 4.1357421875, 4.281494140625, 4.42724609375, 4.572998046875, 4.71875]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 5.0, 1.0, 4.0, 9.0, 19.0, 15.0, 20.0, 33.0, 51.0, 67.0, 68.0, 77.0, 100.0, 82.0, 89.0, 102.0, 65.0, 56.0, 47.0, 24.0, 20.0, 15.0, 18.0, 6.0, 2.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.447021484375, -0.4301261901855469, -0.41323089599609375, -0.3963356018066406, -0.3794403076171875, -0.3625450134277344, -0.34564971923828125, -0.3287544250488281, -0.311859130859375, -0.2949638366699219, -0.27806854248046875, -0.2611732482910156, -0.2442779541015625, -0.22738265991210938, -0.21048736572265625, -0.19359207153320312, -0.17669677734375, -0.15980148315429688, -0.14290618896484375, -0.12601089477539062, -0.1091156005859375, -0.09222030639648438, -0.07532501220703125, -0.058429718017578125, -0.041534423828125, -0.024639129638671875, -0.00774383544921875, 0.009151458740234375, 0.0260467529296875, 0.042942047119140625, 0.05983734130859375, 0.07673263549804688, 0.0936279296875, 0.11052322387695312, 0.12741851806640625, 0.14431381225585938, 0.1612091064453125, 0.17810440063476562, 0.19499969482421875, 0.21189498901367188, 0.228790283203125, 0.24568557739257812, 0.26258087158203125, 0.2794761657714844, 0.2963714599609375, 0.3132667541503906, 0.33016204833984375, 0.3470573425292969, 0.36395263671875, 0.3808479309082031, 0.39774322509765625, 0.4146385192871094, 0.4315338134765625, 0.4484291076660156, 0.46532440185546875, 0.4822196960449219, 0.499114990234375, 0.5160102844238281, 0.5329055786132812, 0.5498008728027344, 0.5666961669921875, 0.5835914611816406, 0.6004867553710938, 0.6173820495605469, 0.63427734375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 6.0, 13.0, 17.0, 18.0, 25.0, 55.0, 92.0, 134.0, 233.0, 383.0, 758.0, 1512.0, 3327.0, 9038.0, 39792.0, 3343764.0, 749819.0, 31198.0, 7914.0, 3072.0, 1394.0, 703.0, 382.0, 229.0, 140.0, 97.0, 60.0, 37.0, 25.0, 9.0, 12.0, 6.0, 6.0, 6.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.671875, -3.5750732421875, -3.478271484375, -3.3814697265625, -3.28466796875, -3.1878662109375, -3.091064453125, -2.9942626953125, -2.8974609375, -2.8006591796875, -2.703857421875, -2.6070556640625, -2.51025390625, -2.4134521484375, -2.316650390625, -2.2198486328125, -2.123046875, -2.0262451171875, -1.929443359375, -1.8326416015625, -1.73583984375, -1.6390380859375, -1.542236328125, -1.4454345703125, -1.3486328125, -1.2518310546875, -1.155029296875, -1.0582275390625, -0.96142578125, -0.8646240234375, -0.767822265625, -0.6710205078125, -0.57421875, -0.4774169921875, -0.380615234375, -0.2838134765625, -0.18701171875, -0.0902099609375, 0.006591796875, 0.1033935546875, 0.2001953125, 0.2969970703125, 0.393798828125, 0.4906005859375, 0.58740234375, 0.6842041015625, 0.781005859375, 0.8778076171875, 0.974609375, 1.0714111328125, 1.168212890625, 1.2650146484375, 1.36181640625, 1.4586181640625, 1.555419921875, 1.6522216796875, 1.7490234375, 1.8458251953125, 1.942626953125, 2.0394287109375, 2.13623046875, 2.2330322265625, 2.329833984375, 2.4266357421875, 2.5234375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 5.0, 5.0, 5.0, 8.0, 20.0, 18.0, 27.0, 56.0, 118.0, 524.0, 2745.0, 307.0, 96.0, 48.0, 30.0, 17.0, 13.0, 8.0, 8.0, 6.0, 4.0, 1.0, 0.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1796875, -1.1408233642578125, -1.101959228515625, -1.0630950927734375, -1.02423095703125, -0.9853668212890625, -0.946502685546875, -0.9076385498046875, -0.8687744140625, -0.8299102783203125, -0.791046142578125, -0.7521820068359375, -0.71331787109375, -0.6744537353515625, -0.635589599609375, -0.5967254638671875, -0.557861328125, -0.5189971923828125, -0.480133056640625, -0.4412689208984375, -0.40240478515625, -0.3635406494140625, -0.324676513671875, -0.2858123779296875, -0.2469482421875, -0.2080841064453125, -0.169219970703125, -0.1303558349609375, -0.09149169921875, -0.0526275634765625, -0.013763427734375, 0.0251007080078125, 0.06396484375, 0.1028289794921875, 0.141693115234375, 0.1805572509765625, 0.21942138671875, 0.2582855224609375, 0.297149658203125, 0.3360137939453125, 0.3748779296875, 0.4137420654296875, 0.452606201171875, 0.4914703369140625, 0.53033447265625, 0.5691986083984375, 0.608062744140625, 0.6469268798828125, 0.685791015625, 0.7246551513671875, 0.763519287109375, 0.8023834228515625, 0.84124755859375, 0.8801116943359375, 0.918975830078125, 0.9578399658203125, 0.9967041015625, 1.0355682373046875, 1.074432373046875, 1.1132965087890625, 1.15216064453125, 1.1910247802734375, 1.229888916015625, 1.2687530517578125, 1.3076171875]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 5.0, 9.0, 21.0, 35.0, 74.0, 131.0, 218.0, 223.0, 121.0, 71.0, 33.0, 21.0, 14.0, 12.0, 5.0, 6.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.330661773681641, -5.115939140319824, -4.901216506958008, -4.686493396759033, -4.471770763397217, -4.2570481300354, -4.042325019836426, -3.8276023864746094, -3.612879753112793, -3.3981571197509766, -3.183434247970581, -2.9687113761901855, -2.753988742828369, -2.5392661094665527, -2.3245432376861572, -2.1098203659057617, -1.8950977325439453, -1.6803749799728394, -1.4656522274017334, -1.2509294748306274, -1.0362067222595215, -0.8214839696884155, -0.6067612171173096, -0.3920384645462036, -0.17731571197509766, 0.0374070405960083, 0.25212979316711426, 0.4668525457382202, 0.6815752983093262, 0.8962980508804321, 1.111020803451538, 1.325743556022644, 1.54046630859375, 1.755189061164856, 1.969911813735962, 2.1846346855163574, 2.399357318878174, 2.6140799522399902, 2.8288028240203857, 3.0435256958007812, 3.2582483291625977, 3.472970962524414, 3.6876938343048096, 3.902416706085205, 4.1171393394470215, 4.331861972808838, 4.5465850830078125, 4.761307716369629, 4.976030349731445, 5.190752983093262, 5.405475616455078, 5.620198726654053, 5.834921360015869, 6.0496439933776855, 6.26436710357666, 6.479089736938477, 6.693812370300293, 6.908535003662109, 7.123257637023926, 7.3379807472229, 7.552703380584717, 7.767426013946533, 7.982149124145508, 8.196871757507324, 8.41159439086914]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 9.0, 5.0, 10.0, 7.0, 10.0, 9.0, 7.0, 15.0, 12.0, 19.0, 22.0, 44.0, 35.0, 36.0, 43.0, 31.0, 47.0, 50.0, 52.0, 53.0, 51.0, 53.0, 52.0, 42.0, 39.0, 48.0, 23.0, 32.0, 21.0, 22.0, 25.0, 11.0, 12.0, 19.0, 5.0, 8.0, 6.0, 7.0, 6.0, 3.0, 3.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.448403835296631, -2.3606741428375244, -2.272944450378418, -2.1852149963378906, -2.097485303878784, -2.0097556114196777, -1.9220259189605713, -1.8342962265014648, -1.746566653251648, -1.6588369607925415, -1.5711073875427246, -1.4833776950836182, -1.3956480026245117, -1.3079184293746948, -1.2201887369155884, -1.1324591636657715, -1.044729471206665, -0.9569998383522034, -0.8692702054977417, -0.7815405130386353, -0.6938108801841736, -0.6060812473297119, -0.5183515548706055, -0.4306219220161438, -0.34289228916168213, -0.25516265630722046, -0.1674329936504364, -0.07970333099365234, 0.008026301860809326, 0.095755934715271, 0.18348562717437744, 0.2712152600288391, 0.3589451313018799, 0.44667476415634155, 0.5344043970108032, 0.6221340894699097, 0.7098637223243713, 0.797593355178833, 0.8853230476379395, 0.9730526804924011, 1.0607823133468628, 1.1485120058059692, 1.2362415790557861, 1.3239712715148926, 1.411700963973999, 1.499430537223816, 1.5871602296829224, 1.6748898029327393, 1.7626194953918457, 1.8503491878509521, 1.938078761100769, 2.025808334350586, 2.1135380268096924, 2.201267719268799, 2.2889974117279053, 2.3767271041870117, 2.464456558227539, 2.5521862506866455, 2.639915943145752, 2.7276453971862793, 2.8153750896453857, 2.903104782104492, 2.9908344745635986, 3.078564167022705, 3.1662938594818115]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 5.0, 5.0, 6.0, 11.0, 12.0, 19.0, 19.0, 22.0, 43.0, 61.0, 85.0, 170.0, 296.0, 540.0, 1234.0, 3015.0, 9783.0, 50418.0, 548556.0, 384013.0, 37128.0, 8178.0, 2621.0, 1059.0, 527.0, 262.0, 158.0, 96.0, 54.0, 37.0, 42.0, 18.0, 20.0, 13.0, 6.0, 8.0, 4.0, 2.0, 0.0, 5.0, 3.0, 5.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.080078125, -2.977142333984375, -2.87420654296875, -2.771270751953125, -2.6683349609375, -2.565399169921875, -2.46246337890625, -2.359527587890625, -2.256591796875, -2.153656005859375, -2.05072021484375, -1.947784423828125, -1.8448486328125, -1.741912841796875, -1.63897705078125, -1.536041259765625, -1.43310546875, -1.330169677734375, -1.22723388671875, -1.124298095703125, -1.0213623046875, -0.918426513671875, -0.81549072265625, -0.712554931640625, -0.609619140625, -0.506683349609375, -0.40374755859375, -0.300811767578125, -0.1978759765625, -0.094940185546875, 0.00799560546875, 0.110931396484375, 0.2138671875, 0.316802978515625, 0.41973876953125, 0.522674560546875, 0.6256103515625, 0.728546142578125, 0.83148193359375, 0.934417724609375, 1.037353515625, 1.140289306640625, 1.24322509765625, 1.346160888671875, 1.4490966796875, 1.552032470703125, 1.65496826171875, 1.757904052734375, 1.86083984375, 1.963775634765625, 2.06671142578125, 2.169647216796875, 2.2725830078125, 2.375518798828125, 2.47845458984375, 2.581390380859375, 2.684326171875, 2.787261962890625, 2.89019775390625, 2.993133544921875, 3.0960693359375, 3.199005126953125, 3.30194091796875, 3.404876708984375, 3.5078125]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 3.0, 2.0, 1.0, 9.0, 17.0, 28.0, 39.0, 39.0, 41.0, 60.0, 79.0, 82.0, 80.0, 89.0, 88.0, 77.0, 70.0, 58.0, 42.0, 29.0, 22.0, 8.0, 14.0, 8.0, 3.0, 4.0, 3.0, 6.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.498046875, -0.48040008544921875, -0.4627532958984375, -0.44510650634765625, -0.427459716796875, -0.40981292724609375, -0.3921661376953125, -0.37451934814453125, -0.35687255859375, -0.33922576904296875, -0.3215789794921875, -0.30393218994140625, -0.286285400390625, -0.26863861083984375, -0.2509918212890625, -0.23334503173828125, -0.2156982421875, -0.19805145263671875, -0.1804046630859375, -0.16275787353515625, -0.145111083984375, -0.12746429443359375, -0.1098175048828125, -0.09217071533203125, -0.07452392578125, -0.05687713623046875, -0.0392303466796875, -0.02158355712890625, -0.003936767578125, 0.01371002197265625, 0.0313568115234375, 0.04900360107421875, 0.066650390625, 0.08429718017578125, 0.1019439697265625, 0.11959075927734375, 0.137237548828125, 0.15488433837890625, 0.1725311279296875, 0.19017791748046875, 0.20782470703125, 0.22547149658203125, 0.2431182861328125, 0.26076507568359375, 0.278411865234375, 0.29605865478515625, 0.3137054443359375, 0.33135223388671875, 0.3489990234375, 0.36664581298828125, 0.3842926025390625, 0.40193939208984375, 0.419586181640625, 0.43723297119140625, 0.4548797607421875, 0.47252655029296875, 0.49017333984375, 0.5078201293945312, 0.5254669189453125, 0.5431137084960938, 0.560760498046875, 0.5784072875976562, 0.5960540771484375, 0.6137008666992188, 0.63134765625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 7.0, 1.0, 5.0, 2.0, 6.0, 9.0, 12.0, 17.0, 19.0, 26.0, 47.0, 69.0, 130.0, 251.0, 400.0, 880.0, 1791.0, 4183.0, 11441.0, 38003.0, 164196.0, 537513.0, 217914.0, 48738.0, 13768.0, 4958.0, 2127.0, 944.0, 481.0, 213.0, 150.0, 77.0, 42.0, 42.0, 21.0, 15.0, 6.0, 16.0, 8.0, 3.0, 8.0, 3.0, 5.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.69140625, -1.6378631591796875, -1.584320068359375, -1.5307769775390625, -1.47723388671875, -1.4236907958984375, -1.370147705078125, -1.3166046142578125, -1.2630615234375, -1.2095184326171875, -1.155975341796875, -1.1024322509765625, -1.04888916015625, -0.9953460693359375, -0.941802978515625, -0.8882598876953125, -0.834716796875, -0.7811737060546875, -0.727630615234375, -0.6740875244140625, -0.62054443359375, -0.5670013427734375, -0.513458251953125, -0.4599151611328125, -0.4063720703125, -0.3528289794921875, -0.299285888671875, -0.2457427978515625, -0.19219970703125, -0.1386566162109375, -0.085113525390625, -0.0315704345703125, 0.02197265625, 0.0755157470703125, 0.129058837890625, 0.1826019287109375, 0.23614501953125, 0.2896881103515625, 0.343231201171875, 0.3967742919921875, 0.4503173828125, 0.5038604736328125, 0.557403564453125, 0.6109466552734375, 0.66448974609375, 0.7180328369140625, 0.771575927734375, 0.8251190185546875, 0.878662109375, 0.9322052001953125, 0.985748291015625, 1.0392913818359375, 1.09283447265625, 1.1463775634765625, 1.199920654296875, 1.2534637451171875, 1.3070068359375, 1.3605499267578125, 1.414093017578125, 1.4676361083984375, 1.52117919921875, 1.5747222900390625, 1.628265380859375, 1.6818084716796875, 1.7353515625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 2.0, 1.0, 3.0, 5.0, 6.0, 6.0, 16.0, 7.0, 15.0, 20.0, 17.0, 13.0, 22.0, 22.0, 31.0, 27.0, 30.0, 40.0, 43.0, 39.0, 44.0, 51.0, 45.0, 42.0, 33.0, 43.0, 32.0, 45.0, 36.0, 30.0, 31.0, 22.0, 27.0, 24.0, 15.0, 22.0, 19.0, 17.0, 9.0, 9.0, 10.0, 12.0, 4.0, 5.0, 4.0, 2.0, 0.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.24609375, -1.2064361572265625, -1.166778564453125, -1.1271209716796875, -1.08746337890625, -1.0478057861328125, -1.008148193359375, -0.9684906005859375, -0.9288330078125, -0.8891754150390625, -0.849517822265625, -0.8098602294921875, -0.77020263671875, -0.7305450439453125, -0.690887451171875, -0.6512298583984375, -0.611572265625, -0.5719146728515625, -0.532257080078125, -0.4925994873046875, -0.45294189453125, -0.4132843017578125, -0.373626708984375, -0.3339691162109375, -0.2943115234375, -0.2546539306640625, -0.214996337890625, -0.1753387451171875, -0.13568115234375, -0.0960235595703125, -0.056365966796875, -0.0167083740234375, 0.02294921875, 0.0626068115234375, 0.102264404296875, 0.1419219970703125, 0.18157958984375, 0.2212371826171875, 0.260894775390625, 0.3005523681640625, 0.3402099609375, 0.3798675537109375, 0.419525146484375, 0.4591827392578125, 0.49884033203125, 0.5384979248046875, 0.578155517578125, 0.6178131103515625, 0.657470703125, 0.6971282958984375, 0.736785888671875, 0.7764434814453125, 0.81610107421875, 0.8557586669921875, 0.895416259765625, 0.9350738525390625, 0.9747314453125, 1.0143890380859375, 1.054046630859375, 1.0937042236328125, 1.13336181640625, 1.1730194091796875, 1.212677001953125, 1.2523345947265625, 1.2919921875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 2.0, 4.0, 10.0, 7.0, 6.0, 10.0, 21.0, 25.0, 41.0, 65.0, 116.0, 237.0, 494.0, 1063.0, 2875.0, 9265.0, 42361.0, 347531.0, 556359.0, 68435.0, 13137.0, 3902.0, 1361.0, 558.0, 292.0, 139.0, 95.0, 44.0, 36.0, 17.0, 17.0, 8.0, 7.0, 6.0, 0.0, 3.0, 8.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.7158203125, -0.6942138671875, -0.672607421875, -0.6510009765625, -0.62939453125, -0.6077880859375, -0.586181640625, -0.5645751953125, -0.54296875, -0.5213623046875, -0.499755859375, -0.4781494140625, -0.45654296875, -0.4349365234375, -0.413330078125, -0.3917236328125, -0.3701171875, -0.3485107421875, -0.326904296875, -0.3052978515625, -0.28369140625, -0.2620849609375, -0.240478515625, -0.2188720703125, -0.197265625, -0.1756591796875, -0.154052734375, -0.1324462890625, -0.11083984375, -0.0892333984375, -0.067626953125, -0.0460205078125, -0.0244140625, -0.0028076171875, 0.018798828125, 0.0404052734375, 0.06201171875, 0.0836181640625, 0.105224609375, 0.1268310546875, 0.1484375, 0.1700439453125, 0.191650390625, 0.2132568359375, 0.23486328125, 0.2564697265625, 0.278076171875, 0.2996826171875, 0.3212890625, 0.3428955078125, 0.364501953125, 0.3861083984375, 0.40771484375, 0.4293212890625, 0.450927734375, 0.4725341796875, 0.494140625, 0.5157470703125, 0.537353515625, 0.5589599609375, 0.58056640625, 0.6021728515625, 0.623779296875, 0.6453857421875, 0.6669921875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 5.0, 2.0, 2.0, 6.0, 2.0, 7.0, 10.0, 5.0, 14.0, 27.0, 30.0, 42.0, 86.0, 128.0, 171.0, 146.0, 114.0, 73.0, 33.0, 24.0, 25.0, 9.0, 12.0, 9.0, 8.0, 4.0, 5.0, 5.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001500844955444336, -0.00014537759125232697, -0.00014067068696022034, -0.0001359637826681137, -0.00013125687837600708, -0.00012654997408390045, -0.00012184306979179382, -0.0001171361654996872, -0.00011242926120758057, -0.00010772235691547394, -0.00010301545262336731, -9.830854833126068e-05, -9.360164403915405e-05, -8.889473974704742e-05, -8.41878354549408e-05, -7.948093116283417e-05, -7.477402687072754e-05, -7.006712257862091e-05, -6.536021828651428e-05, -6.0653313994407654e-05, -5.5946409702301025e-05, -5.12395054101944e-05, -4.653260111808777e-05, -4.182569682598114e-05, -3.711879253387451e-05, -3.241188824176788e-05, -2.7704983949661255e-05, -2.2998079657554626e-05, -1.8291175365447998e-05, -1.358427107334137e-05, -8.877366781234741e-06, -4.170462489128113e-06, 5.364418029785156e-07, 5.243346095085144e-06, 9.950250387191772e-06, 1.4657154679298401e-05, 1.936405897140503e-05, 2.4070963263511658e-05, 2.8777867555618286e-05, 3.3484771847724915e-05, 3.819167613983154e-05, 4.289858043193817e-05, 4.76054847240448e-05, 5.231238901615143e-05, 5.701929330825806e-05, 6.172619760036469e-05, 6.643310189247131e-05, 7.114000618457794e-05, 7.584691047668457e-05, 8.05538147687912e-05, 8.526071906089783e-05, 8.996762335300446e-05, 9.467452764511108e-05, 9.938143193721771e-05, 0.00010408833622932434, 0.00010879524052143097, 0.0001135021448135376, 0.00011820904910564423, 0.00012291595339775085, 0.00012762285768985748, 0.0001323297619819641, 0.00013703666627407074, 0.00014174357056617737, 0.000146450474858284, 0.00015115737915039062]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 6.0, 2.0, 4.0, 10.0, 10.0, 14.0, 16.0, 30.0, 44.0, 59.0, 116.0, 205.0, 405.0, 941.0, 2590.0, 9051.0, 46025.0, 494516.0, 440027.0, 41778.0, 8391.0, 2452.0, 947.0, 404.0, 213.0, 111.0, 68.0, 37.0, 31.0, 13.0, 12.0, 9.0, 8.0, 3.0, 3.0, 3.0, 0.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.67822265625, -0.654815673828125, -0.63140869140625, -0.608001708984375, -0.5845947265625, -0.561187744140625, -0.53778076171875, -0.514373779296875, -0.490966796875, -0.467559814453125, -0.44415283203125, -0.420745849609375, -0.3973388671875, -0.373931884765625, -0.35052490234375, -0.327117919921875, -0.3037109375, -0.280303955078125, -0.25689697265625, -0.233489990234375, -0.2100830078125, -0.186676025390625, -0.16326904296875, -0.139862060546875, -0.116455078125, -0.093048095703125, -0.06964111328125, -0.046234130859375, -0.0228271484375, 0.000579833984375, 0.02398681640625, 0.047393798828125, 0.07080078125, 0.094207763671875, 0.11761474609375, 0.141021728515625, 0.1644287109375, 0.187835693359375, 0.21124267578125, 0.234649658203125, 0.258056640625, 0.281463623046875, 0.30487060546875, 0.328277587890625, 0.3516845703125, 0.375091552734375, 0.39849853515625, 0.421905517578125, 0.4453125, 0.468719482421875, 0.49212646484375, 0.515533447265625, 0.5389404296875, 0.562347412109375, 0.58575439453125, 0.609161376953125, 0.632568359375, 0.655975341796875, 0.67938232421875, 0.702789306640625, 0.7261962890625, 0.749603271484375, 0.77301025390625, 0.796417236328125, 0.81982421875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 1.0, 4.0, 1.0, 5.0, 1.0, 8.0, 6.0, 6.0, 10.0, 11.0, 13.0, 8.0, 30.0, 22.0, 37.0, 68.0, 93.0, 98.0, 117.0, 82.0, 96.0, 85.0, 55.0, 36.0, 28.0, 25.0, 15.0, 8.0, 15.0, 4.0, 3.0, 5.0, 5.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.487548828125, -0.47306060791015625, -0.4585723876953125, -0.44408416748046875, -0.429595947265625, -0.41510772705078125, -0.4006195068359375, -0.38613128662109375, -0.37164306640625, -0.35715484619140625, -0.3426666259765625, -0.32817840576171875, -0.313690185546875, -0.29920196533203125, -0.2847137451171875, -0.27022552490234375, -0.2557373046875, -0.24124908447265625, -0.2267608642578125, -0.21227264404296875, -0.197784423828125, -0.18329620361328125, -0.1688079833984375, -0.15431976318359375, -0.13983154296875, -0.12534332275390625, -0.1108551025390625, -0.09636688232421875, -0.081878662109375, -0.06739044189453125, -0.0529022216796875, -0.03841400146484375, -0.02392578125, -0.00943756103515625, 0.0050506591796875, 0.01953887939453125, 0.034027099609375, 0.04851531982421875, 0.0630035400390625, 0.07749176025390625, 0.09197998046875, 0.10646820068359375, 0.1209564208984375, 0.13544464111328125, 0.149932861328125, 0.16442108154296875, 0.1789093017578125, 0.19339752197265625, 0.2078857421875, 0.22237396240234375, 0.2368621826171875, 0.25135040283203125, 0.265838623046875, 0.28032684326171875, 0.2948150634765625, 0.30930328369140625, 0.32379150390625, 0.33827972412109375, 0.3527679443359375, 0.36725616455078125, 0.381744384765625, 0.39623260498046875, 0.4107208251953125, 0.42520904541015625, 0.439697265625]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 7.0, 15.0, 16.0, 33.0, 54.0, 99.0, 140.0, 179.0, 183.0, 117.0, 70.0, 52.0, 23.0, 14.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.855772018432617, -15.42529582977295, -14.994818687438965, -14.564342498779297, -14.133865356445312, -13.703389167785645, -13.27291202545166, -12.842435836791992, -12.411958694458008, -11.98148250579834, -11.551005363464355, -11.120529174804688, -10.690052032470703, -10.259575843811035, -9.82909870147705, -9.398622512817383, -8.968145370483398, -8.53766918182373, -8.107192039489746, -7.67671537399292, -7.246238708496094, -6.815762519836426, -6.385285377502441, -5.954809188842773, -5.5243330001831055, -5.093856334686279, -4.663379669189453, -4.232903003692627, -3.802426338195801, -3.3719499111175537, -2.9414732456207275, -2.5109965801239014, -2.080519676208496, -1.65004301071167, -1.2195663452148438, -0.7890897989273071, -0.35861313343048096, 0.07186341285705566, 0.5023400783538818, 0.932816743850708, 1.3632934093475342, 1.7937700748443604, 2.2242467403411865, 2.6547231674194336, 3.0851998329162598, 3.515676498413086, 3.946153163909912, 4.376629829406738, 4.8071064949035645, 5.237583160400391, 5.668059825897217, 6.098536491394043, 6.529013156890869, 6.959489822387695, 7.389966011047363, 7.820443153381348, 8.250919342041016, 8.681395530700684, 9.111872673034668, 9.542348861694336, 9.97282600402832, 10.403302192687988, 10.833779335021973, 11.26425552368164, 11.694732666015625]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 7.0, 1.0, 2.0, 6.0, 4.0, 12.0, 9.0, 9.0, 15.0, 13.0, 14.0, 20.0, 23.0, 19.0, 30.0, 26.0, 34.0, 36.0, 37.0, 45.0, 44.0, 56.0, 38.0, 51.0, 40.0, 39.0, 42.0, 43.0, 41.0, 40.0, 33.0, 27.0, 20.0, 34.0, 19.0, 14.0, 14.0, 14.0, 7.0, 6.0, 6.0, 6.0, 6.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.959950923919678, -5.761819362640381, -5.563688278198242, -5.365556716918945, -5.167425155639648, -4.969293594360352, -4.771162509918213, -4.573030948638916, -4.374899864196777, -4.1767683029174805, -3.9786369800567627, -3.780505657196045, -3.582374095916748, -3.3842427730560303, -3.1861114501953125, -2.9879798889160156, -2.7898483276367188, -2.591717004776001, -2.393585443496704, -2.1954541206359863, -1.997322678565979, -1.7991912364959717, -1.601059913635254, -1.4029284715652466, -1.2047970294952393, -1.006665587425232, -0.8085342049598694, -0.6104028224945068, -0.4122713804244995, -0.2141399383544922, -0.016008615493774414, 0.1821228265762329, 0.38025474548339844, 0.5783861875534058, 0.7765175700187683, 0.9746489524841309, 1.1727803945541382, 1.3709118366241455, 1.5690431594848633, 1.7671746015548706, 1.965306043624878, 2.1634373664855957, 2.3615689277648926, 2.5597002506256104, 2.757831573486328, 2.955963134765625, 3.1540944576263428, 3.3522257804870605, 3.5503573417663574, 3.748488664627075, 3.946620225906372, 4.14475154876709, 4.342883110046387, 4.541014671325684, 4.739145755767822, 4.937277317047119, 5.135408401489258, 5.333539962768555, 5.531671047210693, 5.72980260848999, 5.927934169769287, 6.126065254211426, 6.324196815490723, 6.5223283767700195, 6.720459938049316]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 6.0, 11.0, 10.0, 17.0, 19.0, 13.0, 29.0, 60.0, 77.0, 160.0, 292.0, 633.0, 1548.0, 4461.0, 16604.0, 187481.0, 3927645.0, 42074.0, 8124.0, 2648.0, 1094.0, 527.0, 287.0, 148.0, 90.0, 51.0, 40.0, 28.0, 35.0, 19.0, 11.0, 10.0, 4.0, 7.0, 4.0, 6.0, 6.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.375, -4.2393798828125, -4.103759765625, -3.9681396484375, -3.83251953125, -3.6968994140625, -3.561279296875, -3.4256591796875, -3.2900390625, -3.1544189453125, -3.018798828125, -2.8831787109375, -2.74755859375, -2.6119384765625, -2.476318359375, -2.3406982421875, -2.205078125, -2.0694580078125, -1.933837890625, -1.7982177734375, -1.66259765625, -1.5269775390625, -1.391357421875, -1.2557373046875, -1.1201171875, -0.9844970703125, -0.848876953125, -0.7132568359375, -0.57763671875, -0.4420166015625, -0.306396484375, -0.1707763671875, -0.03515625, 0.1004638671875, 0.236083984375, 0.3717041015625, 0.50732421875, 0.6429443359375, 0.778564453125, 0.9141845703125, 1.0498046875, 1.1854248046875, 1.321044921875, 1.4566650390625, 1.59228515625, 1.7279052734375, 1.863525390625, 1.9991455078125, 2.134765625, 2.2703857421875, 2.406005859375, 2.5416259765625, 2.67724609375, 2.8128662109375, 2.948486328125, 3.0841064453125, 3.2197265625, 3.3553466796875, 3.490966796875, 3.6265869140625, 3.76220703125, 3.8978271484375, 4.033447265625, 4.1690673828125, 4.3046875]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 4.0, 5.0, 4.0, 6.0, 15.0, 32.0, 23.0, 45.0, 63.0, 65.0, 68.0, 82.0, 83.0, 74.0, 87.0, 84.0, 60.0, 58.0, 37.0, 28.0, 23.0, 16.0, 13.0, 7.0, 4.0, 6.0, 1.0, 5.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5078125, -0.49040985107421875, -0.4730072021484375, -0.45560455322265625, -0.438201904296875, -0.42079925537109375, -0.4033966064453125, -0.38599395751953125, -0.36859130859375, -0.35118865966796875, -0.3337860107421875, -0.31638336181640625, -0.298980712890625, -0.28157806396484375, -0.2641754150390625, -0.24677276611328125, -0.2293701171875, -0.21196746826171875, -0.1945648193359375, -0.17716217041015625, -0.159759521484375, -0.14235687255859375, -0.1249542236328125, -0.10755157470703125, -0.09014892578125, -0.07274627685546875, -0.0553436279296875, -0.03794097900390625, -0.020538330078125, -0.00313568115234375, 0.0142669677734375, 0.03166961669921875, 0.049072265625, 0.06647491455078125, 0.0838775634765625, 0.10128021240234375, 0.118682861328125, 0.13608551025390625, 0.1534881591796875, 0.17089080810546875, 0.18829345703125, 0.20569610595703125, 0.2230987548828125, 0.24050140380859375, 0.257904052734375, 0.27530670166015625, 0.2927093505859375, 0.31011199951171875, 0.3275146484375, 0.34491729736328125, 0.3623199462890625, 0.37972259521484375, 0.397125244140625, 0.41452789306640625, 0.4319305419921875, 0.44933319091796875, 0.46673583984375, 0.48413848876953125, 0.5015411376953125, 0.5189437866210938, 0.536346435546875, 0.5537490844726562, 0.5711517333984375, 0.5885543823242188, 0.60595703125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 5.0, 7.0, 9.0, 17.0, 21.0, 41.0, 64.0, 84.0, 147.0, 245.0, 403.0, 645.0, 1226.0, 2224.0, 4301.0, 9600.0, 24731.0, 98217.0, 3522723.0, 448675.0, 51024.0, 16115.0, 6707.0, 3149.0, 1653.0, 901.0, 534.0, 292.0, 191.0, 124.0, 72.0, 48.0, 31.0, 35.0, 12.0, 6.0, 5.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.72265625, -2.6506195068359375, -2.578582763671875, -2.5065460205078125, -2.43450927734375, -2.3624725341796875, -2.290435791015625, -2.2183990478515625, -2.1463623046875, -2.0743255615234375, -2.002288818359375, -1.9302520751953125, -1.85821533203125, -1.7861785888671875, -1.714141845703125, -1.6421051025390625, -1.570068359375, -1.4980316162109375, -1.425994873046875, -1.3539581298828125, -1.28192138671875, -1.2098846435546875, -1.137847900390625, -1.0658111572265625, -0.9937744140625, -0.9217376708984375, -0.849700927734375, -0.7776641845703125, -0.70562744140625, -0.6335906982421875, -0.561553955078125, -0.4895172119140625, -0.41748046875, -0.3454437255859375, -0.273406982421875, -0.2013702392578125, -0.12933349609375, -0.0572967529296875, 0.014739990234375, 0.0867767333984375, 0.1588134765625, 0.2308502197265625, 0.302886962890625, 0.3749237060546875, 0.44696044921875, 0.5189971923828125, 0.591033935546875, 0.6630706787109375, 0.735107421875, 0.8071441650390625, 0.879180908203125, 0.9512176513671875, 1.02325439453125, 1.0952911376953125, 1.167327880859375, 1.2393646240234375, 1.3114013671875, 1.3834381103515625, 1.455474853515625, 1.5275115966796875, 1.59954833984375, 1.6715850830078125, 1.743621826171875, 1.8156585693359375, 1.8876953125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 5.0, 6.0, 7.0, 2.0, 6.0, 6.0, 12.0, 7.0, 19.0, 22.0, 30.0, 59.0, 62.0, 123.0, 341.0, 2366.0, 577.0, 174.0, 92.0, 44.0, 35.0, 21.0, 14.0, 10.0, 9.0, 8.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.0146484375, -0.9853744506835938, -0.9561004638671875, -0.9268264770507812, -0.897552490234375, -0.8682785034179688, -0.8390045166015625, -0.8097305297851562, -0.78045654296875, -0.7511825561523438, -0.7219085693359375, -0.6926345825195312, -0.663360595703125, -0.6340866088867188, -0.6048126220703125, -0.5755386352539062, -0.5462646484375, -0.5169906616210938, -0.4877166748046875, -0.45844268798828125, -0.429168701171875, -0.39989471435546875, -0.3706207275390625, -0.34134674072265625, -0.31207275390625, -0.28279876708984375, -0.2535247802734375, -0.22425079345703125, -0.194976806640625, -0.16570281982421875, -0.1364288330078125, -0.10715484619140625, -0.077880859375, -0.04860687255859375, -0.0193328857421875, 0.00994110107421875, 0.039215087890625, 0.06848907470703125, 0.0977630615234375, 0.12703704833984375, 0.15631103515625, 0.18558502197265625, 0.2148590087890625, 0.24413299560546875, 0.273406982421875, 0.30268096923828125, 0.3319549560546875, 0.36122894287109375, 0.3905029296875, 0.41977691650390625, 0.4490509033203125, 0.47832489013671875, 0.507598876953125, 0.5368728637695312, 0.5661468505859375, 0.5954208374023438, 0.62469482421875, 0.6539688110351562, 0.6832427978515625, 0.7125167846679688, 0.741790771484375, 0.7710647583007812, 0.8003387451171875, 0.8296127319335938, 0.85888671875]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 5.0, 3.0, 6.0, 2.0, 13.0, 20.0, 82.0, 165.0, 305.0, 260.0, 85.0, 44.0, 16.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.4218854904174805, -6.096843242645264, -5.771800994873047, -5.44675874710083, -5.121716499328613, -4.7966742515563965, -4.47163200378418, -4.146589756011963, -3.821547508239746, -3.4965052604675293, -3.1714630126953125, -2.8464207649230957, -2.521378517150879, -2.196336269378662, -1.8712940216064453, -1.5462517738342285, -1.2212095260620117, -0.8961672782897949, -0.5711250305175781, -0.24608278274536133, 0.07895946502685547, 0.40400171279907227, 0.7290439605712891, 1.0540862083435059, 1.3791284561157227, 1.7041707038879395, 2.0292129516601562, 2.354255199432373, 2.67929744720459, 3.0043396949768066, 3.3293819427490234, 3.6544241905212402, 3.9794654846191406, 4.304507732391357, 4.629549980163574, 4.954592227935791, 5.279634475708008, 5.604676723480225, 5.929718971252441, 6.254761219024658, 6.579803466796875, 6.904845714569092, 7.229887962341309, 7.554930210113525, 7.879972457885742, 8.205015182495117, 8.530056953430176, 8.855098724365234, 9.18014144897461, 9.505184173583984, 9.830225944519043, 10.155267715454102, 10.480310440063477, 10.805353164672852, 11.13039493560791, 11.455436706542969, 11.780479431152344, 12.105522155761719, 12.430563926696777, 12.755605697631836, 13.080648422241211, 13.405691146850586, 13.730732917785645, 14.055774688720703, 14.380817413330078]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 0.0, 2.0, 5.0, 4.0, 2.0, 8.0, 9.0, 6.0, 8.0, 19.0, 18.0, 21.0, 18.0, 25.0, 32.0, 20.0, 41.0, 25.0, 44.0, 35.0, 34.0, 39.0, 39.0, 50.0, 45.0, 46.0, 35.0, 53.0, 45.0, 31.0, 27.0, 30.0, 36.0, 17.0, 28.0, 16.0, 14.0, 11.0, 17.0, 16.0, 6.0, 10.0, 8.0, 6.0, 4.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.838697671890259, -2.761110782623291, -2.6835241317749023, -2.6059372425079346, -2.528350591659546, -2.450763702392578, -2.3731770515441895, -2.2955901622772217, -2.218003273010254, -2.140416383743286, -2.0628297328948975, -1.9852429628372192, -1.907656192779541, -1.8300693035125732, -1.752482533454895, -1.6748957633972168, -1.5973091125488281, -1.51972234249115, -1.4421355724334717, -1.3645488023757935, -1.2869620323181152, -1.2093751430511475, -1.1317883729934692, -1.054201602935791, -0.9766148328781128, -0.8990280628204346, -0.8214412927627563, -0.7438544631004333, -0.6662676930427551, -0.5886809229850769, -0.5110940933227539, -0.4335073232650757, -0.35592055320739746, -0.27833378314971924, -0.20074698328971863, -0.12316019833087921, -0.045573413372039795, 0.03201335668563843, 0.10960015654563904, 0.18718695640563965, 0.26477372646331787, 0.3423604965209961, 0.4199472963809967, 0.4975340962409973, 0.5751208662986755, 0.6527076363563538, 0.7302944660186768, 0.807881236076355, 0.8854680061340332, 0.9630547761917114, 1.0406415462493896, 1.1182283163070679, 1.195815086364746, 1.2734019756317139, 1.350988745689392, 1.4285755157470703, 1.5061622858047485, 1.5837490558624268, 1.661335825920105, 1.7389225959777832, 1.816509485244751, 1.8940961360931396, 1.9716830253601074, 2.049269676208496, 2.126856565475464]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 5.0, 7.0, 12.0, 11.0, 33.0, 49.0, 44.0, 88.0, 104.0, 167.0, 263.0, 445.0, 805.0, 1630.0, 3900.0, 11052.0, 43049.0, 229758.0, 566465.0, 146725.0, 29580.0, 8113.0, 3093.0, 1405.0, 685.0, 382.0, 244.0, 148.0, 92.0, 58.0, 50.0, 32.0, 21.0, 13.0, 12.0, 4.0, 4.0, 4.0, 3.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9296875, -2.844451904296875, -2.75921630859375, -2.673980712890625, -2.5887451171875, -2.503509521484375, -2.41827392578125, -2.333038330078125, -2.247802734375, -2.162567138671875, -2.07733154296875, -1.992095947265625, -1.9068603515625, -1.821624755859375, -1.73638916015625, -1.651153564453125, -1.56591796875, -1.480682373046875, -1.39544677734375, -1.310211181640625, -1.2249755859375, -1.139739990234375, -1.05450439453125, -0.969268798828125, -0.884033203125, -0.798797607421875, -0.71356201171875, -0.628326416015625, -0.5430908203125, -0.457855224609375, -0.37261962890625, -0.287384033203125, -0.2021484375, -0.116912841796875, -0.03167724609375, 0.053558349609375, 0.1387939453125, 0.224029541015625, 0.30926513671875, 0.394500732421875, 0.479736328125, 0.564971923828125, 0.65020751953125, 0.735443115234375, 0.8206787109375, 0.905914306640625, 0.99114990234375, 1.076385498046875, 1.16162109375, 1.246856689453125, 1.33209228515625, 1.417327880859375, 1.5025634765625, 1.587799072265625, 1.67303466796875, 1.758270263671875, 1.843505859375, 1.928741455078125, 2.01397705078125, 2.099212646484375, 2.1844482421875, 2.269683837890625, 2.35491943359375, 2.440155029296875, 2.525390625]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 7.0, 4.0, 12.0, 9.0, 9.0, 20.0, 28.0, 36.0, 51.0, 51.0, 64.0, 58.0, 67.0, 89.0, 79.0, 64.0, 65.0, 55.0, 57.0, 48.0, 32.0, 24.0, 19.0, 22.0, 12.0, 5.0, 5.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.5283203125, -0.51129150390625, -0.4942626953125, -0.47723388671875, -0.460205078125, -0.44317626953125, -0.4261474609375, -0.40911865234375, -0.39208984375, -0.37506103515625, -0.3580322265625, -0.34100341796875, -0.323974609375, -0.30694580078125, -0.2899169921875, -0.27288818359375, -0.255859375, -0.23883056640625, -0.2218017578125, -0.20477294921875, -0.187744140625, -0.17071533203125, -0.1536865234375, -0.13665771484375, -0.11962890625, -0.10260009765625, -0.0855712890625, -0.06854248046875, -0.051513671875, -0.03448486328125, -0.0174560546875, -0.00042724609375, 0.0166015625, 0.03363037109375, 0.0506591796875, 0.06768798828125, 0.084716796875, 0.10174560546875, 0.1187744140625, 0.13580322265625, 0.15283203125, 0.16986083984375, 0.1868896484375, 0.20391845703125, 0.220947265625, 0.23797607421875, 0.2550048828125, 0.27203369140625, 0.2890625, 0.30609130859375, 0.3231201171875, 0.34014892578125, 0.357177734375, 0.37420654296875, 0.3912353515625, 0.40826416015625, 0.42529296875, 0.44232177734375, 0.4593505859375, 0.47637939453125, 0.493408203125, 0.51043701171875, 0.5274658203125, 0.54449462890625, 0.5615234375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 1.0, 7.0, 8.0, 9.0, 20.0, 21.0, 27.0, 31.0, 48.0, 92.0, 122.0, 197.0, 238.0, 428.0, 667.0, 1175.0, 2054.0, 3973.0, 8227.0, 18135.0, 42032.0, 107004.0, 266111.0, 335961.0, 154835.0, 60106.0, 24725.0, 10814.0, 5128.0, 2685.0, 1375.0, 847.0, 490.0, 312.0, 199.0, 137.0, 78.0, 61.0, 51.0, 30.0, 22.0, 15.0, 14.0, 9.0, 11.0, 9.0, 3.0, 3.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1826171875, -1.1434478759765625, -1.104278564453125, -1.0651092529296875, -1.02593994140625, -0.9867706298828125, -0.947601318359375, -0.9084320068359375, -0.8692626953125, -0.8300933837890625, -0.790924072265625, -0.7517547607421875, -0.71258544921875, -0.6734161376953125, -0.634246826171875, -0.5950775146484375, -0.555908203125, -0.5167388916015625, -0.477569580078125, -0.4384002685546875, -0.39923095703125, -0.3600616455078125, -0.320892333984375, -0.2817230224609375, -0.2425537109375, -0.2033843994140625, -0.164215087890625, -0.1250457763671875, -0.08587646484375, -0.0467071533203125, -0.007537841796875, 0.0316314697265625, 0.07080078125, 0.1099700927734375, 0.149139404296875, 0.1883087158203125, 0.22747802734375, 0.2666473388671875, 0.305816650390625, 0.3449859619140625, 0.3841552734375, 0.4233245849609375, 0.462493896484375, 0.5016632080078125, 0.54083251953125, 0.5800018310546875, 0.619171142578125, 0.6583404541015625, 0.697509765625, 0.7366790771484375, 0.775848388671875, 0.8150177001953125, 0.85418701171875, 0.8933563232421875, 0.932525634765625, 0.9716949462890625, 1.0108642578125, 1.0500335693359375, 1.089202880859375, 1.1283721923828125, 1.16754150390625, 1.2067108154296875, 1.245880126953125, 1.2850494384765625, 1.32421875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 5.0, 6.0, 6.0, 11.0, 12.0, 12.0, 13.0, 18.0, 25.0, 16.0, 27.0, 30.0, 30.0, 37.0, 42.0, 37.0, 47.0, 50.0, 57.0, 38.0, 56.0, 52.0, 46.0, 44.0, 47.0, 31.0, 30.0, 26.0, 17.0, 24.0, 19.0, 20.0, 24.0, 16.0, 12.0, 6.0, 2.0, 2.0, 5.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6904296875, -1.6351470947265625, -1.579864501953125, -1.5245819091796875, -1.46929931640625, -1.4140167236328125, -1.358734130859375, -1.3034515380859375, -1.2481689453125, -1.1928863525390625, -1.137603759765625, -1.0823211669921875, -1.02703857421875, -0.9717559814453125, -0.916473388671875, -0.8611907958984375, -0.805908203125, -0.7506256103515625, -0.695343017578125, -0.6400604248046875, -0.58477783203125, -0.5294952392578125, -0.474212646484375, -0.4189300537109375, -0.3636474609375, -0.3083648681640625, -0.253082275390625, -0.1977996826171875, -0.14251708984375, -0.0872344970703125, -0.031951904296875, 0.0233306884765625, 0.07861328125, 0.1338958740234375, 0.189178466796875, 0.2444610595703125, 0.29974365234375, 0.3550262451171875, 0.410308837890625, 0.4655914306640625, 0.5208740234375, 0.5761566162109375, 0.631439208984375, 0.6867218017578125, 0.74200439453125, 0.7972869873046875, 0.852569580078125, 0.9078521728515625, 0.963134765625, 1.0184173583984375, 1.073699951171875, 1.1289825439453125, 1.18426513671875, 1.2395477294921875, 1.294830322265625, 1.3501129150390625, 1.4053955078125, 1.4606781005859375, 1.515960693359375, 1.5712432861328125, 1.62652587890625, 1.6818084716796875, 1.737091064453125, 1.7923736572265625, 1.84765625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 10.0, 7.0, 11.0, 10.0, 20.0, 35.0, 68.0, 101.0, 174.0, 265.0, 495.0, 956.0, 1999.0, 5078.0, 17794.0, 106133.0, 694279.0, 183555.0, 26045.0, 6649.0, 2360.0, 1136.0, 555.0, 337.0, 185.0, 102.0, 67.0, 45.0, 35.0, 21.0, 10.0, 8.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-1.23828125, -1.2044677734375, -1.170654296875, -1.1368408203125, -1.10302734375, -1.0692138671875, -1.035400390625, -1.0015869140625, -0.9677734375, -0.9339599609375, -0.900146484375, -0.8663330078125, -0.83251953125, -0.7987060546875, -0.764892578125, -0.7310791015625, -0.697265625, -0.6634521484375, -0.629638671875, -0.5958251953125, -0.56201171875, -0.5281982421875, -0.494384765625, -0.4605712890625, -0.4267578125, -0.3929443359375, -0.359130859375, -0.3253173828125, -0.29150390625, -0.2576904296875, -0.223876953125, -0.1900634765625, -0.15625, -0.1224365234375, -0.088623046875, -0.0548095703125, -0.02099609375, 0.0128173828125, 0.046630859375, 0.0804443359375, 0.1142578125, 0.1480712890625, 0.181884765625, 0.2156982421875, 0.24951171875, 0.2833251953125, 0.317138671875, 0.3509521484375, 0.384765625, 0.4185791015625, 0.452392578125, 0.4862060546875, 0.52001953125, 0.5538330078125, 0.587646484375, 0.6214599609375, 0.6552734375, 0.6890869140625, 0.722900390625, 0.7567138671875, 0.79052734375, 0.8243408203125, 0.858154296875, 0.8919677734375, 0.92578125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 3.0, 4.0, 5.0, 8.0, 12.0, 15.0, 16.0, 31.0, 32.0, 37.0, 50.0, 79.0, 93.0, 115.0, 122.0, 83.0, 81.0, 50.0, 41.0, 32.0, 23.0, 22.0, 11.0, 7.0, 6.0, 5.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011920928955078125, -0.000115223228931427, -0.00011123716831207275, -0.0001072511076927185, -0.00010326504707336426, -9.927898645401001e-05, -9.529292583465576e-05, -9.130686521530151e-05, -8.732080459594727e-05, -8.333474397659302e-05, -7.934868335723877e-05, -7.536262273788452e-05, -7.137656211853027e-05, -6.739050149917603e-05, -6.340444087982178e-05, -5.941838026046753e-05, -5.543231964111328e-05, -5.144625902175903e-05, -4.7460198402404785e-05, -4.347413778305054e-05, -3.948807716369629e-05, -3.550201654434204e-05, -3.151595592498779e-05, -2.7529895305633545e-05, -2.3543834686279297e-05, -1.955777406692505e-05, -1.55717134475708e-05, -1.1585652828216553e-05, -7.599592208862305e-06, -3.6135315895080566e-06, 3.725290298461914e-07, 4.3585896492004395e-06, 8.344650268554688e-06, 1.2330710887908936e-05, 1.6316771507263184e-05, 2.030283212661743e-05, 2.428889274597168e-05, 2.8274953365325928e-05, 3.2261013984680176e-05, 3.6247074604034424e-05, 4.023313522338867e-05, 4.421919584274292e-05, 4.820525646209717e-05, 5.2191317081451416e-05, 5.6177377700805664e-05, 6.016343832015991e-05, 6.414949893951416e-05, 6.813555955886841e-05, 7.212162017822266e-05, 7.61076807975769e-05, 8.009374141693115e-05, 8.40798020362854e-05, 8.806586265563965e-05, 9.20519232749939e-05, 9.603798389434814e-05, 0.00010002404451370239, 0.00010401010513305664, 0.00010799616575241089, 0.00011198222637176514, 0.00011596828699111938, 0.00011995434761047363, 0.00012394040822982788, 0.00012792646884918213, 0.00013191252946853638, 0.00013589859008789062]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 3.0, 6.0, 9.0, 8.0, 11.0, 20.0, 22.0, 34.0, 50.0, 82.0, 155.0, 208.0, 462.0, 1000.0, 2785.0, 10472.0, 65227.0, 735368.0, 204023.0, 20978.0, 4669.0, 1549.0, 655.0, 297.0, 166.0, 89.0, 64.0, 47.0, 32.0, 17.0, 14.0, 7.0, 5.0, 6.0, 6.0, 2.0, 5.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.72265625, -1.6744232177734375, -1.626190185546875, -1.5779571533203125, -1.52972412109375, -1.4814910888671875, -1.433258056640625, -1.3850250244140625, -1.3367919921875, -1.2885589599609375, -1.240325927734375, -1.1920928955078125, -1.14385986328125, -1.0956268310546875, -1.047393798828125, -0.9991607666015625, -0.950927734375, -0.9026947021484375, -0.854461669921875, -0.8062286376953125, -0.75799560546875, -0.7097625732421875, -0.661529541015625, -0.6132965087890625, -0.5650634765625, -0.5168304443359375, -0.468597412109375, -0.4203643798828125, -0.37213134765625, -0.3238983154296875, -0.275665283203125, -0.2274322509765625, -0.17919921875, -0.1309661865234375, -0.082733154296875, -0.0345001220703125, 0.01373291015625, 0.0619659423828125, 0.110198974609375, 0.1584320068359375, 0.2066650390625, 0.2548980712890625, 0.303131103515625, 0.3513641357421875, 0.39959716796875, 0.4478302001953125, 0.496063232421875, 0.5442962646484375, 0.592529296875, 0.6407623291015625, 0.688995361328125, 0.7372283935546875, 0.78546142578125, 0.8336944580078125, 0.881927490234375, 0.9301605224609375, 0.9783935546875, 1.0266265869140625, 1.074859619140625, 1.1230926513671875, 1.17132568359375, 1.2195587158203125, 1.267791748046875, 1.3160247802734375, 1.3642578125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 5.0, 1.0, 3.0, 10.0, 14.0, 12.0, 11.0, 29.0, 32.0, 64.0, 69.0, 134.0, 116.0, 138.0, 106.0, 66.0, 53.0, 40.0, 19.0, 22.0, 18.0, 10.0, 5.0, 8.0, 5.0, 6.0, 5.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7939453125, -0.7579193115234375, -0.721893310546875, -0.6858673095703125, -0.64984130859375, -0.6138153076171875, -0.577789306640625, -0.5417633056640625, -0.5057373046875, -0.4697113037109375, -0.433685302734375, -0.3976593017578125, -0.36163330078125, -0.3256072998046875, -0.289581298828125, -0.2535552978515625, -0.217529296875, -0.1815032958984375, -0.145477294921875, -0.1094512939453125, -0.07342529296875, -0.0373992919921875, -0.001373291015625, 0.0346527099609375, 0.0706787109375, 0.1067047119140625, 0.142730712890625, 0.1787567138671875, 0.21478271484375, 0.2508087158203125, 0.286834716796875, 0.3228607177734375, 0.35888671875, 0.3949127197265625, 0.430938720703125, 0.4669647216796875, 0.50299072265625, 0.5390167236328125, 0.575042724609375, 0.6110687255859375, 0.6470947265625, 0.6831207275390625, 0.719146728515625, 0.7551727294921875, 0.79119873046875, 0.8272247314453125, 0.863250732421875, 0.8992767333984375, 0.935302734375, 0.9713287353515625, 1.007354736328125, 1.0433807373046875, 1.07940673828125, 1.1154327392578125, 1.151458740234375, 1.1874847412109375, 1.2235107421875, 1.2595367431640625, 1.295562744140625, 1.3315887451171875, 1.36761474609375, 1.4036407470703125, 1.439666748046875, 1.4756927490234375, 1.51171875]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 10.0, 13.0, 41.0, 73.0, 171.0, 248.0, 202.0, 123.0, 67.0, 28.0, 12.0, 9.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.453231811523438, -12.651277542114258, -11.849323272705078, -11.047369956970215, -10.245415687561035, -9.443461418151855, -8.641508102416992, -7.8395538330078125, -7.037599563598633, -6.235645294189453, -5.433691501617432, -4.63173770904541, -3.8297834396362305, -3.027829170227051, -2.2258753776550293, -1.4239215850830078, -0.6219673156738281, 0.17998671531677246, 0.981940746307373, 1.7838947772979736, 2.585848808288574, 3.387803077697754, 4.189756870269775, 4.991710662841797, 5.793664932250977, 6.595619201660156, 7.397572994232178, 8.1995267868042, 9.001481056213379, 9.803435325622559, 10.605388641357422, 11.407342910766602, 12.209297180175781, 13.011251449584961, 13.81320571899414, 14.615159034729004, 15.417113304138184, 16.219066619873047, 17.021020889282227, 17.822975158691406, 18.624929428100586, 19.426883697509766, 20.228837966918945, 21.030792236328125, 21.832744598388672, 22.634700775146484, 23.43665313720703, 24.23860740661621, 25.04056167602539, 25.84251594543457, 26.64447021484375, 27.44642448425293, 28.24837875366211, 29.050331115722656, 29.852285385131836, 30.654239654541016, 31.456193923950195, 32.258148193359375, 33.06010055541992, 33.862056732177734, 34.66400909423828, 35.465965270996094, 36.26791763305664, 37.06986999511719, 37.871826171875]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 11.0, 4.0, 4.0, 2.0, 13.0, 4.0, 12.0, 12.0, 11.0, 20.0, 22.0, 22.0, 23.0, 25.0, 24.0, 28.0, 41.0, 34.0, 38.0, 34.0, 38.0, 33.0, 33.0, 39.0, 41.0, 34.0, 39.0, 46.0, 35.0, 29.0, 29.0, 34.0, 26.0, 19.0, 20.0, 20.0, 18.0, 11.0, 12.0, 13.0, 10.0, 6.0, 6.0, 6.0, 9.0, 5.0, 1.0, 1.0, 5.0, 3.0, 2.0, 0.0, 0.0, 3.0], "bins": [-8.649946212768555, -8.391485214233398, -8.133024215698242, -7.874563694000244, -7.616103172302246, -7.35764217376709, -7.099181175231934, -6.840720176696777, -6.582259654998779, -6.323798656463623, -6.065338134765625, -5.806877136230469, -5.5484161376953125, -5.2899556159973145, -5.031494617462158, -4.77303409576416, -4.514573097229004, -4.256112098693848, -3.9976515769958496, -3.7391905784606934, -3.480729818344116, -3.222269058227539, -2.963808059692383, -2.7053472995758057, -2.4468865394592285, -2.1884257793426514, -1.9299649000167847, -1.671504020690918, -1.4130432605743408, -1.1545825004577637, -0.896121621131897, -0.6376607418060303, -0.3791999816894531, -0.1207391619682312, 0.13772165775299072, 0.39618247747421265, 0.6546432971954346, 0.9131040573120117, 1.1715649366378784, 1.4300258159637451, 1.6884865760803223, 1.9469473361968994, 2.2054080963134766, 2.463869094848633, 2.72232985496521, 2.980790615081787, 3.2392516136169434, 3.4977123737335205, 3.7561731338500977, 4.014634132385254, 4.273094654083252, 4.531555652618408, 4.790016174316406, 5.0484771728515625, 5.306938171386719, 5.565399169921875, 5.823859691619873, 6.082320690155029, 6.340781211853027, 6.599242210388184, 6.85770320892334, 7.116163730621338, 7.374624729156494, 7.633085250854492, 7.891546249389648]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 5.0, 3.0, 3.0, 3.0, 6.0, 7.0, 9.0, 18.0, 23.0, 26.0, 40.0, 69.0, 135.0, 221.0, 466.0, 996.0, 2392.0, 6302.0, 20065.0, 126046.0, 3900478.0, 108570.0, 18398.0, 5692.0, 2255.0, 942.0, 466.0, 248.0, 110.0, 83.0, 55.0, 44.0, 32.0, 15.0, 17.0, 15.0, 10.0, 7.0, 4.0, 3.0, 6.0, 1.0, 3.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.140625, -4.0205078125, -3.900390625, -3.7802734375, -3.66015625, -3.5400390625, -3.419921875, -3.2998046875, -3.1796875, -3.0595703125, -2.939453125, -2.8193359375, -2.69921875, -2.5791015625, -2.458984375, -2.3388671875, -2.21875, -2.0986328125, -1.978515625, -1.8583984375, -1.73828125, -1.6181640625, -1.498046875, -1.3779296875, -1.2578125, -1.1376953125, -1.017578125, -0.8974609375, -0.77734375, -0.6572265625, -0.537109375, -0.4169921875, -0.296875, -0.1767578125, -0.056640625, 0.0634765625, 0.18359375, 0.3037109375, 0.423828125, 0.5439453125, 0.6640625, 0.7841796875, 0.904296875, 1.0244140625, 1.14453125, 1.2646484375, 1.384765625, 1.5048828125, 1.625, 1.7451171875, 1.865234375, 1.9853515625, 2.10546875, 2.2255859375, 2.345703125, 2.4658203125, 2.5859375, 2.7060546875, 2.826171875, 2.9462890625, 3.06640625, 3.1865234375, 3.306640625, 3.4267578125, 3.546875]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 4.0, 3.0, 9.0, 17.0, 17.0, 15.0, 17.0, 26.0, 37.0, 26.0, 51.0, 54.0, 64.0, 52.0, 69.0, 79.0, 71.0, 53.0, 50.0, 43.0, 44.0, 45.0, 41.0, 29.0, 22.0, 22.0, 11.0, 10.0, 7.0, 8.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.53662109375, -0.5196609497070312, -0.5027008056640625, -0.48574066162109375, -0.468780517578125, -0.45182037353515625, -0.4348602294921875, -0.41790008544921875, -0.40093994140625, -0.38397979736328125, -0.3670196533203125, -0.35005950927734375, -0.333099365234375, -0.31613922119140625, -0.2991790771484375, -0.28221893310546875, -0.2652587890625, -0.24829864501953125, -0.2313385009765625, -0.21437835693359375, -0.197418212890625, -0.18045806884765625, -0.1634979248046875, -0.14653778076171875, -0.12957763671875, -0.11261749267578125, -0.0956573486328125, -0.07869720458984375, -0.061737060546875, -0.04477691650390625, -0.0278167724609375, -0.01085662841796875, 0.006103515625, 0.02306365966796875, 0.0400238037109375, 0.05698394775390625, 0.073944091796875, 0.09090423583984375, 0.1078643798828125, 0.12482452392578125, 0.14178466796875, 0.15874481201171875, 0.1757049560546875, 0.19266510009765625, 0.209625244140625, 0.22658538818359375, 0.2435455322265625, 0.26050567626953125, 0.2774658203125, 0.29442596435546875, 0.3113861083984375, 0.32834625244140625, 0.345306396484375, 0.36226654052734375, 0.3792266845703125, 0.39618682861328125, 0.41314697265625, 0.43010711669921875, 0.4470672607421875, 0.46402740478515625, 0.480987548828125, 0.49794769287109375, 0.5149078369140625, 0.5318679809570312, 0.548828125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 6.0, 8.0, 18.0, 20.0, 31.0, 46.0, 72.0, 134.0, 207.0, 381.0, 685.0, 1373.0, 2818.0, 6995.0, 21173.0, 96751.0, 3620301.0, 379282.0, 43344.0, 12034.0, 4462.0, 1920.0, 991.0, 540.0, 260.0, 156.0, 100.0, 60.0, 41.0, 23.0, 25.0, 9.0, 10.0, 6.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.57421875, -3.474273681640625, -3.37432861328125, -3.274383544921875, -3.1744384765625, -3.074493408203125, -2.97454833984375, -2.874603271484375, -2.774658203125, -2.674713134765625, -2.57476806640625, -2.474822998046875, -2.3748779296875, -2.274932861328125, -2.17498779296875, -2.075042724609375, -1.97509765625, -1.875152587890625, -1.77520751953125, -1.675262451171875, -1.5753173828125, -1.475372314453125, -1.37542724609375, -1.275482177734375, -1.175537109375, -1.075592041015625, -0.97564697265625, -0.875701904296875, -0.7757568359375, -0.675811767578125, -0.57586669921875, -0.475921630859375, -0.3759765625, -0.276031494140625, -0.17608642578125, -0.076141357421875, 0.0238037109375, 0.123748779296875, 0.22369384765625, 0.323638916015625, 0.423583984375, 0.523529052734375, 0.62347412109375, 0.723419189453125, 0.8233642578125, 0.923309326171875, 1.02325439453125, 1.123199462890625, 1.22314453125, 1.323089599609375, 1.42303466796875, 1.522979736328125, 1.6229248046875, 1.722869873046875, 1.82281494140625, 1.922760009765625, 2.022705078125, 2.122650146484375, 2.22259521484375, 2.322540283203125, 2.4224853515625, 2.522430419921875, 2.62237548828125, 2.722320556640625, 2.822265625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 4.0, 2.0, 2.0, 1.0, 5.0, 3.0, 11.0, 5.0, 7.0, 12.0, 14.0, 17.0, 24.0, 43.0, 48.0, 97.0, 193.0, 598.0, 2221.0, 374.0, 134.0, 79.0, 49.0, 30.0, 27.0, 20.0, 16.0, 7.0, 9.0, 6.0, 7.0, 4.0, 1.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.142578125, -1.1022491455078125, -1.061920166015625, -1.0215911865234375, -0.98126220703125, -0.9409332275390625, -0.900604248046875, -0.8602752685546875, -0.8199462890625, -0.7796173095703125, -0.739288330078125, -0.6989593505859375, -0.65863037109375, -0.6183013916015625, -0.577972412109375, -0.5376434326171875, -0.497314453125, -0.4569854736328125, -0.416656494140625, -0.3763275146484375, -0.33599853515625, -0.2956695556640625, -0.255340576171875, -0.2150115966796875, -0.1746826171875, -0.1343536376953125, -0.094024658203125, -0.0536956787109375, -0.01336669921875, 0.0269622802734375, 0.067291259765625, 0.1076202392578125, 0.14794921875, 0.1882781982421875, 0.228607177734375, 0.2689361572265625, 0.30926513671875, 0.3495941162109375, 0.389923095703125, 0.4302520751953125, 0.4705810546875, 0.5109100341796875, 0.551239013671875, 0.5915679931640625, 0.63189697265625, 0.6722259521484375, 0.712554931640625, 0.7528839111328125, 0.793212890625, 0.8335418701171875, 0.873870849609375, 0.9141998291015625, 0.95452880859375, 0.9948577880859375, 1.035186767578125, 1.0755157470703125, 1.1158447265625, 1.1561737060546875, 1.196502685546875, 1.2368316650390625, 1.27716064453125, 1.3174896240234375, 1.357818603515625, 1.3981475830078125, 1.4384765625]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 8.0, 15.0, 6.0, 33.0, 78.0, 180.0, 257.0, 222.0, 123.0, 50.0, 15.0, 8.0, 7.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.920326232910156, -14.491230010986328, -14.062132835388184, -13.633036613464355, -13.203940391540527, -12.774843215942383, -12.345746994018555, -11.916650772094727, -11.487554550170898, -11.05845832824707, -10.629361152648926, -10.200264930725098, -9.77116870880127, -9.342071533203125, -8.912975311279297, -8.483879089355469, -8.054781913757324, -7.625685214996338, -7.19658899307251, -6.767492294311523, -6.338396072387695, -5.909299373626709, -5.480202674865723, -5.0511064529418945, -4.622009754180908, -4.192913055419922, -3.7638168334960938, -3.3347201347351074, -2.9056236743927, -2.476527214050293, -2.0474305152893066, -1.6183340549468994, -1.1892375946044922, -0.7601410746574402, -0.3310445547103882, 0.0980520248413086, 0.5271484851837158, 0.956244945526123, 1.3853416442871094, 1.8144381046295166, 2.243534564971924, 2.672631025314331, 3.1017274856567383, 3.5308241844177246, 3.959920644760132, 4.389017105102539, 4.818113803863525, 5.247210502624512, 5.67630672454834, 6.105403423309326, 6.534499645233154, 6.963596343994141, 7.392692565917969, 7.821789264678955, 8.250885963439941, 8.67998218536377, 9.109079360961914, 9.538175582885742, 9.967272758483887, 10.396368980407715, 10.825465202331543, 11.254562377929688, 11.683658599853516, 12.112754821777344, 12.541851043701172]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 6.0, 5.0, 8.0, 7.0, 8.0, 17.0, 6.0, 12.0, 21.0, 14.0, 15.0, 18.0, 21.0, 32.0, 25.0, 43.0, 38.0, 38.0, 26.0, 41.0, 47.0, 26.0, 38.0, 44.0, 37.0, 29.0, 47.0, 29.0, 47.0, 32.0, 28.0, 27.0, 28.0, 21.0, 13.0, 14.0, 19.0, 10.0, 10.0, 15.0, 9.0, 4.0, 7.0, 5.0, 5.0, 1.0, 4.0, 4.0, 3.0, 0.0, 2.0, 2.0, 2.0], "bins": [-3.4667015075683594, -3.363508939743042, -3.2603163719177246, -3.157123565673828, -3.0539309978485107, -2.9507384300231934, -2.847545862197876, -2.7443532943725586, -2.641160726547241, -2.537968158721924, -2.4347755908966064, -2.331583023071289, -2.2283902168273926, -2.125197649002075, -2.022005081176758, -1.9188125133514404, -1.8156198263168335, -1.7124272584915161, -1.6092345714569092, -1.5060420036315918, -1.4028494358062744, -1.299656867980957, -1.19646418094635, -1.0932716131210327, -0.9900789856910706, -0.8868863582611084, -0.783693790435791, -0.6805011630058289, -0.5773085355758667, -0.4741159677505493, -0.37092334032058716, -0.2677307724952698, -0.16453814506530762, -0.06134553998708725, 0.04184706509113312, 0.14503967761993408, 0.24823227524757385, 0.3514248728752136, 0.4546175003051758, 0.5578100681304932, 0.6610026955604553, 0.7641953229904175, 0.8673878908157349, 0.970580518245697, 1.0737731456756592, 1.1769657135009766, 1.280158281326294, 1.3833508491516113, 1.4865435361862183, 1.5897361040115356, 1.6929287910461426, 1.79612135887146, 1.8993139266967773, 2.0025064945220947, 2.105699062347412, 2.2088918685913086, 2.312084436416626, 2.4152770042419434, 2.5184695720672607, 2.621662139892578, 2.7248549461364746, 2.828047513961792, 2.9312400817871094, 3.0344326496124268, 3.137625217437744]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 3.0, 5.0, 5.0, 5.0, 10.0, 6.0, 18.0, 24.0, 20.0, 33.0, 71.0, 101.0, 135.0, 207.0, 343.0, 539.0, 897.0, 1849.0, 4229.0, 11004.0, 33464.0, 116797.0, 377571.0, 349159.0, 104442.0, 29820.0, 9929.0, 3844.0, 1810.0, 878.0, 449.0, 299.0, 197.0, 118.0, 88.0, 58.0, 49.0, 25.0, 22.0, 13.0, 13.0, 2.0, 4.0, 3.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-2.68359375, -2.599609375, -2.515625, -2.431640625, -2.34765625, -2.263671875, -2.1796875, -2.095703125, -2.01171875, -1.927734375, -1.84375, -1.759765625, -1.67578125, -1.591796875, -1.5078125, -1.423828125, -1.33984375, -1.255859375, -1.171875, -1.087890625, -1.00390625, -0.919921875, -0.8359375, -0.751953125, -0.66796875, -0.583984375, -0.5, -0.416015625, -0.33203125, -0.248046875, -0.1640625, -0.080078125, 0.00390625, 0.087890625, 0.171875, 0.255859375, 0.33984375, 0.423828125, 0.5078125, 0.591796875, 0.67578125, 0.759765625, 0.84375, 0.927734375, 1.01171875, 1.095703125, 1.1796875, 1.263671875, 1.34765625, 1.431640625, 1.515625, 1.599609375, 1.68359375, 1.767578125, 1.8515625, 1.935546875, 2.01953125, 2.103515625, 2.1875, 2.271484375, 2.35546875, 2.439453125, 2.5234375, 2.607421875, 2.69140625]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 6.0, 4.0, 4.0, 6.0, 11.0, 12.0, 26.0, 29.0, 30.0, 49.0, 36.0, 49.0, 53.0, 56.0, 60.0, 59.0, 65.0, 58.0, 48.0, 63.0, 58.0, 40.0, 34.0, 33.0, 19.0, 23.0, 23.0, 15.0, 10.0, 10.0, 4.0, 5.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.54345703125, -0.5260696411132812, -0.5086822509765625, -0.49129486083984375, -0.473907470703125, -0.45652008056640625, -0.4391326904296875, -0.42174530029296875, -0.40435791015625, -0.38697052001953125, -0.3695831298828125, -0.35219573974609375, -0.334808349609375, -0.31742095947265625, -0.3000335693359375, -0.28264617919921875, -0.2652587890625, -0.24787139892578125, -0.2304840087890625, -0.21309661865234375, -0.195709228515625, -0.17832183837890625, -0.1609344482421875, -0.14354705810546875, -0.12615966796875, -0.10877227783203125, -0.0913848876953125, -0.07399749755859375, -0.056610107421875, -0.03922271728515625, -0.0218353271484375, -0.00444793701171875, 0.012939453125, 0.03032684326171875, 0.0477142333984375, 0.06510162353515625, 0.082489013671875, 0.09987640380859375, 0.1172637939453125, 0.13465118408203125, 0.15203857421875, 0.16942596435546875, 0.1868133544921875, 0.20420074462890625, 0.221588134765625, 0.23897552490234375, 0.2563629150390625, 0.27375030517578125, 0.2911376953125, 0.30852508544921875, 0.3259124755859375, 0.34329986572265625, 0.360687255859375, 0.37807464599609375, 0.3954620361328125, 0.41284942626953125, 0.43023681640625, 0.44762420654296875, 0.4650115966796875, 0.48239898681640625, 0.499786376953125, 0.5171737670898438, 0.5345611572265625, 0.5519485473632812, 0.5693359375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 6.0, 7.0, 4.0, 6.0, 23.0, 24.0, 41.0, 49.0, 88.0, 155.0, 247.0, 498.0, 956.0, 2147.0, 5759.0, 16654.0, 55956.0, 218752.0, 492267.0, 183621.0, 47905.0, 14372.0, 5103.0, 1951.0, 923.0, 445.0, 253.0, 117.0, 97.0, 48.0, 35.0, 19.0, 14.0, 6.0, 6.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.25390625, -2.177337646484375, -2.10076904296875, -2.024200439453125, -1.9476318359375, -1.871063232421875, -1.79449462890625, -1.717926025390625, -1.641357421875, -1.564788818359375, -1.48822021484375, -1.411651611328125, -1.3350830078125, -1.258514404296875, -1.18194580078125, -1.105377197265625, -1.02880859375, -0.952239990234375, -0.87567138671875, -0.799102783203125, -0.7225341796875, -0.645965576171875, -0.56939697265625, -0.492828369140625, -0.416259765625, -0.339691162109375, -0.26312255859375, -0.186553955078125, -0.1099853515625, -0.033416748046875, 0.04315185546875, 0.119720458984375, 0.1962890625, 0.272857666015625, 0.34942626953125, 0.425994873046875, 0.5025634765625, 0.579132080078125, 0.65570068359375, 0.732269287109375, 0.808837890625, 0.885406494140625, 0.96197509765625, 1.038543701171875, 1.1151123046875, 1.191680908203125, 1.26824951171875, 1.344818115234375, 1.42138671875, 1.497955322265625, 1.57452392578125, 1.651092529296875, 1.7276611328125, 1.804229736328125, 1.88079833984375, 1.957366943359375, 2.033935546875, 2.110504150390625, 2.18707275390625, 2.263641357421875, 2.3402099609375, 2.416778564453125, 2.49334716796875, 2.569915771484375, 2.646484375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 5.0, 8.0, 6.0, 6.0, 8.0, 12.0, 13.0, 15.0, 15.0, 13.0, 27.0, 27.0, 33.0, 31.0, 37.0, 23.0, 49.0, 47.0, 46.0, 52.0, 47.0, 53.0, 49.0, 46.0, 40.0, 45.0, 37.0, 31.0, 25.0, 19.0, 21.0, 26.0, 16.0, 22.0, 9.0, 11.0, 8.0, 5.0, 5.0, 4.0, 6.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-1.7626953125, -1.6974334716796875, -1.632171630859375, -1.5669097900390625, -1.50164794921875, -1.4363861083984375, -1.371124267578125, -1.3058624267578125, -1.2406005859375, -1.1753387451171875, -1.110076904296875, -1.0448150634765625, -0.97955322265625, -0.9142913818359375, -0.849029541015625, -0.7837677001953125, -0.718505859375, -0.6532440185546875, -0.587982177734375, -0.5227203369140625, -0.45745849609375, -0.3921966552734375, -0.326934814453125, -0.2616729736328125, -0.1964111328125, -0.1311492919921875, -0.065887451171875, -0.0006256103515625, 0.06463623046875, 0.1298980712890625, 0.195159912109375, 0.2604217529296875, 0.32568359375, 0.3909454345703125, 0.456207275390625, 0.5214691162109375, 0.58673095703125, 0.6519927978515625, 0.717254638671875, 0.7825164794921875, 0.8477783203125, 0.9130401611328125, 0.978302001953125, 1.0435638427734375, 1.10882568359375, 1.1740875244140625, 1.239349365234375, 1.3046112060546875, 1.369873046875, 1.4351348876953125, 1.500396728515625, 1.5656585693359375, 1.63092041015625, 1.6961822509765625, 1.761444091796875, 1.8267059326171875, 1.8919677734375, 1.9572296142578125, 2.022491455078125, 2.0877532958984375, 2.15301513671875, 2.2182769775390625, 2.283538818359375, 2.3488006591796875, 2.4140625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 1.0, 4.0, 6.0, 3.0, 10.0, 21.0, 36.0, 55.0, 125.0, 232.0, 497.0, 998.0, 2678.0, 8101.0, 35122.0, 248874.0, 622199.0, 103412.0, 18013.0, 4964.0, 1719.0, 748.0, 367.0, 178.0, 80.0, 41.0, 30.0, 17.0, 7.0, 2.0, 8.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.56640625, -1.5178985595703125, -1.469390869140625, -1.4208831787109375, -1.37237548828125, -1.3238677978515625, -1.275360107421875, -1.2268524169921875, -1.1783447265625, -1.1298370361328125, -1.081329345703125, -1.0328216552734375, -0.98431396484375, -0.9358062744140625, -0.887298583984375, -0.8387908935546875, -0.790283203125, -0.7417755126953125, -0.693267822265625, -0.6447601318359375, -0.59625244140625, -0.5477447509765625, -0.499237060546875, -0.4507293701171875, -0.4022216796875, -0.3537139892578125, -0.305206298828125, -0.2566986083984375, -0.20819091796875, -0.1596832275390625, -0.111175537109375, -0.0626678466796875, -0.01416015625, 0.0343475341796875, 0.082855224609375, 0.1313629150390625, 0.17987060546875, 0.2283782958984375, 0.276885986328125, 0.3253936767578125, 0.3739013671875, 0.4224090576171875, 0.470916748046875, 0.5194244384765625, 0.56793212890625, 0.6164398193359375, 0.664947509765625, 0.7134552001953125, 0.761962890625, 0.8104705810546875, 0.858978271484375, 0.9074859619140625, 0.95599365234375, 1.0045013427734375, 1.053009033203125, 1.1015167236328125, 1.1500244140625, 1.1985321044921875, 1.247039794921875, 1.2955474853515625, 1.34405517578125, 1.3925628662109375, 1.441070556640625, 1.4895782470703125, 1.5380859375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 7.0, 12.0, 13.0, 16.0, 30.0, 29.0, 51.0, 57.0, 88.0, 129.0, 155.0, 122.0, 88.0, 61.0, 38.0, 27.0, 24.0, 17.0, 16.0, 7.0, 7.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002906322479248047, -0.00028218701481819153, -0.00027374178171157837, -0.0002652965486049652, -0.00025685131549835205, -0.0002484060823917389, -0.00023996084928512573, -0.00023151561617851257, -0.00022307038307189941, -0.00021462514996528625, -0.0002061799168586731, -0.00019773468375205994, -0.00018928945064544678, -0.00018084421753883362, -0.00017239898443222046, -0.0001639537513256073, -0.00015550851821899414, -0.00014706328511238098, -0.00013861805200576782, -0.00013017281889915466, -0.0001217275857925415, -0.00011328235268592834, -0.00010483711957931519, -9.639188647270203e-05, -8.794665336608887e-05, -7.950142025947571e-05, -7.105618715286255e-05, -6.261095404624939e-05, -5.416572093963623e-05, -4.572048783302307e-05, -3.727525472640991e-05, -2.8830021619796753e-05, -2.0384788513183594e-05, -1.1939555406570435e-05, -3.4943222999572754e-06, 4.950910806655884e-06, 1.3396143913269043e-05, 2.1841377019882202e-05, 3.028661012649536e-05, 3.873184323310852e-05, 4.717707633972168e-05, 5.562230944633484e-05, 6.4067542552948e-05, 7.251277565956116e-05, 8.095800876617432e-05, 8.940324187278748e-05, 9.784847497940063e-05, 0.0001062937080860138, 0.00011473894119262695, 0.0001231841742992401, 0.00013162940740585327, 0.00014007464051246643, 0.0001485198736190796, 0.00015696510672569275, 0.0001654103398323059, 0.00017385557293891907, 0.00018230080604553223, 0.00019074603915214539, 0.00019919127225875854, 0.0002076365053653717, 0.00021608173847198486, 0.00022452697157859802, 0.00023297220468521118, 0.00024141743779182434, 0.0002498626708984375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 4.0, 7.0, 8.0, 15.0, 11.0, 26.0, 36.0, 64.0, 132.0, 192.0, 312.0, 628.0, 1597.0, 4679.0, 20202.0, 159130.0, 708228.0, 128674.0, 17655.0, 4138.0, 1448.0, 658.0, 297.0, 146.0, 95.0, 52.0, 38.0, 23.0, 21.0, 12.0, 9.0, 5.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0, 2.0], "bins": [-2.181640625, -2.124908447265625, -2.06817626953125, -2.011444091796875, -1.9547119140625, -1.897979736328125, -1.84124755859375, -1.784515380859375, -1.727783203125, -1.671051025390625, -1.61431884765625, -1.557586669921875, -1.5008544921875, -1.444122314453125, -1.38739013671875, -1.330657958984375, -1.27392578125, -1.217193603515625, -1.16046142578125, -1.103729248046875, -1.0469970703125, -0.990264892578125, -0.93353271484375, -0.876800537109375, -0.820068359375, -0.763336181640625, -0.70660400390625, -0.649871826171875, -0.5931396484375, -0.536407470703125, -0.47967529296875, -0.422943115234375, -0.3662109375, -0.309478759765625, -0.25274658203125, -0.196014404296875, -0.1392822265625, -0.082550048828125, -0.02581787109375, 0.030914306640625, 0.087646484375, 0.144378662109375, 0.20111083984375, 0.257843017578125, 0.3145751953125, 0.371307373046875, 0.42803955078125, 0.484771728515625, 0.54150390625, 0.598236083984375, 0.65496826171875, 0.711700439453125, 0.7684326171875, 0.825164794921875, 0.88189697265625, 0.938629150390625, 0.995361328125, 1.052093505859375, 1.10882568359375, 1.165557861328125, 1.2222900390625, 1.279022216796875, 1.33575439453125, 1.392486572265625, 1.44921875]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 2.0, 4.0, 10.0, 6.0, 11.0, 15.0, 15.0, 25.0, 35.0, 56.0, 62.0, 86.0, 107.0, 121.0, 87.0, 87.0, 69.0, 38.0, 50.0, 30.0, 11.0, 19.0, 17.0, 11.0, 6.0, 5.0, 5.0, 4.0, 8.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.154296875, -1.1088104248046875, -1.063323974609375, -1.0178375244140625, -0.97235107421875, -0.9268646240234375, -0.881378173828125, -0.8358917236328125, -0.7904052734375, -0.7449188232421875, -0.699432373046875, -0.6539459228515625, -0.60845947265625, -0.5629730224609375, -0.517486572265625, -0.4720001220703125, -0.426513671875, -0.3810272216796875, -0.335540771484375, -0.2900543212890625, -0.24456787109375, -0.1990814208984375, -0.153594970703125, -0.1081085205078125, -0.0626220703125, -0.0171356201171875, 0.028350830078125, 0.0738372802734375, 0.11932373046875, 0.1648101806640625, 0.210296630859375, 0.2557830810546875, 0.30126953125, 0.3467559814453125, 0.392242431640625, 0.4377288818359375, 0.48321533203125, 0.5287017822265625, 0.574188232421875, 0.6196746826171875, 0.6651611328125, 0.7106475830078125, 0.756134033203125, 0.8016204833984375, 0.84710693359375, 0.8925933837890625, 0.938079833984375, 0.9835662841796875, 1.029052734375, 1.0745391845703125, 1.120025634765625, 1.1655120849609375, 1.21099853515625, 1.2564849853515625, 1.301971435546875, 1.3474578857421875, 1.3929443359375, 1.4384307861328125, 1.483917236328125, 1.5294036865234375, 1.57489013671875, 1.6203765869140625, 1.665863037109375, 1.7113494873046875, 1.7568359375]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 3.0, 5.0, 3.0, 11.0, 21.0, 13.0, 16.0, 39.0, 62.0, 71.0, 101.0, 108.0, 111.0, 103.0, 96.0, 80.0, 54.0, 33.0, 23.0, 12.0, 13.0, 11.0, 8.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.366525650024414, -12.869441032409668, -12.372356414794922, -11.87527084350586, -11.378186225891113, -10.881101608276367, -10.384016036987305, -9.886931419372559, -9.389846801757812, -8.892762184143066, -8.39567756652832, -7.898591995239258, -7.401507377624512, -6.904422760009766, -6.407337665557861, -5.910252571105957, -5.413167953491211, -4.916083335876465, -4.4189982414245605, -3.9219133853912354, -3.42482852935791, -2.927743673324585, -2.4306588172912598, -1.9335739612579346, -1.4364891052246094, -0.9394042491912842, -0.442319393157959, 0.05476546287536621, 0.5518503189086914, 1.0489351749420166, 1.5460200309753418, 2.043104887008667, 2.540189743041992, 3.0372745990753174, 3.5343594551086426, 4.031444549560547, 4.528529167175293, 5.025613784790039, 5.522698879241943, 6.019783973693848, 6.516868591308594, 7.01395320892334, 7.511038303375244, 8.008123397827148, 8.505208015441895, 9.00229263305664, 9.499378204345703, 9.99646282196045, 10.493547439575195, 10.990632057189941, 11.487716674804688, 11.98480224609375, 12.481886863708496, 12.978971481323242, 13.476057052612305, 13.97314167022705, 14.470226287841797, 14.967310905456543, 15.464395523071289, 15.961481094360352, 16.45856475830078, 16.955650329589844, 17.452735900878906, 17.949819564819336, 18.4469051361084]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 5.0, 7.0, 13.0, 14.0, 10.0, 17.0, 8.0, 15.0, 26.0, 27.0, 31.0, 23.0, 40.0, 42.0, 42.0, 59.0, 43.0, 50.0, 61.0, 40.0, 48.0, 51.0, 32.0, 34.0, 37.0, 42.0, 20.0, 20.0, 23.0, 20.0, 17.0, 15.0, 11.0, 16.0, 6.0, 4.0, 7.0, 9.0, 4.0, 7.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.76424789428711, -9.410740852355957, -9.057234764099121, -8.703727722167969, -8.350220680236816, -7.996714115142822, -7.643207550048828, -7.289700508117676, -6.936193943023682, -6.5826873779296875, -6.229180335998535, -5.875673770904541, -5.522167205810547, -5.1686601638793945, -4.8151535987854, -4.461647033691406, -4.108139991760254, -3.7546331882476807, -3.4011263847351074, -3.0476198196411133, -2.69411301612854, -2.340606212615967, -1.9870996475219727, -1.6335928440093994, -1.2800860404968262, -0.9265792965888977, -0.5730725526809692, -0.21956586837768555, 0.1339409351348877, 0.48744773864746094, 0.8409543037414551, 1.1944611072540283, 1.5479679107666016, 1.9014747142791748, 2.254981517791748, 2.608488082885742, 2.9619948863983154, 3.3155016899108887, 3.669008255004883, 4.022515296936035, 4.376021862030029, 4.729528427124023, 5.083035469055176, 5.43654203414917, 5.790048599243164, 6.143555641174316, 6.4970622062683105, 6.850568771362305, 7.204075813293457, 7.557582378387451, 7.9110894203186035, 8.264595985412598, 8.61810302734375, 8.971609115600586, 9.325116157531738, 9.67862319946289, 10.032129287719727, 10.385636329650879, 10.739142417907715, 11.092649459838867, 11.44615650177002, 11.799663543701172, 12.153169631958008, 12.50667667388916, 12.860183715820312]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 6.0, 10.0, 22.0, 58.0, 93.0, 135.0, 299.0, 578.0, 1294.0, 3091.0, 10447.0, 141955.0, 4011523.0, 17491.0, 4191.0, 1595.0, 711.0, 335.0, 184.0, 95.0, 66.0, 30.0, 27.0, 18.0, 12.0, 5.0, 4.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.4375, -5.24432373046875, -5.0511474609375, -4.85797119140625, -4.664794921875, -4.47161865234375, -4.2784423828125, -4.08526611328125, -3.89208984375, -3.69891357421875, -3.5057373046875, -3.31256103515625, -3.119384765625, -2.92620849609375, -2.7330322265625, -2.53985595703125, -2.3466796875, -2.15350341796875, -1.9603271484375, -1.76715087890625, -1.573974609375, -1.38079833984375, -1.1876220703125, -0.99444580078125, -0.80126953125, -0.60809326171875, -0.4149169921875, -0.22174072265625, -0.028564453125, 0.16461181640625, 0.3577880859375, 0.55096435546875, 0.744140625, 0.93731689453125, 1.1304931640625, 1.32366943359375, 1.516845703125, 1.71002197265625, 1.9031982421875, 2.09637451171875, 2.28955078125, 2.48272705078125, 2.6759033203125, 2.86907958984375, 3.062255859375, 3.25543212890625, 3.4486083984375, 3.64178466796875, 3.8349609375, 4.02813720703125, 4.2213134765625, 4.41448974609375, 4.607666015625, 4.80084228515625, 4.9940185546875, 5.18719482421875, 5.38037109375, 5.57354736328125, 5.7667236328125, 5.95989990234375, 6.153076171875, 6.34625244140625, 6.5394287109375, 6.73260498046875, 6.92578125]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 5.0, 10.0, 11.0, 11.0, 20.0, 18.0, 32.0, 32.0, 33.0, 38.0, 53.0, 34.0, 53.0, 58.0, 47.0, 58.0, 51.0, 63.0, 53.0, 45.0, 47.0, 27.0, 32.0, 29.0, 26.0, 30.0, 18.0, 18.0, 10.0, 11.0, 6.0, 8.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.5556640625, -0.537628173828125, -0.51959228515625, -0.501556396484375, -0.4835205078125, -0.465484619140625, -0.44744873046875, -0.429412841796875, -0.411376953125, -0.393341064453125, -0.37530517578125, -0.357269287109375, -0.3392333984375, -0.321197509765625, -0.30316162109375, -0.285125732421875, -0.26708984375, -0.249053955078125, -0.23101806640625, -0.212982177734375, -0.1949462890625, -0.176910400390625, -0.15887451171875, -0.140838623046875, -0.122802734375, -0.104766845703125, -0.08673095703125, -0.068695068359375, -0.0506591796875, -0.032623291015625, -0.01458740234375, 0.003448486328125, 0.021484375, 0.039520263671875, 0.05755615234375, 0.075592041015625, 0.0936279296875, 0.111663818359375, 0.12969970703125, 0.147735595703125, 0.165771484375, 0.183807373046875, 0.20184326171875, 0.219879150390625, 0.2379150390625, 0.255950927734375, 0.27398681640625, 0.292022705078125, 0.31005859375, 0.328094482421875, 0.34613037109375, 0.364166259765625, 0.3822021484375, 0.400238037109375, 0.41827392578125, 0.436309814453125, 0.454345703125, 0.472381591796875, 0.49041748046875, 0.508453369140625, 0.5264892578125, 0.544525146484375, 0.56256103515625, 0.580596923828125, 0.5986328125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 6.0, 11.0, 8.0, 16.0, 23.0, 32.0, 51.0, 74.0, 102.0, 152.0, 212.0, 322.0, 474.0, 772.0, 1144.0, 1957.0, 3675.0, 7920.0, 22343.0, 132063.0, 3928085.0, 65237.0, 15395.0, 6282.0, 3067.0, 1752.0, 1030.0, 671.0, 444.0, 307.0, 199.0, 147.0, 104.0, 75.0, 44.0, 29.0, 22.0, 20.0, 10.0, 4.0, 6.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.009765625, -2.91375732421875, -2.8177490234375, -2.72174072265625, -2.625732421875, -2.52972412109375, -2.4337158203125, -2.33770751953125, -2.24169921875, -2.14569091796875, -2.0496826171875, -1.95367431640625, -1.857666015625, -1.76165771484375, -1.6656494140625, -1.56964111328125, -1.4736328125, -1.37762451171875, -1.2816162109375, -1.18560791015625, -1.089599609375, -0.99359130859375, -0.8975830078125, -0.80157470703125, -0.70556640625, -0.60955810546875, -0.5135498046875, -0.41754150390625, -0.321533203125, -0.22552490234375, -0.1295166015625, -0.03350830078125, 0.0625, 0.15850830078125, 0.2545166015625, 0.35052490234375, 0.446533203125, 0.54254150390625, 0.6385498046875, 0.73455810546875, 0.83056640625, 0.92657470703125, 1.0225830078125, 1.11859130859375, 1.214599609375, 1.31060791015625, 1.4066162109375, 1.50262451171875, 1.5986328125, 1.69464111328125, 1.7906494140625, 1.88665771484375, 1.982666015625, 2.07867431640625, 2.1746826171875, 2.27069091796875, 2.36669921875, 2.46270751953125, 2.5587158203125, 2.65472412109375, 2.750732421875, 2.84674072265625, 2.9427490234375, 3.03875732421875, 3.134765625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 6.0, 7.0, 4.0, 11.0, 15.0, 19.0, 41.0, 60.0, 146.0, 3015.0, 497.0, 99.0, 43.0, 34.0, 17.0, 12.0, 8.0, 4.0, 5.0, 6.0, 5.0, 5.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.56201171875, -0.5432052612304688, -0.5243988037109375, -0.5055923461914062, -0.486785888671875, -0.46797943115234375, -0.4491729736328125, -0.43036651611328125, -0.41156005859375, -0.39275360107421875, -0.3739471435546875, -0.35514068603515625, -0.336334228515625, -0.31752777099609375, -0.2987213134765625, -0.27991485595703125, -0.2611083984375, -0.24230194091796875, -0.2234954833984375, -0.20468902587890625, -0.185882568359375, -0.16707611083984375, -0.1482696533203125, -0.12946319580078125, -0.11065673828125, -0.09185028076171875, -0.0730438232421875, -0.05423736572265625, -0.035430908203125, -0.01662445068359375, 0.0021820068359375, 0.02098846435546875, 0.039794921875, 0.05860137939453125, 0.0774078369140625, 0.09621429443359375, 0.115020751953125, 0.13382720947265625, 0.1526336669921875, 0.17144012451171875, 0.19024658203125, 0.20905303955078125, 0.2278594970703125, 0.24666595458984375, 0.265472412109375, 0.28427886962890625, 0.3030853271484375, 0.32189178466796875, 0.3406982421875, 0.35950469970703125, 0.3783111572265625, 0.39711761474609375, 0.415924072265625, 0.43473052978515625, 0.4535369873046875, 0.47234344482421875, 0.49114990234375, 0.5099563598632812, 0.5287628173828125, 0.5475692749023438, 0.566375732421875, 0.5851821899414062, 0.6039886474609375, 0.6227951049804688, 0.6416015625]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 7.0, 10.0, 14.0, 24.0, 39.0, 72.0, 101.0, 138.0, 140.0, 122.0, 104.0, 82.0, 56.0, 34.0, 25.0, 16.0, 6.0, 7.0, 5.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5385429859161377, -3.4232499599456787, -3.3079566955566406, -3.1926636695861816, -3.0773706436157227, -2.9620776176452637, -2.8467845916748047, -2.7314913272857666, -2.6161983013153076, -2.5009052753448486, -2.3856120109558105, -2.2703189849853516, -2.1550259590148926, -2.0397329330444336, -1.924439787864685, -1.8091466426849365, -1.6938536167144775, -1.5785605907440186, -1.46326744556427, -1.3479743003845215, -1.2326812744140625, -1.1173882484436035, -1.002095103263855, -0.8868020176887512, -0.7715089321136475, -0.6562158465385437, -0.5409227609634399, -0.4256296753883362, -0.3103365898132324, -0.19504350423812866, -0.0797504186630249, 0.03554266691207886, 0.15083599090576172, 0.2661290764808655, 0.38142216205596924, 0.496715247631073, 0.6120083332061768, 0.7273014187812805, 0.8425945043563843, 0.957887589931488, 1.0731806755065918, 1.1884737014770508, 1.3037668466567993, 1.4190599918365479, 1.5343530178070068, 1.6496460437774658, 1.7649391889572144, 1.880232334136963, 1.9955253601074219, 2.110818386077881, 2.22611141204834, 2.341404676437378, 2.456697702407837, 2.571990728378296, 2.687283992767334, 2.802577018737793, 2.917870044708252, 3.033163070678711, 3.14845609664917, 3.263749361038208, 3.379042387008667, 3.494335412979126, 3.609628677368164, 3.724921703338623, 3.840214729309082]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 4.0, 5.0, 5.0, 10.0, 14.0, 7.0, 10.0, 20.0, 21.0, 23.0, 22.0, 16.0, 28.0, 31.0, 36.0, 41.0, 33.0, 31.0, 50.0, 33.0, 38.0, 53.0, 46.0, 39.0, 22.0, 43.0, 34.0, 42.0, 34.0, 27.0, 25.0, 26.0, 26.0, 16.0, 19.0, 15.0, 13.0, 10.0, 7.0, 9.0, 4.0, 9.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.326143503189087, -1.2843542098999023, -1.2425650358200073, -1.2007757425308228, -1.1589865684509277, -1.1171972751617432, -1.0754081010818481, -1.0336188077926636, -0.9918296337127686, -0.9500404000282288, -0.908251166343689, -0.8664619326591492, -0.8246726989746094, -0.7828834652900696, -0.7410942316055298, -0.6993049383163452, -0.6575157046318054, -0.6157264709472656, -0.5739372372627258, -0.532148003578186, -0.49035876989364624, -0.44856953620910645, -0.40678027272224426, -0.36499103903770447, -0.3232018053531647, -0.2814125716686249, -0.23962333798408508, -0.1978340893983841, -0.1560448557138443, -0.1142556220293045, -0.07246637344360352, -0.03067713975906372, 0.011112093925476074, 0.05290133133530617, 0.09469056874513626, 0.13647980988025665, 0.17826904356479645, 0.22005827724933624, 0.26184752583503723, 0.303636759519577, 0.3454259932041168, 0.3872152268886566, 0.4290044605731964, 0.4707937240600586, 0.5125829577445984, 0.5543721914291382, 0.596161425113678, 0.6379506587982178, 0.6797398924827576, 0.7215291261672974, 0.7633183598518372, 0.805107593536377, 0.8468968272209167, 0.8886860609054565, 0.9304753541946411, 0.9722645282745361, 1.0140538215637207, 1.0558431148529053, 1.0976322889328003, 1.1394215822219849, 1.1812107563018799, 1.2230000495910645, 1.2647892236709595, 1.306578516960144, 1.348367691040039]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 7.0, 4.0, 6.0, 3.0, 7.0, 7.0, 17.0, 24.0, 28.0, 46.0, 64.0, 97.0, 123.0, 183.0, 287.0, 494.0, 747.0, 1404.0, 2528.0, 4816.0, 9699.0, 21099.0, 47029.0, 107881.0, 215145.0, 279670.0, 191212.0, 90952.0, 39527.0, 17562.0, 8350.0, 4192.0, 2195.0, 1218.0, 705.0, 421.0, 276.0, 162.0, 107.0, 76.0, 54.0, 32.0, 33.0, 17.0, 17.0, 11.0, 12.0, 7.0, 4.0, 3.0, 2.0, 4.0, 0.0, 3.0, 3.0], "bins": [-2.09765625, -2.0366668701171875, -1.975677490234375, -1.9146881103515625, -1.85369873046875, -1.7927093505859375, -1.731719970703125, -1.6707305908203125, -1.6097412109375, -1.5487518310546875, -1.487762451171875, -1.4267730712890625, -1.36578369140625, -1.3047943115234375, -1.243804931640625, -1.1828155517578125, -1.121826171875, -1.0608367919921875, -0.999847412109375, -0.9388580322265625, -0.87786865234375, -0.8168792724609375, -0.755889892578125, -0.6949005126953125, -0.6339111328125, -0.5729217529296875, -0.511932373046875, -0.4509429931640625, -0.38995361328125, -0.3289642333984375, -0.267974853515625, -0.2069854736328125, -0.14599609375, -0.0850067138671875, -0.024017333984375, 0.0369720458984375, 0.09796142578125, 0.1589508056640625, 0.219940185546875, 0.2809295654296875, 0.3419189453125, 0.4029083251953125, 0.463897705078125, 0.5248870849609375, 0.58587646484375, 0.6468658447265625, 0.707855224609375, 0.7688446044921875, 0.829833984375, 0.8908233642578125, 0.951812744140625, 1.0128021240234375, 1.07379150390625, 1.1347808837890625, 1.195770263671875, 1.2567596435546875, 1.3177490234375, 1.3787384033203125, 1.439727783203125, 1.5007171630859375, 1.56170654296875, 1.6226959228515625, 1.683685302734375, 1.7446746826171875, 1.8056640625]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 3.0, 9.0, 11.0, 8.0, 18.0, 13.0, 26.0, 21.0, 35.0, 36.0, 31.0, 32.0, 41.0, 44.0, 56.0, 35.0, 45.0, 58.0, 48.0, 44.0, 56.0, 47.0, 49.0, 32.0, 33.0, 33.0, 21.0, 19.0, 23.0, 17.0, 15.0, 8.0, 12.0, 5.0, 4.0, 6.0, 5.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.5556640625, -0.5374526977539062, -0.5192413330078125, -0.5010299682617188, -0.482818603515625, -0.46460723876953125, -0.4463958740234375, -0.42818450927734375, -0.40997314453125, -0.39176177978515625, -0.3735504150390625, -0.35533905029296875, -0.337127685546875, -0.31891632080078125, -0.3007049560546875, -0.28249359130859375, -0.2642822265625, -0.24607086181640625, -0.2278594970703125, -0.20964813232421875, -0.191436767578125, -0.17322540283203125, -0.1550140380859375, -0.13680267333984375, -0.11859130859375, -0.10037994384765625, -0.0821685791015625, -0.06395721435546875, -0.045745849609375, -0.02753448486328125, -0.0093231201171875, 0.00888824462890625, 0.027099609375, 0.04531097412109375, 0.0635223388671875, 0.08173370361328125, 0.099945068359375, 0.11815643310546875, 0.1363677978515625, 0.15457916259765625, 0.17279052734375, 0.19100189208984375, 0.2092132568359375, 0.22742462158203125, 0.245635986328125, 0.26384735107421875, 0.2820587158203125, 0.30027008056640625, 0.3184814453125, 0.33669281005859375, 0.3549041748046875, 0.37311553955078125, 0.391326904296875, 0.40953826904296875, 0.4277496337890625, 0.44596099853515625, 0.46417236328125, 0.48238372802734375, 0.5005950927734375, 0.5188064575195312, 0.537017822265625, 0.5552291870117188, 0.5734405517578125, 0.5916519165039062, 0.60986328125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 4.0, 1.0, 5.0, 1.0, 4.0, 4.0, 8.0, 9.0, 17.0, 19.0, 27.0, 48.0, 74.0, 129.0, 228.0, 486.0, 1101.0, 2948.0, 8414.0, 29370.0, 124487.0, 479158.0, 305398.0, 69884.0, 17785.0, 5361.0, 1898.0, 822.0, 353.0, 189.0, 116.0, 78.0, 45.0, 27.0, 19.0, 14.0, 7.0, 6.0, 7.0, 8.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.865234375, -2.76910400390625, -2.6729736328125, -2.57684326171875, -2.480712890625, -2.38458251953125, -2.2884521484375, -2.19232177734375, -2.09619140625, -2.00006103515625, -1.9039306640625, -1.80780029296875, -1.711669921875, -1.61553955078125, -1.5194091796875, -1.42327880859375, -1.3271484375, -1.23101806640625, -1.1348876953125, -1.03875732421875, -0.942626953125, -0.84649658203125, -0.7503662109375, -0.65423583984375, -0.55810546875, -0.46197509765625, -0.3658447265625, -0.26971435546875, -0.173583984375, -0.07745361328125, 0.0186767578125, 0.11480712890625, 0.2109375, 0.30706787109375, 0.4031982421875, 0.49932861328125, 0.595458984375, 0.69158935546875, 0.7877197265625, 0.88385009765625, 0.97998046875, 1.07611083984375, 1.1722412109375, 1.26837158203125, 1.364501953125, 1.46063232421875, 1.5567626953125, 1.65289306640625, 1.7490234375, 1.84515380859375, 1.9412841796875, 2.03741455078125, 2.133544921875, 2.22967529296875, 2.3258056640625, 2.42193603515625, 2.51806640625, 2.61419677734375, 2.7103271484375, 2.80645751953125, 2.902587890625, 2.99871826171875, 3.0948486328125, 3.19097900390625, 3.287109375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 8.0, 5.0, 13.0, 10.0, 17.0, 21.0, 19.0, 30.0, 34.0, 40.0, 52.0, 50.0, 55.0, 70.0, 63.0, 57.0, 60.0, 64.0, 54.0, 54.0, 46.0, 36.0, 31.0, 26.0, 21.0, 15.0, 14.0, 13.0, 14.0, 5.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.69140625, -4.574737548828125, -4.45806884765625, -4.341400146484375, -4.2247314453125, -4.108062744140625, -3.99139404296875, -3.874725341796875, -3.758056640625, -3.641387939453125, -3.52471923828125, -3.408050537109375, -3.2913818359375, -3.174713134765625, -3.05804443359375, -2.941375732421875, -2.82470703125, -2.708038330078125, -2.59136962890625, -2.474700927734375, -2.3580322265625, -2.241363525390625, -2.12469482421875, -2.008026123046875, -1.891357421875, -1.774688720703125, -1.65802001953125, -1.541351318359375, -1.4246826171875, -1.308013916015625, -1.19134521484375, -1.074676513671875, -0.9580078125, -0.841339111328125, -0.72467041015625, -0.608001708984375, -0.4913330078125, -0.374664306640625, -0.25799560546875, -0.141326904296875, -0.024658203125, 0.092010498046875, 0.20867919921875, 0.325347900390625, 0.4420166015625, 0.558685302734375, 0.67535400390625, 0.792022705078125, 0.90869140625, 1.025360107421875, 1.14202880859375, 1.258697509765625, 1.3753662109375, 1.492034912109375, 1.60870361328125, 1.725372314453125, 1.842041015625, 1.958709716796875, 2.07537841796875, 2.192047119140625, 2.3087158203125, 2.425384521484375, 2.54205322265625, 2.658721923828125, 2.775390625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 9.0, 8.0, 5.0, 9.0, 23.0, 21.0, 35.0, 53.0, 83.0, 168.0, 273.0, 695.0, 1768.0, 6403.0, 37264.0, 591485.0, 374327.0, 27920.0, 5268.0, 1462.0, 628.0, 260.0, 153.0, 69.0, 46.0, 26.0, 27.0, 20.0, 10.0, 9.0, 7.0, 6.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.146484375, -3.053741455078125, -2.96099853515625, -2.868255615234375, -2.7755126953125, -2.682769775390625, -2.59002685546875, -2.497283935546875, -2.404541015625, -2.311798095703125, -2.21905517578125, -2.126312255859375, -2.0335693359375, -1.940826416015625, -1.84808349609375, -1.755340576171875, -1.66259765625, -1.569854736328125, -1.47711181640625, -1.384368896484375, -1.2916259765625, -1.198883056640625, -1.10614013671875, -1.013397216796875, -0.920654296875, -0.827911376953125, -0.73516845703125, -0.642425537109375, -0.5496826171875, -0.456939697265625, -0.36419677734375, -0.271453857421875, -0.1787109375, -0.085968017578125, 0.00677490234375, 0.099517822265625, 0.1922607421875, 0.285003662109375, 0.37774658203125, 0.470489501953125, 0.563232421875, 0.655975341796875, 0.74871826171875, 0.841461181640625, 0.9342041015625, 1.026947021484375, 1.11968994140625, 1.212432861328125, 1.30517578125, 1.397918701171875, 1.49066162109375, 1.583404541015625, 1.6761474609375, 1.768890380859375, 1.86163330078125, 1.954376220703125, 2.047119140625, 2.139862060546875, 2.23260498046875, 2.325347900390625, 2.4180908203125, 2.510833740234375, 2.60357666015625, 2.696319580078125, 2.7890625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 5.0, 5.0, 15.0, 13.0, 9.0, 21.0, 22.0, 29.0, 30.0, 47.0, 58.0, 68.0, 87.0, 81.0, 93.0, 85.0, 66.0, 57.0, 44.0, 30.0, 29.0, 26.0, 18.0, 9.0, 8.0, 10.0, 7.0, 3.0, 4.0, 1.0, 5.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 3.0], "bins": [-0.00023317337036132812, -0.00022704154253005981, -0.0002209097146987915, -0.0002147778868675232, -0.00020864605903625488, -0.00020251423120498657, -0.00019638240337371826, -0.00019025057554244995, -0.00018411874771118164, -0.00017798691987991333, -0.00017185509204864502, -0.0001657232642173767, -0.0001595914363861084, -0.0001534596085548401, -0.00014732778072357178, -0.00014119595289230347, -0.00013506412506103516, -0.00012893229722976685, -0.00012280046939849854, -0.00011666864156723022, -0.00011053681373596191, -0.0001044049859046936, -9.827315807342529e-05, -9.214133024215698e-05, -8.600950241088867e-05, -7.987767457962036e-05, -7.374584674835205e-05, -6.761401891708374e-05, -6.148219108581543e-05, -5.535036325454712e-05, -4.921853542327881e-05, -4.30867075920105e-05, -3.695487976074219e-05, -3.082305192947388e-05, -2.4691224098205566e-05, -1.8559396266937256e-05, -1.2427568435668945e-05, -6.295740604400635e-06, -1.6391277313232422e-07, 5.967915058135986e-06, 1.2099742889404297e-05, 1.8231570720672607e-05, 2.4363398551940918e-05, 3.049522638320923e-05, 3.662705421447754e-05, 4.275888204574585e-05, 4.889070987701416e-05, 5.502253770828247e-05, 6.115436553955078e-05, 6.728619337081909e-05, 7.34180212020874e-05, 7.954984903335571e-05, 8.568167686462402e-05, 9.181350469589233e-05, 9.794533252716064e-05, 0.00010407716035842896, 0.00011020898818969727, 0.00011634081602096558, 0.0001224726438522339, 0.0001286044716835022, 0.0001347362995147705, 0.00014086812734603882, 0.00014699995517730713, 0.00015313178300857544, 0.00015926361083984375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 6.0, 5.0, 7.0, 17.0, 21.0, 30.0, 61.0, 78.0, 161.0, 296.0, 561.0, 1535.0, 4394.0, 18272.0, 124366.0, 732299.0, 138926.0, 19771.0, 4890.0, 1493.0, 628.0, 316.0, 181.0, 96.0, 57.0, 28.0, 15.0, 16.0, 17.0, 4.0, 6.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.328125, -2.2542724609375, -2.180419921875, -2.1065673828125, -2.03271484375, -1.9588623046875, -1.885009765625, -1.8111572265625, -1.7373046875, -1.6634521484375, -1.589599609375, -1.5157470703125, -1.44189453125, -1.3680419921875, -1.294189453125, -1.2203369140625, -1.146484375, -1.0726318359375, -0.998779296875, -0.9249267578125, -0.85107421875, -0.7772216796875, -0.703369140625, -0.6295166015625, -0.5556640625, -0.4818115234375, -0.407958984375, -0.3341064453125, -0.26025390625, -0.1864013671875, -0.112548828125, -0.0386962890625, 0.03515625, 0.1090087890625, 0.182861328125, 0.2567138671875, 0.33056640625, 0.4044189453125, 0.478271484375, 0.5521240234375, 0.6259765625, 0.6998291015625, 0.773681640625, 0.8475341796875, 0.92138671875, 0.9952392578125, 1.069091796875, 1.1429443359375, 1.216796875, 1.2906494140625, 1.364501953125, 1.4383544921875, 1.51220703125, 1.5860595703125, 1.659912109375, 1.7337646484375, 1.8076171875, 1.8814697265625, 1.955322265625, 2.0291748046875, 2.10302734375, 2.1768798828125, 2.250732421875, 2.3245849609375, 2.3984375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 4.0, 7.0, 9.0, 5.0, 11.0, 13.0, 9.0, 21.0, 24.0, 31.0, 47.0, 61.0, 104.0, 139.0, 138.0, 108.0, 66.0, 67.0, 36.0, 30.0, 23.0, 16.0, 10.0, 9.0, 7.0, 6.0, 5.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.384765625, -3.29827880859375, -3.2117919921875, -3.12530517578125, -3.038818359375, -2.95233154296875, -2.8658447265625, -2.77935791015625, -2.69287109375, -2.60638427734375, -2.5198974609375, -2.43341064453125, -2.346923828125, -2.26043701171875, -2.1739501953125, -2.08746337890625, -2.0009765625, -1.91448974609375, -1.8280029296875, -1.74151611328125, -1.655029296875, -1.56854248046875, -1.4820556640625, -1.39556884765625, -1.30908203125, -1.22259521484375, -1.1361083984375, -1.04962158203125, -0.963134765625, -0.87664794921875, -0.7901611328125, -0.70367431640625, -0.6171875, -0.53070068359375, -0.4442138671875, -0.35772705078125, -0.271240234375, -0.18475341796875, -0.0982666015625, -0.01177978515625, 0.07470703125, 0.16119384765625, 0.2476806640625, 0.33416748046875, 0.420654296875, 0.50714111328125, 0.5936279296875, 0.68011474609375, 0.7666015625, 0.85308837890625, 0.9395751953125, 1.02606201171875, 1.112548828125, 1.19903564453125, 1.2855224609375, 1.37200927734375, 1.45849609375, 1.54498291015625, 1.6314697265625, 1.71795654296875, 1.804443359375, 1.89093017578125, 1.9774169921875, 2.06390380859375, 2.150390625]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 0.0, 7.0, 11.0, 18.0, 46.0, 50.0, 126.0, 160.0, 172.0, 153.0, 119.0, 66.0, 40.0, 23.0, 10.0, 4.0, 2.0, 3.0], "bins": [-68.13705444335938, -66.88511657714844, -65.63318634033203, -64.3812484741211, -63.12931442260742, -61.87738037109375, -60.62544250488281, -59.37350845336914, -58.12157440185547, -56.8696403503418, -55.617706298828125, -54.36576843261719, -53.113834381103516, -51.861900329589844, -50.609962463378906, -49.358028411865234, -48.10609436035156, -46.85416030883789, -45.60222625732422, -44.35028839111328, -43.09835433959961, -41.84642028808594, -40.594482421875, -39.34254837036133, -38.090614318847656, -36.838680267333984, -35.58674621582031, -34.334808349609375, -33.0828742980957, -31.83094024658203, -30.579004287719727, -29.327068328857422, -28.075136184692383, -26.823200225830078, -25.571266174316406, -24.319332122802734, -23.06739616394043, -21.815460205078125, -20.563526153564453, -19.31159210205078, -18.059656143188477, -16.807720184326172, -15.5557861328125, -14.303851127624512, -13.051916122436523, -11.799981117248535, -10.548046112060547, -9.296111106872559, -8.04417610168457, -6.792241096496582, -5.540306091308594, -4.2883710861206055, -3.036436080932617, -1.784501075744629, -0.5325660705566406, 0.7193689346313477, 1.971303939819336, 3.223238945007324, 4.4751739501953125, 5.727108955383301, 6.979043960571289, 8.230978965759277, 9.482913970947266, 10.734848976135254, 11.986783981323242]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 6.0, 6.0, 1.0, 5.0, 3.0, 3.0, 3.0, 9.0, 13.0, 12.0, 23.0, 20.0, 35.0, 34.0, 23.0, 40.0, 46.0, 38.0, 58.0, 64.0, 58.0, 64.0, 68.0, 58.0, 47.0, 45.0, 32.0, 38.0, 25.0, 22.0, 26.0, 14.0, 14.0, 14.0, 9.0, 9.0, 5.0, 13.0, 4.0, 1.0, 6.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.822039604187012, -15.275516510009766, -14.728992462158203, -14.182469367980957, -13.635946273803711, -13.089422225952148, -12.542899131774902, -11.996376037597656, -11.449851989746094, -10.903328895568848, -10.356804847717285, -9.810281753540039, -9.263758659362793, -8.717235565185547, -8.170711517333984, -7.624188423156738, -7.077665328979492, -6.531141757965088, -5.984618663787842, -5.4380950927734375, -4.891571998596191, -4.345048427581787, -3.798524856567383, -3.2520015239715576, -2.7054781913757324, -2.1589548587799072, -1.6124314069747925, -1.0659079551696777, -0.5193846225738525, 0.027138710021972656, 0.573662281036377, 1.1201856136322021, 1.666707992553711, 2.213231325149536, 2.7597546577453613, 3.3062782287597656, 3.852801561355591, 4.399324893951416, 4.94584846496582, 5.492371559143066, 6.038895130157471, 6.585418701171875, 7.131941795349121, 7.678465366363525, 8.22498893737793, 8.771512031555176, 9.318035125732422, 9.864559173583984, 10.41108226776123, 10.957605361938477, 11.504129409790039, 12.050652503967285, 12.597175598144531, 13.143699645996094, 13.69022274017334, 14.236745834350586, 14.783269882202148, 15.329792976379395, 15.876317024230957, 16.422840118408203, 16.969364166259766, 17.515886306762695, 18.062410354614258, 18.60893440246582, 19.15545654296875]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 9.0, 11.0, 13.0, 23.0, 39.0, 74.0, 149.0, 397.0, 956.0, 2531.0, 10113.0, 152855.0, 4003942.0, 17367.0, 3673.0, 1172.0, 504.0, 183.0, 116.0, 62.0, 40.0, 16.0, 13.0, 10.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0], "bins": [-9.671875, -9.43682861328125, -9.2017822265625, -8.96673583984375, -8.731689453125, -8.49664306640625, -8.2615966796875, -8.02655029296875, -7.79150390625, -7.55645751953125, -7.3214111328125, -7.08636474609375, -6.851318359375, -6.61627197265625, -6.3812255859375, -6.14617919921875, -5.9111328125, -5.67608642578125, -5.4410400390625, -5.20599365234375, -4.970947265625, -4.73590087890625, -4.5008544921875, -4.26580810546875, -4.03076171875, -3.79571533203125, -3.5606689453125, -3.32562255859375, -3.090576171875, -2.85552978515625, -2.6204833984375, -2.38543701171875, -2.150390625, -1.91534423828125, -1.6802978515625, -1.44525146484375, -1.210205078125, -0.97515869140625, -0.7401123046875, -0.50506591796875, -0.27001953125, -0.03497314453125, 0.2000732421875, 0.43511962890625, 0.670166015625, 0.90521240234375, 1.1402587890625, 1.37530517578125, 1.6103515625, 1.84539794921875, 2.0804443359375, 2.31549072265625, 2.550537109375, 2.78558349609375, 3.0206298828125, 3.25567626953125, 3.49072265625, 3.72576904296875, 3.9608154296875, 4.19586181640625, 4.430908203125, 4.66595458984375, 4.9010009765625, 5.13604736328125, 5.37109375]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [4.0, 1.0, 3.0, 0.0, 1.0, 5.0, 9.0, 8.0, 7.0, 7.0, 9.0, 20.0, 23.0, 21.0, 44.0, 39.0, 53.0, 64.0, 68.0, 59.0, 72.0, 73.0, 69.0, 67.0, 45.0, 47.0, 45.0, 29.0, 34.0, 21.0, 14.0, 18.0, 10.0, 9.0, 5.0, 4.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5556640625, -0.5292205810546875, -0.502777099609375, -0.4763336181640625, -0.44989013671875, -0.4234466552734375, -0.397003173828125, -0.3705596923828125, -0.3441162109375, -0.3176727294921875, -0.291229248046875, -0.2647857666015625, -0.23834228515625, -0.2118988037109375, -0.185455322265625, -0.1590118408203125, -0.132568359375, -0.1061248779296875, -0.079681396484375, -0.0532379150390625, -0.02679443359375, -0.0003509521484375, 0.026092529296875, 0.0525360107421875, 0.0789794921875, 0.1054229736328125, 0.131866455078125, 0.1583099365234375, 0.18475341796875, 0.2111968994140625, 0.237640380859375, 0.2640838623046875, 0.29052734375, 0.3169708251953125, 0.343414306640625, 0.3698577880859375, 0.39630126953125, 0.4227447509765625, 0.449188232421875, 0.4756317138671875, 0.5020751953125, 0.5285186767578125, 0.554962158203125, 0.5814056396484375, 0.60784912109375, 0.6342926025390625, 0.660736083984375, 0.6871795654296875, 0.713623046875, 0.7400665283203125, 0.766510009765625, 0.7929534912109375, 0.81939697265625, 0.8458404541015625, 0.872283935546875, 0.8987274169921875, 0.9251708984375, 0.9516143798828125, 0.978057861328125, 1.0045013427734375, 1.03094482421875, 1.0573883056640625, 1.083831787109375, 1.1102752685546875, 1.13671875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 4.0, 6.0, 16.0, 16.0, 28.0, 30.0, 51.0, 67.0, 110.0, 163.0, 225.0, 364.0, 506.0, 859.0, 1360.0, 2054.0, 3743.0, 7524.0, 17184.0, 54924.0, 3519421.0, 509083.0, 45460.0, 15385.0, 6782.0, 3474.0, 1962.0, 1215.0, 746.0, 487.0, 326.0, 242.0, 152.0, 98.0, 74.0, 43.0, 44.0, 28.0, 11.0, 10.0, 8.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.08203125, -2.95843505859375, -2.8348388671875, -2.71124267578125, -2.587646484375, -2.46405029296875, -2.3404541015625, -2.21685791015625, -2.09326171875, -1.96966552734375, -1.8460693359375, -1.72247314453125, -1.598876953125, -1.47528076171875, -1.3516845703125, -1.22808837890625, -1.1044921875, -0.98089599609375, -0.8572998046875, -0.73370361328125, -0.610107421875, -0.48651123046875, -0.3629150390625, -0.23931884765625, -0.11572265625, 0.00787353515625, 0.1314697265625, 0.25506591796875, 0.378662109375, 0.50225830078125, 0.6258544921875, 0.74945068359375, 0.873046875, 0.99664306640625, 1.1202392578125, 1.24383544921875, 1.367431640625, 1.49102783203125, 1.6146240234375, 1.73822021484375, 1.86181640625, 1.98541259765625, 2.1090087890625, 2.23260498046875, 2.356201171875, 2.47979736328125, 2.6033935546875, 2.72698974609375, 2.8505859375, 2.97418212890625, 3.0977783203125, 3.22137451171875, 3.344970703125, 3.46856689453125, 3.5921630859375, 3.71575927734375, 3.83935546875, 3.96295166015625, 4.0865478515625, 4.21014404296875, 4.333740234375, 4.45733642578125, 4.5809326171875, 4.70452880859375, 4.828125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 3.0, 1.0, 2.0, 7.0, 8.0, 7.0, 18.0, 15.0, 26.0, 37.0, 85.0, 230.0, 3097.0, 273.0, 102.0, 49.0, 21.0, 31.0, 13.0, 14.0, 5.0, 5.0, 8.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0322265625, -0.9961090087890625, -0.959991455078125, -0.9238739013671875, -0.88775634765625, -0.8516387939453125, -0.815521240234375, -0.7794036865234375, -0.7432861328125, -0.7071685791015625, -0.671051025390625, -0.6349334716796875, -0.59881591796875, -0.5626983642578125, -0.526580810546875, -0.4904632568359375, -0.454345703125, -0.4182281494140625, -0.382110595703125, -0.3459930419921875, -0.30987548828125, -0.2737579345703125, -0.237640380859375, -0.2015228271484375, -0.1654052734375, -0.1292877197265625, -0.093170166015625, -0.0570526123046875, -0.02093505859375, 0.0151824951171875, 0.051300048828125, 0.0874176025390625, 0.12353515625, 0.1596527099609375, 0.195770263671875, 0.2318878173828125, 0.26800537109375, 0.3041229248046875, 0.340240478515625, 0.3763580322265625, 0.4124755859375, 0.4485931396484375, 0.484710693359375, 0.5208282470703125, 0.55694580078125, 0.5930633544921875, 0.629180908203125, 0.6652984619140625, 0.701416015625, 0.7375335693359375, 0.773651123046875, 0.8097686767578125, 0.84588623046875, 0.8820037841796875, 0.918121337890625, 0.9542388916015625, 0.9903564453125, 1.0264739990234375, 1.062591552734375, 1.0987091064453125, 1.13482666015625, 1.1709442138671875, 1.207061767578125, 1.2431793212890625, 1.279296875]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 6.0, 1.0, 3.0, 4.0, 7.0, 18.0, 29.0, 29.0, 56.0, 90.0, 137.0, 149.0, 137.0, 110.0, 80.0, 66.0, 24.0, 19.0, 22.0, 12.0, 3.0, 8.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.178412437438965, -3.970205783843994, -3.7619991302490234, -3.5537924766540527, -3.345585823059082, -3.1373791694641113, -2.9291725158691406, -2.72096586227417, -2.512759208679199, -2.3045525550842285, -2.096345901489258, -1.888139247894287, -1.6799325942993164, -1.4717258214950562, -1.2635191679000854, -1.0553125143051147, -0.8471057415008545, -0.6388990879058838, -0.4306924045085907, -0.2224857211112976, -0.014279067516326904, 0.19392764568328857, 0.4021342992782593, 0.61034095287323, 0.8185476064682007, 1.0267542600631714, 1.234960913658142, 1.4431676864624023, 1.651374340057373, 1.8595809936523438, 2.0677876472473145, 2.275994300842285, 2.484200954437256, 2.6924076080322266, 2.9006142616271973, 3.108820915222168, 3.3170275688171387, 3.5252342224121094, 3.73344087600708, 3.941647529602051, 4.1498541831970215, 4.358060836791992, 4.566267490386963, 4.774474143981934, 4.982680797576904, 5.190887451171875, 5.399094104766846, 5.607300758361816, 5.815507888793945, 6.023714542388916, 6.231921195983887, 6.440127849578857, 6.648334503173828, 6.856541156768799, 7.0647478103637695, 7.27295446395874, 7.481161117553711, 7.689367771148682, 7.897574424743652, 8.105781555175781, 8.313987731933594, 8.522194862365723, 8.730401039123535, 8.938608169555664, 9.146814346313477]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 4.0, 1.0, 3.0, 3.0, 5.0, 6.0, 8.0, 10.0, 13.0, 18.0, 16.0, 19.0, 24.0, 33.0, 31.0, 26.0, 26.0, 48.0, 36.0, 30.0, 36.0, 52.0, 43.0, 41.0, 39.0, 34.0, 39.0, 35.0, 34.0, 43.0, 31.0, 29.0, 34.0, 27.0, 31.0, 22.0, 20.0, 9.0, 10.0, 10.0, 10.0, 5.0, 1.0, 2.0, 2.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0], "bins": [-3.6049296855926514, -3.502578020095825, -3.400226354598999, -3.297874689102173, -3.1955230236053467, -3.0931713581085205, -2.9908194541931152, -2.888467788696289, -2.786116123199463, -2.6837644577026367, -2.5814127922058105, -2.4790611267089844, -2.376709461212158, -2.274357795715332, -2.172006130218506, -2.0696544647216797, -1.9673027992248535, -1.8649511337280273, -1.7625994682312012, -1.660247802734375, -1.5578961372375488, -1.4555444717407227, -1.353192687034607, -1.2508410215377808, -1.1484893560409546, -1.0461376905441284, -0.9437860250473022, -0.8414342999458313, -0.7390826344490051, -0.636730968952179, -0.534379243850708, -0.43202757835388184, -0.32967591285705566, -0.2273242324590683, -0.12497255206108093, -0.022620856761932373, 0.0797308087348938, 0.18208247423171997, 0.2844341993331909, 0.3867858648300171, 0.48913753032684326, 0.5914891958236694, 0.6938408613204956, 0.7961925864219666, 0.8985442519187927, 1.0008959770202637, 1.1032476425170898, 1.205599308013916, 1.3079509735107422, 1.4103026390075684, 1.5126543045043945, 1.6150059700012207, 1.7173576354980469, 1.819709300994873, 1.9220610857009888, 2.0244126319885254, 2.1267642974853516, 2.2291159629821777, 2.331467628479004, 2.43381929397583, 2.5361709594726562, 2.6385226249694824, 2.7408742904663086, 2.8432259559631348, 2.94557785987854]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 4.0, 4.0, 8.0, 8.0, 14.0, 13.0, 18.0, 41.0, 57.0, 67.0, 91.0, 127.0, 233.0, 332.0, 558.0, 952.0, 1720.0, 3135.0, 6007.0, 12197.0, 26250.0, 57703.0, 126920.0, 241633.0, 270604.0, 160139.0, 74361.0, 33581.0, 15563.0, 7271.0, 3905.0, 2064.0, 1159.0, 633.0, 399.0, 262.0, 173.0, 113.0, 79.0, 50.0, 32.0, 30.0, 15.0, 9.0, 4.0, 5.0, 5.0, 5.0, 3.0, 1.0, 2.0, 3.0, 0.0, 3.0], "bins": [-1.9404296875, -1.8836212158203125, -1.826812744140625, -1.7700042724609375, -1.71319580078125, -1.6563873291015625, -1.599578857421875, -1.5427703857421875, -1.4859619140625, -1.4291534423828125, -1.372344970703125, -1.3155364990234375, -1.25872802734375, -1.2019195556640625, -1.145111083984375, -1.0883026123046875, -1.031494140625, -0.9746856689453125, -0.917877197265625, -0.8610687255859375, -0.80426025390625, -0.7474517822265625, -0.690643310546875, -0.6338348388671875, -0.5770263671875, -0.5202178955078125, -0.463409423828125, -0.4066009521484375, -0.34979248046875, -0.2929840087890625, -0.236175537109375, -0.1793670654296875, -0.12255859375, -0.0657501220703125, -0.008941650390625, 0.0478668212890625, 0.10467529296875, 0.1614837646484375, 0.218292236328125, 0.2751007080078125, 0.3319091796875, 0.3887176513671875, 0.445526123046875, 0.5023345947265625, 0.55914306640625, 0.6159515380859375, 0.672760009765625, 0.7295684814453125, 0.786376953125, 0.8431854248046875, 0.899993896484375, 0.9568023681640625, 1.01361083984375, 1.0704193115234375, 1.127227783203125, 1.1840362548828125, 1.2408447265625, 1.2976531982421875, 1.354461669921875, 1.4112701416015625, 1.46807861328125, 1.5248870849609375, 1.581695556640625, 1.6385040283203125, 1.6953125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 4.0, 2.0, 4.0, 8.0, 9.0, 13.0, 16.0, 21.0, 12.0, 25.0, 31.0, 43.0, 47.0, 49.0, 42.0, 62.0, 66.0, 68.0, 64.0, 67.0, 56.0, 57.0, 42.0, 38.0, 34.0, 23.0, 21.0, 22.0, 22.0, 13.0, 6.0, 6.0, 8.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7900390625, -0.758056640625, -0.72607421875, -0.694091796875, -0.662109375, -0.630126953125, -0.59814453125, -0.566162109375, -0.5341796875, -0.502197265625, -0.47021484375, -0.438232421875, -0.40625, -0.374267578125, -0.34228515625, -0.310302734375, -0.2783203125, -0.246337890625, -0.21435546875, -0.182373046875, -0.150390625, -0.118408203125, -0.08642578125, -0.054443359375, -0.0224609375, 0.009521484375, 0.04150390625, 0.073486328125, 0.10546875, 0.137451171875, 0.16943359375, 0.201416015625, 0.2333984375, 0.265380859375, 0.29736328125, 0.329345703125, 0.361328125, 0.393310546875, 0.42529296875, 0.457275390625, 0.4892578125, 0.521240234375, 0.55322265625, 0.585205078125, 0.6171875, 0.649169921875, 0.68115234375, 0.713134765625, 0.7451171875, 0.777099609375, 0.80908203125, 0.841064453125, 0.873046875, 0.905029296875, 0.93701171875, 0.968994140625, 1.0009765625, 1.032958984375, 1.06494140625, 1.096923828125, 1.12890625, 1.160888671875, 1.19287109375, 1.224853515625, 1.2568359375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 16.0, 15.0, 21.0, 35.0, 71.0, 123.0, 288.0, 687.0, 2061.0, 8697.0, 58974.0, 639457.0, 303170.0, 27640.0, 5041.0, 1366.0, 448.0, 187.0, 120.0, 53.0, 40.0, 16.0, 15.0, 8.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.70703125, -7.51348876953125, -7.3199462890625, -7.12640380859375, -6.932861328125, -6.73931884765625, -6.5457763671875, -6.35223388671875, -6.15869140625, -5.96514892578125, -5.7716064453125, -5.57806396484375, -5.384521484375, -5.19097900390625, -4.9974365234375, -4.80389404296875, -4.6103515625, -4.41680908203125, -4.2232666015625, -4.02972412109375, -3.836181640625, -3.64263916015625, -3.4490966796875, -3.25555419921875, -3.06201171875, -2.86846923828125, -2.6749267578125, -2.48138427734375, -2.287841796875, -2.09429931640625, -1.9007568359375, -1.70721435546875, -1.513671875, -1.32012939453125, -1.1265869140625, -0.93304443359375, -0.739501953125, -0.54595947265625, -0.3524169921875, -0.15887451171875, 0.03466796875, 0.22821044921875, 0.4217529296875, 0.61529541015625, 0.808837890625, 1.00238037109375, 1.1959228515625, 1.38946533203125, 1.5830078125, 1.77655029296875, 1.9700927734375, 2.16363525390625, 2.357177734375, 2.55072021484375, 2.7442626953125, 2.93780517578125, 3.13134765625, 3.32489013671875, 3.5184326171875, 3.71197509765625, 3.905517578125, 4.09906005859375, 4.2926025390625, 4.48614501953125, 4.6796875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 3.0, 3.0, 6.0, 8.0, 7.0, 15.0, 12.0, 12.0, 24.0, 24.0, 24.0, 31.0, 44.0, 58.0, 59.0, 60.0, 61.0, 75.0, 61.0, 48.0, 61.0, 47.0, 43.0, 48.0, 38.0, 25.0, 22.0, 18.0, 15.0, 12.0, 4.0, 12.0, 5.0, 4.0, 5.0, 5.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.30078125, -6.1280517578125, -5.955322265625, -5.7825927734375, -5.60986328125, -5.4371337890625, -5.264404296875, -5.0916748046875, -4.9189453125, -4.7462158203125, -4.573486328125, -4.4007568359375, -4.22802734375, -4.0552978515625, -3.882568359375, -3.7098388671875, -3.537109375, -3.3643798828125, -3.191650390625, -3.0189208984375, -2.84619140625, -2.6734619140625, -2.500732421875, -2.3280029296875, -2.1552734375, -1.9825439453125, -1.809814453125, -1.6370849609375, -1.46435546875, -1.2916259765625, -1.118896484375, -0.9461669921875, -0.7734375, -0.6007080078125, -0.427978515625, -0.2552490234375, -0.08251953125, 0.0902099609375, 0.262939453125, 0.4356689453125, 0.6083984375, 0.7811279296875, 0.953857421875, 1.1265869140625, 1.29931640625, 1.4720458984375, 1.644775390625, 1.8175048828125, 1.990234375, 2.1629638671875, 2.335693359375, 2.5084228515625, 2.68115234375, 2.8538818359375, 3.026611328125, 3.1993408203125, 3.3720703125, 3.5447998046875, 3.717529296875, 3.8902587890625, 4.06298828125, 4.2357177734375, 4.408447265625, 4.5811767578125, 4.75390625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 9.0, 6.0, 8.0, 19.0, 34.0, 54.0, 121.0, 181.0, 488.0, 1262.0, 5231.0, 51124.0, 856430.0, 122118.0, 8663.0, 1749.0, 538.0, 239.0, 113.0, 75.0, 32.0, 22.0, 17.0, 8.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.20703125, -4.07403564453125, -3.9410400390625, -3.80804443359375, -3.675048828125, -3.54205322265625, -3.4090576171875, -3.27606201171875, -3.14306640625, -3.01007080078125, -2.8770751953125, -2.74407958984375, -2.611083984375, -2.47808837890625, -2.3450927734375, -2.21209716796875, -2.0791015625, -1.94610595703125, -1.8131103515625, -1.68011474609375, -1.547119140625, -1.41412353515625, -1.2811279296875, -1.14813232421875, -1.01513671875, -0.88214111328125, -0.7491455078125, -0.61614990234375, -0.483154296875, -0.35015869140625, -0.2171630859375, -0.08416748046875, 0.048828125, 0.18182373046875, 0.3148193359375, 0.44781494140625, 0.580810546875, 0.71380615234375, 0.8468017578125, 0.97979736328125, 1.11279296875, 1.24578857421875, 1.3787841796875, 1.51177978515625, 1.644775390625, 1.77777099609375, 1.9107666015625, 2.04376220703125, 2.1767578125, 2.30975341796875, 2.4427490234375, 2.57574462890625, 2.708740234375, 2.84173583984375, 2.9747314453125, 3.10772705078125, 3.24072265625, 3.37371826171875, 3.5067138671875, 3.63970947265625, 3.772705078125, 3.90570068359375, 4.0386962890625, 4.17169189453125, 4.3046875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 6.0, 2.0, 1.0, 6.0, 14.0, 9.0, 26.0, 28.0, 40.0, 51.0, 86.0, 119.0, 126.0, 125.0, 111.0, 110.0, 44.0, 38.0, 24.0, 18.0, 10.0, 7.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0], "bins": [-0.0005655288696289062, -0.0005529113113880157, -0.0005402937531471252, -0.0005276761949062347, -0.0005150586366653442, -0.0005024410784244537, -0.0004898235201835632, -0.00047720596194267273, -0.0004645884037017822, -0.0004519708454608917, -0.0004393532872200012, -0.0004267357289791107, -0.0004141181707382202, -0.0004015006124973297, -0.0003888830542564392, -0.0003762654960155487, -0.0003636479377746582, -0.0003510303795337677, -0.0003384128212928772, -0.0003257952630519867, -0.0003131777048110962, -0.0003005601465702057, -0.0002879425883293152, -0.0002753250300884247, -0.0002627074718475342, -0.0002500899136066437, -0.00023747235536575317, -0.00022485479712486267, -0.00021223723888397217, -0.00019961968064308167, -0.00018700212240219116, -0.00017438456416130066, -0.00016176700592041016, -0.00014914944767951965, -0.00013653188943862915, -0.00012391433119773865, -0.00011129677295684814, -9.867921471595764e-05, -8.606165647506714e-05, -7.344409823417664e-05, -6.082653999328613e-05, -4.820898175239563e-05, -3.559142351150513e-05, -2.2973865270614624e-05, -1.0356307029724121e-05, 2.261251211166382e-06, 1.4878809452056885e-05, 2.7496367692947388e-05, 4.011392593383789e-05, 5.2731484174728394e-05, 6.53490424156189e-05, 7.79666006565094e-05, 9.05841588973999e-05, 0.0001032017171382904, 0.00011581927537918091, 0.0001284368336200714, 0.00014105439186096191, 0.00015367195010185242, 0.00016628950834274292, 0.00017890706658363342, 0.00019152462482452393, 0.00020414218306541443, 0.00021675974130630493, 0.00022937729954719543, 0.00024199485778808594]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 8.0, 14.0, 18.0, 26.0, 45.0, 92.0, 210.0, 480.0, 1962.0, 29210.0, 974053.0, 39279.0, 2181.0, 530.0, 206.0, 107.0, 49.0, 31.0, 20.0, 11.0, 8.0, 5.0, 2.0, 7.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6640625, -8.4503173828125, -8.236572265625, -8.0228271484375, -7.80908203125, -7.5953369140625, -7.381591796875, -7.1678466796875, -6.9541015625, -6.7403564453125, -6.526611328125, -6.3128662109375, -6.09912109375, -5.8853759765625, -5.671630859375, -5.4578857421875, -5.244140625, -5.0303955078125, -4.816650390625, -4.6029052734375, -4.38916015625, -4.1754150390625, -3.961669921875, -3.7479248046875, -3.5341796875, -3.3204345703125, -3.106689453125, -2.8929443359375, -2.67919921875, -2.4654541015625, -2.251708984375, -2.0379638671875, -1.82421875, -1.6104736328125, -1.396728515625, -1.1829833984375, -0.96923828125, -0.7554931640625, -0.541748046875, -0.3280029296875, -0.1142578125, 0.0994873046875, 0.313232421875, 0.5269775390625, 0.74072265625, 0.9544677734375, 1.168212890625, 1.3819580078125, 1.595703125, 1.8094482421875, 2.023193359375, 2.2369384765625, 2.45068359375, 2.6644287109375, 2.878173828125, 3.0919189453125, 3.3056640625, 3.5194091796875, 3.733154296875, 3.9468994140625, 4.16064453125, 4.3743896484375, 4.588134765625, 4.8018798828125, 5.015625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 9.0, 17.0, 27.0, 69.0, 173.0, 306.0, 235.0, 109.0, 32.0, 21.0, 6.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.890625, -10.662567138671875, -10.43450927734375, -10.206451416015625, -9.9783935546875, -9.750335693359375, -9.52227783203125, -9.294219970703125, -9.066162109375, -8.838104248046875, -8.61004638671875, -8.381988525390625, -8.1539306640625, -7.925872802734375, -7.69781494140625, -7.469757080078125, -7.24169921875, -7.013641357421875, -6.78558349609375, -6.557525634765625, -6.3294677734375, -6.101409912109375, -5.87335205078125, -5.645294189453125, -5.417236328125, -5.189178466796875, -4.96112060546875, -4.733062744140625, -4.5050048828125, -4.276947021484375, -4.04888916015625, -3.820831298828125, -3.5927734375, -3.364715576171875, -3.13665771484375, -2.908599853515625, -2.6805419921875, -2.452484130859375, -2.22442626953125, -1.996368408203125, -1.768310546875, -1.540252685546875, -1.31219482421875, -1.084136962890625, -0.8560791015625, -0.628021240234375, -0.39996337890625, -0.171905517578125, 0.05615234375, 0.284210205078125, 0.51226806640625, 0.740325927734375, 0.9683837890625, 1.196441650390625, 1.42449951171875, 1.652557373046875, 1.880615234375, 2.108673095703125, 2.33673095703125, 2.564788818359375, 2.7928466796875, 3.020904541015625, 3.24896240234375, 3.477020263671875, 3.705078125]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 11.0, 27.0, 116.0, 362.0, 359.0, 121.0, 13.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.034568786621094, -43.15842819213867, -39.282283782958984, -35.40614318847656, -31.530000686645508, -27.653858184814453, -23.77771759033203, -19.901575088500977, -16.025432586669922, -12.149290084838867, -8.273148536682129, -4.397006988525391, -0.5208644866943359, 3.3552780151367188, 7.231418609619141, 11.107561111450195, 14.98370361328125, 18.859846115112305, 22.73598861694336, 26.61212921142578, 30.488271713256836, 34.36441421508789, 38.24055480957031, 42.11669921875, 45.99283981323242, 49.868980407714844, 53.74512481689453, 57.62126541137695, 61.497406005859375, 65.37355041503906, 69.24969482421875, 73.1258316040039, 77.00196838378906, 80.87811279296875, 84.7542495727539, 88.6303939819336, 92.50653839111328, 96.38267517089844, 100.25881958007812, 104.13496398925781, 108.0111083984375, 111.88725280761719, 115.76338958740234, 119.63953399658203, 123.51567840576172, 127.39181518554688, 131.26795959472656, 135.14410400390625, 139.02023315429688, 142.89637756347656, 146.77252197265625, 150.64865112304688, 154.52479553222656, 158.40093994140625, 162.27708435058594, 166.15322875976562, 170.0293731689453, 173.905517578125, 177.7816619873047, 181.65780639648438, 185.533935546875, 189.4100799560547, 193.28622436523438, 197.16236877441406, 201.03851318359375]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 5.0, 7.0, 4.0, 2.0, 9.0, 9.0, 17.0, 10.0, 16.0, 22.0, 19.0, 26.0, 29.0, 39.0, 36.0, 52.0, 44.0, 38.0, 60.0, 44.0, 77.0, 55.0, 52.0, 47.0, 37.0, 37.0, 34.0, 30.0, 25.0, 24.0, 21.0, 15.0, 10.0, 8.0, 17.0, 5.0, 5.0, 7.0, 5.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.857677459716797, -22.127111434936523, -21.39654541015625, -20.665979385375977, -19.935413360595703, -19.20484733581543, -18.474281311035156, -17.743715286254883, -17.01314926147461, -16.282583236694336, -15.552017211914062, -14.821451187133789, -14.090885162353516, -13.360319137573242, -12.629753112792969, -11.899187088012695, -11.168621063232422, -10.438055038452148, -9.707489013671875, -8.976922988891602, -8.246356964111328, -7.515790939331055, -6.785224914550781, -6.054658889770508, -5.324092864990234, -4.593526840209961, -3.8629608154296875, -3.132394790649414, -2.4018287658691406, -1.6712627410888672, -0.9406967163085938, -0.2101306915283203, 0.5204334259033203, 1.2509994506835938, 1.9815654754638672, 2.7121315002441406, 3.442697525024414, 4.1732635498046875, 4.903829574584961, 5.634395599365234, 6.364961624145508, 7.095527648925781, 7.826093673706055, 8.556659698486328, 9.287225723266602, 10.017791748046875, 10.748357772827148, 11.478923797607422, 12.209489822387695, 12.940055847167969, 13.670621871948242, 14.401187896728516, 15.131753921508789, 15.862319946289062, 16.592885971069336, 17.32345199584961, 18.054018020629883, 18.784584045410156, 19.51515007019043, 20.245716094970703, 20.976282119750977, 21.70684814453125, 22.437414169311523, 23.167980194091797, 23.89854621887207]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 5.0, 4.0, 1.0, 2.0, 5.0, 9.0, 16.0, 23.0, 30.0, 58.0, 103.0, 202.0, 397.0, 794.0, 1750.0, 5336.0, 42106.0, 4122099.0, 15591.0, 3337.0, 1195.0, 566.0, 254.0, 163.0, 85.0, 51.0, 31.0, 15.0, 12.0, 13.0, 7.0, 11.0, 2.0, 6.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.8046875, -8.5322265625, -8.259765625, -7.9873046875, -7.71484375, -7.4423828125, -7.169921875, -6.8974609375, -6.625, -6.3525390625, -6.080078125, -5.8076171875, -5.53515625, -5.2626953125, -4.990234375, -4.7177734375, -4.4453125, -4.1728515625, -3.900390625, -3.6279296875, -3.35546875, -3.0830078125, -2.810546875, -2.5380859375, -2.265625, -1.9931640625, -1.720703125, -1.4482421875, -1.17578125, -0.9033203125, -0.630859375, -0.3583984375, -0.0859375, 0.1865234375, 0.458984375, 0.7314453125, 1.00390625, 1.2763671875, 1.548828125, 1.8212890625, 2.09375, 2.3662109375, 2.638671875, 2.9111328125, 3.18359375, 3.4560546875, 3.728515625, 4.0009765625, 4.2734375, 4.5458984375, 4.818359375, 5.0908203125, 5.36328125, 5.6357421875, 5.908203125, 6.1806640625, 6.453125, 6.7255859375, 6.998046875, 7.2705078125, 7.54296875, 7.8154296875, 8.087890625, 8.3603515625, 8.6328125]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 7.0, 6.0, 11.0, 18.0, 30.0, 31.0, 39.0, 43.0, 58.0, 72.0, 84.0, 87.0, 87.0, 93.0, 79.0, 54.0, 56.0, 33.0, 25.0, 28.0, 16.0, 12.0, 12.0, 5.0, 6.0, 2.0, 4.0, 0.0, 4.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1611328125, -1.1131591796875, -1.065185546875, -1.0172119140625, -0.96923828125, -0.9212646484375, -0.873291015625, -0.8253173828125, -0.77734375, -0.7293701171875, -0.681396484375, -0.6334228515625, -0.58544921875, -0.5374755859375, -0.489501953125, -0.4415283203125, -0.3935546875, -0.3455810546875, -0.297607421875, -0.2496337890625, -0.20166015625, -0.1536865234375, -0.105712890625, -0.0577392578125, -0.009765625, 0.0382080078125, 0.086181640625, 0.1341552734375, 0.18212890625, 0.2301025390625, 0.278076171875, 0.3260498046875, 0.3740234375, 0.4219970703125, 0.469970703125, 0.5179443359375, 0.56591796875, 0.6138916015625, 0.661865234375, 0.7098388671875, 0.7578125, 0.8057861328125, 0.853759765625, 0.9017333984375, 0.94970703125, 0.9976806640625, 1.045654296875, 1.0936279296875, 1.1416015625, 1.1895751953125, 1.237548828125, 1.2855224609375, 1.33349609375, 1.3814697265625, 1.429443359375, 1.4774169921875, 1.525390625, 1.5733642578125, 1.621337890625, 1.6693115234375, 1.71728515625, 1.7652587890625, 1.813232421875, 1.8612060546875, 1.9091796875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 7.0, 4.0, 16.0, 12.0, 25.0, 27.0, 27.0, 76.0, 92.0, 158.0, 273.0, 360.0, 573.0, 1011.0, 1859.0, 3846.0, 9980.0, 48790.0, 4070440.0, 39832.0, 9016.0, 3551.0, 1744.0, 994.0, 514.0, 346.0, 244.0, 141.0, 81.0, 66.0, 55.0, 40.0, 31.0, 13.0, 13.0, 9.0, 5.0, 6.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.41015625, -6.17669677734375, -5.9432373046875, -5.70977783203125, -5.476318359375, -5.24285888671875, -5.0093994140625, -4.77593994140625, -4.54248046875, -4.30902099609375, -4.0755615234375, -3.84210205078125, -3.608642578125, -3.37518310546875, -3.1417236328125, -2.90826416015625, -2.6748046875, -2.44134521484375, -2.2078857421875, -1.97442626953125, -1.740966796875, -1.50750732421875, -1.2740478515625, -1.04058837890625, -0.80712890625, -0.57366943359375, -0.3402099609375, -0.10675048828125, 0.126708984375, 0.36016845703125, 0.5936279296875, 0.82708740234375, 1.060546875, 1.29400634765625, 1.5274658203125, 1.76092529296875, 1.994384765625, 2.22784423828125, 2.4613037109375, 2.69476318359375, 2.92822265625, 3.16168212890625, 3.3951416015625, 3.62860107421875, 3.862060546875, 4.09552001953125, 4.3289794921875, 4.56243896484375, 4.7958984375, 5.02935791015625, 5.2628173828125, 5.49627685546875, 5.729736328125, 5.96319580078125, 6.1966552734375, 6.43011474609375, 6.66357421875, 6.89703369140625, 7.1304931640625, 7.36395263671875, 7.597412109375, 7.83087158203125, 8.0643310546875, 8.29779052734375, 8.53125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 5.0, 12.0, 11.0, 22.0, 37.0, 76.0, 3630.0, 167.0, 52.0, 19.0, 10.0, 6.0, 3.0, 3.0, 3.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.41796875, -1.3607177734375, -1.303466796875, -1.2462158203125, -1.18896484375, -1.1317138671875, -1.074462890625, -1.0172119140625, -0.9599609375, -0.9027099609375, -0.845458984375, -0.7882080078125, -0.73095703125, -0.6737060546875, -0.616455078125, -0.5592041015625, -0.501953125, -0.4447021484375, -0.387451171875, -0.3302001953125, -0.27294921875, -0.2156982421875, -0.158447265625, -0.1011962890625, -0.0439453125, 0.0133056640625, 0.070556640625, 0.1278076171875, 0.18505859375, 0.2423095703125, 0.299560546875, 0.3568115234375, 0.4140625, 0.4713134765625, 0.528564453125, 0.5858154296875, 0.64306640625, 0.7003173828125, 0.757568359375, 0.8148193359375, 0.8720703125, 0.9293212890625, 0.986572265625, 1.0438232421875, 1.10107421875, 1.1583251953125, 1.215576171875, 1.2728271484375, 1.330078125, 1.3873291015625, 1.444580078125, 1.5018310546875, 1.55908203125, 1.6163330078125, 1.673583984375, 1.7308349609375, 1.7880859375, 1.8453369140625, 1.902587890625, 1.9598388671875, 2.01708984375, 2.0743408203125, 2.131591796875, 2.1888427734375, 2.24609375]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 7.0, 7.0, 10.0, 15.0, 28.0, 45.0, 84.0, 119.0, 137.0, 148.0, 116.0, 105.0, 55.0, 42.0, 33.0, 20.0, 10.0, 4.0, 8.0, 7.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.686426162719727, -6.486286640167236, -6.286147117614746, -6.086007118225098, -5.885867595672607, -5.685728073120117, -5.485588550567627, -5.285449028015137, -5.085309028625488, -4.885169506072998, -4.685029983520508, -4.484889984130859, -4.284750461578369, -4.084610939025879, -3.8844714164733887, -3.6843318939208984, -3.484192371368408, -3.284052848815918, -3.0839130878448486, -2.8837735652923584, -2.683633804321289, -2.483494281768799, -2.2833547592163086, -2.0832152366638184, -1.883075475692749, -1.6829358339309692, -1.4827961921691895, -1.2826566696166992, -1.0825170278549194, -0.8823773860931396, -0.6822378635406494, -0.48209822177886963, -0.28195905685424805, -0.08181944489479065, 0.11832016706466675, 0.31845974922180176, 0.5185993909835815, 0.7187390327453613, 0.9188785552978516, 1.1190181970596313, 1.3191578388214111, 1.519297480583191, 1.7194371223449707, 1.919576644897461, 2.119716167449951, 2.3198559284210205, 2.5199954509735107, 2.72013521194458, 2.9202747344970703, 3.1204142570495605, 3.32055401802063, 3.52069354057312, 3.7208333015441895, 3.9209728240966797, 4.12111234664917, 4.32125186920166, 4.521391868591309, 4.721531391143799, 4.921670913696289, 5.1218109130859375, 5.321950435638428, 5.522089958190918, 5.722229480743408, 5.922369003295898, 6.122508525848389]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 5.0, 3.0, 3.0, 7.0, 6.0, 10.0, 17.0, 9.0, 7.0, 18.0, 17.0, 23.0, 20.0, 17.0, 28.0, 33.0, 40.0, 45.0, 39.0, 49.0, 46.0, 40.0, 43.0, 38.0, 40.0, 35.0, 47.0, 51.0, 24.0, 37.0, 30.0, 23.0, 27.0, 19.0, 25.0, 19.0, 19.0, 15.0, 9.0, 7.0, 6.0, 3.0, 2.0, 5.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.822389602661133, -2.73347806930542, -2.644566297531128, -2.555654764175415, -2.466742992401123, -2.37783145904541, -2.2889199256896973, -2.2000083923339844, -2.1110966205596924, -2.0221850872039795, -1.9332733154296875, -1.8443617820739746, -1.7554501295089722, -1.6665384769439697, -1.5776269435882568, -1.4887152910232544, -1.399803638458252, -1.3108919858932495, -1.221980333328247, -1.1330687999725342, -1.0441571474075317, -0.9552454948425293, -0.8663339018821716, -0.777422308921814, -0.6885106563568115, -0.5995990037918091, -0.5106874108314514, -0.42177578806877136, -0.3328641653060913, -0.24395254254341125, -0.1550409197807312, -0.06612932682037354, 0.022782325744628906, 0.11169394850730896, 0.200605571269989, 0.28951719403266907, 0.3784288167953491, 0.4673404395580292, 0.5562520623207092, 0.6451636552810669, 0.7340753078460693, 0.8229869604110718, 0.9118985533714294, 1.000810146331787, 1.0897217988967896, 1.178633451461792, 1.2675449848175049, 1.3564566373825073, 1.4453682899475098, 1.5342799425125122, 1.6231915950775146, 1.7121031284332275, 1.80101478099823, 1.8899264335632324, 1.9788379669189453, 2.067749500274658, 2.15666127204895, 2.245572805404663, 2.334484577178955, 2.423396110534668, 2.512307643890381, 2.601219415664673, 2.6901309490203857, 2.7790427207946777, 2.8679542541503906]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 1.0, 2.0, 3.0, 11.0, 9.0, 8.0, 16.0, 18.0, 40.0, 43.0, 61.0, 108.0, 121.0, 262.0, 409.0, 746.0, 1490.0, 3424.0, 8094.0, 21670.0, 65901.0, 210980.0, 427685.0, 207354.0, 63953.0, 21452.0, 7999.0, 3320.0, 1518.0, 756.0, 433.0, 200.0, 148.0, 93.0, 62.0, 48.0, 35.0, 26.0, 19.0, 11.0, 3.0, 5.0, 6.0, 3.0, 7.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.83984375, -2.749664306640625, -2.65948486328125, -2.569305419921875, -2.4791259765625, -2.388946533203125, -2.29876708984375, -2.208587646484375, -2.118408203125, -2.028228759765625, -1.93804931640625, -1.847869873046875, -1.7576904296875, -1.667510986328125, -1.57733154296875, -1.487152099609375, -1.39697265625, -1.306793212890625, -1.21661376953125, -1.126434326171875, -1.0362548828125, -0.946075439453125, -0.85589599609375, -0.765716552734375, -0.675537109375, -0.585357666015625, -0.49517822265625, -0.404998779296875, -0.3148193359375, -0.224639892578125, -0.13446044921875, -0.044281005859375, 0.0458984375, 0.136077880859375, 0.22625732421875, 0.316436767578125, 0.4066162109375, 0.496795654296875, 0.58697509765625, 0.677154541015625, 0.767333984375, 0.857513427734375, 0.94769287109375, 1.037872314453125, 1.1280517578125, 1.218231201171875, 1.30841064453125, 1.398590087890625, 1.48876953125, 1.578948974609375, 1.66912841796875, 1.759307861328125, 1.8494873046875, 1.939666748046875, 2.02984619140625, 2.120025634765625, 2.210205078125, 2.300384521484375, 2.39056396484375, 2.480743408203125, 2.5709228515625, 2.661102294921875, 2.75128173828125, 2.841461181640625, 2.931640625]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 6.0, 3.0, 10.0, 11.0, 11.0, 18.0, 24.0, 38.0, 42.0, 49.0, 56.0, 65.0, 71.0, 51.0, 71.0, 77.0, 64.0, 52.0, 67.0, 40.0, 40.0, 38.0, 31.0, 15.0, 15.0, 14.0, 6.0, 5.0, 2.0, 3.0, 2.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3916015625, -1.3461456298828125, -1.300689697265625, -1.2552337646484375, -1.20977783203125, -1.1643218994140625, -1.118865966796875, -1.0734100341796875, -1.0279541015625, -0.9824981689453125, -0.937042236328125, -0.8915863037109375, -0.84613037109375, -0.8006744384765625, -0.755218505859375, -0.7097625732421875, -0.664306640625, -0.6188507080078125, -0.573394775390625, -0.5279388427734375, -0.48248291015625, -0.4370269775390625, -0.391571044921875, -0.3461151123046875, -0.3006591796875, -0.2552032470703125, -0.209747314453125, -0.1642913818359375, -0.11883544921875, -0.0733795166015625, -0.027923583984375, 0.0175323486328125, 0.06298828125, 0.1084442138671875, 0.153900146484375, 0.1993560791015625, 0.24481201171875, 0.2902679443359375, 0.335723876953125, 0.3811798095703125, 0.4266357421875, 0.4720916748046875, 0.517547607421875, 0.5630035400390625, 0.60845947265625, 0.6539154052734375, 0.699371337890625, 0.7448272705078125, 0.790283203125, 0.8357391357421875, 0.881195068359375, 0.9266510009765625, 0.97210693359375, 1.0175628662109375, 1.063018798828125, 1.1084747314453125, 1.1539306640625, 1.1993865966796875, 1.244842529296875, 1.2902984619140625, 1.33575439453125, 1.3812103271484375, 1.426666259765625, 1.4721221923828125, 1.517578125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 4.0, 5.0, 6.0, 6.0, 10.0, 15.0, 22.0, 42.0, 59.0, 92.0, 178.0, 355.0, 670.0, 1750.0, 6183.0, 34155.0, 306668.0, 612162.0, 70813.0, 10818.0, 2679.0, 924.0, 396.0, 215.0, 115.0, 66.0, 47.0, 27.0, 24.0, 21.0, 10.0, 8.0, 4.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.375, -4.2078857421875, -4.040771484375, -3.8736572265625, -3.70654296875, -3.5394287109375, -3.372314453125, -3.2052001953125, -3.0380859375, -2.8709716796875, -2.703857421875, -2.5367431640625, -2.36962890625, -2.2025146484375, -2.035400390625, -1.8682861328125, -1.701171875, -1.5340576171875, -1.366943359375, -1.1998291015625, -1.03271484375, -0.8656005859375, -0.698486328125, -0.5313720703125, -0.3642578125, -0.1971435546875, -0.030029296875, 0.1370849609375, 0.30419921875, 0.4713134765625, 0.638427734375, 0.8055419921875, 0.97265625, 1.1397705078125, 1.306884765625, 1.4739990234375, 1.64111328125, 1.8082275390625, 1.975341796875, 2.1424560546875, 2.3095703125, 2.4766845703125, 2.643798828125, 2.8109130859375, 2.97802734375, 3.1451416015625, 3.312255859375, 3.4793701171875, 3.646484375, 3.8135986328125, 3.980712890625, 4.1478271484375, 4.31494140625, 4.4820556640625, 4.649169921875, 4.8162841796875, 4.9833984375, 5.1505126953125, 5.317626953125, 5.4847412109375, 5.65185546875, 5.8189697265625, 5.986083984375, 6.1531982421875, 6.3203125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 3.0, 5.0, 9.0, 12.0, 11.0, 19.0, 14.0, 20.0, 26.0, 25.0, 23.0, 38.0, 33.0, 40.0, 59.0, 50.0, 61.0, 54.0, 58.0, 51.0, 51.0, 52.0, 42.0, 45.0, 50.0, 29.0, 22.0, 20.0, 19.0, 11.0, 9.0, 14.0, 8.0, 5.0, 7.0, 3.0, 0.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.46875, -5.27874755859375, -5.0887451171875, -4.89874267578125, -4.708740234375, -4.51873779296875, -4.3287353515625, -4.13873291015625, -3.94873046875, -3.75872802734375, -3.5687255859375, -3.37872314453125, -3.188720703125, -2.99871826171875, -2.8087158203125, -2.61871337890625, -2.4287109375, -2.23870849609375, -2.0487060546875, -1.85870361328125, -1.668701171875, -1.47869873046875, -1.2886962890625, -1.09869384765625, -0.90869140625, -0.71868896484375, -0.5286865234375, -0.33868408203125, -0.148681640625, 0.04132080078125, 0.2313232421875, 0.42132568359375, 0.611328125, 0.80133056640625, 0.9913330078125, 1.18133544921875, 1.371337890625, 1.56134033203125, 1.7513427734375, 1.94134521484375, 2.13134765625, 2.32135009765625, 2.5113525390625, 2.70135498046875, 2.891357421875, 3.08135986328125, 3.2713623046875, 3.46136474609375, 3.6513671875, 3.84136962890625, 4.0313720703125, 4.22137451171875, 4.411376953125, 4.60137939453125, 4.7913818359375, 4.98138427734375, 5.17138671875, 5.36138916015625, 5.5513916015625, 5.74139404296875, 5.931396484375, 6.12139892578125, 6.3114013671875, 6.50140380859375, 6.69140625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 3.0, 5.0, 11.0, 7.0, 18.0, 22.0, 38.0, 29.0, 68.0, 95.0, 190.0, 307.0, 622.0, 1484.0, 4594.0, 23470.0, 407671.0, 571666.0, 29920.0, 5190.0, 1644.0, 633.0, 315.0, 214.0, 124.0, 70.0, 36.0, 32.0, 23.0, 15.0, 10.0, 9.0, 6.0, 1.0, 2.0, 4.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.923828125, -2.8265380859375, -2.729248046875, -2.6319580078125, -2.53466796875, -2.4373779296875, -2.340087890625, -2.2427978515625, -2.1455078125, -2.0482177734375, -1.950927734375, -1.8536376953125, -1.75634765625, -1.6590576171875, -1.561767578125, -1.4644775390625, -1.3671875, -1.2698974609375, -1.172607421875, -1.0753173828125, -0.97802734375, -0.8807373046875, -0.783447265625, -0.6861572265625, -0.5888671875, -0.4915771484375, -0.394287109375, -0.2969970703125, -0.19970703125, -0.1024169921875, -0.005126953125, 0.0921630859375, 0.189453125, 0.2867431640625, 0.384033203125, 0.4813232421875, 0.57861328125, 0.6759033203125, 0.773193359375, 0.8704833984375, 0.9677734375, 1.0650634765625, 1.162353515625, 1.2596435546875, 1.35693359375, 1.4542236328125, 1.551513671875, 1.6488037109375, 1.74609375, 1.8433837890625, 1.940673828125, 2.0379638671875, 2.13525390625, 2.2325439453125, 2.329833984375, 2.4271240234375, 2.5244140625, 2.6217041015625, 2.718994140625, 2.8162841796875, 2.91357421875, 3.0108642578125, 3.108154296875, 3.2054443359375, 3.302734375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 1.0, 3.0, 4.0, 8.0, 13.0, 25.0, 36.0, 52.0, 72.0, 76.0, 127.0, 128.0, 146.0, 115.0, 59.0, 57.0, 38.0, 20.0, 16.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00025963783264160156, -0.00024629756808280945, -0.00023295730352401733, -0.00021961703896522522, -0.0002062767744064331, -0.000192936509847641, -0.00017959624528884888, -0.00016625598073005676, -0.00015291571617126465, -0.00013957545161247253, -0.00012623518705368042, -0.0001128949224948883, -9.955465793609619e-05, -8.621439337730408e-05, -7.287412881851196e-05, -5.953386425971985e-05, -4.6193599700927734e-05, -3.285333514213562e-05, -1.9513070583343506e-05, -6.172806024551392e-06, 7.167458534240723e-06, 2.0507723093032837e-05, 3.384798765182495e-05, 4.7188252210617065e-05, 6.052851676940918e-05, 7.38687813282013e-05, 8.720904588699341e-05, 0.00010054931044578552, 0.00011388957500457764, 0.00012722983956336975, 0.00014057010412216187, 0.00015391036868095398, 0.0001672506332397461, 0.0001805908977985382, 0.00019393116235733032, 0.00020727142691612244, 0.00022061169147491455, 0.00023395195603370667, 0.0002472922205924988, 0.0002606324851512909, 0.000273972749710083, 0.0002873130142688751, 0.00030065327882766724, 0.00031399354338645935, 0.00032733380794525146, 0.0003406740725040436, 0.0003540143370628357, 0.0003673546016216278, 0.0003806948661804199, 0.00039403513073921204, 0.00040737539529800415, 0.00042071565985679626, 0.0004340559244155884, 0.0004473961889743805, 0.0004607364535331726, 0.0004740767180919647, 0.00048741698265075684, 0.000500757247209549, 0.0005140975117683411, 0.0005274377763271332, 0.0005407780408859253, 0.0005541183054447174, 0.0005674585700035095, 0.0005807988345623016, 0.0005941390991210938]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 1.0, 4.0, 11.0, 5.0, 10.0, 18.0, 17.0, 34.0, 56.0, 99.0, 258.0, 593.0, 1712.0, 6597.0, 59015.0, 884947.0, 84156.0, 7934.0, 1934.0, 659.0, 243.0, 109.0, 54.0, 28.0, 24.0, 12.0, 12.0, 3.0, 5.0, 6.0, 4.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.140625, -4.0093994140625, -3.878173828125, -3.7469482421875, -3.61572265625, -3.4844970703125, -3.353271484375, -3.2220458984375, -3.0908203125, -2.9595947265625, -2.828369140625, -2.6971435546875, -2.56591796875, -2.4346923828125, -2.303466796875, -2.1722412109375, -2.041015625, -1.9097900390625, -1.778564453125, -1.6473388671875, -1.51611328125, -1.3848876953125, -1.253662109375, -1.1224365234375, -0.9912109375, -0.8599853515625, -0.728759765625, -0.5975341796875, -0.46630859375, -0.3350830078125, -0.203857421875, -0.0726318359375, 0.05859375, 0.1898193359375, 0.321044921875, 0.4522705078125, 0.58349609375, 0.7147216796875, 0.845947265625, 0.9771728515625, 1.1083984375, 1.2396240234375, 1.370849609375, 1.5020751953125, 1.63330078125, 1.7645263671875, 1.895751953125, 2.0269775390625, 2.158203125, 2.2894287109375, 2.420654296875, 2.5518798828125, 2.68310546875, 2.8143310546875, 2.945556640625, 3.0767822265625, 3.2080078125, 3.3392333984375, 3.470458984375, 3.6016845703125, 3.73291015625, 3.8641357421875, 3.995361328125, 4.1265869140625, 4.2578125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 7.0, 11.0, 18.0, 26.0, 34.0, 53.0, 73.0, 94.0, 116.0, 116.0, 109.0, 72.0, 80.0, 54.0, 38.0, 23.0, 13.0, 14.0, 4.0, 6.0, 5.0, 5.0, 7.0, 2.0, 3.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.365234375, -2.275848388671875, -2.18646240234375, -2.097076416015625, -2.0076904296875, -1.918304443359375, -1.82891845703125, -1.739532470703125, -1.650146484375, -1.560760498046875, -1.47137451171875, -1.381988525390625, -1.2926025390625, -1.203216552734375, -1.11383056640625, -1.024444580078125, -0.93505859375, -0.845672607421875, -0.75628662109375, -0.666900634765625, -0.5775146484375, -0.488128662109375, -0.39874267578125, -0.309356689453125, -0.219970703125, -0.130584716796875, -0.04119873046875, 0.048187255859375, 0.1375732421875, 0.226959228515625, 0.31634521484375, 0.405731201171875, 0.4951171875, 0.584503173828125, 0.67388916015625, 0.763275146484375, 0.8526611328125, 0.942047119140625, 1.03143310546875, 1.120819091796875, 1.210205078125, 1.299591064453125, 1.38897705078125, 1.478363037109375, 1.5677490234375, 1.657135009765625, 1.74652099609375, 1.835906982421875, 1.92529296875, 2.014678955078125, 2.10406494140625, 2.193450927734375, 2.2828369140625, 2.372222900390625, 2.46160888671875, 2.550994873046875, 2.640380859375, 2.729766845703125, 2.81915283203125, 2.908538818359375, 2.9979248046875, 3.087310791015625, 3.17669677734375, 3.266082763671875, 3.35546875]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 5.0, 11.0, 100.0, 370.0, 407.0, 93.0, 25.0, 3.0, 1.0, 1.0, 1.0], "bins": [-240.26705932617188, -236.05662536621094, -231.84619140625, -227.63575744628906, -223.42532348632812, -219.21487426757812, -215.00445556640625, -210.79400634765625, -206.5835723876953, -202.37313842773438, -198.16270446777344, -193.9522705078125, -189.74183654785156, -185.53140258789062, -181.32095336914062, -177.1105194091797, -172.90008544921875, -168.6896514892578, -164.47921752929688, -160.26878356933594, -156.058349609375, -151.847900390625, -147.63748168945312, -143.42703247070312, -139.21661376953125, -135.0061798095703, -130.79574584960938, -126.58531188964844, -122.37487030029297, -118.16443634033203, -113.9540023803711, -109.74356842041016, -105.53313446044922, -101.32270050048828, -97.11226654052734, -92.90182495117188, -88.69139099121094, -84.48095703125, -80.27052307128906, -76.06008911132812, -71.84964752197266, -67.63921356201172, -63.428775787353516, -59.21834182739258, -55.007904052734375, -50.79747009277344, -46.5870361328125, -42.37660217285156, -38.166168212890625, -33.95573425292969, -29.745296478271484, -25.534862518310547, -21.324426651000977, -17.113990783691406, -12.903556823730469, -8.693120956420898, -4.482683181762695, -0.2722477912902832, 3.938187599182129, 8.148622512817383, 12.359058380126953, 16.569494247436523, 20.77992820739746, 24.99036407470703, 29.2007999420166]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 6.0, 4.0, 2.0, 6.0, 7.0, 12.0, 17.0, 14.0, 24.0, 28.0, 34.0, 47.0, 54.0, 43.0, 59.0, 46.0, 89.0, 60.0, 71.0, 51.0, 51.0, 57.0, 50.0, 44.0, 26.0, 20.0, 24.0, 19.0, 13.0, 10.0, 6.0, 2.0, 4.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-38.46742248535156, -37.43059539794922, -36.393768310546875, -35.35694122314453, -34.32011413574219, -33.28328323364258, -32.246456146240234, -31.20962905883789, -30.172801971435547, -29.135974884033203, -28.09914779663086, -27.062318801879883, -26.02549171447754, -24.988664627075195, -23.95183563232422, -22.915008544921875, -21.87818145751953, -20.841354370117188, -19.804527282714844, -18.767698287963867, -17.730871200561523, -16.69404411315918, -15.65721607208252, -14.62038803100586, -13.583560943603516, -12.546733856201172, -11.509905815124512, -10.473077774047852, -9.436250686645508, -8.399423599243164, -7.362595558166504, -6.325767993927002, -5.288944244384766, -4.252116680145264, -3.2152891159057617, -2.1784615516662598, -1.1416339874267578, -0.10480642318725586, 0.9320211410522461, 1.968848705291748, 3.00567626953125, 4.042503833770752, 5.079331398010254, 6.116158962249756, 7.152986526489258, 8.189813613891602, 9.226641654968262, 10.263469696044922, 11.300296783447266, 12.33712387084961, 13.37395191192627, 14.41077995300293, 15.447607040405273, 16.484434127807617, 17.521263122558594, 18.558090209960938, 19.59491729736328, 20.631744384765625, 21.66857147216797, 22.705400466918945, 23.74222755432129, 24.779054641723633, 25.81588363647461, 26.852710723876953, 27.889537811279297]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 13.0, 6.0, 18.0, 26.0, 37.0, 57.0, 86.0, 155.0, 243.0, 516.0, 1195.0, 2982.0, 9567.0, 95161.0, 4050680.0, 25130.0, 5237.0, 1707.0, 698.0, 349.0, 163.0, 89.0, 59.0, 44.0, 21.0, 10.0, 10.0, 6.0, 4.0, 2.0, 7.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.0, -4.80206298828125, -4.6041259765625, -4.40618896484375, -4.208251953125, -4.01031494140625, -3.8123779296875, -3.61444091796875, -3.41650390625, -3.21856689453125, -3.0206298828125, -2.82269287109375, -2.624755859375, -2.42681884765625, -2.2288818359375, -2.03094482421875, -1.8330078125, -1.63507080078125, -1.4371337890625, -1.23919677734375, -1.041259765625, -0.84332275390625, -0.6453857421875, -0.44744873046875, -0.24951171875, -0.05157470703125, 0.1463623046875, 0.34429931640625, 0.542236328125, 0.74017333984375, 0.9381103515625, 1.13604736328125, 1.333984375, 1.53192138671875, 1.7298583984375, 1.92779541015625, 2.125732421875, 2.32366943359375, 2.5216064453125, 2.71954345703125, 2.91748046875, 3.11541748046875, 3.3133544921875, 3.51129150390625, 3.709228515625, 3.90716552734375, 4.1051025390625, 4.30303955078125, 4.5009765625, 4.69891357421875, 4.8968505859375, 5.09478759765625, 5.292724609375, 5.49066162109375, 5.6885986328125, 5.88653564453125, 6.08447265625, 6.28240966796875, 6.4803466796875, 6.67828369140625, 6.876220703125, 7.07415771484375, 7.2720947265625, 7.47003173828125, 7.66796875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 5.0, 4.0, 5.0, 8.0, 9.0, 24.0, 38.0, 49.0, 61.0, 71.0, 101.0, 99.0, 121.0, 110.0, 84.0, 69.0, 48.0, 37.0, 20.0, 11.0, 11.0, 6.0, 6.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.416015625, -2.3471832275390625, -2.278350830078125, -2.2095184326171875, -2.14068603515625, -2.0718536376953125, -2.003021240234375, -1.9341888427734375, -1.8653564453125, -1.7965240478515625, -1.727691650390625, -1.6588592529296875, -1.59002685546875, -1.5211944580078125, -1.452362060546875, -1.3835296630859375, -1.314697265625, -1.2458648681640625, -1.177032470703125, -1.1082000732421875, -1.03936767578125, -0.9705352783203125, -0.901702880859375, -0.8328704833984375, -0.7640380859375, -0.6952056884765625, -0.626373291015625, -0.5575408935546875, -0.48870849609375, -0.4198760986328125, -0.351043701171875, -0.2822113037109375, -0.21337890625, -0.1445465087890625, -0.075714111328125, -0.0068817138671875, 0.06195068359375, 0.1307830810546875, 0.199615478515625, 0.2684478759765625, 0.3372802734375, 0.4061126708984375, 0.474945068359375, 0.5437774658203125, 0.61260986328125, 0.6814422607421875, 0.750274658203125, 0.8191070556640625, 0.887939453125, 0.9567718505859375, 1.025604248046875, 1.0944366455078125, 1.16326904296875, 1.2321014404296875, 1.300933837890625, 1.3697662353515625, 1.4385986328125, 1.5074310302734375, 1.576263427734375, 1.6450958251953125, 1.71392822265625, 1.7827606201171875, 1.851593017578125, 1.9204254150390625, 1.9892578125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 6.0, 2.0, 7.0, 16.0, 20.0, 31.0, 30.0, 50.0, 53.0, 90.0, 120.0, 197.0, 284.0, 478.0, 789.0, 1373.0, 2659.0, 6049.0, 16002.0, 63934.0, 3877381.0, 179110.0, 28108.0, 9113.0, 3822.0, 1893.0, 1012.0, 563.0, 346.0, 241.0, 167.0, 115.0, 67.0, 41.0, 40.0, 23.0, 17.0, 13.0, 12.0, 6.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.5, -3.36395263671875, -3.2279052734375, -3.09185791015625, -2.955810546875, -2.81976318359375, -2.6837158203125, -2.54766845703125, -2.41162109375, -2.27557373046875, -2.1395263671875, -2.00347900390625, -1.867431640625, -1.73138427734375, -1.5953369140625, -1.45928955078125, -1.3232421875, -1.18719482421875, -1.0511474609375, -0.91510009765625, -0.779052734375, -0.64300537109375, -0.5069580078125, -0.37091064453125, -0.23486328125, -0.09881591796875, 0.0372314453125, 0.17327880859375, 0.309326171875, 0.44537353515625, 0.5814208984375, 0.71746826171875, 0.853515625, 0.98956298828125, 1.1256103515625, 1.26165771484375, 1.397705078125, 1.53375244140625, 1.6697998046875, 1.80584716796875, 1.94189453125, 2.07794189453125, 2.2139892578125, 2.35003662109375, 2.486083984375, 2.62213134765625, 2.7581787109375, 2.89422607421875, 3.0302734375, 3.16632080078125, 3.3023681640625, 3.43841552734375, 3.574462890625, 3.71051025390625, 3.8465576171875, 3.98260498046875, 4.11865234375, 4.25469970703125, 4.3907470703125, 4.52679443359375, 4.662841796875, 4.79888916015625, 4.9349365234375, 5.07098388671875, 5.20703125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 8.0, 9.0, 10.0, 5.0, 18.0, 23.0, 35.0, 53.0, 96.0, 252.0, 3183.0, 170.0, 63.0, 41.0, 32.0, 21.0, 14.0, 8.0, 8.0, 5.0, 6.0, 4.0, 5.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.841796875, -1.779144287109375, -1.71649169921875, -1.653839111328125, -1.5911865234375, -1.528533935546875, -1.46588134765625, -1.403228759765625, -1.340576171875, -1.277923583984375, -1.21527099609375, -1.152618408203125, -1.0899658203125, -1.027313232421875, -0.96466064453125, -0.902008056640625, -0.83935546875, -0.776702880859375, -0.71405029296875, -0.651397705078125, -0.5887451171875, -0.526092529296875, -0.46343994140625, -0.400787353515625, -0.338134765625, -0.275482177734375, -0.21282958984375, -0.150177001953125, -0.0875244140625, -0.024871826171875, 0.03778076171875, 0.100433349609375, 0.1630859375, 0.225738525390625, 0.28839111328125, 0.351043701171875, 0.4136962890625, 0.476348876953125, 0.53900146484375, 0.601654052734375, 0.664306640625, 0.726959228515625, 0.78961181640625, 0.852264404296875, 0.9149169921875, 0.977569580078125, 1.04022216796875, 1.102874755859375, 1.16552734375, 1.228179931640625, 1.29083251953125, 1.353485107421875, 1.4161376953125, 1.478790283203125, 1.54144287109375, 1.604095458984375, 1.666748046875, 1.729400634765625, 1.79205322265625, 1.854705810546875, 1.9173583984375, 1.980010986328125, 2.04266357421875, 2.105316162109375, 2.16796875]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 8.0, 4.0, 17.0, 25.0, 67.0, 126.0, 199.0, 229.0, 166.0, 94.0, 39.0, 15.0, 8.0, 6.0, 5.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.184077262878418, -13.732525825500488, -13.280973434448242, -12.829421997070312, -12.377870559692383, -11.926318168640137, -11.474766731262207, -11.023214340209961, -10.571662902832031, -10.120111465454102, -9.668559074401855, -9.217007637023926, -8.76545524597168, -8.31390380859375, -7.86235237121582, -7.410800457000732, -6.9592485427856445, -6.507696628570557, -6.056144714355469, -5.604593276977539, -5.153041362762451, -4.701489448547363, -4.249938011169434, -3.7983860969543457, -3.346834182739258, -2.89528226852417, -2.443730592727661, -1.9921787977218628, -1.5406270027160645, -1.0890750885009766, -0.6375234127044678, -0.18597173690795898, 0.2655811309814453, 0.7171329259872437, 1.168684720993042, 1.6202365159988403, 2.0717883110046387, 2.5233402252197266, 2.9748919010162354, 3.426443576812744, 3.877995491027832, 4.32954740524292, 4.781099319458008, 5.2326507568359375, 5.684202671051025, 6.135754585266113, 6.587306022644043, 7.038857936859131, 7.490409851074219, 7.941961765289307, 8.393513679504395, 8.845065116882324, 9.29661750793457, 9.7481689453125, 10.19972038269043, 10.65127182006836, 11.102824211120605, 11.554375648498535, 12.005928039550781, 12.457479476928711, 12.90903091430664, 13.360583305358887, 13.812134742736816, 14.263687133789062, 14.715238571166992]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 6.0, 2.0, 5.0, 8.0, 10.0, 6.0, 15.0, 21.0, 25.0, 25.0, 26.0, 27.0, 39.0, 36.0, 37.0, 33.0, 35.0, 46.0, 55.0, 46.0, 48.0, 38.0, 34.0, 48.0, 41.0, 32.0, 46.0, 39.0, 24.0, 28.0, 22.0, 18.0, 19.0, 11.0, 14.0, 13.0, 5.0, 5.0, 8.0, 2.0, 5.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.659075736999512, -4.512619972229004, -4.366164207458496, -4.219708442687988, -4.0732526779174805, -3.9267966747283936, -3.7803406715393066, -3.633884906768799, -3.487429141998291, -3.340973377227783, -3.1945176124572754, -3.0480616092681885, -2.9016058444976807, -2.755150079727173, -2.608694076538086, -2.462238311767578, -2.3157825469970703, -2.1693267822265625, -2.0228710174560547, -1.8764150142669678, -1.72995924949646, -1.5835034847259521, -1.4370476007461548, -1.2905917167663574, -1.1441359519958496, -0.997680127620697, -0.8512243032455444, -0.7047684788703918, -0.5583126544952393, -0.41185683012008667, -0.2654010057449341, -0.11894512176513672, 0.027510643005371094, 0.17396646738052368, 0.32042229175567627, 0.46687811613082886, 0.6133339405059814, 0.759789764881134, 0.9062455892562866, 1.052701473236084, 1.1991572380065918, 1.3456130027770996, 1.492068886756897, 1.6385247707366943, 1.7849805355072021, 1.93143630027771, 2.077892303466797, 2.2243480682373047, 2.3708038330078125, 2.5172595977783203, 2.663715362548828, 2.810171365737915, 2.956627130508423, 3.1030828952789307, 3.2495388984680176, 3.3959946632385254, 3.542450428009033, 3.688906192779541, 3.835361957550049, 3.9818179607391357, 4.128273963928223, 4.2747297286987305, 4.421185493469238, 4.567641258239746, 4.714097023010254]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 3.0, 6.0, 9.0, 12.0, 31.0, 72.0, 120.0, 332.0, 984.0, 3573.0, 21613.0, 241951.0, 680691.0, 86226.0, 9810.0, 2085.0, 603.0, 213.0, 114.0, 47.0, 30.0, 17.0, 7.0, 7.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.86328125, -7.657958984375, -7.45263671875, -7.247314453125, -7.0419921875, -6.836669921875, -6.63134765625, -6.426025390625, -6.220703125, -6.015380859375, -5.81005859375, -5.604736328125, -5.3994140625, -5.194091796875, -4.98876953125, -4.783447265625, -4.578125, -4.372802734375, -4.16748046875, -3.962158203125, -3.7568359375, -3.551513671875, -3.34619140625, -3.140869140625, -2.935546875, -2.730224609375, -2.52490234375, -2.319580078125, -2.1142578125, -1.908935546875, -1.70361328125, -1.498291015625, -1.29296875, -1.087646484375, -0.88232421875, -0.677001953125, -0.4716796875, -0.266357421875, -0.06103515625, 0.144287109375, 0.349609375, 0.554931640625, 0.76025390625, 0.965576171875, 1.1708984375, 1.376220703125, 1.58154296875, 1.786865234375, 1.9921875, 2.197509765625, 2.40283203125, 2.608154296875, 2.8134765625, 3.018798828125, 3.22412109375, 3.429443359375, 3.634765625, 3.840087890625, 4.04541015625, 4.250732421875, 4.4560546875, 4.661376953125, 4.86669921875, 5.072021484375, 5.27734375]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 8.0, 3.0, 9.0, 15.0, 13.0, 36.0, 41.0, 56.0, 76.0, 93.0, 97.0, 110.0, 102.0, 98.0, 75.0, 56.0, 37.0, 22.0, 19.0, 19.0, 8.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.62109375, -2.5492401123046875, -2.477386474609375, -2.4055328369140625, -2.33367919921875, -2.2618255615234375, -2.189971923828125, -2.1181182861328125, -2.0462646484375, -1.9744110107421875, -1.902557373046875, -1.8307037353515625, -1.75885009765625, -1.6869964599609375, -1.615142822265625, -1.5432891845703125, -1.471435546875, -1.3995819091796875, -1.327728271484375, -1.2558746337890625, -1.18402099609375, -1.1121673583984375, -1.040313720703125, -0.9684600830078125, -0.8966064453125, -0.8247528076171875, -0.752899169921875, -0.6810455322265625, -0.60919189453125, -0.5373382568359375, -0.465484619140625, -0.3936309814453125, -0.32177734375, -0.2499237060546875, -0.178070068359375, -0.1062164306640625, -0.03436279296875, 0.0374908447265625, 0.109344482421875, 0.1811981201171875, 0.2530517578125, 0.3249053955078125, 0.396759033203125, 0.4686126708984375, 0.54046630859375, 0.6123199462890625, 0.684173583984375, 0.7560272216796875, 0.827880859375, 0.8997344970703125, 0.971588134765625, 1.0434417724609375, 1.11529541015625, 1.1871490478515625, 1.259002685546875, 1.3308563232421875, 1.4027099609375, 1.4745635986328125, 1.546417236328125, 1.6182708740234375, 1.69012451171875, 1.7619781494140625, 1.833831787109375, 1.9056854248046875, 1.9775390625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 3.0, 5.0, 3.0, 8.0, 5.0, 8.0, 19.0, 23.0, 27.0, 48.0, 82.0, 118.0, 174.0, 335.0, 621.0, 1312.0, 3346.0, 10667.0, 49647.0, 328849.0, 538967.0, 89430.0, 16803.0, 4545.0, 1697.0, 762.0, 404.0, 240.0, 129.0, 89.0, 54.0, 48.0, 35.0, 19.0, 15.0, 6.0, 3.0, 3.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.90625, -4.77056884765625, -4.6348876953125, -4.49920654296875, -4.363525390625, -4.22784423828125, -4.0921630859375, -3.95648193359375, -3.82080078125, -3.68511962890625, -3.5494384765625, -3.41375732421875, -3.278076171875, -3.14239501953125, -3.0067138671875, -2.87103271484375, -2.7353515625, -2.59967041015625, -2.4639892578125, -2.32830810546875, -2.192626953125, -2.05694580078125, -1.9212646484375, -1.78558349609375, -1.64990234375, -1.51422119140625, -1.3785400390625, -1.24285888671875, -1.107177734375, -0.97149658203125, -0.8358154296875, -0.70013427734375, -0.564453125, -0.42877197265625, -0.2930908203125, -0.15740966796875, -0.021728515625, 0.11395263671875, 0.2496337890625, 0.38531494140625, 0.52099609375, 0.65667724609375, 0.7923583984375, 0.92803955078125, 1.063720703125, 1.19940185546875, 1.3350830078125, 1.47076416015625, 1.6064453125, 1.74212646484375, 1.8778076171875, 2.01348876953125, 2.149169921875, 2.28485107421875, 2.4205322265625, 2.55621337890625, 2.69189453125, 2.82757568359375, 2.9632568359375, 3.09893798828125, 3.234619140625, 3.37030029296875, 3.5059814453125, 3.64166259765625, 3.77734375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 5.0, 7.0, 9.0, 6.0, 9.0, 11.0, 10.0, 17.0, 13.0, 27.0, 24.0, 34.0, 29.0, 39.0, 45.0, 54.0, 42.0, 56.0, 55.0, 48.0, 59.0, 46.0, 57.0, 42.0, 45.0, 34.0, 30.0, 24.0, 22.0, 16.0, 10.0, 17.0, 22.0, 11.0, 6.0, 10.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.65625, -5.4912109375, -5.326171875, -5.1611328125, -4.99609375, -4.8310546875, -4.666015625, -4.5009765625, -4.3359375, -4.1708984375, -4.005859375, -3.8408203125, -3.67578125, -3.5107421875, -3.345703125, -3.1806640625, -3.015625, -2.8505859375, -2.685546875, -2.5205078125, -2.35546875, -2.1904296875, -2.025390625, -1.8603515625, -1.6953125, -1.5302734375, -1.365234375, -1.2001953125, -1.03515625, -0.8701171875, -0.705078125, -0.5400390625, -0.375, -0.2099609375, -0.044921875, 0.1201171875, 0.28515625, 0.4501953125, 0.615234375, 0.7802734375, 0.9453125, 1.1103515625, 1.275390625, 1.4404296875, 1.60546875, 1.7705078125, 1.935546875, 2.1005859375, 2.265625, 2.4306640625, 2.595703125, 2.7607421875, 2.92578125, 3.0908203125, 3.255859375, 3.4208984375, 3.5859375, 3.7509765625, 3.916015625, 4.0810546875, 4.24609375, 4.4111328125, 4.576171875, 4.7412109375, 4.90625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 0.0, 9.0, 9.0, 10.0, 22.0, 19.0, 28.0, 92.0, 175.0, 413.0, 989.0, 4112.0, 30756.0, 665431.0, 325858.0, 16437.0, 2750.0, 779.0, 325.0, 142.0, 60.0, 56.0, 28.0, 16.0, 12.0, 5.0, 6.0, 5.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.71484375, -2.6450042724609375, -2.575164794921875, -2.5053253173828125, -2.43548583984375, -2.3656463623046875, -2.295806884765625, -2.2259674072265625, -2.1561279296875, -2.0862884521484375, -2.016448974609375, -1.9466094970703125, -1.87677001953125, -1.8069305419921875, -1.737091064453125, -1.6672515869140625, -1.597412109375, -1.5275726318359375, -1.457733154296875, -1.3878936767578125, -1.31805419921875, -1.2482147216796875, -1.178375244140625, -1.1085357666015625, -1.0386962890625, -0.9688568115234375, -0.899017333984375, -0.8291778564453125, -0.75933837890625, -0.6894989013671875, -0.619659423828125, -0.5498199462890625, -0.47998046875, -0.4101409912109375, -0.340301513671875, -0.2704620361328125, -0.20062255859375, -0.1307830810546875, -0.060943603515625, 0.0088958740234375, 0.0787353515625, 0.1485748291015625, 0.218414306640625, 0.2882537841796875, 0.35809326171875, 0.4279327392578125, 0.497772216796875, 0.5676116943359375, 0.637451171875, 0.7072906494140625, 0.777130126953125, 0.8469696044921875, 0.91680908203125, 0.9866485595703125, 1.056488037109375, 1.1263275146484375, 1.1961669921875, 1.2660064697265625, 1.335845947265625, 1.4056854248046875, 1.47552490234375, 1.5453643798828125, 1.615203857421875, 1.6850433349609375, 1.7548828125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 2.0, 2.0, 10.0, 5.0, 8.0, 12.0, 8.0, 17.0, 24.0, 25.0, 30.0, 31.0, 37.0, 58.0, 72.0, 56.0, 74.0, 78.0, 96.0, 71.0, 77.0, 48.0, 37.0, 37.0, 24.0, 9.0, 8.0, 15.0, 6.0, 7.0, 4.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002162456512451172, -0.00020909495651721954, -0.0002019442617893219, -0.00019479356706142426, -0.0001876428723335266, -0.00018049217760562897, -0.00017334148287773132, -0.00016619078814983368, -0.00015904009342193604, -0.0001518893986940384, -0.00014473870396614075, -0.0001375880092382431, -0.00013043731451034546, -0.00012328661978244781, -0.00011613592505455017, -0.00010898523032665253, -0.00010183453559875488, -9.468384087085724e-05, -8.75331461429596e-05, -8.038245141506195e-05, -7.32317566871643e-05, -6.608106195926666e-05, -5.893036723136902e-05, -5.1779672503471375e-05, -4.462897777557373e-05, -3.7478283047676086e-05, -3.0327588319778442e-05, -2.31768935918808e-05, -1.6026198863983154e-05, -8.87550413608551e-06, -1.7248094081878662e-06, 5.425885319709778e-06, 1.2576580047607422e-05, 1.9727274775505066e-05, 2.687796950340271e-05, 3.4028664231300354e-05, 4.1179358959198e-05, 4.833005368709564e-05, 5.5480748414993286e-05, 6.263144314289093e-05, 6.978213787078857e-05, 7.693283259868622e-05, 8.408352732658386e-05, 9.12342220544815e-05, 9.838491678237915e-05, 0.0001055356115102768, 0.00011268630623817444, 0.00011983700096607208, 0.00012698769569396973, 0.00013413839042186737, 0.00014128908514976501, 0.00014843977987766266, 0.0001555904746055603, 0.00016274116933345795, 0.0001698918640613556, 0.00017704255878925323, 0.00018419325351715088, 0.00019134394824504852, 0.00019849464297294617, 0.0002056453377008438, 0.00021279603242874146, 0.0002199467271566391, 0.00022709742188453674, 0.0002342481166124344, 0.00024139881134033203]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 6.0, 0.0, 1.0, 1.0, 3.0, 1.0, 7.0, 12.0, 10.0, 22.0, 46.0, 55.0, 145.0, 282.0, 623.0, 1870.0, 9430.0, 177368.0, 811795.0, 40487.0, 4369.0, 1161.0, 422.0, 210.0, 95.0, 49.0, 33.0, 19.0, 24.0, 6.0, 0.0, 6.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.328125, -2.245819091796875, -2.16351318359375, -2.081207275390625, -1.9989013671875, -1.916595458984375, -1.83428955078125, -1.751983642578125, -1.669677734375, -1.587371826171875, -1.50506591796875, -1.422760009765625, -1.3404541015625, -1.258148193359375, -1.17584228515625, -1.093536376953125, -1.01123046875, -0.928924560546875, -0.84661865234375, -0.764312744140625, -0.6820068359375, -0.599700927734375, -0.51739501953125, -0.435089111328125, -0.352783203125, -0.270477294921875, -0.18817138671875, -0.105865478515625, -0.0235595703125, 0.058746337890625, 0.14105224609375, 0.223358154296875, 0.3056640625, 0.387969970703125, 0.47027587890625, 0.552581787109375, 0.6348876953125, 0.717193603515625, 0.79949951171875, 0.881805419921875, 0.964111328125, 1.046417236328125, 1.12872314453125, 1.211029052734375, 1.2933349609375, 1.375640869140625, 1.45794677734375, 1.540252685546875, 1.62255859375, 1.704864501953125, 1.78717041015625, 1.869476318359375, 1.9517822265625, 2.034088134765625, 2.11639404296875, 2.198699951171875, 2.281005859375, 2.363311767578125, 2.44561767578125, 2.527923583984375, 2.6102294921875, 2.692535400390625, 2.77484130859375, 2.857147216796875, 2.939453125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 1.0, 11.0, 15.0, 19.0, 34.0, 36.0, 51.0, 67.0, 71.0, 90.0, 88.0, 101.0, 85.0, 71.0, 68.0, 49.0, 44.0, 25.0, 21.0, 16.0, 9.0, 13.0, 7.0, 4.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0380859375, -0.9887847900390625, -0.939483642578125, -0.8901824951171875, -0.84088134765625, -0.7915802001953125, -0.742279052734375, -0.6929779052734375, -0.6436767578125, -0.5943756103515625, -0.545074462890625, -0.4957733154296875, -0.44647216796875, -0.3971710205078125, -0.347869873046875, -0.2985687255859375, -0.249267578125, -0.1999664306640625, -0.150665283203125, -0.1013641357421875, -0.05206298828125, -0.0027618408203125, 0.046539306640625, 0.0958404541015625, 0.1451416015625, 0.1944427490234375, 0.243743896484375, 0.2930450439453125, 0.34234619140625, 0.3916473388671875, 0.440948486328125, 0.4902496337890625, 0.53955078125, 0.5888519287109375, 0.638153076171875, 0.6874542236328125, 0.73675537109375, 0.7860565185546875, 0.835357666015625, 0.8846588134765625, 0.9339599609375, 0.9832611083984375, 1.032562255859375, 1.0818634033203125, 1.13116455078125, 1.1804656982421875, 1.229766845703125, 1.2790679931640625, 1.328369140625, 1.3776702880859375, 1.426971435546875, 1.4762725830078125, 1.52557373046875, 1.5748748779296875, 1.624176025390625, 1.6734771728515625, 1.7227783203125, 1.7720794677734375, 1.821380615234375, 1.8706817626953125, 1.91998291015625, 1.9692840576171875, 2.018585205078125, 2.0678863525390625, 2.1171875]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 7.0, 8.0, 13.0, 27.0, 71.0, 132.0, 197.0, 243.0, 166.0, 77.0, 45.0, 16.0, 10.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.57719802856445, -38.83559799194336, -37.09400177001953, -35.35240173339844, -33.610801696777344, -31.869205474853516, -30.127605438232422, -28.38600730895996, -26.6444091796875, -24.90281105041504, -23.161212921142578, -21.419612884521484, -19.678014755249023, -17.936416625976562, -16.19481658935547, -14.453218460083008, -12.711620330810547, -10.970022201538086, -9.228423118591309, -7.4868245124816895, -5.74522590637207, -4.003627777099609, -2.262028694152832, -0.5204296112060547, 1.2211685180664062, 2.9627671241760254, 4.7043657302856445, 6.445964336395264, 8.187562942504883, 9.929161071777344, 11.670760154724121, 13.412359237670898, 15.153953552246094, 16.895551681518555, 18.637149810791016, 20.37874984741211, 22.12034797668457, 23.86194610595703, 25.603546142578125, 27.345144271850586, 29.086742401123047, 30.828340530395508, 32.56993865966797, 34.31153869628906, 36.053138732910156, 37.794734954833984, 39.53633499145508, 41.277931213378906, 43.01953125, 44.761131286621094, 46.50272750854492, 48.244327545166016, 49.985923767089844, 51.72752380371094, 53.46912384033203, 55.210723876953125, 56.95232009887695, 58.69392013549805, 60.435516357421875, 62.17711639404297, 63.91871643066406, 65.66030883789062, 67.40190887451172, 69.14350891113281, 70.8851089477539]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 10.0, 10.0, 7.0, 17.0, 16.0, 20.0, 29.0, 31.0, 44.0, 41.0, 50.0, 59.0, 79.0, 69.0, 74.0, 62.0, 86.0, 46.0, 49.0, 36.0, 36.0, 27.0, 21.0, 17.0, 22.0, 13.0, 13.0, 7.0, 6.0, 0.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.024574279785156, -30.084320068359375, -29.144065856933594, -28.203811645507812, -27.26355743408203, -26.32330322265625, -25.3830509185791, -24.44279670715332, -23.50254249572754, -22.562288284301758, -21.622034072875977, -20.681779861450195, -19.741527557373047, -18.801273345947266, -17.861019134521484, -16.920764923095703, -15.980510711669922, -15.04025650024414, -14.10000228881836, -13.159749031066895, -12.219494819641113, -11.279240608215332, -10.338987350463867, -9.398733139038086, -8.458478927612305, -7.518224716186523, -6.5779709815979, -5.637717247009277, -4.697463035583496, -3.757208824157715, -2.816955089569092, -1.8767013549804688, -0.9364471435546875, 0.0038068294525146484, 0.9440608024597168, 1.884314775466919, 2.824568748474121, 3.7648229598999023, 4.705076694488525, 5.645330429077148, 6.58558464050293, 7.525838851928711, 8.466093063354492, 9.406346321105957, 10.346600532531738, 11.28685474395752, 12.227108001708984, 13.167362213134766, 14.107616424560547, 15.047870635986328, 15.98812484741211, 16.92837905883789, 17.868633270263672, 18.808887481689453, 19.7491397857666, 20.689393997192383, 21.629648208618164, 22.569902420043945, 23.510156631469727, 24.450410842895508, 25.390663146972656, 26.330917358398438, 27.27117156982422, 28.21142578125, 29.15167999267578]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 11.0, 13.0, 29.0, 58.0, 136.0, 223.0, 470.0, 1214.0, 3637.0, 16445.0, 136630.0, 3826631.0, 183923.0, 18504.0, 4048.0, 1276.0, 530.0, 214.0, 115.0, 62.0, 43.0, 17.0, 16.0, 14.0, 7.0, 8.0, 1.0, 1.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-5.75390625, -5.61199951171875, -5.4700927734375, -5.32818603515625, -5.186279296875, -5.04437255859375, -4.9024658203125, -4.76055908203125, -4.61865234375, -4.47674560546875, -4.3348388671875, -4.19293212890625, -4.051025390625, -3.90911865234375, -3.7672119140625, -3.62530517578125, -3.4833984375, -3.34149169921875, -3.1995849609375, -3.05767822265625, -2.915771484375, -2.77386474609375, -2.6319580078125, -2.49005126953125, -2.34814453125, -2.20623779296875, -2.0643310546875, -1.92242431640625, -1.780517578125, -1.63861083984375, -1.4967041015625, -1.35479736328125, -1.212890625, -1.07098388671875, -0.9290771484375, -0.78717041015625, -0.645263671875, -0.50335693359375, -0.3614501953125, -0.21954345703125, -0.07763671875, 0.06427001953125, 0.2061767578125, 0.34808349609375, 0.489990234375, 0.63189697265625, 0.7738037109375, 0.91571044921875, 1.0576171875, 1.19952392578125, 1.3414306640625, 1.48333740234375, 1.625244140625, 1.76715087890625, 1.9090576171875, 2.05096435546875, 2.19287109375, 2.33477783203125, 2.4766845703125, 2.61859130859375, 2.760498046875, 2.90240478515625, 3.0443115234375, 3.18621826171875, 3.328125]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 2.0, 6.0, 12.0, 10.0, 12.0, 15.0, 18.0, 24.0, 26.0, 32.0, 29.0, 36.0, 36.0, 41.0, 58.0, 52.0, 49.0, 64.0, 58.0, 51.0, 51.0, 55.0, 53.0, 43.0, 33.0, 24.0, 23.0, 17.0, 11.0, 14.0, 18.0, 9.0, 7.0, 1.0, 5.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.81884765625, -0.7853927612304688, -0.7519378662109375, -0.7184829711914062, -0.685028076171875, -0.6515731811523438, -0.6181182861328125, -0.5846633911132812, -0.55120849609375, -0.5177536010742188, -0.4842987060546875, -0.45084381103515625, -0.417388916015625, -0.38393402099609375, -0.3504791259765625, -0.31702423095703125, -0.2835693359375, -0.25011444091796875, -0.2166595458984375, -0.18320465087890625, -0.149749755859375, -0.11629486083984375, -0.0828399658203125, -0.04938507080078125, -0.01593017578125, 0.01752471923828125, 0.0509796142578125, 0.08443450927734375, 0.117889404296875, 0.15134429931640625, 0.1847991943359375, 0.21825408935546875, 0.251708984375, 0.28516387939453125, 0.3186187744140625, 0.35207366943359375, 0.385528564453125, 0.41898345947265625, 0.4524383544921875, 0.48589324951171875, 0.51934814453125, 0.5528030395507812, 0.5862579345703125, 0.6197128295898438, 0.653167724609375, 0.6866226196289062, 0.7200775146484375, 0.7535324096679688, 0.7869873046875, 0.8204421997070312, 0.8538970947265625, 0.8873519897460938, 0.920806884765625, 0.9542617797851562, 0.9877166748046875, 1.0211715698242188, 1.05462646484375, 1.0880813598632812, 1.1215362548828125, 1.1549911499023438, 1.188446044921875, 1.2219009399414062, 1.2553558349609375, 1.2888107299804688, 1.322265625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 3.0, 9.0, 4.0, 4.0, 11.0, 13.0, 32.0, 53.0, 85.0, 213.0, 603.0, 1720.0, 6592.0, 37055.0, 1020777.0, 3061310.0, 53612.0, 8680.0, 2248.0, 687.0, 288.0, 142.0, 57.0, 31.0, 15.0, 17.0, 9.0, 3.0, 2.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.109375, -5.94464111328125, -5.7799072265625, -5.61517333984375, -5.450439453125, -5.28570556640625, -5.1209716796875, -4.95623779296875, -4.79150390625, -4.62677001953125, -4.4620361328125, -4.29730224609375, -4.132568359375, -3.96783447265625, -3.8031005859375, -3.63836669921875, -3.4736328125, -3.30889892578125, -3.1441650390625, -2.97943115234375, -2.814697265625, -2.64996337890625, -2.4852294921875, -2.32049560546875, -2.15576171875, -1.99102783203125, -1.8262939453125, -1.66156005859375, -1.496826171875, -1.33209228515625, -1.1673583984375, -1.00262451171875, -0.837890625, -0.67315673828125, -0.5084228515625, -0.34368896484375, -0.178955078125, -0.01422119140625, 0.1505126953125, 0.31524658203125, 0.47998046875, 0.64471435546875, 0.8094482421875, 0.97418212890625, 1.138916015625, 1.30364990234375, 1.4683837890625, 1.63311767578125, 1.7978515625, 1.96258544921875, 2.1273193359375, 2.29205322265625, 2.456787109375, 2.62152099609375, 2.7862548828125, 2.95098876953125, 3.11572265625, 3.28045654296875, 3.4451904296875, 3.60992431640625, 3.774658203125, 3.93939208984375, 4.1041259765625, 4.26885986328125, 4.43359375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 9.0, 13.0, 7.0, 6.0, 11.0, 16.0, 28.0, 32.0, 41.0, 79.0, 124.0, 225.0, 416.0, 861.0, 1002.0, 494.0, 256.0, 119.0, 103.0, 54.0, 47.0, 30.0, 17.0, 12.0, 15.0, 12.0, 9.0, 11.0, 8.0, 3.0, 2.0, 0.0, 4.0, 0.0, 3.0, 1.0, 3.0, 0.0, 2.0, 3.0, 0.0, 1.0], "bins": [-3.62890625, -3.528472900390625, -3.42803955078125, -3.327606201171875, -3.2271728515625, -3.126739501953125, -3.02630615234375, -2.925872802734375, -2.825439453125, -2.725006103515625, -2.62457275390625, -2.524139404296875, -2.4237060546875, -2.323272705078125, -2.22283935546875, -2.122406005859375, -2.02197265625, -1.921539306640625, -1.82110595703125, -1.720672607421875, -1.6202392578125, -1.519805908203125, -1.41937255859375, -1.318939208984375, -1.218505859375, -1.118072509765625, -1.01763916015625, -0.917205810546875, -0.8167724609375, -0.716339111328125, -0.61590576171875, -0.515472412109375, -0.4150390625, -0.314605712890625, -0.21417236328125, -0.113739013671875, -0.0133056640625, 0.087127685546875, 0.18756103515625, 0.287994384765625, 0.388427734375, 0.488861083984375, 0.58929443359375, 0.689727783203125, 0.7901611328125, 0.890594482421875, 0.99102783203125, 1.091461181640625, 1.19189453125, 1.292327880859375, 1.39276123046875, 1.493194580078125, 1.5936279296875, 1.694061279296875, 1.79449462890625, 1.894927978515625, 1.995361328125, 2.095794677734375, 2.19622802734375, 2.296661376953125, 2.3970947265625, 2.497528076171875, 2.59796142578125, 2.698394775390625, 2.798828125]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 9.0, 12.0, 23.0, 42.0, 87.0, 137.0, 183.0, 166.0, 120.0, 76.0, 44.0, 29.0, 22.0, 11.0, 4.0, 6.0, 2.0, 6.0, 3.0, 4.0, 2.0, 1.0, 4.0, 2.0, 7.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.98832893371582, -21.048076629638672, -20.107824325561523, -19.167572021484375, -18.227319717407227, -17.287067413330078, -16.346813201904297, -15.406561851501465, -14.466309547424316, -13.526057243347168, -12.58580493927002, -11.645551681518555, -10.705299377441406, -9.765047073364258, -8.82479476928711, -7.884542465209961, -6.9442901611328125, -6.004037857055664, -5.063785552978516, -4.123532772064209, -3.1832804679870605, -2.243028163909912, -1.3027753829956055, -0.36252307891845703, 0.5777292251586914, 1.5179816484451294, 2.4582340717315674, 3.398486614227295, 4.338738918304443, 5.278991222381592, 6.219244003295898, 7.159496307373047, 8.099750518798828, 9.040002822875977, 9.980255126953125, 10.920507431030273, 11.860759735107422, 12.80101203918457, 13.741265296936035, 14.681517601013184, 15.621769905090332, 16.562023162841797, 17.502275466918945, 18.442527770996094, 19.382780075073242, 20.32303237915039, 21.26328468322754, 22.203536987304688, 23.143789291381836, 24.084041595458984, 25.024293899536133, 25.96454620361328, 26.90479850769043, 27.845050811767578, 28.78530502319336, 29.725555419921875, 30.665809631347656, 31.606061935424805, 32.54631423950195, 33.486568450927734, 34.42681884765625, 35.36707305908203, 36.30732345581055, 37.24757766723633, 38.187828063964844]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 0.0, 5.0, 1.0, 6.0, 13.0, 8.0, 14.0, 19.0, 20.0, 24.0, 19.0, 41.0, 32.0, 46.0, 39.0, 47.0, 48.0, 41.0, 49.0, 51.0, 43.0, 50.0, 49.0, 40.0, 44.0, 45.0, 34.0, 28.0, 31.0, 21.0, 24.0, 19.0, 17.0, 12.0, 8.0, 6.0, 8.0, 2.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.75447654724121, -17.229167938232422, -16.703859329223633, -16.178550720214844, -15.653243064880371, -15.127934455871582, -14.60262680053711, -14.07731819152832, -13.552009582519531, -13.026700973510742, -12.501392364501953, -11.97608470916748, -11.450776100158691, -10.925467491149902, -10.40015983581543, -9.87485122680664, -9.349542617797852, -8.824234008789062, -8.298925399780273, -7.773617744445801, -7.248309135437012, -6.723000526428223, -6.197692394256592, -5.672384262084961, -5.147075653076172, -4.621767044067383, -4.096458911895752, -3.571150541305542, -3.045842170715332, -2.520533800125122, -1.995225429534912, -1.4699170589447021, -0.9446067810058594, -0.4192984104156494, 0.10600996017456055, 0.6313183307647705, 1.1566267013549805, 1.6819350719451904, 2.2072434425354004, 2.7325518131256104, 3.2578601837158203, 3.7831685543060303, 4.30847692489624, 4.833785057067871, 5.35909366607666, 5.884402275085449, 6.40971040725708, 6.935018539428711, 7.4603271484375, 7.985635757446289, 8.510944366455078, 9.03625202178955, 9.56156063079834, 10.086869239807129, 10.612176895141602, 11.13748550415039, 11.66279411315918, 12.188102722167969, 12.713411331176758, 13.23871898651123, 13.76402759552002, 14.289336204528809, 14.814643859863281, 15.33995246887207, 15.86526107788086]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 12.0, 11.0, 17.0, 27.0, 43.0, 63.0, 95.0, 182.0, 277.0, 488.0, 924.0, 1767.0, 3445.0, 7497.0, 17993.0, 46448.0, 131397.0, 332543.0, 312439.0, 119821.0, 42857.0, 16419.0, 6857.0, 3243.0, 1642.0, 891.0, 470.0, 263.0, 169.0, 91.0, 65.0, 40.0, 16.0, 24.0, 11.0, 5.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.265625, -2.1873779296875, -2.109130859375, -2.0308837890625, -1.95263671875, -1.8743896484375, -1.796142578125, -1.7178955078125, -1.6396484375, -1.5614013671875, -1.483154296875, -1.4049072265625, -1.32666015625, -1.2484130859375, -1.170166015625, -1.0919189453125, -1.013671875, -0.9354248046875, -0.857177734375, -0.7789306640625, -0.70068359375, -0.6224365234375, -0.544189453125, -0.4659423828125, -0.3876953125, -0.3094482421875, -0.231201171875, -0.1529541015625, -0.07470703125, 0.0035400390625, 0.081787109375, 0.1600341796875, 0.23828125, 0.3165283203125, 0.394775390625, 0.4730224609375, 0.55126953125, 0.6295166015625, 0.707763671875, 0.7860107421875, 0.8642578125, 0.9425048828125, 1.020751953125, 1.0989990234375, 1.17724609375, 1.2554931640625, 1.333740234375, 1.4119873046875, 1.490234375, 1.5684814453125, 1.646728515625, 1.7249755859375, 1.80322265625, 1.8814697265625, 1.959716796875, 2.0379638671875, 2.1162109375, 2.1944580078125, 2.272705078125, 2.3509521484375, 2.42919921875, 2.5074462890625, 2.585693359375, 2.6639404296875, 2.7421875]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 2.0, 3.0, 2.0, 5.0, 4.0, 12.0, 7.0, 11.0, 10.0, 13.0, 21.0, 22.0, 22.0, 15.0, 39.0, 35.0, 29.0, 32.0, 44.0, 46.0, 53.0, 46.0, 56.0, 60.0, 47.0, 45.0, 43.0, 41.0, 30.0, 31.0, 27.0, 21.0, 23.0, 24.0, 18.0, 15.0, 16.0, 8.0, 9.0, 2.0, 0.0, 7.0, 5.0, 4.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.78125, -0.75054931640625, -0.7198486328125, -0.68914794921875, -0.658447265625, -0.62774658203125, -0.5970458984375, -0.56634521484375, -0.53564453125, -0.50494384765625, -0.4742431640625, -0.44354248046875, -0.412841796875, -0.38214111328125, -0.3514404296875, -0.32073974609375, -0.2900390625, -0.25933837890625, -0.2286376953125, -0.19793701171875, -0.167236328125, -0.13653564453125, -0.1058349609375, -0.07513427734375, -0.04443359375, -0.01373291015625, 0.0169677734375, 0.04766845703125, 0.078369140625, 0.10906982421875, 0.1397705078125, 0.17047119140625, 0.201171875, 0.23187255859375, 0.2625732421875, 0.29327392578125, 0.323974609375, 0.35467529296875, 0.3853759765625, 0.41607666015625, 0.44677734375, 0.47747802734375, 0.5081787109375, 0.53887939453125, 0.569580078125, 0.60028076171875, 0.6309814453125, 0.66168212890625, 0.6923828125, 0.72308349609375, 0.7537841796875, 0.78448486328125, 0.815185546875, 0.84588623046875, 0.8765869140625, 0.90728759765625, 0.93798828125, 0.96868896484375, 0.9993896484375, 1.03009033203125, 1.060791015625, 1.09149169921875, 1.1221923828125, 1.15289306640625, 1.18359375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 1.0, 1.0, 5.0, 9.0, 16.0, 13.0, 21.0, 29.0, 36.0, 52.0, 67.0, 102.0, 159.0, 245.0, 429.0, 639.0, 1159.0, 2183.0, 4659.0, 13489.0, 54155.0, 292327.0, 542365.0, 100901.0, 22124.0, 6851.0, 2867.0, 1453.0, 830.0, 487.0, 284.0, 193.0, 120.0, 77.0, 60.0, 37.0, 34.0, 15.0, 14.0, 13.0, 8.0, 8.0, 6.0, 5.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.23828125, -3.13446044921875, -3.0306396484375, -2.92681884765625, -2.822998046875, -2.71917724609375, -2.6153564453125, -2.51153564453125, -2.40771484375, -2.30389404296875, -2.2000732421875, -2.09625244140625, -1.992431640625, -1.88861083984375, -1.7847900390625, -1.68096923828125, -1.5771484375, -1.47332763671875, -1.3695068359375, -1.26568603515625, -1.161865234375, -1.05804443359375, -0.9542236328125, -0.85040283203125, -0.74658203125, -0.64276123046875, -0.5389404296875, -0.43511962890625, -0.331298828125, -0.22747802734375, -0.1236572265625, -0.01983642578125, 0.083984375, 0.18780517578125, 0.2916259765625, 0.39544677734375, 0.499267578125, 0.60308837890625, 0.7069091796875, 0.81072998046875, 0.91455078125, 1.01837158203125, 1.1221923828125, 1.22601318359375, 1.329833984375, 1.43365478515625, 1.5374755859375, 1.64129638671875, 1.7451171875, 1.84893798828125, 1.9527587890625, 2.05657958984375, 2.160400390625, 2.26422119140625, 2.3680419921875, 2.47186279296875, 2.57568359375, 2.67950439453125, 2.7833251953125, 2.88714599609375, 2.990966796875, 3.09478759765625, 3.1986083984375, 3.30242919921875, 3.40625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 4.0, 1.0, 2.0, 7.0, 9.0, 9.0, 14.0, 19.0, 17.0, 30.0, 29.0, 29.0, 44.0, 44.0, 40.0, 49.0, 54.0, 41.0, 50.0, 49.0, 51.0, 62.0, 63.0, 54.0, 44.0, 33.0, 32.0, 21.0, 29.0, 13.0, 13.0, 12.0, 4.0, 12.0, 5.0, 7.0, 2.0, 5.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-5.7890625, -5.63079833984375, -5.4725341796875, -5.31427001953125, -5.156005859375, -4.99774169921875, -4.8394775390625, -4.68121337890625, -4.52294921875, -4.36468505859375, -4.2064208984375, -4.04815673828125, -3.889892578125, -3.73162841796875, -3.5733642578125, -3.41510009765625, -3.2568359375, -3.09857177734375, -2.9403076171875, -2.78204345703125, -2.623779296875, -2.46551513671875, -2.3072509765625, -2.14898681640625, -1.99072265625, -1.83245849609375, -1.6741943359375, -1.51593017578125, -1.357666015625, -1.19940185546875, -1.0411376953125, -0.88287353515625, -0.724609375, -0.56634521484375, -0.4080810546875, -0.24981689453125, -0.091552734375, 0.06671142578125, 0.2249755859375, 0.38323974609375, 0.54150390625, 0.69976806640625, 0.8580322265625, 1.01629638671875, 1.174560546875, 1.33282470703125, 1.4910888671875, 1.64935302734375, 1.8076171875, 1.96588134765625, 2.1241455078125, 2.28240966796875, 2.440673828125, 2.59893798828125, 2.7572021484375, 2.91546630859375, 3.07373046875, 3.23199462890625, 3.3902587890625, 3.54852294921875, 3.706787109375, 3.86505126953125, 4.0233154296875, 4.18157958984375, 4.33984375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 8.0, 10.0, 12.0, 11.0, 21.0, 26.0, 38.0, 77.0, 110.0, 185.0, 386.0, 854.0, 2508.0, 11663.0, 136747.0, 823484.0, 61907.0, 7191.0, 1853.0, 683.0, 305.0, 159.0, 96.0, 75.0, 41.0, 26.0, 24.0, 14.0, 15.0, 4.0, 3.0, 9.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.658203125, -1.59283447265625, -1.5274658203125, -1.46209716796875, -1.396728515625, -1.33135986328125, -1.2659912109375, -1.20062255859375, -1.13525390625, -1.06988525390625, -1.0045166015625, -0.93914794921875, -0.873779296875, -0.80841064453125, -0.7430419921875, -0.67767333984375, -0.6123046875, -0.54693603515625, -0.4815673828125, -0.41619873046875, -0.350830078125, -0.28546142578125, -0.2200927734375, -0.15472412109375, -0.08935546875, -0.02398681640625, 0.0413818359375, 0.10675048828125, 0.172119140625, 0.23748779296875, 0.3028564453125, 0.36822509765625, 0.43359375, 0.49896240234375, 0.5643310546875, 0.62969970703125, 0.695068359375, 0.76043701171875, 0.8258056640625, 0.89117431640625, 0.95654296875, 1.02191162109375, 1.0872802734375, 1.15264892578125, 1.218017578125, 1.28338623046875, 1.3487548828125, 1.41412353515625, 1.4794921875, 1.54486083984375, 1.6102294921875, 1.67559814453125, 1.740966796875, 1.80633544921875, 1.8717041015625, 1.93707275390625, 2.00244140625, 2.06781005859375, 2.1331787109375, 2.19854736328125, 2.263916015625, 2.32928466796875, 2.3946533203125, 2.46002197265625, 2.525390625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 5.0, 6.0, 4.0, 15.0, 14.0, 27.0, 22.0, 40.0, 39.0, 58.0, 78.0, 72.0, 118.0, 109.0, 91.0, 57.0, 55.0, 41.0, 39.0, 25.0, 19.0, 22.0, 9.0, 11.0, 5.0, 3.0, 2.0, 5.0, 6.0, 4.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.00032973289489746094, -0.00032123737037181854, -0.00031274184584617615, -0.00030424632132053375, -0.00029575079679489136, -0.00028725527226924896, -0.00027875974774360657, -0.00027026422321796417, -0.0002617686986923218, -0.0002532731741666794, -0.000244777649641037, -0.0002362821251153946, -0.0002277866005897522, -0.0002192910760641098, -0.0002107955515384674, -0.000202300027012825, -0.00019380450248718262, -0.00018530897796154022, -0.00017681345343589783, -0.00016831792891025543, -0.00015982240438461304, -0.00015132687985897064, -0.00014283135533332825, -0.00013433583080768585, -0.00012584030628204346, -0.00011734478175640106, -0.00010884925723075867, -0.00010035373270511627, -9.185820817947388e-05, -8.336268365383148e-05, -7.486715912818909e-05, -6.637163460254669e-05, -5.78761100769043e-05, -4.93805855512619e-05, -4.088506102561951e-05, -3.238953649997711e-05, -2.3894011974334717e-05, -1.5398487448692322e-05, -6.902962923049927e-06, 1.5925616025924683e-06, 1.0088086128234863e-05, 1.8583610653877258e-05, 2.7079135179519653e-05, 3.557465970516205e-05, 4.407018423080444e-05, 5.256570875644684e-05, 6.106123328208923e-05, 6.955675780773163e-05, 7.805228233337402e-05, 8.654780685901642e-05, 9.504333138465881e-05, 0.00010353885591030121, 0.0001120343804359436, 0.000120529904961586, 0.0001290254294872284, 0.0001375209540128708, 0.00014601647853851318, 0.00015451200306415558, 0.00016300752758979797, 0.00017150305211544037, 0.00017999857664108276, 0.00018849410116672516, 0.00019698962569236755, 0.00020548515021800995, 0.00021398067474365234]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 5.0, 11.0, 4.0, 9.0, 9.0, 16.0, 26.0, 29.0, 42.0, 49.0, 72.0, 115.0, 219.0, 346.0, 693.0, 1547.0, 4079.0, 15089.0, 104815.0, 733908.0, 159110.0, 19838.0, 4876.0, 1885.0, 718.0, 389.0, 221.0, 149.0, 81.0, 56.0, 44.0, 25.0, 24.0, 22.0, 12.0, 6.0, 8.0, 6.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8115234375, -1.7620086669921875, -1.712493896484375, -1.6629791259765625, -1.61346435546875, -1.5639495849609375, -1.514434814453125, -1.4649200439453125, -1.4154052734375, -1.3658905029296875, -1.316375732421875, -1.2668609619140625, -1.21734619140625, -1.1678314208984375, -1.118316650390625, -1.0688018798828125, -1.019287109375, -0.9697723388671875, -0.920257568359375, -0.8707427978515625, -0.82122802734375, -0.7717132568359375, -0.722198486328125, -0.6726837158203125, -0.6231689453125, -0.5736541748046875, -0.524139404296875, -0.4746246337890625, -0.42510986328125, -0.3755950927734375, -0.326080322265625, -0.2765655517578125, -0.22705078125, -0.1775360107421875, -0.128021240234375, -0.0785064697265625, -0.02899169921875, 0.0205230712890625, 0.070037841796875, 0.1195526123046875, 0.1690673828125, 0.2185821533203125, 0.268096923828125, 0.3176116943359375, 0.36712646484375, 0.4166412353515625, 0.466156005859375, 0.5156707763671875, 0.565185546875, 0.6147003173828125, 0.664215087890625, 0.7137298583984375, 0.76324462890625, 0.8127593994140625, 0.862274169921875, 0.9117889404296875, 0.9613037109375, 1.0108184814453125, 1.060333251953125, 1.1098480224609375, 1.15936279296875, 1.2088775634765625, 1.258392333984375, 1.3079071044921875, 1.357421875]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 5.0, 4.0, 7.0, 12.0, 24.0, 23.0, 21.0, 34.0, 39.0, 56.0, 63.0, 81.0, 84.0, 83.0, 76.0, 75.0, 70.0, 59.0, 41.0, 33.0, 32.0, 21.0, 13.0, 7.0, 9.0, 8.0, 5.0, 5.0, 4.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5927734375, -1.545074462890625, -1.49737548828125, -1.449676513671875, -1.4019775390625, -1.354278564453125, -1.30657958984375, -1.258880615234375, -1.211181640625, -1.163482666015625, -1.11578369140625, -1.068084716796875, -1.0203857421875, -0.972686767578125, -0.92498779296875, -0.877288818359375, -0.82958984375, -0.781890869140625, -0.73419189453125, -0.686492919921875, -0.6387939453125, -0.591094970703125, -0.54339599609375, -0.495697021484375, -0.447998046875, -0.400299072265625, -0.35260009765625, -0.304901123046875, -0.2572021484375, -0.209503173828125, -0.16180419921875, -0.114105224609375, -0.06640625, -0.018707275390625, 0.02899169921875, 0.076690673828125, 0.1243896484375, 0.172088623046875, 0.21978759765625, 0.267486572265625, 0.315185546875, 0.362884521484375, 0.41058349609375, 0.458282470703125, 0.5059814453125, 0.553680419921875, 0.60137939453125, 0.649078369140625, 0.69677734375, 0.744476318359375, 0.79217529296875, 0.839874267578125, 0.8875732421875, 0.935272216796875, 0.98297119140625, 1.030670166015625, 1.078369140625, 1.126068115234375, 1.17376708984375, 1.221466064453125, 1.2691650390625, 1.316864013671875, 1.36456298828125, 1.412261962890625, 1.4599609375]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 6.0, 6.0, 16.0, 29.0, 56.0, 87.0, 139.0, 177.0, 198.0, 119.0, 70.0, 36.0, 20.0, 18.0, 12.0, 4.0, 8.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.88990020751953, -36.91172790527344, -35.93355941772461, -34.955387115478516, -33.97721481323242, -32.999046325683594, -32.0208740234375, -31.04270362854004, -30.064533233642578, -29.086362838745117, -28.108190536499023, -27.130020141601562, -26.1518497467041, -25.17367935180664, -24.195507049560547, -23.217336654663086, -22.239164352416992, -21.26099395751953, -20.282821655273438, -19.304651260375977, -18.326480865478516, -17.348308563232422, -16.37013816833496, -15.3919677734375, -14.413796424865723, -13.435625076293945, -12.457454681396484, -11.479283332824707, -10.50111198425293, -9.522941589355469, -8.544770240783691, -7.566599369049072, -6.588428497314453, -5.610257625579834, -4.632086753845215, -3.6539154052734375, -2.6757445335388184, -1.6975736618041992, -0.7194023132324219, 0.25876855850219727, 1.2369394302368164, 2.2151103019714355, 3.193281412124634, 4.171452522277832, 5.149623394012451, 6.12779426574707, 7.105965614318848, 8.084136962890625, 9.062307357788086, 10.040478706359863, 11.018649101257324, 11.996820449829102, 12.974990844726562, 13.95316219329834, 14.931333541870117, 15.909503936767578, 16.887676239013672, 17.865846633911133, 18.844018936157227, 19.822189331054688, 20.80035972595215, 21.77853012084961, 22.756702423095703, 23.734872817993164, 24.713043212890625]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 3.0, 5.0, 4.0, 5.0, 6.0, 9.0, 4.0, 7.0, 11.0, 13.0, 13.0, 17.0, 16.0, 21.0, 24.0, 35.0, 29.0, 27.0, 30.0, 35.0, 42.0, 43.0, 58.0, 45.0, 55.0, 44.0, 54.0, 39.0, 42.0, 31.0, 26.0, 27.0, 34.0, 18.0, 23.0, 18.0, 17.0, 17.0, 14.0, 9.0, 6.0, 8.0, 5.0, 4.0, 4.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0], "bins": [-17.36117935180664, -16.849042892456055, -16.33690643310547, -15.824769973754883, -15.312633514404297, -14.800497055053711, -14.288360595703125, -13.776224136352539, -13.264087677001953, -12.751951217651367, -12.239814758300781, -11.727678298950195, -11.21554183959961, -10.703405380249023, -10.191268920898438, -9.679132461547852, -9.166996002197266, -8.65485954284668, -8.142723083496094, -7.630586624145508, -7.118450164794922, -6.606313705444336, -6.09417724609375, -5.582040786743164, -5.069904327392578, -4.557767868041992, -4.045631408691406, -3.5334949493408203, -3.0213584899902344, -2.5092220306396484, -1.9970855712890625, -1.4849491119384766, -0.9728145599365234, -0.4606781005859375, 0.05145835876464844, 0.5635948181152344, 1.0757312774658203, 1.5878677368164062, 2.100004196166992, 2.612140655517578, 3.124277114868164, 3.63641357421875, 4.148550033569336, 4.660686492919922, 5.172822952270508, 5.684959411621094, 6.19709587097168, 6.709232330322266, 7.221368789672852, 7.7335052490234375, 8.245641708374023, 8.75777816772461, 9.269914627075195, 9.782051086425781, 10.294187545776367, 10.806324005126953, 11.318460464477539, 11.830596923828125, 12.342733383178711, 12.854869842529297, 13.367006301879883, 13.879142761230469, 14.391279220581055, 14.90341567993164, 15.415552139282227]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 4.0, 7.0, 8.0, 10.0, 24.0, 31.0, 35.0, 96.0, 182.0, 444.0, 1672.0, 13722.0, 3916003.0, 254689.0, 5755.0, 1017.0, 284.0, 135.0, 68.0, 35.0, 20.0, 15.0, 8.0, 8.0, 5.0, 4.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.9609375, -8.70367431640625, -8.4464111328125, -8.18914794921875, -7.931884765625, -7.67462158203125, -7.4173583984375, -7.16009521484375, -6.90283203125, -6.64556884765625, -6.3883056640625, -6.13104248046875, -5.873779296875, -5.61651611328125, -5.3592529296875, -5.10198974609375, -4.8447265625, -4.58746337890625, -4.3302001953125, -4.07293701171875, -3.815673828125, -3.55841064453125, -3.3011474609375, -3.04388427734375, -2.78662109375, -2.52935791015625, -2.2720947265625, -2.01483154296875, -1.757568359375, -1.50030517578125, -1.2430419921875, -0.98577880859375, -0.728515625, -0.47125244140625, -0.2139892578125, 0.04327392578125, 0.300537109375, 0.55780029296875, 0.8150634765625, 1.07232666015625, 1.32958984375, 1.58685302734375, 1.8441162109375, 2.10137939453125, 2.358642578125, 2.61590576171875, 2.8731689453125, 3.13043212890625, 3.3876953125, 3.64495849609375, 3.9022216796875, 4.15948486328125, 4.416748046875, 4.67401123046875, 4.9312744140625, 5.18853759765625, 5.44580078125, 5.70306396484375, 5.9603271484375, 6.21759033203125, 6.474853515625, 6.73211669921875, 6.9893798828125, 7.24664306640625, 7.50390625]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 5.0, 6.0, 8.0, 15.0, 20.0, 21.0, 31.0, 35.0, 45.0, 59.0, 64.0, 76.0, 68.0, 88.0, 75.0, 82.0, 68.0, 50.0, 44.0, 36.0, 28.0, 35.0, 14.0, 9.0, 7.0, 4.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5537109375, -1.5057525634765625, -1.457794189453125, -1.4098358154296875, -1.36187744140625, -1.3139190673828125, -1.265960693359375, -1.2180023193359375, -1.1700439453125, -1.1220855712890625, -1.074127197265625, -1.0261688232421875, -0.97821044921875, -0.9302520751953125, -0.882293701171875, -0.8343353271484375, -0.786376953125, -0.7384185791015625, -0.690460205078125, -0.6425018310546875, -0.59454345703125, -0.5465850830078125, -0.498626708984375, -0.4506683349609375, -0.4027099609375, -0.3547515869140625, -0.306793212890625, -0.2588348388671875, -0.21087646484375, -0.1629180908203125, -0.114959716796875, -0.0670013427734375, -0.01904296875, 0.0289154052734375, 0.076873779296875, 0.1248321533203125, 0.17279052734375, 0.2207489013671875, 0.268707275390625, 0.3166656494140625, 0.3646240234375, 0.4125823974609375, 0.460540771484375, 0.5084991455078125, 0.55645751953125, 0.6044158935546875, 0.652374267578125, 0.7003326416015625, 0.748291015625, 0.7962493896484375, 0.844207763671875, 0.8921661376953125, 0.94012451171875, 0.9880828857421875, 1.036041259765625, 1.0839996337890625, 1.1319580078125, 1.1799163818359375, 1.227874755859375, 1.2758331298828125, 1.32379150390625, 1.3717498779296875, 1.419708251953125, 1.4676666259765625, 1.515625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 4.0, 3.0, 2.0, 3.0, 3.0, 4.0, 5.0, 9.0, 7.0, 22.0, 42.0, 48.0, 77.0, 116.0, 191.0, 320.0, 510.0, 869.0, 1517.0, 2981.0, 6069.0, 15004.0, 47028.0, 309536.0, 3457861.0, 280138.0, 44739.0, 14621.0, 6167.0, 2765.0, 1587.0, 842.0, 461.0, 290.0, 171.0, 94.0, 62.0, 41.0, 26.0, 19.0, 9.0, 13.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0], "bins": [-2.94140625, -2.86077880859375, -2.7801513671875, -2.69952392578125, -2.618896484375, -2.53826904296875, -2.4576416015625, -2.37701416015625, -2.29638671875, -2.21575927734375, -2.1351318359375, -2.05450439453125, -1.973876953125, -1.89324951171875, -1.8126220703125, -1.73199462890625, -1.6513671875, -1.57073974609375, -1.4901123046875, -1.40948486328125, -1.328857421875, -1.24822998046875, -1.1676025390625, -1.08697509765625, -1.00634765625, -0.92572021484375, -0.8450927734375, -0.76446533203125, -0.683837890625, -0.60321044921875, -0.5225830078125, -0.44195556640625, -0.361328125, -0.28070068359375, -0.2000732421875, -0.11944580078125, -0.038818359375, 0.04180908203125, 0.1224365234375, 0.20306396484375, 0.28369140625, 0.36431884765625, 0.4449462890625, 0.52557373046875, 0.606201171875, 0.68682861328125, 0.7674560546875, 0.84808349609375, 0.9287109375, 1.00933837890625, 1.0899658203125, 1.17059326171875, 1.251220703125, 1.33184814453125, 1.4124755859375, 1.49310302734375, 1.57373046875, 1.65435791015625, 1.7349853515625, 1.81561279296875, 1.896240234375, 1.97686767578125, 2.0574951171875, 2.13812255859375, 2.21875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 6.0, 5.0, 5.0, 8.0, 13.0, 13.0, 27.0, 24.0, 54.0, 91.0, 174.0, 374.0, 1095.0, 1256.0, 484.0, 204.0, 90.0, 43.0, 33.0, 16.0, 15.0, 10.0, 7.0, 5.0, 5.0, 5.0, 4.0, 6.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.14453125, -4.03265380859375, -3.9207763671875, -3.80889892578125, -3.697021484375, -3.58514404296875, -3.4732666015625, -3.36138916015625, -3.24951171875, -3.13763427734375, -3.0257568359375, -2.91387939453125, -2.802001953125, -2.69012451171875, -2.5782470703125, -2.46636962890625, -2.3544921875, -2.24261474609375, -2.1307373046875, -2.01885986328125, -1.906982421875, -1.79510498046875, -1.6832275390625, -1.57135009765625, -1.45947265625, -1.34759521484375, -1.2357177734375, -1.12384033203125, -1.011962890625, -0.90008544921875, -0.7882080078125, -0.67633056640625, -0.564453125, -0.45257568359375, -0.3406982421875, -0.22882080078125, -0.116943359375, -0.00506591796875, 0.1068115234375, 0.21868896484375, 0.33056640625, 0.44244384765625, 0.5543212890625, 0.66619873046875, 0.778076171875, 0.88995361328125, 1.0018310546875, 1.11370849609375, 1.2255859375, 1.33746337890625, 1.4493408203125, 1.56121826171875, 1.673095703125, 1.78497314453125, 1.8968505859375, 2.00872802734375, 2.12060546875, 2.23248291015625, 2.3443603515625, 2.45623779296875, 2.568115234375, 2.67999267578125, 2.7918701171875, 2.90374755859375, 3.015625]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 8.0, 10.0, 20.0, 46.0, 133.0, 301.0, 301.0, 116.0, 34.0, 17.0, 6.0, 2.0, 6.0, 4.0, 0.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.278968811035156, -52.9849739074707, -51.690975189208984, -50.39698028564453, -49.10298156738281, -47.80898666381836, -46.514991760253906, -45.22099304199219, -43.926998138427734, -42.63300323486328, -41.33900451660156, -40.04500961303711, -38.751014709472656, -37.45701599121094, -36.163021087646484, -34.86902618408203, -33.57502746582031, -32.28103256225586, -30.98703384399414, -29.693038940429688, -28.3990421295166, -27.105045318603516, -25.811050415039062, -24.517053604125977, -23.22305679321289, -21.929059982299805, -20.63506317138672, -19.341068267822266, -18.04707145690918, -16.753074645996094, -15.459078788757324, -14.165082931518555, -12.871086120605469, -11.577089309692383, -10.283093452453613, -8.989097595214844, -7.695100784301758, -6.40110445022583, -5.107108116149902, -3.813112258911133, -2.519115447998047, -1.2251191139221191, 0.0688772201538086, 1.3628735542297363, 2.656869888305664, 3.950866222381592, 5.2448625564575195, 6.538858413696289, 7.832855224609375, 9.126852035522461, 10.42084789276123, 11.71484375, 13.008840560913086, 14.302837371826172, 15.596833229064941, 16.89082908630371, 18.184825897216797, 19.478822708129883, 20.77281951904297, 22.066814422607422, 23.360811233520508, 24.654808044433594, 25.948802947998047, 27.242799758911133, 28.53679656982422]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 7.0, 9.0, 6.0, 10.0, 12.0, 11.0, 15.0, 22.0, 30.0, 27.0, 29.0, 34.0, 43.0, 50.0, 47.0, 51.0, 57.0, 50.0, 53.0, 58.0, 36.0, 43.0, 51.0, 45.0, 36.0, 35.0, 25.0, 31.0, 14.0, 15.0, 17.0, 7.0, 6.0, 4.0, 8.0, 4.0, 4.0, 2.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.61648941040039, -13.207945823669434, -12.799402236938477, -12.390857696533203, -11.982314109802246, -11.573770523071289, -11.165226936340332, -10.756683349609375, -10.348138809204102, -9.939595222473145, -9.531051635742188, -9.122507095336914, -8.713963508605957, -8.305419921875, -7.896876335144043, -7.488332271575928, -7.079788684844971, -6.671245098114014, -6.262701034545898, -5.854157447814941, -5.445613384246826, -5.037069797515869, -4.628525733947754, -4.219982147216797, -3.8114383220672607, -3.4028944969177246, -2.9943506717681885, -2.5858068466186523, -2.1772632598876953, -1.7687194347381592, -1.360175609588623, -0.9516317844390869, -0.5430879592895508, -0.13454416394233704, 0.2739996314048767, 0.6825433969497681, 1.0910872220993042, 1.4996309280395508, 1.908174753189087, 2.316718578338623, 2.725262403488159, 3.1338062286376953, 3.5423500537872314, 3.9508938789367676, 4.359437465667725, 4.76798152923584, 5.176525115966797, 5.585068702697754, 5.993612766265869, 6.402156352996826, 6.810700416564941, 7.219244003295898, 7.627788066864014, 8.036331176757812, 8.444875717163086, 8.853419303894043, 9.261962890625, 9.670506477355957, 10.079050064086914, 10.487594604492188, 10.896138191223145, 11.304681777954102, 11.713225364685059, 12.121768951416016, 12.530313491821289]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 5.0, 2.0, 13.0, 12.0, 20.0, 28.0, 40.0, 64.0, 109.0, 149.0, 257.0, 480.0, 833.0, 1505.0, 3100.0, 6720.0, 15431.0, 39453.0, 108448.0, 309147.0, 354240.0, 129062.0, 46449.0, 18021.0, 7418.0, 3594.0, 1789.0, 899.0, 518.0, 287.0, 184.0, 92.0, 58.0, 44.0, 23.0, 18.0, 16.0, 14.0, 4.0, 5.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.19140625, -2.113372802734375, -2.03533935546875, -1.957305908203125, -1.8792724609375, -1.801239013671875, -1.72320556640625, -1.645172119140625, -1.567138671875, -1.489105224609375, -1.41107177734375, -1.333038330078125, -1.2550048828125, -1.176971435546875, -1.09893798828125, -1.020904541015625, -0.94287109375, -0.864837646484375, -0.78680419921875, -0.708770751953125, -0.6307373046875, -0.552703857421875, -0.47467041015625, -0.396636962890625, -0.318603515625, -0.240570068359375, -0.16253662109375, -0.084503173828125, -0.0064697265625, 0.071563720703125, 0.14959716796875, 0.227630615234375, 0.3056640625, 0.383697509765625, 0.46173095703125, 0.539764404296875, 0.6177978515625, 0.695831298828125, 0.77386474609375, 0.851898193359375, 0.929931640625, 1.007965087890625, 1.08599853515625, 1.164031982421875, 1.2420654296875, 1.320098876953125, 1.39813232421875, 1.476165771484375, 1.55419921875, 1.632232666015625, 1.71026611328125, 1.788299560546875, 1.8663330078125, 1.944366455078125, 2.02239990234375, 2.100433349609375, 2.178466796875, 2.256500244140625, 2.33453369140625, 2.412567138671875, 2.4906005859375, 2.568634033203125, 2.64666748046875, 2.724700927734375, 2.802734375]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 4.0, 4.0, 9.0, 14.0, 13.0, 15.0, 27.0, 27.0, 20.0, 32.0, 42.0, 41.0, 44.0, 56.0, 49.0, 45.0, 66.0, 50.0, 61.0, 59.0, 48.0, 48.0, 44.0, 32.0, 26.0, 21.0, 22.0, 21.0, 17.0, 11.0, 13.0, 6.0, 10.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0], "bins": [-1.4892578125, -1.4535446166992188, -1.4178314208984375, -1.3821182250976562, -1.346405029296875, -1.3106918334960938, -1.2749786376953125, -1.2392654418945312, -1.20355224609375, -1.1678390502929688, -1.1321258544921875, -1.0964126586914062, -1.060699462890625, -1.0249862670898438, -0.9892730712890625, -0.9535598754882812, -0.9178466796875, -0.8821334838867188, -0.8464202880859375, -0.8107070922851562, -0.774993896484375, -0.7392807006835938, -0.7035675048828125, -0.6678543090820312, -0.63214111328125, -0.5964279174804688, -0.5607147216796875, -0.5250015258789062, -0.489288330078125, -0.45357513427734375, -0.4178619384765625, -0.38214874267578125, -0.346435546875, -0.31072235107421875, -0.2750091552734375, -0.23929595947265625, -0.203582763671875, -0.16786956787109375, -0.1321563720703125, -0.09644317626953125, -0.06072998046875, -0.02501678466796875, 0.0106964111328125, 0.04640960693359375, 0.082122802734375, 0.11783599853515625, 0.1535491943359375, 0.18926239013671875, 0.2249755859375, 0.26068878173828125, 0.2964019775390625, 0.33211517333984375, 0.367828369140625, 0.40354156494140625, 0.4392547607421875, 0.47496795654296875, 0.51068115234375, 0.5463943481445312, 0.5821075439453125, 0.6178207397460938, 0.653533935546875, 0.6892471313476562, 0.7249603271484375, 0.7606735229492188, 0.79638671875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 5.0, 6.0, 5.0, 8.0, 8.0, 10.0, 12.0, 32.0, 34.0, 37.0, 71.0, 116.0, 145.0, 242.0, 440.0, 849.0, 1995.0, 6117.0, 25868.0, 151380.0, 669992.0, 154587.0, 26290.0, 6241.0, 2074.0, 874.0, 409.0, 236.0, 148.0, 108.0, 67.0, 43.0, 26.0, 24.0, 16.0, 12.0, 10.0, 4.0, 5.0, 6.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.31640625, -3.1912841796875, -3.066162109375, -2.9410400390625, -2.81591796875, -2.6907958984375, -2.565673828125, -2.4405517578125, -2.3154296875, -2.1903076171875, -2.065185546875, -1.9400634765625, -1.81494140625, -1.6898193359375, -1.564697265625, -1.4395751953125, -1.314453125, -1.1893310546875, -1.064208984375, -0.9390869140625, -0.81396484375, -0.6888427734375, -0.563720703125, -0.4385986328125, -0.3134765625, -0.1883544921875, -0.063232421875, 0.0618896484375, 0.18701171875, 0.3121337890625, 0.437255859375, 0.5623779296875, 0.6875, 0.8126220703125, 0.937744140625, 1.0628662109375, 1.18798828125, 1.3131103515625, 1.438232421875, 1.5633544921875, 1.6884765625, 1.8135986328125, 1.938720703125, 2.0638427734375, 2.18896484375, 2.3140869140625, 2.439208984375, 2.5643310546875, 2.689453125, 2.8145751953125, 2.939697265625, 3.0648193359375, 3.18994140625, 3.3150634765625, 3.440185546875, 3.5653076171875, 3.6904296875, 3.8155517578125, 3.940673828125, 4.0657958984375, 4.19091796875, 4.3160400390625, 4.441162109375, 4.5662841796875, 4.69140625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 4.0, 5.0, 8.0, 14.0, 6.0, 12.0, 19.0, 18.0, 22.0, 26.0, 25.0, 32.0, 38.0, 34.0, 36.0, 34.0, 42.0, 38.0, 60.0, 42.0, 43.0, 46.0, 36.0, 39.0, 38.0, 41.0, 41.0, 25.0, 26.0, 26.0, 16.0, 22.0, 15.0, 17.0, 4.0, 15.0, 10.0, 11.0, 5.0, 4.0, 2.0, 5.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.435546875, -3.3251953125, -3.21484375, -3.1044921875, -2.994140625, -2.8837890625, -2.7734375, -2.6630859375, -2.552734375, -2.4423828125, -2.33203125, -2.2216796875, -2.111328125, -2.0009765625, -1.890625, -1.7802734375, -1.669921875, -1.5595703125, -1.44921875, -1.3388671875, -1.228515625, -1.1181640625, -1.0078125, -0.8974609375, -0.787109375, -0.6767578125, -0.56640625, -0.4560546875, -0.345703125, -0.2353515625, -0.125, -0.0146484375, 0.095703125, 0.2060546875, 0.31640625, 0.4267578125, 0.537109375, 0.6474609375, 0.7578125, 0.8681640625, 0.978515625, 1.0888671875, 1.19921875, 1.3095703125, 1.419921875, 1.5302734375, 1.640625, 1.7509765625, 1.861328125, 1.9716796875, 2.08203125, 2.1923828125, 2.302734375, 2.4130859375, 2.5234375, 2.6337890625, 2.744140625, 2.8544921875, 2.96484375, 3.0751953125, 3.185546875, 3.2958984375, 3.40625, 3.5166015625, 3.626953125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 2.0, 2.0, 5.0, 6.0, 9.0, 16.0, 21.0, 32.0, 36.0, 55.0, 83.0, 102.0, 228.0, 416.0, 778.0, 2047.0, 6587.0, 33757.0, 419538.0, 536545.0, 37231.0, 7044.0, 2123.0, 856.0, 384.0, 230.0, 113.0, 79.0, 52.0, 43.0, 31.0, 21.0, 21.0, 15.0, 5.0, 9.0, 6.0, 6.0, 3.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 4.0, 1.0], "bins": [-2.09375, -2.0322113037109375, -1.970672607421875, -1.9091339111328125, -1.84759521484375, -1.7860565185546875, -1.724517822265625, -1.6629791259765625, -1.6014404296875, -1.5399017333984375, -1.478363037109375, -1.4168243408203125, -1.35528564453125, -1.2937469482421875, -1.232208251953125, -1.1706695556640625, -1.109130859375, -1.0475921630859375, -0.986053466796875, -0.9245147705078125, -0.86297607421875, -0.8014373779296875, -0.739898681640625, -0.6783599853515625, -0.6168212890625, -0.5552825927734375, -0.493743896484375, -0.4322052001953125, -0.37066650390625, -0.3091278076171875, -0.247589111328125, -0.1860504150390625, -0.12451171875, -0.0629730224609375, -0.001434326171875, 0.0601043701171875, 0.12164306640625, 0.1831817626953125, 0.244720458984375, 0.3062591552734375, 0.3677978515625, 0.4293365478515625, 0.490875244140625, 0.5524139404296875, 0.61395263671875, 0.6754913330078125, 0.737030029296875, 0.7985687255859375, 0.860107421875, 0.9216461181640625, 0.983184814453125, 1.0447235107421875, 1.10626220703125, 1.1678009033203125, 1.229339599609375, 1.2908782958984375, 1.3524169921875, 1.4139556884765625, 1.475494384765625, 1.5370330810546875, 1.59857177734375, 1.6601104736328125, 1.721649169921875, 1.7831878662109375, 1.8447265625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 6.0, 16.0, 22.0, 53.0, 84.0, 185.0, 241.0, 164.0, 108.0, 51.0, 22.0, 26.0, 7.0, 9.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0010929107666015625, -0.001069914549589157, -0.0010469183325767517, -0.0010239221155643463, -0.001000925898551941, -0.0009779296815395355, -0.0009549334645271301, -0.0009319372475147247, -0.0009089410305023193, -0.0008859448134899139, -0.0008629485964775085, -0.0008399523794651031, -0.0008169561624526978, -0.0007939599454402924, -0.000770963728427887, -0.0007479675114154816, -0.0007249712944030762, -0.0007019750773906708, -0.0006789788603782654, -0.00065598264336586, -0.0006329864263534546, -0.0006099902093410492, -0.0005869939923286438, -0.0005639977753162384, -0.000541001558303833, -0.0005180053412914276, -0.0004950091242790222, -0.0004720129072666168, -0.0004490166902542114, -0.00042602047324180603, -0.00040302425622940063, -0.00038002803921699524, -0.00035703182220458984, -0.00033403560519218445, -0.00031103938817977905, -0.00028804317116737366, -0.00026504695415496826, -0.00024205073714256287, -0.00021905452013015747, -0.00019605830311775208, -0.00017306208610534668, -0.00015006586909294128, -0.0001270696520805359, -0.00010407343506813049, -8.10772180557251e-05, -5.80810010433197e-05, -3.508478403091431e-05, -1.2088567018508911e-05, 1.0907649993896484e-05, 3.390386700630188e-05, 5.6900084018707275e-05, 7.989630103111267e-05, 0.00010289251804351807, 0.00012588873505592346, 0.00014888495206832886, 0.00017188116908073425, 0.00019487738609313965, 0.00021787360310554504, 0.00024086982011795044, 0.00026386603713035583, 0.00028686225414276123, 0.0003098584711551666, 0.000332854688167572, 0.0003558509051799774, 0.0003788471221923828]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 6.0, 8.0, 17.0, 19.0, 27.0, 36.0, 53.0, 100.0, 169.0, 351.0, 790.0, 2121.0, 8610.0, 66158.0, 792662.0, 157376.0, 14823.0, 3199.0, 1045.0, 447.0, 225.0, 119.0, 64.0, 42.0, 28.0, 15.0, 8.0, 6.0, 11.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.16015625, -2.0919189453125, -2.023681640625, -1.9554443359375, -1.88720703125, -1.8189697265625, -1.750732421875, -1.6824951171875, -1.6142578125, -1.5460205078125, -1.477783203125, -1.4095458984375, -1.34130859375, -1.2730712890625, -1.204833984375, -1.1365966796875, -1.068359375, -1.0001220703125, -0.931884765625, -0.8636474609375, -0.79541015625, -0.7271728515625, -0.658935546875, -0.5906982421875, -0.5224609375, -0.4542236328125, -0.385986328125, -0.3177490234375, -0.24951171875, -0.1812744140625, -0.113037109375, -0.0447998046875, 0.0234375, 0.0916748046875, 0.159912109375, 0.2281494140625, 0.29638671875, 0.3646240234375, 0.432861328125, 0.5010986328125, 0.5693359375, 0.6375732421875, 0.705810546875, 0.7740478515625, 0.84228515625, 0.9105224609375, 0.978759765625, 1.0469970703125, 1.115234375, 1.1834716796875, 1.251708984375, 1.3199462890625, 1.38818359375, 1.4564208984375, 1.524658203125, 1.5928955078125, 1.6611328125, 1.7293701171875, 1.797607421875, 1.8658447265625, 1.93408203125, 2.0023193359375, 2.070556640625, 2.1387939453125, 2.20703125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 5.0, 7.0, 10.0, 13.0, 13.0, 16.0, 19.0, 21.0, 28.0, 27.0, 45.0, 45.0, 57.0, 73.0, 74.0, 67.0, 67.0, 74.0, 67.0, 53.0, 26.0, 41.0, 29.0, 24.0, 14.0, 23.0, 10.0, 7.0, 14.0, 8.0, 5.0, 3.0, 3.0, 4.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7265625, -1.6815948486328125, -1.636627197265625, -1.5916595458984375, -1.54669189453125, -1.5017242431640625, -1.456756591796875, -1.4117889404296875, -1.3668212890625, -1.3218536376953125, -1.276885986328125, -1.2319183349609375, -1.18695068359375, -1.1419830322265625, -1.097015380859375, -1.0520477294921875, -1.007080078125, -0.9621124267578125, -0.917144775390625, -0.8721771240234375, -0.82720947265625, -0.7822418212890625, -0.737274169921875, -0.6923065185546875, -0.6473388671875, -0.6023712158203125, -0.557403564453125, -0.5124359130859375, -0.46746826171875, -0.4225006103515625, -0.377532958984375, -0.3325653076171875, -0.28759765625, -0.2426300048828125, -0.197662353515625, -0.1526947021484375, -0.10772705078125, -0.0627593994140625, -0.017791748046875, 0.0271759033203125, 0.0721435546875, 0.1171112060546875, 0.162078857421875, 0.2070465087890625, 0.25201416015625, 0.2969818115234375, 0.341949462890625, 0.3869171142578125, 0.431884765625, 0.4768524169921875, 0.521820068359375, 0.5667877197265625, 0.61175537109375, 0.6567230224609375, 0.701690673828125, 0.7466583251953125, 0.7916259765625, 0.8365936279296875, 0.881561279296875, 0.9265289306640625, 0.97149658203125, 1.0164642333984375, 1.061431884765625, 1.1063995361328125, 1.1513671875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 4.0, 11.0, 27.0, 62.0, 138.0, 188.0, 260.0, 159.0, 78.0, 48.0, 14.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-63.306217193603516, -62.02650833129883, -60.746795654296875, -59.46708679199219, -58.1873779296875, -56.90766525268555, -55.62795639038086, -54.348243713378906, -53.06853485107422, -51.78882598876953, -50.50911331176758, -49.22940444946289, -47.9496955871582, -46.66998291015625, -45.39027404785156, -44.110565185546875, -42.83085632324219, -41.5511474609375, -40.27143478393555, -38.99172592163086, -37.71201705932617, -36.43230438232422, -35.15259552001953, -33.872886657714844, -32.59317398071289, -31.31346321105957, -30.033754348754883, -28.754043579101562, -27.474332809448242, -26.194622039794922, -24.914913177490234, -23.635202407836914, -22.355491638183594, -21.075780868530273, -19.796072006225586, -18.516361236572266, -17.236650466918945, -15.956940650939941, -14.677230834960938, -13.397520065307617, -12.117810249328613, -10.83810043334961, -9.558389663696289, -8.278679847717285, -6.998969554901123, -5.719259262084961, -4.439549446105957, -3.1598386764526367, -1.8801288604736328, -0.6004186868667603, 0.6792914867401123, 1.9590015411376953, 3.2387118339538574, 4.5184221267700195, 5.798131942749023, 7.077842712402344, 8.357552528381348, 9.637262344360352, 10.916973114013672, 12.196682929992676, 13.47639274597168, 14.756103515625, 16.035812377929688, 17.31552505493164, 18.595233917236328]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 5.0, 1.0, 3.0, 4.0, 7.0, 5.0, 11.0, 10.0, 17.0, 24.0, 21.0, 19.0, 39.0, 33.0, 24.0, 43.0, 44.0, 51.0, 62.0, 82.0, 67.0, 60.0, 51.0, 47.0, 40.0, 51.0, 28.0, 25.0, 34.0, 24.0, 16.0, 20.0, 13.0, 13.0, 6.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.01881217956543, -21.38681411743164, -20.754817962646484, -20.122821807861328, -19.49082374572754, -18.85882568359375, -18.226829528808594, -17.594833374023438, -16.96283531188965, -16.33083724975586, -15.698841094970703, -15.06684398651123, -14.434846878051758, -13.802849769592285, -13.170852661132812, -12.53885555267334, -11.906858444213867, -11.274861335754395, -10.642864227294922, -10.01086711883545, -9.378870010375977, -8.746872901916504, -8.114875793457031, -7.482878684997559, -6.850881576538086, -6.218884468078613, -5.586887359619141, -4.954890251159668, -4.322893142700195, -3.6908960342407227, -3.05889892578125, -2.4269018173217773, -1.7949066162109375, -1.1629095077514648, -0.5309123992919922, 0.10108470916748047, 0.7330818176269531, 1.3650789260864258, 1.9970760345458984, 2.629073143005371, 3.2610702514648438, 3.8930673599243164, 4.525064468383789, 5.157061576843262, 5.789058685302734, 6.421055793762207, 7.05305290222168, 7.685050010681152, 8.317047119140625, 8.949044227600098, 9.58104133605957, 10.213038444519043, 10.845035552978516, 11.477032661437988, 12.109029769897461, 12.741026878356934, 13.373023986816406, 14.005021095275879, 14.637018203735352, 15.269015312194824, 15.901012420654297, 16.533008575439453, 17.165006637573242, 17.79700469970703, 18.429000854492188]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 3.0, 4.0, 7.0, 14.0, 19.0, 29.0, 48.0, 72.0, 148.0, 273.0, 556.0, 1035.0, 2658.0, 7449.0, 27200.0, 205931.0, 3347835.0, 540802.0, 43622.0, 10152.0, 3437.0, 1451.0, 709.0, 329.0, 174.0, 83.0, 68.0, 51.0, 26.0, 21.0, 24.0, 9.0, 12.0, 6.0, 7.0, 6.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.50390625, -2.427215576171875, -2.35052490234375, -2.273834228515625, -2.1971435546875, -2.120452880859375, -2.04376220703125, -1.967071533203125, -1.890380859375, -1.813690185546875, -1.73699951171875, -1.660308837890625, -1.5836181640625, -1.506927490234375, -1.43023681640625, -1.353546142578125, -1.27685546875, -1.200164794921875, -1.12347412109375, -1.046783447265625, -0.9700927734375, -0.893402099609375, -0.81671142578125, -0.740020751953125, -0.663330078125, -0.586639404296875, -0.50994873046875, -0.433258056640625, -0.3565673828125, -0.279876708984375, -0.20318603515625, -0.126495361328125, -0.0498046875, 0.026885986328125, 0.10357666015625, 0.180267333984375, 0.2569580078125, 0.333648681640625, 0.41033935546875, 0.487030029296875, 0.563720703125, 0.640411376953125, 0.71710205078125, 0.793792724609375, 0.8704833984375, 0.947174072265625, 1.02386474609375, 1.100555419921875, 1.17724609375, 1.253936767578125, 1.33062744140625, 1.407318115234375, 1.4840087890625, 1.560699462890625, 1.63739013671875, 1.714080810546875, 1.790771484375, 1.867462158203125, 1.94415283203125, 2.020843505859375, 2.0975341796875, 2.174224853515625, 2.25091552734375, 2.327606201171875, 2.404296875]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 6.0, 1.0, 8.0, 7.0, 6.0, 5.0, 8.0, 12.0, 14.0, 16.0, 26.0, 34.0, 33.0, 27.0, 33.0, 41.0, 32.0, 49.0, 36.0, 49.0, 44.0, 43.0, 59.0, 47.0, 52.0, 43.0, 41.0, 44.0, 28.0, 25.0, 23.0, 17.0, 21.0, 12.0, 9.0, 11.0, 10.0, 6.0, 8.0, 6.0, 3.0, 4.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.751953125, -0.7252273559570312, -0.6985015869140625, -0.6717758178710938, -0.645050048828125, -0.6183242797851562, -0.5915985107421875, -0.5648727416992188, -0.53814697265625, -0.5114212036132812, -0.4846954345703125, -0.45796966552734375, -0.431243896484375, -0.40451812744140625, -0.3777923583984375, -0.35106658935546875, -0.3243408203125, -0.29761505126953125, -0.2708892822265625, -0.24416351318359375, -0.217437744140625, -0.19071197509765625, -0.1639862060546875, -0.13726043701171875, -0.11053466796875, -0.08380889892578125, -0.0570831298828125, -0.03035736083984375, -0.003631591796875, 0.02309417724609375, 0.0498199462890625, 0.07654571533203125, 0.103271484375, 0.12999725341796875, 0.1567230224609375, 0.18344879150390625, 0.210174560546875, 0.23690032958984375, 0.2636260986328125, 0.29035186767578125, 0.31707763671875, 0.34380340576171875, 0.3705291748046875, 0.39725494384765625, 0.423980712890625, 0.45070648193359375, 0.4774322509765625, 0.5041580200195312, 0.5308837890625, 0.5576095581054688, 0.5843353271484375, 0.6110610961914062, 0.637786865234375, 0.6645126342773438, 0.6912384033203125, 0.7179641723632812, 0.74468994140625, 0.7714157104492188, 0.7981414794921875, 0.8248672485351562, 0.851593017578125, 0.8783187866210938, 0.9050445556640625, 0.9317703247070312, 0.95849609375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 7.0, 4.0, 9.0, 9.0, 16.0, 36.0, 56.0, 96.0, 153.0, 336.0, 907.0, 2474.0, 9311.0, 52051.0, 1291483.0, 2743678.0, 75479.0, 12515.0, 3386.0, 1187.0, 508.0, 260.0, 130.0, 59.0, 47.0, 42.0, 12.0, 11.0, 6.0, 6.0, 5.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.931640625, -2.814727783203125, -2.69781494140625, -2.580902099609375, -2.4639892578125, -2.347076416015625, -2.23016357421875, -2.113250732421875, -1.996337890625, -1.879425048828125, -1.76251220703125, -1.645599365234375, -1.5286865234375, -1.411773681640625, -1.29486083984375, -1.177947998046875, -1.06103515625, -0.944122314453125, -0.82720947265625, -0.710296630859375, -0.5933837890625, -0.476470947265625, -0.35955810546875, -0.242645263671875, -0.125732421875, -0.008819580078125, 0.10809326171875, 0.225006103515625, 0.3419189453125, 0.458831787109375, 0.57574462890625, 0.692657470703125, 0.8095703125, 0.926483154296875, 1.04339599609375, 1.160308837890625, 1.2772216796875, 1.394134521484375, 1.51104736328125, 1.627960205078125, 1.744873046875, 1.861785888671875, 1.97869873046875, 2.095611572265625, 2.2125244140625, 2.329437255859375, 2.44635009765625, 2.563262939453125, 2.68017578125, 2.797088623046875, 2.91400146484375, 3.030914306640625, 3.1478271484375, 3.264739990234375, 3.38165283203125, 3.498565673828125, 3.615478515625, 3.732391357421875, 3.84930419921875, 3.966217041015625, 4.0831298828125, 4.200042724609375, 4.31695556640625, 4.433868408203125, 4.55078125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 2.0, 6.0, 8.0, 9.0, 14.0, 19.0, 25.0, 39.0, 58.0, 89.0, 154.0, 315.0, 581.0, 1119.0, 748.0, 392.0, 169.0, 94.0, 56.0, 47.0, 33.0, 26.0, 25.0, 18.0, 6.0, 4.0, 4.0, 8.0, 3.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.68359375, -2.57464599609375, -2.4656982421875, -2.35675048828125, -2.247802734375, -2.13885498046875, -2.0299072265625, -1.92095947265625, -1.81201171875, -1.70306396484375, -1.5941162109375, -1.48516845703125, -1.376220703125, -1.26727294921875, -1.1583251953125, -1.04937744140625, -0.9404296875, -0.83148193359375, -0.7225341796875, -0.61358642578125, -0.504638671875, -0.39569091796875, -0.2867431640625, -0.17779541015625, -0.06884765625, 0.04010009765625, 0.1490478515625, 0.25799560546875, 0.366943359375, 0.47589111328125, 0.5848388671875, 0.69378662109375, 0.802734375, 0.91168212890625, 1.0206298828125, 1.12957763671875, 1.238525390625, 1.34747314453125, 1.4564208984375, 1.56536865234375, 1.67431640625, 1.78326416015625, 1.8922119140625, 2.00115966796875, 2.110107421875, 2.21905517578125, 2.3280029296875, 2.43695068359375, 2.5458984375, 2.65484619140625, 2.7637939453125, 2.87274169921875, 2.981689453125, 3.09063720703125, 3.1995849609375, 3.30853271484375, 3.41748046875, 3.52642822265625, 3.6353759765625, 3.74432373046875, 3.853271484375, 3.96221923828125, 4.0711669921875, 4.18011474609375, 4.2890625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 1.0, 4.0, 3.0, 3.0, 3.0, 7.0, 10.0, 14.0, 35.0, 72.0, 101.0, 144.0, 190.0, 159.0, 111.0, 65.0, 25.0, 18.0, 14.0, 7.0, 3.0, 4.0, 4.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-16.693740844726562, -15.918699264526367, -15.143657684326172, -14.368616104125977, -13.593574523925781, -12.818532943725586, -12.04349136352539, -11.268449783325195, -10.493408203125, -9.718366622924805, -8.94332504272461, -8.168283462524414, -7.393241882324219, -6.618200302124023, -5.84315824508667, -5.068116664886475, -4.293074607849121, -3.518033027648926, -2.7429914474487305, -1.967949628829956, -1.1929080486297607, -0.41786646842956543, 0.357175350189209, 1.1322169303894043, 1.9072585105895996, 2.682300090789795, 3.4573416709899902, 4.232383728027344, 5.007425308227539, 5.782466888427734, 6.55750846862793, 7.332550048828125, 8.10759162902832, 8.882633209228516, 9.657674789428711, 10.432716369628906, 11.207757949829102, 11.982799530029297, 12.757841110229492, 13.532882690429688, 14.307924270629883, 15.082965850830078, 15.858007431030273, 16.63304901123047, 17.408090591430664, 18.18313217163086, 18.958173751831055, 19.73321533203125, 20.508258819580078, 21.283300399780273, 22.05834197998047, 22.833383560180664, 23.60842514038086, 24.383466720581055, 25.15850830078125, 25.933549880981445, 26.70859146118164, 27.483633041381836, 28.25867462158203, 29.033716201782227, 29.808757781982422, 30.583799362182617, 31.358840942382812, 32.13388442993164, 32.9089241027832]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 4.0, 5.0, 3.0, 3.0, 3.0, 4.0, 3.0, 8.0, 6.0, 5.0, 12.0, 13.0, 16.0, 4.0, 20.0, 25.0, 22.0, 21.0, 31.0, 33.0, 23.0, 41.0, 44.0, 46.0, 29.0, 42.0, 32.0, 58.0, 47.0, 40.0, 33.0, 38.0, 38.0, 34.0, 23.0, 27.0, 25.0, 27.0, 22.0, 17.0, 17.0, 15.0, 12.0, 14.0, 6.0, 4.0, 2.0, 3.0, 3.0, 6.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-12.627767562866211, -12.270913124084473, -11.914058685302734, -11.557204246520996, -11.200349807739258, -10.84349536895752, -10.486640930175781, -10.12978744506836, -9.772932052612305, -9.416077613830566, -9.059223175048828, -8.70236873626709, -8.345514297485352, -7.988659858703613, -7.631805896759033, -7.274951457977295, -6.918097496032715, -6.561243057250977, -6.204388618469238, -5.8475341796875, -5.490679740905762, -5.133825302124023, -4.776971340179443, -4.420116901397705, -4.063262462615967, -3.7064080238342285, -3.3495535850524902, -2.992699384689331, -2.6358449459075928, -2.2789905071258545, -1.9221363067626953, -1.565281867980957, -1.2084274291992188, -0.8515730500221252, -0.49471867084503174, -0.137864351272583, 0.21899008750915527, 0.5758445262908936, 0.9326987266540527, 1.289553165435791, 1.6464076042175293, 2.0032620429992676, 2.360116481781006, 2.716970682144165, 3.0738251209259033, 3.4306795597076416, 3.787533760070801, 4.144388198852539, 4.501242637634277, 4.858097076416016, 5.214951515197754, 5.571805953979492, 5.9286603927612305, 6.285514831542969, 6.642368793487549, 6.999223232269287, 7.356077671051025, 7.712932109832764, 8.069786071777344, 8.426640510559082, 8.78349494934082, 9.140349388122559, 9.497203826904297, 9.854058265686035, 10.210912704467773]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 4.0, 5.0, 6.0, 9.0, 12.0, 12.0, 20.0, 21.0, 21.0, 49.0, 82.0, 110.0, 207.0, 311.0, 517.0, 908.0, 1468.0, 2894.0, 5469.0, 11133.0, 24019.0, 52738.0, 116123.0, 236343.0, 286601.0, 166245.0, 76529.0, 34615.0, 15637.0, 7682.0, 3813.0, 2000.0, 1167.0, 673.0, 409.0, 238.0, 139.0, 88.0, 65.0, 58.0, 25.0, 27.0, 20.0, 16.0, 2.0, 9.0, 9.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.6767578125, -1.6247406005859375, -1.572723388671875, -1.5207061767578125, -1.46868896484375, -1.4166717529296875, -1.364654541015625, -1.3126373291015625, -1.2606201171875, -1.2086029052734375, -1.156585693359375, -1.1045684814453125, -1.05255126953125, -1.0005340576171875, -0.948516845703125, -0.8964996337890625, -0.844482421875, -0.7924652099609375, -0.740447998046875, -0.6884307861328125, -0.63641357421875, -0.5843963623046875, -0.532379150390625, -0.4803619384765625, -0.4283447265625, -0.3763275146484375, -0.324310302734375, -0.2722930908203125, -0.22027587890625, -0.1682586669921875, -0.116241455078125, -0.0642242431640625, -0.01220703125, 0.0398101806640625, 0.091827392578125, 0.1438446044921875, 0.19586181640625, 0.2478790283203125, 0.299896240234375, 0.3519134521484375, 0.4039306640625, 0.4559478759765625, 0.507965087890625, 0.5599822998046875, 0.61199951171875, 0.6640167236328125, 0.716033935546875, 0.7680511474609375, 0.820068359375, 0.8720855712890625, 0.924102783203125, 0.9761199951171875, 1.02813720703125, 1.0801544189453125, 1.132171630859375, 1.1841888427734375, 1.2362060546875, 1.2882232666015625, 1.340240478515625, 1.3922576904296875, 1.44427490234375, 1.4962921142578125, 1.548309326171875, 1.6003265380859375, 1.65234375]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 4.0, 2.0, 4.0, 5.0, 1.0, 8.0, 2.0, 14.0, 11.0, 13.0, 11.0, 19.0, 18.0, 17.0, 20.0, 27.0, 29.0, 30.0, 28.0, 39.0, 37.0, 39.0, 34.0, 47.0, 39.0, 38.0, 57.0, 33.0, 51.0, 30.0, 34.0, 35.0, 36.0, 26.0, 26.0, 20.0, 21.0, 23.0, 15.0, 19.0, 7.0, 8.0, 14.0, 6.0, 6.0, 4.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.71240234375, -0.6879043579101562, -0.6634063720703125, -0.6389083862304688, -0.614410400390625, -0.5899124145507812, -0.5654144287109375, -0.5409164428710938, -0.51641845703125, -0.49192047119140625, -0.4674224853515625, -0.44292449951171875, -0.418426513671875, -0.39392852783203125, -0.3694305419921875, -0.34493255615234375, -0.3204345703125, -0.29593658447265625, -0.2714385986328125, -0.24694061279296875, -0.222442626953125, -0.19794464111328125, -0.1734466552734375, -0.14894866943359375, -0.12445068359375, -0.09995269775390625, -0.0754547119140625, -0.05095672607421875, -0.026458740234375, -0.00196075439453125, 0.0225372314453125, 0.04703521728515625, 0.071533203125, 0.09603118896484375, 0.1205291748046875, 0.14502716064453125, 0.169525146484375, 0.19402313232421875, 0.2185211181640625, 0.24301910400390625, 0.26751708984375, 0.29201507568359375, 0.3165130615234375, 0.34101104736328125, 0.365509033203125, 0.39000701904296875, 0.4145050048828125, 0.43900299072265625, 0.4635009765625, 0.48799896240234375, 0.5124969482421875, 0.5369949340820312, 0.561492919921875, 0.5859909057617188, 0.6104888916015625, 0.6349868774414062, 0.65948486328125, 0.6839828491210938, 0.7084808349609375, 0.7329788208007812, 0.757476806640625, 0.7819747924804688, 0.8064727783203125, 0.8309707641601562, 0.85546875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 8.0, 3.0, 9.0, 7.0, 16.0, 27.0, 26.0, 38.0, 53.0, 77.0, 120.0, 189.0, 290.0, 406.0, 662.0, 1152.0, 1982.0, 5218.0, 19397.0, 128252.0, 694499.0, 161507.0, 23405.0, 5797.0, 2322.0, 1125.0, 674.0, 434.0, 257.0, 204.0, 116.0, 79.0, 52.0, 57.0, 29.0, 12.0, 20.0, 7.0, 7.0, 5.0, 5.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.353515625, -3.24005126953125, -3.1265869140625, -3.01312255859375, -2.899658203125, -2.78619384765625, -2.6727294921875, -2.55926513671875, -2.44580078125, -2.33233642578125, -2.2188720703125, -2.10540771484375, -1.991943359375, -1.87847900390625, -1.7650146484375, -1.65155029296875, -1.5380859375, -1.42462158203125, -1.3111572265625, -1.19769287109375, -1.084228515625, -0.97076416015625, -0.8572998046875, -0.74383544921875, -0.63037109375, -0.51690673828125, -0.4034423828125, -0.28997802734375, -0.176513671875, -0.06304931640625, 0.0504150390625, 0.16387939453125, 0.27734375, 0.39080810546875, 0.5042724609375, 0.61773681640625, 0.731201171875, 0.84466552734375, 0.9581298828125, 1.07159423828125, 1.18505859375, 1.29852294921875, 1.4119873046875, 1.52545166015625, 1.638916015625, 1.75238037109375, 1.8658447265625, 1.97930908203125, 2.0927734375, 2.20623779296875, 2.3197021484375, 2.43316650390625, 2.546630859375, 2.66009521484375, 2.7735595703125, 2.88702392578125, 3.00048828125, 3.11395263671875, 3.2274169921875, 3.34088134765625, 3.454345703125, 3.56781005859375, 3.6812744140625, 3.79473876953125, 3.908203125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 7.0, 9.0, 7.0, 5.0, 9.0, 14.0, 14.0, 19.0, 19.0, 29.0, 34.0, 22.0, 33.0, 56.0, 39.0, 39.0, 49.0, 43.0, 50.0, 44.0, 50.0, 42.0, 56.0, 48.0, 40.0, 29.0, 32.0, 39.0, 29.0, 22.0, 17.0, 15.0, 11.0, 10.0, 7.0, 3.0, 3.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.96484375, -3.84490966796875, -3.7249755859375, -3.60504150390625, -3.485107421875, -3.36517333984375, -3.2452392578125, -3.12530517578125, -3.00537109375, -2.88543701171875, -2.7655029296875, -2.64556884765625, -2.525634765625, -2.40570068359375, -2.2857666015625, -2.16583251953125, -2.0458984375, -1.92596435546875, -1.8060302734375, -1.68609619140625, -1.566162109375, -1.44622802734375, -1.3262939453125, -1.20635986328125, -1.08642578125, -0.96649169921875, -0.8465576171875, -0.72662353515625, -0.606689453125, -0.48675537109375, -0.3668212890625, -0.24688720703125, -0.126953125, -0.00701904296875, 0.1129150390625, 0.23284912109375, 0.352783203125, 0.47271728515625, 0.5926513671875, 0.71258544921875, 0.83251953125, 0.95245361328125, 1.0723876953125, 1.19232177734375, 1.312255859375, 1.43218994140625, 1.5521240234375, 1.67205810546875, 1.7919921875, 1.91192626953125, 2.0318603515625, 2.15179443359375, 2.271728515625, 2.39166259765625, 2.5115966796875, 2.63153076171875, 2.75146484375, 2.87139892578125, 2.9913330078125, 3.11126708984375, 3.231201171875, 3.35113525390625, 3.4710693359375, 3.59100341796875, 3.7109375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 4.0, 9.0, 13.0, 10.0, 14.0, 17.0, 27.0, 35.0, 67.0, 105.0, 159.0, 231.0, 439.0, 927.0, 2297.0, 7670.0, 46329.0, 696454.0, 261447.0, 23988.0, 5026.0, 1614.0, 721.0, 345.0, 205.0, 132.0, 75.0, 41.0, 43.0, 28.0, 21.0, 15.0, 11.0, 9.0, 8.0, 5.0, 2.0, 4.0, 2.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.38671875, -1.3417510986328125, -1.296783447265625, -1.2518157958984375, -1.20684814453125, -1.1618804931640625, -1.116912841796875, -1.0719451904296875, -1.0269775390625, -0.9820098876953125, -0.937042236328125, -0.8920745849609375, -0.84710693359375, -0.8021392822265625, -0.757171630859375, -0.7122039794921875, -0.667236328125, -0.6222686767578125, -0.577301025390625, -0.5323333740234375, -0.48736572265625, -0.4423980712890625, -0.397430419921875, -0.3524627685546875, -0.3074951171875, -0.2625274658203125, -0.217559814453125, -0.1725921630859375, -0.12762451171875, -0.0826568603515625, -0.037689208984375, 0.0072784423828125, 0.05224609375, 0.0972137451171875, 0.142181396484375, 0.1871490478515625, 0.23211669921875, 0.2770843505859375, 0.322052001953125, 0.3670196533203125, 0.4119873046875, 0.4569549560546875, 0.501922607421875, 0.5468902587890625, 0.59185791015625, 0.6368255615234375, 0.681793212890625, 0.7267608642578125, 0.771728515625, 0.8166961669921875, 0.861663818359375, 0.9066314697265625, 0.95159912109375, 0.9965667724609375, 1.041534423828125, 1.0865020751953125, 1.1314697265625, 1.1764373779296875, 1.221405029296875, 1.2663726806640625, 1.31134033203125, 1.3563079833984375, 1.401275634765625, 1.4462432861328125, 1.4912109375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 4.0, 7.0, 2.0, 7.0, 6.0, 7.0, 17.0, 20.0, 32.0, 40.0, 41.0, 60.0, 83.0, 106.0, 117.0, 105.0, 61.0, 52.0, 49.0, 33.0, 36.0, 21.0, 17.0, 16.0, 11.0, 7.0, 9.0, 4.0, 5.0, 5.0, 5.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002772808074951172, -0.0002675391733646393, -0.0002577975392341614, -0.00024805590510368347, -0.00023831427097320557, -0.00022857263684272766, -0.00021883100271224976, -0.00020908936858177185, -0.00019934773445129395, -0.00018960610032081604, -0.00017986446619033813, -0.00017012283205986023, -0.00016038119792938232, -0.00015063956379890442, -0.00014089792966842651, -0.0001311562955379486, -0.0001214146614074707, -0.0001116730272769928, -0.00010193139314651489, -9.218975901603699e-05, -8.244812488555908e-05, -7.270649075508118e-05, -6.296485662460327e-05, -5.3223222494125366e-05, -4.348158836364746e-05, -3.3739954233169556e-05, -2.399832010269165e-05, -1.4256685972213745e-05, -4.51505184173584e-06, 5.2265822887420654e-06, 1.496821641921997e-05, 2.4709850549697876e-05, 3.445148468017578e-05, 4.4193118810653687e-05, 5.393475294113159e-05, 6.36763870716095e-05, 7.34180212020874e-05, 8.315965533256531e-05, 9.290128946304321e-05, 0.00010264292359352112, 0.00011238455772399902, 0.00012212619185447693, 0.00013186782598495483, 0.00014160946011543274, 0.00015135109424591064, 0.00016109272837638855, 0.00017083436250686646, 0.00018057599663734436, 0.00019031763076782227, 0.00020005926489830017, 0.00020980089902877808, 0.00021954253315925598, 0.0002292841672897339, 0.0002390258014202118, 0.0002487674355506897, 0.0002585090696811676, 0.0002682507038116455, 0.0002779923379421234, 0.0002877339720726013, 0.0002974756062030792, 0.00030721724033355713, 0.00031695887446403503, 0.00032670050859451294, 0.00033644214272499084, 0.00034618377685546875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 2.0, 7.0, 1.0, 11.0, 15.0, 11.0, 22.0, 35.0, 59.0, 101.0, 143.0, 279.0, 567.0, 1213.0, 3177.0, 11756.0, 75860.0, 794797.0, 136183.0, 17095.0, 4326.0, 1437.0, 663.0, 312.0, 161.0, 103.0, 57.0, 41.0, 45.0, 22.0, 11.0, 14.0, 9.0, 4.0, 2.0, 5.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5009765625, -1.4549560546875, -1.408935546875, -1.3629150390625, -1.31689453125, -1.2708740234375, -1.224853515625, -1.1788330078125, -1.1328125, -1.0867919921875, -1.040771484375, -0.9947509765625, -0.94873046875, -0.9027099609375, -0.856689453125, -0.8106689453125, -0.7646484375, -0.7186279296875, -0.672607421875, -0.6265869140625, -0.58056640625, -0.5345458984375, -0.488525390625, -0.4425048828125, -0.396484375, -0.3504638671875, -0.304443359375, -0.2584228515625, -0.21240234375, -0.1663818359375, -0.120361328125, -0.0743408203125, -0.0283203125, 0.0177001953125, 0.063720703125, 0.1097412109375, 0.15576171875, 0.2017822265625, 0.247802734375, 0.2938232421875, 0.33984375, 0.3858642578125, 0.431884765625, 0.4779052734375, 0.52392578125, 0.5699462890625, 0.615966796875, 0.6619873046875, 0.7080078125, 0.7540283203125, 0.800048828125, 0.8460693359375, 0.89208984375, 0.9381103515625, 0.984130859375, 1.0301513671875, 1.076171875, 1.1221923828125, 1.168212890625, 1.2142333984375, 1.26025390625, 1.3062744140625, 1.352294921875, 1.3983154296875, 1.4443359375]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 5.0, 2.0, 6.0, 6.0, 11.0, 9.0, 6.0, 13.0, 19.0, 27.0, 19.0, 37.0, 48.0, 64.0, 74.0, 83.0, 85.0, 82.0, 70.0, 64.0, 69.0, 43.0, 36.0, 30.0, 22.0, 18.0, 13.0, 11.0, 5.0, 8.0, 9.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0908203125, -1.0528717041015625, -1.014923095703125, -0.9769744873046875, -0.93902587890625, -0.9010772705078125, -0.863128662109375, -0.8251800537109375, -0.7872314453125, -0.7492828369140625, -0.711334228515625, -0.6733856201171875, -0.63543701171875, -0.5974884033203125, -0.559539794921875, -0.5215911865234375, -0.483642578125, -0.4456939697265625, -0.407745361328125, -0.3697967529296875, -0.33184814453125, -0.2938995361328125, -0.255950927734375, -0.2180023193359375, -0.1800537109375, -0.1421051025390625, -0.104156494140625, -0.0662078857421875, -0.02825927734375, 0.0096893310546875, 0.047637939453125, 0.0855865478515625, 0.12353515625, 0.1614837646484375, 0.199432373046875, 0.2373809814453125, 0.27532958984375, 0.3132781982421875, 0.351226806640625, 0.3891754150390625, 0.4271240234375, 0.4650726318359375, 0.503021240234375, 0.5409698486328125, 0.57891845703125, 0.6168670654296875, 0.654815673828125, 0.6927642822265625, 0.730712890625, 0.7686614990234375, 0.806610107421875, 0.8445587158203125, 0.88250732421875, 0.9204559326171875, 0.958404541015625, 0.9963531494140625, 1.0343017578125, 1.0722503662109375, 1.110198974609375, 1.1481475830078125, 1.18609619140625, 1.2240447998046875, 1.261993408203125, 1.2999420166015625, 1.337890625]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 2.0, 3.0, 0.0, 4.0, 5.0, 13.0, 14.0, 20.0, 48.0, 104.0, 144.0, 289.0, 174.0, 103.0, 41.0, 22.0, 7.0, 8.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.962188720703125, -45.99844741821289, -45.034706115722656, -44.07096481323242, -43.10722351074219, -42.14348220825195, -41.17974090576172, -40.215999603271484, -39.25225830078125, -38.288516998291016, -37.32477569580078, -36.36103439331055, -35.39729309082031, -34.43355178833008, -33.469810485839844, -32.50606918334961, -31.542325973510742, -30.578584671020508, -29.614843368530273, -28.65110206604004, -27.687360763549805, -26.72361946105957, -25.759876251220703, -24.79613494873047, -23.832393646240234, -22.86865234375, -21.904911041259766, -20.94116973876953, -19.977428436279297, -19.013687133789062, -18.049945831298828, -17.086204528808594, -16.12246322631836, -15.158721923828125, -14.19498062133789, -13.231239318847656, -12.267498016357422, -11.303756713867188, -10.340014457702637, -9.376273155212402, -8.412530899047852, -7.448789596557617, -6.485048294067383, -5.52130651473999, -4.557565212249756, -3.5938239097595215, -2.630082130432129, -1.6663408279418945, -0.7025995254516602, 0.26114189624786377, 1.2248833179473877, 2.188624858856201, 3.1523661613464355, 4.11610746383667, 5.0798492431640625, 6.043590545654297, 7.007331848144531, 7.971073150634766, 8.934814453125, 9.898555755615234, 10.862297058105469, 11.826038360595703, 12.789780616760254, 13.753521919250488, 14.717263221740723]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 6.0, 14.0, 7.0, 11.0, 9.0, 16.0, 11.0, 16.0, 19.0, 20.0, 35.0, 33.0, 27.0, 25.0, 30.0, 29.0, 36.0, 59.0, 61.0, 56.0, 61.0, 44.0, 44.0, 36.0, 35.0, 20.0, 26.0, 17.0, 15.0, 27.0, 24.0, 18.0, 19.0, 13.0, 8.0, 15.0, 13.0, 8.0, 7.0, 7.0, 6.0, 5.0, 3.0, 1.0, 6.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-12.562311172485352, -12.178360939025879, -11.794410705566406, -11.410460472106934, -11.026510238647461, -10.642560005187988, -10.258609771728516, -9.874659538269043, -9.49070930480957, -9.106759071350098, -8.722808837890625, -8.338858604431152, -7.95490837097168, -7.570958137512207, -7.187007904052734, -6.803057670593262, -6.419106960296631, -6.035156726837158, -5.6512064933776855, -5.267256259918213, -4.88330602645874, -4.499355792999268, -4.115405082702637, -3.731455087661743, -3.3475048542022705, -2.963554620742798, -2.579604387283325, -2.1956539154052734, -1.8117038011550903, -1.4277535676956177, -1.0438032150268555, -0.6598529815673828, -0.27590274810791016, 0.10804751515388489, 0.49199777841567993, 0.8759480714797974, 1.25989830493927, 1.6438485383987427, 2.027798891067505, 2.4117491245269775, 2.79569935798645, 3.179649591445923, 3.5635998249053955, 3.9475502967834473, 4.33150053024292, 4.715450763702393, 5.099400997161865, 5.483351230621338, 5.8673014640808105, 6.251251697540283, 6.635201930999756, 7.0191521644592285, 7.403102397918701, 7.787052631378174, 8.171003341674805, 8.554953575134277, 8.93890380859375, 9.322854042053223, 9.706804275512695, 10.090754508972168, 10.47470474243164, 10.858654975891113, 11.242605209350586, 11.626555442810059, 12.010505676269531]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 7.0, 6.0, 15.0, 14.0, 28.0, 41.0, 81.0, 153.0, 329.0, 851.0, 2652.0, 10321.0, 74766.0, 2342433.0, 1694089.0, 56230.0, 8657.0, 2180.0, 752.0, 295.0, 172.0, 83.0, 39.0, 32.0, 17.0, 11.0, 9.0, 7.0, 4.0, 3.0, 1.0, 3.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.37109375, -2.29913330078125, -2.2271728515625, -2.15521240234375, -2.083251953125, -2.01129150390625, -1.9393310546875, -1.86737060546875, -1.79541015625, -1.72344970703125, -1.6514892578125, -1.57952880859375, -1.507568359375, -1.43560791015625, -1.3636474609375, -1.29168701171875, -1.2197265625, -1.14776611328125, -1.0758056640625, -1.00384521484375, -0.931884765625, -0.85992431640625, -0.7879638671875, -0.71600341796875, -0.64404296875, -0.57208251953125, -0.5001220703125, -0.42816162109375, -0.356201171875, -0.28424072265625, -0.2122802734375, -0.14031982421875, -0.068359375, 0.00360107421875, 0.0755615234375, 0.14752197265625, 0.219482421875, 0.29144287109375, 0.3634033203125, 0.43536376953125, 0.50732421875, 0.57928466796875, 0.6512451171875, 0.72320556640625, 0.795166015625, 0.86712646484375, 0.9390869140625, 1.01104736328125, 1.0830078125, 1.15496826171875, 1.2269287109375, 1.29888916015625, 1.370849609375, 1.44281005859375, 1.5147705078125, 1.58673095703125, 1.65869140625, 1.73065185546875, 1.8026123046875, 1.87457275390625, 1.946533203125, 2.01849365234375, 2.0904541015625, 2.16241455078125, 2.234375]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 1.0, 3.0, 4.0, 7.0, 4.0, 6.0, 11.0, 7.0, 17.0, 22.0, 12.0, 22.0, 24.0, 23.0, 34.0, 24.0, 22.0, 44.0, 37.0, 43.0, 42.0, 50.0, 47.0, 45.0, 54.0, 46.0, 47.0, 44.0, 43.0, 34.0, 30.0, 26.0, 24.0, 23.0, 14.0, 18.0, 13.0, 3.0, 12.0, 8.0, 4.0, 5.0, 3.0, 0.0, 4.0, 0.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.65966796875, -0.6340484619140625, -0.608428955078125, -0.5828094482421875, -0.55718994140625, -0.5315704345703125, -0.505950927734375, -0.4803314208984375, -0.4547119140625, -0.4290924072265625, -0.403472900390625, -0.3778533935546875, -0.35223388671875, -0.3266143798828125, -0.300994873046875, -0.2753753662109375, -0.249755859375, -0.2241363525390625, -0.198516845703125, -0.1728973388671875, -0.14727783203125, -0.1216583251953125, -0.096038818359375, -0.0704193115234375, -0.0447998046875, -0.0191802978515625, 0.006439208984375, 0.0320587158203125, 0.05767822265625, 0.0832977294921875, 0.108917236328125, 0.1345367431640625, 0.16015625, 0.1857757568359375, 0.211395263671875, 0.2370147705078125, 0.26263427734375, 0.2882537841796875, 0.313873291015625, 0.3394927978515625, 0.3651123046875, 0.3907318115234375, 0.416351318359375, 0.4419708251953125, 0.46759033203125, 0.4932098388671875, 0.518829345703125, 0.5444488525390625, 0.570068359375, 0.5956878662109375, 0.621307373046875, 0.6469268798828125, 0.67254638671875, 0.6981658935546875, 0.723785400390625, 0.7494049072265625, 0.7750244140625, 0.8006439208984375, 0.826263427734375, 0.8518829345703125, 0.87750244140625, 0.9031219482421875, 0.928741455078125, 0.9543609619140625, 0.97998046875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 8.0, 6.0, 7.0, 8.0, 12.0, 15.0, 17.0, 37.0, 41.0, 83.0, 113.0, 159.0, 264.0, 481.0, 866.0, 1867.0, 4564.0, 13227.0, 47800.0, 304618.0, 3287082.0, 446566.0, 60656.0, 15962.0, 5310.0, 2187.0, 978.0, 483.0, 280.0, 163.0, 106.0, 76.0, 58.0, 42.0, 43.0, 22.0, 27.0, 16.0, 13.0, 7.0, 4.0, 3.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8056640625, -1.7465972900390625, -1.687530517578125, -1.6284637451171875, -1.56939697265625, -1.5103302001953125, -1.451263427734375, -1.3921966552734375, -1.3331298828125, -1.2740631103515625, -1.214996337890625, -1.1559295654296875, -1.09686279296875, -1.0377960205078125, -0.978729248046875, -0.9196624755859375, -0.860595703125, -0.8015289306640625, -0.742462158203125, -0.6833953857421875, -0.62432861328125, -0.5652618408203125, -0.506195068359375, -0.4471282958984375, -0.3880615234375, -0.3289947509765625, -0.269927978515625, -0.2108612060546875, -0.15179443359375, -0.0927276611328125, -0.033660888671875, 0.0254058837890625, 0.08447265625, 0.1435394287109375, 0.202606201171875, 0.2616729736328125, 0.32073974609375, 0.3798065185546875, 0.438873291015625, 0.4979400634765625, 0.5570068359375, 0.6160736083984375, 0.675140380859375, 0.7342071533203125, 0.79327392578125, 0.8523406982421875, 0.911407470703125, 0.9704742431640625, 1.029541015625, 1.0886077880859375, 1.147674560546875, 1.2067413330078125, 1.26580810546875, 1.3248748779296875, 1.383941650390625, 1.4430084228515625, 1.5020751953125, 1.5611419677734375, 1.620208740234375, 1.6792755126953125, 1.73834228515625, 1.7974090576171875, 1.856475830078125, 1.9155426025390625, 1.974609375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 2.0, 9.0, 6.0, 7.0, 8.0, 16.0, 13.0, 9.0, 21.0, 33.0, 29.0, 48.0, 77.0, 76.0, 140.0, 225.0, 357.0, 570.0, 686.0, 568.0, 371.0, 249.0, 146.0, 102.0, 78.0, 40.0, 31.0, 37.0, 23.0, 23.0, 14.0, 14.0, 10.0, 6.0, 5.0, 7.0, 4.0, 3.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 2.0], "bins": [-1.9130859375, -1.8578033447265625, -1.802520751953125, -1.7472381591796875, -1.69195556640625, -1.6366729736328125, -1.581390380859375, -1.5261077880859375, -1.4708251953125, -1.4155426025390625, -1.360260009765625, -1.3049774169921875, -1.24969482421875, -1.1944122314453125, -1.139129638671875, -1.0838470458984375, -1.028564453125, -0.9732818603515625, -0.917999267578125, -0.8627166748046875, -0.80743408203125, -0.7521514892578125, -0.696868896484375, -0.6415863037109375, -0.5863037109375, -0.5310211181640625, -0.475738525390625, -0.4204559326171875, -0.36517333984375, -0.3098907470703125, -0.254608154296875, -0.1993255615234375, -0.14404296875, -0.0887603759765625, -0.033477783203125, 0.0218048095703125, 0.07708740234375, 0.1323699951171875, 0.187652587890625, 0.2429351806640625, 0.2982177734375, 0.3535003662109375, 0.408782958984375, 0.4640655517578125, 0.51934814453125, 0.5746307373046875, 0.629913330078125, 0.6851959228515625, 0.740478515625, 0.7957611083984375, 0.851043701171875, 0.9063262939453125, 0.96160888671875, 1.0168914794921875, 1.072174072265625, 1.1274566650390625, 1.1827392578125, 1.2380218505859375, 1.293304443359375, 1.3485870361328125, 1.40386962890625, 1.4591522216796875, 1.514434814453125, 1.5697174072265625, 1.625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 6.0, 12.0, 40.0, 95.0, 236.0, 318.0, 186.0, 64.0, 25.0, 7.0, 10.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.70520782470703, -16.62074089050293, -15.536274909973145, -14.45180892944336, -13.367341995239258, -12.282876014709473, -11.198410034179688, -10.113943099975586, -9.0294771194458, -7.945010662078857, -6.860544204711914, -5.776078224182129, -4.6916117668151855, -3.607145309448242, -2.522679328918457, -1.4382128715515137, -0.3537464141845703, 0.7307199239730835, 1.8151862621307373, 2.8996524810791016, 3.984118938446045, 5.068585395812988, 6.153051376342773, 7.237517833709717, 8.32198429107666, 9.406450271606445, 10.490917205810547, 11.575383186340332, 12.659849166870117, 13.744316101074219, 14.828782081604004, 15.913248062133789, 16.99771499633789, 18.082181930541992, 19.16664695739746, 20.251113891601562, 21.335580825805664, 22.420047760009766, 23.504512786865234, 24.588979721069336, 25.673446655273438, 26.75791358947754, 27.842378616333008, 28.92684555053711, 30.01131248474121, 31.095779418945312, 32.18024444580078, 33.26470947265625, 34.34917449951172, 35.43363952636719, 36.51810836791992, 37.60257339477539, 38.68703842163086, 39.771507263183594, 40.85597229003906, 41.94043731689453, 43.024906158447266, 44.109371185302734, 45.19384002685547, 46.27830505371094, 47.362770080566406, 48.44723892211914, 49.53170394897461, 50.61616897583008, 51.70063781738281]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 1.0, 3.0, 12.0, 12.0, 9.0, 5.0, 11.0, 18.0, 20.0, 20.0, 28.0, 32.0, 33.0, 45.0, 40.0, 44.0, 37.0, 51.0, 65.0, 63.0, 47.0, 50.0, 46.0, 50.0, 36.0, 40.0, 27.0, 37.0, 24.0, 15.0, 12.0, 12.0, 13.0, 15.0, 14.0, 8.0, 4.0, 8.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.922636032104492, -11.611213684082031, -11.299790382385254, -10.988368034362793, -10.676944732666016, -10.365522384643555, -10.054099082946777, -9.742676734924316, -9.431253433227539, -9.119831085205078, -8.8084077835083, -8.49698543548584, -8.185562133789062, -7.874139785766602, -7.562716960906982, -7.251294136047363, -6.939871788024902, -6.628448963165283, -6.317026138305664, -6.005603313446045, -5.694180488586426, -5.382758140563965, -5.071335315704346, -4.759912490844727, -4.448489665985107, -4.137066841125488, -3.825644016265869, -3.514221429824829, -3.20279860496521, -2.891375780105591, -2.579953193664551, -2.2685303688049316, -1.9571075439453125, -1.6456847190856934, -1.3342620134353638, -1.0228393077850342, -0.711416482925415, -0.3999936580657959, -0.08857095241546631, 0.22285175323486328, 0.5342745780944824, 0.8456973433494568, 1.1571201086044312, 1.4685428142547607, 1.7799656391143799, 2.091388463973999, 2.402811050415039, 2.714233875274658, 3.0256567001342773, 3.3370795249938965, 3.6485023498535156, 3.9599249362945557, 4.271347999572754, 4.582770347595215, 4.894193172454834, 5.205615997314453, 5.517038822174072, 5.828461647033691, 6.1398844718933105, 6.45130729675293, 6.762729644775391, 7.074152946472168, 7.385575294494629, 7.696998119354248, 8.008420944213867]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 5.0, 6.0, 6.0, 6.0, 8.0, 12.0, 30.0, 26.0, 46.0, 81.0, 150.0, 190.0, 330.0, 497.0, 997.0, 1807.0, 3472.0, 7143.0, 15250.0, 34097.0, 80273.0, 192433.0, 333833.0, 216301.0, 90162.0, 38189.0, 17015.0, 7787.0, 3809.0, 1974.0, 1061.0, 599.0, 356.0, 203.0, 148.0, 85.0, 55.0, 28.0, 35.0, 23.0, 14.0, 9.0, 2.0, 2.0, 4.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.400390625, -1.3495941162109375, -1.298797607421875, -1.2480010986328125, -1.19720458984375, -1.1464080810546875, -1.095611572265625, -1.0448150634765625, -0.9940185546875, -0.9432220458984375, -0.892425537109375, -0.8416290283203125, -0.79083251953125, -0.7400360107421875, -0.689239501953125, -0.6384429931640625, -0.587646484375, -0.5368499755859375, -0.486053466796875, -0.4352569580078125, -0.38446044921875, -0.3336639404296875, -0.282867431640625, -0.2320709228515625, -0.1812744140625, -0.1304779052734375, -0.079681396484375, -0.0288848876953125, 0.02191162109375, 0.0727081298828125, 0.123504638671875, 0.1743011474609375, 0.22509765625, 0.2758941650390625, 0.326690673828125, 0.3774871826171875, 0.42828369140625, 0.4790802001953125, 0.529876708984375, 0.5806732177734375, 0.6314697265625, 0.6822662353515625, 0.733062744140625, 0.7838592529296875, 0.83465576171875, 0.8854522705078125, 0.936248779296875, 0.9870452880859375, 1.037841796875, 1.0886383056640625, 1.139434814453125, 1.1902313232421875, 1.24102783203125, 1.2918243408203125, 1.342620849609375, 1.3934173583984375, 1.4442138671875, 1.4950103759765625, 1.545806884765625, 1.5966033935546875, 1.64739990234375, 1.6981964111328125, 1.748992919921875, 1.7997894287109375, 1.8505859375]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 7.0, 0.0, 7.0, 5.0, 6.0, 13.0, 8.0, 14.0, 12.0, 10.0, 21.0, 18.0, 21.0, 22.0, 27.0, 25.0, 27.0, 36.0, 36.0, 43.0, 36.0, 26.0, 43.0, 35.0, 38.0, 46.0, 41.0, 56.0, 33.0, 36.0, 27.0, 22.0, 22.0, 28.0, 27.0, 31.0, 15.0, 17.0, 11.0, 8.0, 10.0, 11.0, 3.0, 4.0, 5.0, 4.0, 2.0, 7.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.6923828125, -0.6698760986328125, -0.647369384765625, -0.6248626708984375, -0.60235595703125, -0.5798492431640625, -0.557342529296875, -0.5348358154296875, -0.5123291015625, -0.4898223876953125, -0.467315673828125, -0.4448089599609375, -0.42230224609375, -0.3997955322265625, -0.377288818359375, -0.3547821044921875, -0.332275390625, -0.3097686767578125, -0.287261962890625, -0.2647552490234375, -0.24224853515625, -0.2197418212890625, -0.197235107421875, -0.1747283935546875, -0.1522216796875, -0.1297149658203125, -0.107208251953125, -0.0847015380859375, -0.06219482421875, -0.0396881103515625, -0.017181396484375, 0.0053253173828125, 0.02783203125, 0.0503387451171875, 0.072845458984375, 0.0953521728515625, 0.11785888671875, 0.1403656005859375, 0.162872314453125, 0.1853790283203125, 0.2078857421875, 0.2303924560546875, 0.252899169921875, 0.2754058837890625, 0.29791259765625, 0.3204193115234375, 0.342926025390625, 0.3654327392578125, 0.387939453125, 0.4104461669921875, 0.432952880859375, 0.4554595947265625, 0.47796630859375, 0.5004730224609375, 0.522979736328125, 0.5454864501953125, 0.5679931640625, 0.5904998779296875, 0.613006591796875, 0.6355133056640625, 0.65802001953125, 0.6805267333984375, 0.703033447265625, 0.7255401611328125, 0.748046875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 6.0, 4.0, 6.0, 11.0, 22.0, 24.0, 37.0, 58.0, 79.0, 108.0, 151.0, 251.0, 412.0, 661.0, 1196.0, 2426.0, 6943.0, 32041.0, 217883.0, 668347.0, 93325.0, 15976.0, 4368.0, 1755.0, 928.0, 529.0, 331.0, 223.0, 134.0, 94.0, 86.0, 44.0, 31.0, 20.0, 10.0, 9.0, 12.0, 10.0, 4.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.265625, -3.157806396484375, -3.04998779296875, -2.942169189453125, -2.8343505859375, -2.726531982421875, -2.61871337890625, -2.510894775390625, -2.403076171875, -2.295257568359375, -2.18743896484375, -2.079620361328125, -1.9718017578125, -1.863983154296875, -1.75616455078125, -1.648345947265625, -1.54052734375, -1.432708740234375, -1.32489013671875, -1.217071533203125, -1.1092529296875, -1.001434326171875, -0.89361572265625, -0.785797119140625, -0.677978515625, -0.570159912109375, -0.46234130859375, -0.354522705078125, -0.2467041015625, -0.138885498046875, -0.03106689453125, 0.076751708984375, 0.1845703125, 0.292388916015625, 0.40020751953125, 0.508026123046875, 0.6158447265625, 0.723663330078125, 0.83148193359375, 0.939300537109375, 1.047119140625, 1.154937744140625, 1.26275634765625, 1.370574951171875, 1.4783935546875, 1.586212158203125, 1.69403076171875, 1.801849365234375, 1.90966796875, 2.017486572265625, 2.12530517578125, 2.233123779296875, 2.3409423828125, 2.448760986328125, 2.55657958984375, 2.664398193359375, 2.772216796875, 2.880035400390625, 2.98785400390625, 3.095672607421875, 3.2034912109375, 3.311309814453125, 3.41912841796875, 3.526947021484375, 3.634765625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 7.0, 6.0, 9.0, 6.0, 17.0, 12.0, 14.0, 24.0, 30.0, 36.0, 34.0, 41.0, 42.0, 57.0, 60.0, 55.0, 69.0, 56.0, 57.0, 54.0, 40.0, 47.0, 44.0, 34.0, 33.0, 23.0, 24.0, 25.0, 18.0, 9.0, 7.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.45703125, -4.3321533203125, -4.207275390625, -4.0823974609375, -3.95751953125, -3.8326416015625, -3.707763671875, -3.5828857421875, -3.4580078125, -3.3331298828125, -3.208251953125, -3.0833740234375, -2.95849609375, -2.8336181640625, -2.708740234375, -2.5838623046875, -2.458984375, -2.3341064453125, -2.209228515625, -2.0843505859375, -1.95947265625, -1.8345947265625, -1.709716796875, -1.5848388671875, -1.4599609375, -1.3350830078125, -1.210205078125, -1.0853271484375, -0.96044921875, -0.8355712890625, -0.710693359375, -0.5858154296875, -0.4609375, -0.3360595703125, -0.211181640625, -0.0863037109375, 0.03857421875, 0.1634521484375, 0.288330078125, 0.4132080078125, 0.5380859375, 0.6629638671875, 0.787841796875, 0.9127197265625, 1.03759765625, 1.1624755859375, 1.287353515625, 1.4122314453125, 1.537109375, 1.6619873046875, 1.786865234375, 1.9117431640625, 2.03662109375, 2.1614990234375, 2.286376953125, 2.4112548828125, 2.5361328125, 2.6610107421875, 2.785888671875, 2.9107666015625, 3.03564453125, 3.1605224609375, 3.285400390625, 3.4102783203125, 3.53515625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 4.0, 3.0, 7.0, 10.0, 8.0, 18.0, 16.0, 26.0, 52.0, 74.0, 108.0, 197.0, 399.0, 812.0, 2015.0, 6748.0, 36921.0, 304424.0, 619747.0, 62173.0, 10102.0, 2632.0, 1036.0, 413.0, 255.0, 129.0, 70.0, 44.0, 40.0, 26.0, 11.0, 17.0, 3.0, 6.0, 4.0, 5.0, 0.0, 4.0, 2.0, 1.0, 2.0], "bins": [-1.2177734375, -1.1881637573242188, -1.1585540771484375, -1.1289443969726562, -1.099334716796875, -1.0697250366210938, -1.0401153564453125, -1.0105056762695312, -0.98089599609375, -0.9512863159179688, -0.9216766357421875, -0.8920669555664062, -0.862457275390625, -0.8328475952148438, -0.8032379150390625, -0.7736282348632812, -0.7440185546875, -0.7144088745117188, -0.6847991943359375, -0.6551895141601562, -0.625579833984375, -0.5959701538085938, -0.5663604736328125, -0.5367507934570312, -0.50714111328125, -0.47753143310546875, -0.4479217529296875, -0.41831207275390625, -0.388702392578125, -0.35909271240234375, -0.3294830322265625, -0.29987335205078125, -0.270263671875, -0.24065399169921875, -0.2110443115234375, -0.18143463134765625, -0.151824951171875, -0.12221527099609375, -0.0926055908203125, -0.06299591064453125, -0.03338623046875, -0.00377655029296875, 0.0258331298828125, 0.05544281005859375, 0.085052490234375, 0.11466217041015625, 0.1442718505859375, 0.17388153076171875, 0.2034912109375, 0.23310089111328125, 0.2627105712890625, 0.29232025146484375, 0.321929931640625, 0.35153961181640625, 0.3811492919921875, 0.41075897216796875, 0.44036865234375, 0.46997833251953125, 0.4995880126953125, 0.5291976928710938, 0.558807373046875, 0.5884170532226562, 0.6180267333984375, 0.6476364135742188, 0.67724609375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 2.0, 4.0, 7.0, 4.0, 6.0, 9.0, 11.0, 9.0, 25.0, 40.0, 46.0, 61.0, 79.0, 89.0, 120.0, 111.0, 109.0, 71.0, 51.0, 35.0, 27.0, 19.0, 13.0, 14.0, 14.0, 7.0, 5.0, 7.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0003390312194824219, -0.00033006444573402405, -0.0003210976719856262, -0.0003121308982372284, -0.00030316412448883057, -0.00029419735074043274, -0.0002852305769920349, -0.0002762638032436371, -0.00026729702949523926, -0.00025833025574684143, -0.0002493634819984436, -0.00024039670825004578, -0.00023142993450164795, -0.00022246316075325012, -0.0002134963870048523, -0.00020452961325645447, -0.00019556283950805664, -0.0001865960657596588, -0.00017762929201126099, -0.00016866251826286316, -0.00015969574451446533, -0.0001507289707660675, -0.00014176219701766968, -0.00013279542326927185, -0.00012382864952087402, -0.0001148618757724762, -0.00010589510202407837, -9.692832827568054e-05, -8.796155452728271e-05, -7.899478077888489e-05, -7.002800703048706e-05, -6.106123328208923e-05, -5.2094459533691406e-05, -4.312768578529358e-05, -3.416091203689575e-05, -2.5194138288497925e-05, -1.6227364540100098e-05, -7.2605907917022705e-06, 1.7061829566955566e-06, 1.0672956705093384e-05, 1.963973045349121e-05, 2.8606504201889038e-05, 3.7573277950286865e-05, 4.654005169868469e-05, 5.550682544708252e-05, 6.447359919548035e-05, 7.344037294387817e-05, 8.2407146692276e-05, 9.137392044067383e-05, 0.00010034069418907166, 0.00010930746793746948, 0.00011827424168586731, 0.00012724101543426514, 0.00013620778918266296, 0.0001451745629310608, 0.00015414133667945862, 0.00016310811042785645, 0.00017207488417625427, 0.0001810416579246521, 0.00019000843167304993, 0.00019897520542144775, 0.00020794197916984558, 0.0002169087529182434, 0.00022587552666664124, 0.00023484230041503906]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 8.0, 10.0, 9.0, 13.0, 31.0, 34.0, 41.0, 60.0, 100.0, 128.0, 198.0, 326.0, 556.0, 1105.0, 2069.0, 5036.0, 15565.0, 75298.0, 547263.0, 322525.0, 57049.0, 12753.0, 4214.0, 1897.0, 930.0, 489.0, 311.0, 170.0, 103.0, 95.0, 55.0, 30.0, 21.0, 9.0, 10.0, 15.0, 7.0, 5.0, 4.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.7587890625, -0.735015869140625, -0.71124267578125, -0.687469482421875, -0.6636962890625, -0.639923095703125, -0.61614990234375, -0.592376708984375, -0.568603515625, -0.544830322265625, -0.52105712890625, -0.497283935546875, -0.4735107421875, -0.449737548828125, -0.42596435546875, -0.402191162109375, -0.37841796875, -0.354644775390625, -0.33087158203125, -0.307098388671875, -0.2833251953125, -0.259552001953125, -0.23577880859375, -0.212005615234375, -0.188232421875, -0.164459228515625, -0.14068603515625, -0.116912841796875, -0.0931396484375, -0.069366455078125, -0.04559326171875, -0.021820068359375, 0.001953125, 0.025726318359375, 0.04949951171875, 0.073272705078125, 0.0970458984375, 0.120819091796875, 0.14459228515625, 0.168365478515625, 0.192138671875, 0.215911865234375, 0.23968505859375, 0.263458251953125, 0.2872314453125, 0.311004638671875, 0.33477783203125, 0.358551025390625, 0.38232421875, 0.406097412109375, 0.42987060546875, 0.453643798828125, 0.4774169921875, 0.501190185546875, 0.52496337890625, 0.548736572265625, 0.572509765625, 0.596282958984375, 0.62005615234375, 0.643829345703125, 0.6676025390625, 0.691375732421875, 0.71514892578125, 0.738922119140625, 0.7626953125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 2.0, 5.0, 8.0, 6.0, 10.0, 7.0, 14.0, 15.0, 19.0, 20.0, 29.0, 30.0, 27.0, 39.0, 46.0, 44.0, 45.0, 51.0, 60.0, 63.0, 71.0, 59.0, 51.0, 62.0, 37.0, 27.0, 28.0, 17.0, 18.0, 17.0, 20.0, 15.0, 18.0, 6.0, 6.0, 3.0, 4.0, 2.0, 4.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.61767578125, -0.5965042114257812, -0.5753326416015625, -0.5541610717773438, -0.532989501953125, -0.5118179321289062, -0.4906463623046875, -0.46947479248046875, -0.44830322265625, -0.42713165283203125, -0.4059600830078125, -0.38478851318359375, -0.363616943359375, -0.34244537353515625, -0.3212738037109375, -0.30010223388671875, -0.2789306640625, -0.25775909423828125, -0.2365875244140625, -0.21541595458984375, -0.194244384765625, -0.17307281494140625, -0.1519012451171875, -0.13072967529296875, -0.10955810546875, -0.08838653564453125, -0.0672149658203125, -0.04604339599609375, -0.024871826171875, -0.00370025634765625, 0.0174713134765625, 0.03864288330078125, 0.059814453125, 0.08098602294921875, 0.1021575927734375, 0.12332916259765625, 0.144500732421875, 0.16567230224609375, 0.1868438720703125, 0.20801544189453125, 0.22918701171875, 0.25035858154296875, 0.2715301513671875, 0.29270172119140625, 0.313873291015625, 0.33504486083984375, 0.3562164306640625, 0.37738800048828125, 0.3985595703125, 0.41973114013671875, 0.4409027099609375, 0.46207427978515625, 0.483245849609375, 0.5044174194335938, 0.5255889892578125, 0.5467605590820312, 0.56793212890625, 0.5891036987304688, 0.6102752685546875, 0.6314468383789062, 0.652618408203125, 0.6737899780273438, 0.6949615478515625, 0.7161331176757812, 0.7373046875]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 11.0, 18.0, 24.0, 58.0, 106.0, 185.0, 282.0, 162.0, 79.0, 38.0, 13.0, 7.0, 9.0, 3.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-42.03028869628906, -41.14311218261719, -40.25593948364258, -39.36876678466797, -38.481590270996094, -37.59441375732422, -36.70724105834961, -35.820068359375, -34.932891845703125, -34.04571533203125, -33.15854263305664, -32.27136993408203, -31.384193420410156, -30.497018814086914, -29.609844207763672, -28.72266960144043, -27.835494995117188, -26.948320388793945, -26.061145782470703, -25.17397117614746, -24.28679656982422, -23.399621963500977, -22.512447357177734, -21.625272750854492, -20.73809814453125, -19.850923538208008, -18.963748931884766, -18.076574325561523, -17.18939971923828, -16.30222511291504, -15.415050506591797, -14.527875900268555, -13.64069938659668, -12.753524780273438, -11.866350173950195, -10.979175567626953, -10.092000961303711, -9.204826354980469, -8.317651748657227, -7.430477142333984, -6.543302536010742, -5.6561279296875, -4.768953323364258, -3.8817787170410156, -2.9946041107177734, -2.1074295043945312, -1.220254898071289, -0.3330802917480469, 0.5540943145751953, 1.4412689208984375, 2.3284435272216797, 3.215618133544922, 4.102792739868164, 4.989967346191406, 5.877141952514648, 6.764316558837891, 7.651491165161133, 8.538665771484375, 9.425840377807617, 10.31301498413086, 11.200189590454102, 12.087364196777344, 12.974538803100586, 13.861713409423828, 14.74888801574707]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 5.0, 4.0, 4.0, 7.0, 5.0, 3.0, 9.0, 7.0, 12.0, 13.0, 12.0, 13.0, 23.0, 19.0, 20.0, 28.0, 27.0, 23.0, 29.0, 32.0, 47.0, 47.0, 62.0, 61.0, 66.0, 46.0, 45.0, 34.0, 39.0, 38.0, 25.0, 35.0, 15.0, 26.0, 21.0, 13.0, 12.0, 15.0, 10.0, 12.0, 7.0, 11.0, 4.0, 4.0, 3.0, 5.0, 2.0, 0.0, 3.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.115571975708008, -11.708925247192383, -11.302278518676758, -10.895631790161133, -10.488985061645508, -10.082338333129883, -9.675691604614258, -9.269044876098633, -8.862398147583008, -8.455751419067383, -8.049104690551758, -7.642457962036133, -7.235811233520508, -6.829164505004883, -6.422517776489258, -6.015871047973633, -5.609224319458008, -5.202577590942383, -4.795930862426758, -4.389284133911133, -3.982637405395508, -3.575990676879883, -3.169343948364258, -2.762697219848633, -2.356050491333008, -1.9494037628173828, -1.5427570343017578, -1.1361103057861328, -0.7294635772705078, -0.3228168487548828, 0.08382987976074219, 0.4904766082763672, 0.8971233367919922, 1.3037700653076172, 1.7104167938232422, 2.117063522338867, 2.523710250854492, 2.930356979370117, 3.337003707885742, 3.743650436401367, 4.150297164916992, 4.556943893432617, 4.963590621948242, 5.370237350463867, 5.776884078979492, 6.183530807495117, 6.590177536010742, 6.996824264526367, 7.403470993041992, 7.810117721557617, 8.216764450073242, 8.623411178588867, 9.030057907104492, 9.436704635620117, 9.843351364135742, 10.249998092651367, 10.656644821166992, 11.063291549682617, 11.469938278198242, 11.876585006713867, 12.283231735229492, 12.689878463745117, 13.096525192260742, 13.503171920776367, 13.909818649291992]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 9.0, 9.0, 24.0, 21.0, 42.0, 66.0, 110.0, 205.0, 351.0, 832.0, 2163.0, 7041.0, 34913.0, 492003.0, 3325531.0, 295979.0, 25935.0, 5634.0, 1807.0, 753.0, 360.0, 173.0, 105.0, 69.0, 49.0, 27.0, 22.0, 13.0, 12.0, 3.0, 5.0, 4.0, 6.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.880859375, -1.822845458984375, -1.76483154296875, -1.706817626953125, -1.6488037109375, -1.590789794921875, -1.53277587890625, -1.474761962890625, -1.416748046875, -1.358734130859375, -1.30072021484375, -1.242706298828125, -1.1846923828125, -1.126678466796875, -1.06866455078125, -1.010650634765625, -0.95263671875, -0.894622802734375, -0.83660888671875, -0.778594970703125, -0.7205810546875, -0.662567138671875, -0.60455322265625, -0.546539306640625, -0.488525390625, -0.430511474609375, -0.37249755859375, -0.314483642578125, -0.2564697265625, -0.198455810546875, -0.14044189453125, -0.082427978515625, -0.0244140625, 0.033599853515625, 0.09161376953125, 0.149627685546875, 0.2076416015625, 0.265655517578125, 0.32366943359375, 0.381683349609375, 0.439697265625, 0.497711181640625, 0.55572509765625, 0.613739013671875, 0.6717529296875, 0.729766845703125, 0.78778076171875, 0.845794677734375, 0.90380859375, 0.961822509765625, 1.01983642578125, 1.077850341796875, 1.1358642578125, 1.193878173828125, 1.25189208984375, 1.309906005859375, 1.367919921875, 1.425933837890625, 1.48394775390625, 1.541961669921875, 1.5999755859375, 1.657989501953125, 1.71600341796875, 1.774017333984375, 1.83203125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 7.0, 4.0, 13.0, 11.0, 11.0, 12.0, 18.0, 27.0, 20.0, 26.0, 31.0, 27.0, 27.0, 28.0, 39.0, 49.0, 40.0, 41.0, 50.0, 59.0, 45.0, 47.0, 38.0, 30.0, 42.0, 53.0, 28.0, 34.0, 24.0, 30.0, 18.0, 19.0, 10.0, 11.0, 10.0, 8.0, 7.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.77099609375, -0.7461166381835938, -0.7212371826171875, -0.6963577270507812, -0.671478271484375, -0.6465988159179688, -0.6217193603515625, -0.5968399047851562, -0.57196044921875, -0.5470809936523438, -0.5222015380859375, -0.49732208251953125, -0.472442626953125, -0.44756317138671875, -0.4226837158203125, -0.39780426025390625, -0.3729248046875, -0.34804534912109375, -0.3231658935546875, -0.29828643798828125, -0.273406982421875, -0.24852752685546875, -0.2236480712890625, -0.19876861572265625, -0.17388916015625, -0.14900970458984375, -0.1241302490234375, -0.09925079345703125, -0.074371337890625, -0.04949188232421875, -0.0246124267578125, 0.00026702880859375, 0.025146484375, 0.05002593994140625, 0.0749053955078125, 0.09978485107421875, 0.124664306640625, 0.14954376220703125, 0.1744232177734375, 0.19930267333984375, 0.22418212890625, 0.24906158447265625, 0.2739410400390625, 0.29882049560546875, 0.323699951171875, 0.34857940673828125, 0.3734588623046875, 0.39833831787109375, 0.4232177734375, 0.44809722900390625, 0.4729766845703125, 0.49785614013671875, 0.522735595703125, 0.5476150512695312, 0.5724945068359375, 0.5973739624023438, 0.62225341796875, 0.6471328735351562, 0.6720123291015625, 0.6968917846679688, 0.721771240234375, 0.7466506958007812, 0.7715301513671875, 0.7964096069335938, 0.8212890625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 5.0, 1.0, 3.0, 14.0, 8.0, 12.0, 24.0, 30.0, 58.0, 95.0, 105.0, 237.0, 553.0, 1477.0, 5696.0, 36087.0, 884042.0, 3180725.0, 71869.0, 9300.0, 2213.0, 824.0, 352.0, 206.0, 118.0, 84.0, 46.0, 27.0, 22.0, 22.0, 5.0, 10.0, 7.0, 3.0, 9.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.13671875, -3.0474853515625, -2.958251953125, -2.8690185546875, -2.77978515625, -2.6905517578125, -2.601318359375, -2.5120849609375, -2.4228515625, -2.3336181640625, -2.244384765625, -2.1551513671875, -2.06591796875, -1.9766845703125, -1.887451171875, -1.7982177734375, -1.708984375, -1.6197509765625, -1.530517578125, -1.4412841796875, -1.35205078125, -1.2628173828125, -1.173583984375, -1.0843505859375, -0.9951171875, -0.9058837890625, -0.816650390625, -0.7274169921875, -0.63818359375, -0.5489501953125, -0.459716796875, -0.3704833984375, -0.28125, -0.1920166015625, -0.102783203125, -0.0135498046875, 0.07568359375, 0.1649169921875, 0.254150390625, 0.3433837890625, 0.4326171875, 0.5218505859375, 0.611083984375, 0.7003173828125, 0.78955078125, 0.8787841796875, 0.968017578125, 1.0572509765625, 1.146484375, 1.2357177734375, 1.324951171875, 1.4141845703125, 1.50341796875, 1.5926513671875, 1.681884765625, 1.7711181640625, 1.8603515625, 1.9495849609375, 2.038818359375, 2.1280517578125, 2.21728515625, 2.3065185546875, 2.395751953125, 2.4849853515625, 2.57421875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 5.0, 11.0, 10.0, 11.0, 21.0, 26.0, 22.0, 34.0, 45.0, 98.0, 128.0, 185.0, 377.0, 627.0, 751.0, 660.0, 422.0, 226.0, 138.0, 79.0, 51.0, 35.0, 33.0, 24.0, 15.0, 11.0, 8.0, 2.0, 4.0, 4.0, 1.0, 2.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6328125, -1.571380615234375, -1.50994873046875, -1.448516845703125, -1.3870849609375, -1.325653076171875, -1.26422119140625, -1.202789306640625, -1.141357421875, -1.079925537109375, -1.01849365234375, -0.957061767578125, -0.8956298828125, -0.834197998046875, -0.77276611328125, -0.711334228515625, -0.64990234375, -0.588470458984375, -0.52703857421875, -0.465606689453125, -0.4041748046875, -0.342742919921875, -0.28131103515625, -0.219879150390625, -0.158447265625, -0.097015380859375, -0.03558349609375, 0.025848388671875, 0.0872802734375, 0.148712158203125, 0.21014404296875, 0.271575927734375, 0.3330078125, 0.394439697265625, 0.45587158203125, 0.517303466796875, 0.5787353515625, 0.640167236328125, 0.70159912109375, 0.763031005859375, 0.824462890625, 0.885894775390625, 0.94732666015625, 1.008758544921875, 1.0701904296875, 1.131622314453125, 1.19305419921875, 1.254486083984375, 1.31591796875, 1.377349853515625, 1.43878173828125, 1.500213623046875, 1.5616455078125, 1.623077392578125, 1.68450927734375, 1.745941162109375, 1.807373046875, 1.868804931640625, 1.93023681640625, 1.991668701171875, 2.0531005859375, 2.114532470703125, 2.17596435546875, 2.237396240234375, 2.298828125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 5.0, 3.0, 10.0, 10.0, 24.0, 66.0, 125.0, 213.0, 239.0, 154.0, 75.0, 34.0, 11.0, 12.0, 10.0, 6.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.545472145080566, -12.797033309936523, -12.048593521118164, -11.300153732299805, -10.551714897155762, -9.803276062011719, -9.05483627319336, -8.306396484375, -7.557957649230957, -6.809518337249756, -6.061079025268555, -5.3126397132873535, -4.564200401306152, -3.815761089324951, -3.06732177734375, -2.318882465362549, -1.5704431533813477, -0.8220038414001465, -0.07356452941894531, 0.6748747825622559, 1.423314094543457, 2.171753406524658, 2.9201927185058594, 3.6686320304870605, 4.417071342468262, 5.165510654449463, 5.913949966430664, 6.662389278411865, 7.410828590393066, 8.15926742553711, 8.907707214355469, 9.656147003173828, 10.404586791992188, 11.153026580810547, 11.90146541595459, 12.649904251098633, 13.398344039916992, 14.146783828735352, 14.895222663879395, 15.643661499023438, 16.392101287841797, 17.140541076660156, 17.888980865478516, 18.637418746948242, 19.3858585357666, 20.13429832458496, 20.882736206054688, 21.631175994873047, 22.379615783691406, 23.128055572509766, 23.876495361328125, 24.62493324279785, 25.37337303161621, 26.12181282043457, 26.870250701904297, 27.618690490722656, 28.367130279541016, 29.115570068359375, 29.864009857177734, 30.61244773864746, 31.36088752746582, 32.10932540893555, 32.857765197753906, 33.606204986572266, 34.354644775390625]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 5.0, 3.0, 6.0, 6.0, 9.0, 13.0, 23.0, 21.0, 20.0, 28.0, 34.0, 37.0, 40.0, 47.0, 55.0, 52.0, 51.0, 49.0, 50.0, 53.0, 51.0, 43.0, 46.0, 35.0, 29.0, 46.0, 24.0, 27.0, 16.0, 13.0, 19.0, 17.0, 7.0, 10.0, 6.0, 8.0, 5.0, 6.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.258282661437988, -5.999912261962891, -5.741541862487793, -5.483171463012695, -5.224801063537598, -4.9664306640625, -4.7080607414245605, -4.449690341949463, -4.191319942474365, -3.9329495429992676, -3.67457914352417, -3.4162089824676514, -3.1578385829925537, -2.899468183517456, -2.6410980224609375, -2.38272762298584, -2.124357223510742, -1.8659868240356445, -1.6076165437698364, -1.3492462635040283, -1.0908758640289307, -0.832505464553833, -0.5741351842880249, -0.3157649040222168, -0.05739450454711914, 0.20097583532333374, 0.4593461751937866, 0.7177165150642395, 0.9760868549346924, 1.23445725440979, 1.4928275346755981, 1.7511978149414062, 2.0095672607421875, 2.267937660217285, 2.526308059692383, 2.7846782207489014, 3.043048620223999, 3.3014190196990967, 3.5597891807556152, 3.818159580230713, 4.0765299797058105, 4.334900379180908, 4.593270778656006, 4.8516411781311035, 5.110011100769043, 5.368381500244141, 5.626751899719238, 5.885122299194336, 6.143492698669434, 6.401863098144531, 6.660233497619629, 6.918603897094727, 7.176974296569824, 7.435344696044922, 7.693714618682861, 7.952085018157959, 8.210454940795898, 8.468825340270996, 8.727195739746094, 8.985566139221191, 9.243936538696289, 9.502306938171387, 9.760677337646484, 10.019046783447266, 10.27741813659668]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 2.0, 1.0, 7.0, 6.0, 10.0, 6.0, 8.0, 27.0, 24.0, 33.0, 62.0, 88.0, 128.0, 192.0, 347.0, 569.0, 956.0, 1644.0, 3022.0, 5800.0, 11887.0, 26329.0, 59870.0, 136719.0, 255048.0, 268942.0, 152363.0, 67537.0, 29392.0, 13451.0, 6427.0, 3288.0, 1856.0, 956.0, 583.0, 343.0, 211.0, 131.0, 86.0, 56.0, 34.0, 34.0, 29.0, 18.0, 9.0, 7.0, 3.0, 6.0, 4.0, 1.0, 7.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.3251953125, -1.28387451171875, -1.2425537109375, -1.20123291015625, -1.159912109375, -1.11859130859375, -1.0772705078125, -1.03594970703125, -0.99462890625, -0.95330810546875, -0.9119873046875, -0.87066650390625, -0.829345703125, -0.78802490234375, -0.7467041015625, -0.70538330078125, -0.6640625, -0.62274169921875, -0.5814208984375, -0.54010009765625, -0.498779296875, -0.45745849609375, -0.4161376953125, -0.37481689453125, -0.33349609375, -0.29217529296875, -0.2508544921875, -0.20953369140625, -0.168212890625, -0.12689208984375, -0.0855712890625, -0.04425048828125, -0.0029296875, 0.03839111328125, 0.0797119140625, 0.12103271484375, 0.162353515625, 0.20367431640625, 0.2449951171875, 0.28631591796875, 0.32763671875, 0.36895751953125, 0.4102783203125, 0.45159912109375, 0.492919921875, 0.53424072265625, 0.5755615234375, 0.61688232421875, 0.658203125, 0.69952392578125, 0.7408447265625, 0.78216552734375, 0.823486328125, 0.86480712890625, 0.9061279296875, 0.94744873046875, 0.98876953125, 1.03009033203125, 1.0714111328125, 1.11273193359375, 1.154052734375, 1.19537353515625, 1.2366943359375, 1.27801513671875, 1.3193359375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 5.0, 5.0, 8.0, 4.0, 12.0, 14.0, 9.0, 15.0, 17.0, 21.0, 19.0, 26.0, 37.0, 23.0, 34.0, 29.0, 30.0, 41.0, 44.0, 45.0, 53.0, 36.0, 45.0, 52.0, 44.0, 35.0, 48.0, 29.0, 30.0, 32.0, 29.0, 21.0, 20.0, 21.0, 19.0, 10.0, 13.0, 7.0, 5.0, 10.0, 3.0, 1.0, 0.0, 1.0, 4.0, 3.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.86328125, -0.8387222290039062, -0.8141632080078125, -0.7896041870117188, -0.765045166015625, -0.7404861450195312, -0.7159271240234375, -0.6913681030273438, -0.66680908203125, -0.6422500610351562, -0.6176910400390625, -0.5931320190429688, -0.568572998046875, -0.5440139770507812, -0.5194549560546875, -0.49489593505859375, -0.4703369140625, -0.44577789306640625, -0.4212188720703125, -0.39665985107421875, -0.372100830078125, -0.34754180908203125, -0.3229827880859375, -0.29842376708984375, -0.27386474609375, -0.24930572509765625, -0.2247467041015625, -0.20018768310546875, -0.175628662109375, -0.15106964111328125, -0.1265106201171875, -0.10195159912109375, -0.077392578125, -0.05283355712890625, -0.0282745361328125, -0.00371551513671875, 0.020843505859375, 0.04540252685546875, 0.0699615478515625, 0.09452056884765625, 0.11907958984375, 0.14363861083984375, 0.1681976318359375, 0.19275665283203125, 0.217315673828125, 0.24187469482421875, 0.2664337158203125, 0.29099273681640625, 0.3155517578125, 0.34011077880859375, 0.3646697998046875, 0.38922882080078125, 0.413787841796875, 0.43834686279296875, 0.4629058837890625, 0.48746490478515625, 0.51202392578125, 0.5365829467773438, 0.5611419677734375, 0.5857009887695312, 0.610260009765625, 0.6348190307617188, 0.6593780517578125, 0.6839370727539062, 0.70849609375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 8.0, 9.0, 9.0, 10.0, 11.0, 11.0, 17.0, 34.0, 36.0, 62.0, 97.0, 142.0, 237.0, 439.0, 665.0, 1510.0, 3723.0, 10195.0, 36750.0, 156043.0, 580076.0, 192791.0, 45424.0, 12426.0, 4206.0, 1704.0, 789.0, 418.0, 240.0, 140.0, 84.0, 75.0, 51.0, 31.0, 25.0, 17.0, 12.0, 6.0, 12.0, 9.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.2109375, -2.14306640625, -2.0751953125, -2.00732421875, -1.939453125, -1.87158203125, -1.8037109375, -1.73583984375, -1.66796875, -1.60009765625, -1.5322265625, -1.46435546875, -1.396484375, -1.32861328125, -1.2607421875, -1.19287109375, -1.125, -1.05712890625, -0.9892578125, -0.92138671875, -0.853515625, -0.78564453125, -0.7177734375, -0.64990234375, -0.58203125, -0.51416015625, -0.4462890625, -0.37841796875, -0.310546875, -0.24267578125, -0.1748046875, -0.10693359375, -0.0390625, 0.02880859375, 0.0966796875, 0.16455078125, 0.232421875, 0.30029296875, 0.3681640625, 0.43603515625, 0.50390625, 0.57177734375, 0.6396484375, 0.70751953125, 0.775390625, 0.84326171875, 0.9111328125, 0.97900390625, 1.046875, 1.11474609375, 1.1826171875, 1.25048828125, 1.318359375, 1.38623046875, 1.4541015625, 1.52197265625, 1.58984375, 1.65771484375, 1.7255859375, 1.79345703125, 1.861328125, 1.92919921875, 1.9970703125, 2.06494140625, 2.1328125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 6.0, 6.0, 5.0, 8.0, 11.0, 17.0, 18.0, 13.0, 25.0, 43.0, 32.0, 47.0, 45.0, 53.0, 68.0, 55.0, 66.0, 58.0, 42.0, 59.0, 56.0, 55.0, 36.0, 26.0, 34.0, 22.0, 18.0, 16.0, 23.0, 14.0, 9.0, 2.0, 8.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.662109375, -3.557403564453125, -3.45269775390625, -3.347991943359375, -3.2432861328125, -3.138580322265625, -3.03387451171875, -2.929168701171875, -2.824462890625, -2.719757080078125, -2.61505126953125, -2.510345458984375, -2.4056396484375, -2.300933837890625, -2.19622802734375, -2.091522216796875, -1.98681640625, -1.882110595703125, -1.77740478515625, -1.672698974609375, -1.5679931640625, -1.463287353515625, -1.35858154296875, -1.253875732421875, -1.149169921875, -1.044464111328125, -0.93975830078125, -0.835052490234375, -0.7303466796875, -0.625640869140625, -0.52093505859375, -0.416229248046875, -0.3115234375, -0.206817626953125, -0.10211181640625, 0.002593994140625, 0.1072998046875, 0.212005615234375, 0.31671142578125, 0.421417236328125, 0.526123046875, 0.630828857421875, 0.73553466796875, 0.840240478515625, 0.9449462890625, 1.049652099609375, 1.15435791015625, 1.259063720703125, 1.36376953125, 1.468475341796875, 1.57318115234375, 1.677886962890625, 1.7825927734375, 1.887298583984375, 1.99200439453125, 2.096710205078125, 2.201416015625, 2.306121826171875, 2.41082763671875, 2.515533447265625, 2.6202392578125, 2.724945068359375, 2.82965087890625, 2.934356689453125, 3.0390625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 1.0, 4.0, 11.0, 17.0, 25.0, 36.0, 78.0, 180.0, 384.0, 953.0, 3400.0, 19205.0, 203813.0, 742946.0, 66477.0, 8064.0, 1838.0, 595.0, 259.0, 121.0, 61.0, 31.0, 31.0, 9.0, 7.0, 1.0, 6.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1162109375, -1.075286865234375, -1.03436279296875, -0.993438720703125, -0.9525146484375, -0.911590576171875, -0.87066650390625, -0.829742431640625, -0.788818359375, -0.747894287109375, -0.70697021484375, -0.666046142578125, -0.6251220703125, -0.584197998046875, -0.54327392578125, -0.502349853515625, -0.46142578125, -0.420501708984375, -0.37957763671875, -0.338653564453125, -0.2977294921875, -0.256805419921875, -0.21588134765625, -0.174957275390625, -0.134033203125, -0.093109130859375, -0.05218505859375, -0.011260986328125, 0.0296630859375, 0.070587158203125, 0.11151123046875, 0.152435302734375, 0.193359375, 0.234283447265625, 0.27520751953125, 0.316131591796875, 0.3570556640625, 0.397979736328125, 0.43890380859375, 0.479827880859375, 0.520751953125, 0.561676025390625, 0.60260009765625, 0.643524169921875, 0.6844482421875, 0.725372314453125, 0.76629638671875, 0.807220458984375, 0.84814453125, 0.889068603515625, 0.92999267578125, 0.970916748046875, 1.0118408203125, 1.052764892578125, 1.09368896484375, 1.134613037109375, 1.175537109375, 1.216461181640625, 1.25738525390625, 1.298309326171875, 1.3392333984375, 1.380157470703125, 1.42108154296875, 1.462005615234375, 1.5029296875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 4.0, 5.0, 3.0, 7.0, 4.0, 14.0, 14.0, 18.0, 18.0, 34.0, 39.0, 39.0, 56.0, 68.0, 92.0, 93.0, 92.0, 99.0, 56.0, 48.0, 48.0, 32.0, 23.0, 17.0, 26.0, 15.0, 10.0, 4.0, 3.0, 2.0, 5.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0002880096435546875, -0.0002794116735458374, -0.0002708137035369873, -0.0002622157335281372, -0.0002536177635192871, -0.000245019793510437, -0.00023642182350158691, -0.00022782385349273682, -0.00021922588348388672, -0.00021062791347503662, -0.00020202994346618652, -0.00019343197345733643, -0.00018483400344848633, -0.00017623603343963623, -0.00016763806343078613, -0.00015904009342193604, -0.00015044212341308594, -0.00014184415340423584, -0.00013324618339538574, -0.00012464821338653564, -0.00011605024337768555, -0.00010745227336883545, -9.885430335998535e-05, -9.025633335113525e-05, -8.165836334228516e-05, -7.306039333343506e-05, -6.446242332458496e-05, -5.586445331573486e-05, -4.7266483306884766e-05, -3.866851329803467e-05, -3.007054328918457e-05, -2.1472573280334473e-05, -1.2874603271484375e-05, -4.276633262634277e-06, 4.32133674621582e-06, 1.2919306755065918e-05, 2.1517276763916016e-05, 3.0115246772766113e-05, 3.871321678161621e-05, 4.731118679046631e-05, 5.5909156799316406e-05, 6.45071268081665e-05, 7.31050968170166e-05, 8.17030668258667e-05, 9.03010368347168e-05, 9.88990068435669e-05, 0.00010749697685241699, 0.00011609494686126709, 0.0001246929168701172, 0.00013329088687896729, 0.00014188885688781738, 0.00015048682689666748, 0.00015908479690551758, 0.00016768276691436768, 0.00017628073692321777, 0.00018487870693206787, 0.00019347667694091797, 0.00020207464694976807, 0.00021067261695861816, 0.00021927058696746826, 0.00022786855697631836, 0.00023646652698516846, 0.00024506449699401855, 0.00025366246700286865, 0.00026226043701171875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 9.0, 8.0, 16.0, 28.0, 45.0, 80.0, 164.0, 353.0, 965.0, 3287.0, 17210.0, 157894.0, 755436.0, 97445.0, 11702.0, 2442.0, 800.0, 329.0, 156.0, 72.0, 41.0, 20.0, 17.0, 11.0, 7.0, 3.0, 3.0, 1.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.86865234375, -0.8298721313476562, -0.7910919189453125, -0.7523117065429688, -0.713531494140625, -0.6747512817382812, -0.6359710693359375, -0.5971908569335938, -0.55841064453125, -0.5196304321289062, -0.4808502197265625, -0.44207000732421875, -0.403289794921875, -0.36450958251953125, -0.3257293701171875, -0.28694915771484375, -0.2481689453125, -0.20938873291015625, -0.1706085205078125, -0.13182830810546875, -0.093048095703125, -0.05426788330078125, -0.0154876708984375, 0.02329254150390625, 0.06207275390625, 0.10085296630859375, 0.1396331787109375, 0.17841339111328125, 0.217193603515625, 0.25597381591796875, 0.2947540283203125, 0.33353424072265625, 0.372314453125, 0.41109466552734375, 0.4498748779296875, 0.48865509033203125, 0.527435302734375, 0.5662155151367188, 0.6049957275390625, 0.6437759399414062, 0.68255615234375, 0.7213363647460938, 0.7601165771484375, 0.7988967895507812, 0.837677001953125, 0.8764572143554688, 0.9152374267578125, 0.9540176391601562, 0.9927978515625, 1.0315780639648438, 1.0703582763671875, 1.1091384887695312, 1.147918701171875, 1.1866989135742188, 1.2254791259765625, 1.2642593383789062, 1.30303955078125, 1.3418197631835938, 1.3805999755859375, 1.4193801879882812, 1.458160400390625, 1.4969406127929688, 1.5357208251953125, 1.5745010375976562, 1.61328125]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 3.0, 1.0, 7.0, 7.0, 9.0, 11.0, 14.0, 16.0, 20.0, 21.0, 26.0, 25.0, 33.0, 32.0, 49.0, 40.0, 62.0, 59.0, 47.0, 68.0, 62.0, 62.0, 46.0, 41.0, 57.0, 32.0, 35.0, 24.0, 18.0, 13.0, 14.0, 11.0, 8.0, 3.0, 4.0, 7.0, 8.0, 0.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.8349609375, -0.81304931640625, -0.7911376953125, -0.76922607421875, -0.747314453125, -0.72540283203125, -0.7034912109375, -0.68157958984375, -0.65966796875, -0.63775634765625, -0.6158447265625, -0.59393310546875, -0.572021484375, -0.55010986328125, -0.5281982421875, -0.50628662109375, -0.484375, -0.46246337890625, -0.4405517578125, -0.41864013671875, -0.396728515625, -0.37481689453125, -0.3529052734375, -0.33099365234375, -0.30908203125, -0.28717041015625, -0.2652587890625, -0.24334716796875, -0.221435546875, -0.19952392578125, -0.1776123046875, -0.15570068359375, -0.1337890625, -0.11187744140625, -0.0899658203125, -0.06805419921875, -0.046142578125, -0.02423095703125, -0.0023193359375, 0.01959228515625, 0.04150390625, 0.06341552734375, 0.0853271484375, 0.10723876953125, 0.129150390625, 0.15106201171875, 0.1729736328125, 0.19488525390625, 0.216796875, 0.23870849609375, 0.2606201171875, 0.28253173828125, 0.304443359375, 0.32635498046875, 0.3482666015625, 0.37017822265625, 0.39208984375, 0.41400146484375, 0.4359130859375, 0.45782470703125, 0.479736328125, 0.50164794921875, 0.5235595703125, 0.54547119140625, 0.5673828125]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 8.0, 5.0, 14.0, 30.0, 72.0, 155.0, 314.0, 203.0, 102.0, 56.0, 18.0, 10.0, 5.0, 4.0, 6.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.671852111816406, -21.85114860534668, -21.03044319152832, -20.209739685058594, -19.389036178588867, -18.56833267211914, -17.74762725830078, -16.926923751831055, -16.106220245361328, -15.285515785217285, -14.464812278747559, -13.644107818603516, -12.823404312133789, -12.002699851989746, -11.181995391845703, -10.361291885375977, -9.540587425231934, -8.71988296508789, -7.899179458618164, -7.078474998474121, -6.2577714920043945, -5.437067031860352, -4.616363048553467, -3.795659065246582, -2.9749550819396973, -2.1542510986328125, -1.3335469961166382, -0.5128428936004639, 0.3078610897064209, 1.1285653114318848, 1.9492692947387695, 2.7699732780456543, 3.590677261352539, 4.411381244659424, 5.232085227966309, 6.052789688110352, 6.873493194580078, 7.694197654724121, 8.514902114868164, 9.33560562133789, 10.156309127807617, 10.97701358795166, 11.797717094421387, 12.61842155456543, 13.439125061035156, 14.2598295211792, 15.080533981323242, 15.901237487792969, 16.721942901611328, 17.542646408081055, 18.363351821899414, 19.18405532836914, 20.004758834838867, 20.825462341308594, 21.646167755126953, 22.46687126159668, 23.287574768066406, 24.108278274536133, 24.928983688354492, 25.74968719482422, 26.570390701293945, 27.391094207763672, 28.21179962158203, 29.032503128051758, 29.853206634521484]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 0.0, 4.0, 2.0, 5.0, 5.0, 5.0, 6.0, 7.0, 5.0, 7.0, 14.0, 12.0, 15.0, 14.0, 18.0, 17.0, 22.0, 23.0, 28.0, 19.0, 34.0, 29.0, 33.0, 48.0, 59.0, 71.0, 64.0, 81.0, 46.0, 45.0, 27.0, 36.0, 27.0, 23.0, 22.0, 16.0, 19.0, 13.0, 20.0, 21.0, 9.0, 10.0, 6.0, 4.0, 7.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-9.576784133911133, -9.259346008300781, -8.941906929016113, -8.624468803405762, -8.30703067779541, -7.9895920753479, -7.672153472900391, -7.354715347290039, -7.037276744842529, -6.7198381423950195, -6.402400016784668, -6.084961414337158, -5.767522811889648, -5.450084686279297, -5.132646083831787, -4.815207481384277, -4.497769355773926, -4.180330753326416, -3.8628926277160645, -3.5454540252685547, -3.228015661239624, -2.9105772972106934, -2.5931386947631836, -2.275700330734253, -1.9582619667053223, -1.6408236026763916, -1.3233851194381714, -1.0059466361999512, -0.6885082721710205, -0.37106990814208984, -0.05363142490386963, 0.2638070583343506, 0.5812463760375977, 0.8986847996711731, 1.2161232233047485, 1.5335617065429688, 1.8510000705718994, 2.16843843460083, 2.48587703704834, 2.8033154010772705, 3.120753765106201, 3.438192129135132, 3.7556304931640625, 4.073069095611572, 4.390507698059082, 4.707945823669434, 5.025384426116943, 5.342823028564453, 5.660261154174805, 5.9776997566223145, 6.295137882232666, 6.612576484680176, 6.930014610290527, 7.247453212738037, 7.564891815185547, 7.882329940795898, 8.19976806640625, 8.517206192016602, 8.83464527130127, 9.152083396911621, 9.469521522521973, 9.78696060180664, 10.104398727416992, 10.421836853027344, 10.739275932312012]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 9.0, 13.0, 15.0, 26.0, 36.0, 51.0, 100.0, 147.0, 230.0, 500.0, 1091.0, 2932.0, 10086.0, 55258.0, 851831.0, 2989630.0, 248372.0, 24684.0, 5518.0, 1931.0, 836.0, 395.0, 214.0, 133.0, 85.0, 53.0, 27.0, 23.0, 19.0, 9.0, 10.0, 5.0, 6.0, 4.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.6103515625, -1.56048583984375, -1.5106201171875, -1.46075439453125, -1.410888671875, -1.36102294921875, -1.3111572265625, -1.26129150390625, -1.21142578125, -1.16156005859375, -1.1116943359375, -1.06182861328125, -1.011962890625, -0.96209716796875, -0.9122314453125, -0.86236572265625, -0.8125, -0.76263427734375, -0.7127685546875, -0.66290283203125, -0.613037109375, -0.56317138671875, -0.5133056640625, -0.46343994140625, -0.41357421875, -0.36370849609375, -0.3138427734375, -0.26397705078125, -0.214111328125, -0.16424560546875, -0.1143798828125, -0.06451416015625, -0.0146484375, 0.03521728515625, 0.0850830078125, 0.13494873046875, 0.184814453125, 0.23468017578125, 0.2845458984375, 0.33441162109375, 0.38427734375, 0.43414306640625, 0.4840087890625, 0.53387451171875, 0.583740234375, 0.63360595703125, 0.6834716796875, 0.73333740234375, 0.783203125, 0.83306884765625, 0.8829345703125, 0.93280029296875, 0.982666015625, 1.03253173828125, 1.0823974609375, 1.13226318359375, 1.18212890625, 1.23199462890625, 1.2818603515625, 1.33172607421875, 1.381591796875, 1.43145751953125, 1.4813232421875, 1.53118896484375, 1.5810546875]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 3.0, 3.0, 4.0, 7.0, 6.0, 6.0, 14.0, 9.0, 17.0, 17.0, 23.0, 23.0, 27.0, 34.0, 33.0, 27.0, 39.0, 37.0, 48.0, 53.0, 55.0, 45.0, 55.0, 36.0, 39.0, 42.0, 42.0, 36.0, 27.0, 33.0, 30.0, 24.0, 19.0, 22.0, 17.0, 14.0, 8.0, 9.0, 2.0, 5.0, 5.0, 1.0, 4.0, 2.0, 2.0, 1.0, 2.0, 4.0, 0.0, 1.0], "bins": [-0.8623046875, -0.837982177734375, -0.81365966796875, -0.789337158203125, -0.7650146484375, -0.740692138671875, -0.71636962890625, -0.692047119140625, -0.667724609375, -0.643402099609375, -0.61907958984375, -0.594757080078125, -0.5704345703125, -0.546112060546875, -0.52178955078125, -0.497467041015625, -0.47314453125, -0.448822021484375, -0.42449951171875, -0.400177001953125, -0.3758544921875, -0.351531982421875, -0.32720947265625, -0.302886962890625, -0.278564453125, -0.254241943359375, -0.22991943359375, -0.205596923828125, -0.1812744140625, -0.156951904296875, -0.13262939453125, -0.108306884765625, -0.083984375, -0.059661865234375, -0.03533935546875, -0.011016845703125, 0.0133056640625, 0.037628173828125, 0.06195068359375, 0.086273193359375, 0.110595703125, 0.134918212890625, 0.15924072265625, 0.183563232421875, 0.2078857421875, 0.232208251953125, 0.25653076171875, 0.280853271484375, 0.30517578125, 0.329498291015625, 0.35382080078125, 0.378143310546875, 0.4024658203125, 0.426788330078125, 0.45111083984375, 0.475433349609375, 0.499755859375, 0.524078369140625, 0.54840087890625, 0.572723388671875, 0.5970458984375, 0.621368408203125, 0.64569091796875, 0.670013427734375, 0.6943359375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 3.0, 10.0, 6.0, 19.0, 19.0, 37.0, 70.0, 129.0, 276.0, 646.0, 2090.0, 10933.0, 170057.0, 3872837.0, 124064.0, 9783.0, 1998.0, 656.0, 342.0, 132.0, 67.0, 41.0, 22.0, 14.0, 7.0, 7.0, 7.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-3.85546875, -3.755218505859375, -3.65496826171875, -3.554718017578125, -3.4544677734375, -3.354217529296875, -3.25396728515625, -3.153717041015625, -3.053466796875, -2.953216552734375, -2.85296630859375, -2.752716064453125, -2.6524658203125, -2.552215576171875, -2.45196533203125, -2.351715087890625, -2.25146484375, -2.151214599609375, -2.05096435546875, -1.950714111328125, -1.8504638671875, -1.750213623046875, -1.64996337890625, -1.549713134765625, -1.449462890625, -1.349212646484375, -1.24896240234375, -1.148712158203125, -1.0484619140625, -0.948211669921875, -0.84796142578125, -0.747711181640625, -0.6474609375, -0.547210693359375, -0.44696044921875, -0.346710205078125, -0.2464599609375, -0.146209716796875, -0.04595947265625, 0.054290771484375, 0.154541015625, 0.254791259765625, 0.35504150390625, 0.455291748046875, 0.5555419921875, 0.655792236328125, 0.75604248046875, 0.856292724609375, 0.95654296875, 1.056793212890625, 1.15704345703125, 1.257293701171875, 1.3575439453125, 1.457794189453125, 1.55804443359375, 1.658294677734375, 1.758544921875, 1.858795166015625, 1.95904541015625, 2.059295654296875, 2.1595458984375, 2.259796142578125, 2.36004638671875, 2.460296630859375, 2.560546875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 4.0, 11.0, 9.0, 11.0, 19.0, 28.0, 46.0, 48.0, 82.0, 142.0, 226.0, 439.0, 743.0, 803.0, 576.0, 321.0, 198.0, 126.0, 71.0, 46.0, 27.0, 25.0, 19.0, 10.0, 11.0, 10.0, 4.0, 6.0, 4.0, 3.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.8779296875, -1.8160858154296875, -1.754241943359375, -1.6923980712890625, -1.63055419921875, -1.5687103271484375, -1.506866455078125, -1.4450225830078125, -1.3831787109375, -1.3213348388671875, -1.259490966796875, -1.1976470947265625, -1.13580322265625, -1.0739593505859375, -1.012115478515625, -0.9502716064453125, -0.888427734375, -0.8265838623046875, -0.764739990234375, -0.7028961181640625, -0.64105224609375, -0.5792083740234375, -0.517364501953125, -0.4555206298828125, -0.3936767578125, -0.3318328857421875, -0.269989013671875, -0.2081451416015625, -0.14630126953125, -0.0844573974609375, -0.022613525390625, 0.0392303466796875, 0.10107421875, 0.1629180908203125, 0.224761962890625, 0.2866058349609375, 0.34844970703125, 0.4102935791015625, 0.472137451171875, 0.5339813232421875, 0.5958251953125, 0.6576690673828125, 0.719512939453125, 0.7813568115234375, 0.84320068359375, 0.9050445556640625, 0.966888427734375, 1.0287322998046875, 1.090576171875, 1.1524200439453125, 1.214263916015625, 1.2761077880859375, 1.33795166015625, 1.3997955322265625, 1.461639404296875, 1.5234832763671875, 1.5853271484375, 1.6471710205078125, 1.709014892578125, 1.7708587646484375, 1.83270263671875, 1.8945465087890625, 1.956390380859375, 2.0182342529296875, 2.080078125]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 9.0, 18.0, 36.0, 53.0, 129.0, 177.0, 205.0, 169.0, 98.0, 50.0, 29.0, 15.0, 4.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.004962921142578, -8.413089752197266, -7.821216583251953, -7.229342937469482, -6.63746976852417, -6.045596599578857, -5.453722953796387, -4.861849784851074, -4.269976615905762, -3.678103446960449, -3.0862300395965576, -2.494356632232666, -1.9024834632873535, -1.310610294342041, -0.7187368869781494, -0.1268634796142578, 0.4650096893310547, 1.0568829774856567, 1.6487562656402588, 2.2406296730041504, 2.832502841949463, 3.4243760108947754, 4.016249656677246, 4.608122825622559, 5.199995994567871, 5.791869163513184, 6.383742332458496, 6.975615978240967, 7.567489147186279, 8.15936279296875, 8.751235961914062, 9.343109130859375, 9.934982299804688, 10.52685546875, 11.118728637695312, 11.710601806640625, 12.302474975585938, 12.89434814453125, 13.486222267150879, 14.078095436096191, 14.669968605041504, 15.261841773986816, 15.853714942932129, 16.445589065551758, 17.03746223449707, 17.629335403442383, 18.221208572387695, 18.813081741333008, 19.40495491027832, 19.996828079223633, 20.588701248168945, 21.180574417114258, 21.77244758605957, 22.364320755004883, 22.956193923950195, 23.54806900024414, 24.139942169189453, 24.731815338134766, 25.323688507080078, 25.91556167602539, 26.507434844970703, 27.099308013916016, 27.691181182861328, 28.28305435180664, 28.874927520751953]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 3.0, 4.0, 4.0, 6.0, 8.0, 10.0, 19.0, 9.0, 17.0, 17.0, 20.0, 32.0, 29.0, 40.0, 38.0, 41.0, 46.0, 50.0, 45.0, 46.0, 68.0, 57.0, 51.0, 33.0, 52.0, 42.0, 27.0, 22.0, 38.0, 25.0, 25.0, 14.0, 14.0, 18.0, 9.0, 6.0, 4.0, 6.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.077053070068359, -6.8152337074279785, -6.553414344787598, -6.291594982147217, -6.029775619506836, -5.767956733703613, -5.506137371063232, -5.244318008422852, -4.982498645782471, -4.72067928314209, -4.458859920501709, -4.197040557861328, -3.9352214336395264, -3.6734020709991455, -3.4115829467773438, -3.149763584136963, -2.887944221496582, -2.626124858856201, -2.3643054962158203, -2.1024863719940186, -1.8406670093536377, -1.5788476467132568, -1.3170284032821655, -1.0552091598510742, -0.7933897972106934, -0.5315704941749573, -0.2697511911392212, -0.007931888103485107, 0.253887414932251, 0.5157067775726318, 0.7775260210037231, 1.0393452644348145, 1.3011655807495117, 1.5629849433898926, 1.8248041868209839, 2.086623430252075, 2.348442792892456, 2.610262155532837, 2.8720812797546387, 3.1339006423950195, 3.3957200050354004, 3.6575393676757812, 3.919358730316162, 4.181178092956543, 4.442996978759766, 4.704816818237305, 4.966635704040527, 5.228455066680908, 5.490274429321289, 5.75209379196167, 6.013913154602051, 6.275732517242432, 6.5375518798828125, 6.799370765686035, 7.061190128326416, 7.323009490966797, 7.584828853607178, 7.846648216247559, 8.108467102050781, 8.37028694152832, 8.632105827331543, 8.893925666809082, 9.155744552612305, 9.417564392089844, 9.679383277893066]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 7.0, 5.0, 6.0, 6.0, 16.0, 18.0, 29.0, 33.0, 46.0, 80.0, 118.0, 146.0, 277.0, 464.0, 769.0, 1386.0, 2673.0, 5388.0, 10952.0, 24057.0, 53030.0, 121259.0, 255098.0, 291717.0, 154855.0, 68322.0, 29882.0, 13953.0, 6653.0, 3218.0, 1699.0, 917.0, 555.0, 333.0, 210.0, 104.0, 87.0, 51.0, 38.0, 23.0, 21.0, 16.0, 9.0, 9.0, 6.0, 5.0, 5.0, 1.0, 5.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-1.2568359375, -1.217742919921875, -1.17864990234375, -1.139556884765625, -1.1004638671875, -1.061370849609375, -1.02227783203125, -0.983184814453125, -0.944091796875, -0.904998779296875, -0.86590576171875, -0.826812744140625, -0.7877197265625, -0.748626708984375, -0.70953369140625, -0.670440673828125, -0.63134765625, -0.592254638671875, -0.55316162109375, -0.514068603515625, -0.4749755859375, -0.435882568359375, -0.39678955078125, -0.357696533203125, -0.318603515625, -0.279510498046875, -0.24041748046875, -0.201324462890625, -0.1622314453125, -0.123138427734375, -0.08404541015625, -0.044952392578125, -0.005859375, 0.033233642578125, 0.07232666015625, 0.111419677734375, 0.1505126953125, 0.189605712890625, 0.22869873046875, 0.267791748046875, 0.306884765625, 0.345977783203125, 0.38507080078125, 0.424163818359375, 0.4632568359375, 0.502349853515625, 0.54144287109375, 0.580535888671875, 0.61962890625, 0.658721923828125, 0.69781494140625, 0.736907958984375, 0.7760009765625, 0.815093994140625, 0.85418701171875, 0.893280029296875, 0.932373046875, 0.971466064453125, 1.01055908203125, 1.049652099609375, 1.0887451171875, 1.127838134765625, 1.16693115234375, 1.206024169921875, 1.2451171875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 6.0, 5.0, 1.0, 9.0, 2.0, 16.0, 10.0, 9.0, 13.0, 13.0, 17.0, 22.0, 33.0, 32.0, 38.0, 43.0, 36.0, 32.0, 46.0, 57.0, 47.0, 50.0, 43.0, 39.0, 44.0, 43.0, 31.0, 35.0, 41.0, 35.0, 22.0, 20.0, 23.0, 14.0, 10.0, 13.0, 13.0, 9.0, 6.0, 6.0, 8.0, 5.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.75537109375, -0.7297592163085938, -0.7041473388671875, -0.6785354614257812, -0.652923583984375, -0.6273117065429688, -0.6016998291015625, -0.5760879516601562, -0.55047607421875, -0.5248641967773438, -0.4992523193359375, -0.47364044189453125, -0.448028564453125, -0.42241668701171875, -0.3968048095703125, -0.37119293212890625, -0.3455810546875, -0.31996917724609375, -0.2943572998046875, -0.26874542236328125, -0.243133544921875, -0.21752166748046875, -0.1919097900390625, -0.16629791259765625, -0.14068603515625, -0.11507415771484375, -0.0894622802734375, -0.06385040283203125, -0.038238525390625, -0.01262664794921875, 0.0129852294921875, 0.03859710693359375, 0.064208984375, 0.08982086181640625, 0.1154327392578125, 0.14104461669921875, 0.166656494140625, 0.19226837158203125, 0.2178802490234375, 0.24349212646484375, 0.26910400390625, 0.29471588134765625, 0.3203277587890625, 0.34593963623046875, 0.371551513671875, 0.39716339111328125, 0.4227752685546875, 0.44838714599609375, 0.4739990234375, 0.49961090087890625, 0.5252227783203125, 0.5508346557617188, 0.576446533203125, 0.6020584106445312, 0.6276702880859375, 0.6532821655273438, 0.67889404296875, 0.7045059204101562, 0.7301177978515625, 0.7557296752929688, 0.781341552734375, 0.8069534301757812, 0.8325653076171875, 0.8581771850585938, 0.8837890625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 6.0, 9.0, 5.0, 9.0, 10.0, 30.0, 32.0, 45.0, 64.0, 83.0, 143.0, 187.0, 318.0, 461.0, 726.0, 1406.0, 2921.0, 8107.0, 27973.0, 124150.0, 624447.0, 195922.0, 42300.0, 11263.0, 3818.0, 1724.0, 906.0, 521.0, 302.0, 193.0, 141.0, 88.0, 60.0, 51.0, 33.0, 23.0, 20.0, 11.0, 16.0, 8.0, 9.0, 1.0, 5.0, 1.0, 4.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.03515625, -1.96875, -1.90234375, -1.8359375, -1.76953125, -1.703125, -1.63671875, -1.5703125, -1.50390625, -1.4375, -1.37109375, -1.3046875, -1.23828125, -1.171875, -1.10546875, -1.0390625, -0.97265625, -0.90625, -0.83984375, -0.7734375, -0.70703125, -0.640625, -0.57421875, -0.5078125, -0.44140625, -0.375, -0.30859375, -0.2421875, -0.17578125, -0.109375, -0.04296875, 0.0234375, 0.08984375, 0.15625, 0.22265625, 0.2890625, 0.35546875, 0.421875, 0.48828125, 0.5546875, 0.62109375, 0.6875, 0.75390625, 0.8203125, 0.88671875, 0.953125, 1.01953125, 1.0859375, 1.15234375, 1.21875, 1.28515625, 1.3515625, 1.41796875, 1.484375, 1.55078125, 1.6171875, 1.68359375, 1.75, 1.81640625, 1.8828125, 1.94921875, 2.015625, 2.08203125, 2.1484375, 2.21484375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 2.0, 4.0, 5.0, 9.0, 11.0, 16.0, 25.0, 14.0, 26.0, 29.0, 36.0, 55.0, 51.0, 47.0, 57.0, 59.0, 78.0, 60.0, 55.0, 52.0, 50.0, 55.0, 38.0, 40.0, 35.0, 32.0, 16.0, 9.0, 13.0, 8.0, 7.0, 6.0, 3.0, 1.0, 5.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.890625, -3.76470947265625, -3.6387939453125, -3.51287841796875, -3.386962890625, -3.26104736328125, -3.1351318359375, -3.00921630859375, -2.88330078125, -2.75738525390625, -2.6314697265625, -2.50555419921875, -2.379638671875, -2.25372314453125, -2.1278076171875, -2.00189208984375, -1.8759765625, -1.75006103515625, -1.6241455078125, -1.49822998046875, -1.372314453125, -1.24639892578125, -1.1204833984375, -0.99456787109375, -0.86865234375, -0.74273681640625, -0.6168212890625, -0.49090576171875, -0.364990234375, -0.23907470703125, -0.1131591796875, 0.01275634765625, 0.138671875, 0.26458740234375, 0.3905029296875, 0.51641845703125, 0.642333984375, 0.76824951171875, 0.8941650390625, 1.02008056640625, 1.14599609375, 1.27191162109375, 1.3978271484375, 1.52374267578125, 1.649658203125, 1.77557373046875, 1.9014892578125, 2.02740478515625, 2.1533203125, 2.27923583984375, 2.4051513671875, 2.53106689453125, 2.656982421875, 2.78289794921875, 2.9088134765625, 3.03472900390625, 3.16064453125, 3.28656005859375, 3.4124755859375, 3.53839111328125, 3.664306640625, 3.79022216796875, 3.9161376953125, 4.04205322265625, 4.16796875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 6.0, 8.0, 7.0, 9.0, 13.0, 22.0, 18.0, 29.0, 36.0, 67.0, 88.0, 125.0, 212.0, 273.0, 564.0, 1096.0, 2267.0, 5530.0, 14879.0, 46587.0, 193096.0, 638455.0, 100095.0, 27995.0, 9650.0, 3714.0, 1680.0, 815.0, 425.0, 261.0, 159.0, 111.0, 75.0, 72.0, 30.0, 21.0, 14.0, 21.0, 12.0, 6.0, 10.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.7607421875, -0.7403411865234375, -0.719940185546875, -0.6995391845703125, -0.67913818359375, -0.6587371826171875, -0.638336181640625, -0.6179351806640625, -0.5975341796875, -0.5771331787109375, -0.556732177734375, -0.5363311767578125, -0.51593017578125, -0.4955291748046875, -0.475128173828125, -0.4547271728515625, -0.434326171875, -0.4139251708984375, -0.393524169921875, -0.3731231689453125, -0.35272216796875, -0.3323211669921875, -0.311920166015625, -0.2915191650390625, -0.2711181640625, -0.2507171630859375, -0.230316162109375, -0.2099151611328125, -0.18951416015625, -0.1691131591796875, -0.148712158203125, -0.1283111572265625, -0.10791015625, -0.0875091552734375, -0.067108154296875, -0.0467071533203125, -0.02630615234375, -0.0059051513671875, 0.014495849609375, 0.0348968505859375, 0.0552978515625, 0.0756988525390625, 0.096099853515625, 0.1165008544921875, 0.13690185546875, 0.1573028564453125, 0.177703857421875, 0.1981048583984375, 0.218505859375, 0.2389068603515625, 0.259307861328125, 0.2797088623046875, 0.30010986328125, 0.3205108642578125, 0.340911865234375, 0.3613128662109375, 0.3817138671875, 0.4021148681640625, 0.422515869140625, 0.4429168701171875, 0.46331787109375, 0.4837188720703125, 0.504119873046875, 0.5245208740234375, 0.544921875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 2.0, 2.0, 3.0, 2.0, 4.0, 3.0, 5.0, 13.0, 14.0, 13.0, 14.0, 18.0, 20.0, 23.0, 29.0, 44.0, 54.0, 61.0, 78.0, 92.0, 93.0, 64.0, 89.0, 49.0, 45.0, 33.0, 26.0, 30.0, 12.0, 11.0, 10.0, 14.0, 6.0, 4.0, 5.0, 4.0, 1.0, 7.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001958608627319336, -0.00019012577831745148, -0.00018439069390296936, -0.00017865560948848724, -0.00017292052507400513, -0.000167185440659523, -0.0001614503562450409, -0.00015571527183055878, -0.00014998018741607666, -0.00014424510300159454, -0.00013851001858711243, -0.0001327749341726303, -0.0001270398497581482, -0.00012130476534366608, -0.00011556968092918396, -0.00010983459651470184, -0.00010409951210021973, -9.836442768573761e-05, -9.262934327125549e-05, -8.689425885677338e-05, -8.115917444229126e-05, -7.542409002780914e-05, -6.968900561332703e-05, -6.395392119884491e-05, -5.821883678436279e-05, -5.2483752369880676e-05, -4.674866795539856e-05, -4.101358354091644e-05, -3.5278499126434326e-05, -2.954341471195221e-05, -2.3808330297470093e-05, -1.8073245882987976e-05, -1.233816146850586e-05, -6.603077054023743e-06, -8.67992639541626e-07, 4.867091774940491e-06, 1.0602176189422607e-05, 1.6337260603904724e-05, 2.207234501838684e-05, 2.7807429432868958e-05, 3.3542513847351074e-05, 3.927759826183319e-05, 4.501268267631531e-05, 5.0747767090797424e-05, 5.648285150527954e-05, 6.221793591976166e-05, 6.795302033424377e-05, 7.368810474872589e-05, 7.942318916320801e-05, 8.515827357769012e-05, 9.089335799217224e-05, 9.662844240665436e-05, 0.00010236352682113647, 0.00010809861123561859, 0.00011383369565010071, 0.00011956878006458282, 0.00012530386447906494, 0.00013103894889354706, 0.00013677403330802917, 0.0001425091177225113, 0.0001482442021369934, 0.00015397928655147552, 0.00015971437096595764, 0.00016544945538043976, 0.00017118453979492188]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 4.0, 4.0, 3.0, 4.0, 7.0, 13.0, 14.0, 19.0, 35.0, 41.0, 83.0, 94.0, 180.0, 285.0, 459.0, 917.0, 1976.0, 4778.0, 13973.0, 49610.0, 246174.0, 614926.0, 81917.0, 20983.0, 6751.0, 2591.0, 1229.0, 628.0, 292.0, 210.0, 129.0, 83.0, 46.0, 27.0, 19.0, 29.0, 7.0, 7.0, 9.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.68408203125, -0.6628189086914062, -0.6415557861328125, -0.6202926635742188, -0.599029541015625, -0.5777664184570312, -0.5565032958984375, -0.5352401733398438, -0.51397705078125, -0.49271392822265625, -0.4714508056640625, -0.45018768310546875, -0.428924560546875, -0.40766143798828125, -0.3863983154296875, -0.36513519287109375, -0.3438720703125, -0.32260894775390625, -0.3013458251953125, -0.28008270263671875, -0.258819580078125, -0.23755645751953125, -0.2162933349609375, -0.19503021240234375, -0.17376708984375, -0.15250396728515625, -0.1312408447265625, -0.10997772216796875, -0.088714599609375, -0.06745147705078125, -0.0461883544921875, -0.02492523193359375, -0.003662109375, 0.01760101318359375, 0.0388641357421875, 0.06012725830078125, 0.081390380859375, 0.10265350341796875, 0.1239166259765625, 0.14517974853515625, 0.16644287109375, 0.18770599365234375, 0.2089691162109375, 0.23023223876953125, 0.251495361328125, 0.27275848388671875, 0.2940216064453125, 0.31528472900390625, 0.3365478515625, 0.35781097412109375, 0.3790740966796875, 0.40033721923828125, 0.421600341796875, 0.44286346435546875, 0.4641265869140625, 0.48538970947265625, 0.50665283203125, 0.5279159545898438, 0.5491790771484375, 0.5704421997070312, 0.591705322265625, 0.6129684448242188, 0.6342315673828125, 0.6554946899414062, 0.6767578125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 2.0, 2.0, 8.0, 11.0, 9.0, 12.0, 15.0, 16.0, 31.0, 41.0, 40.0, 71.0, 73.0, 88.0, 85.0, 104.0, 81.0, 69.0, 71.0, 41.0, 27.0, 31.0, 13.0, 13.0, 12.0, 4.0, 8.0, 4.0, 3.0, 8.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.83154296875, -0.8071060180664062, -0.7826690673828125, -0.7582321166992188, -0.733795166015625, -0.7093582153320312, -0.6849212646484375, -0.6604843139648438, -0.63604736328125, -0.6116104125976562, -0.5871734619140625, -0.5627365112304688, -0.538299560546875, -0.5138626098632812, -0.4894256591796875, -0.46498870849609375, -0.4405517578125, -0.41611480712890625, -0.3916778564453125, -0.36724090576171875, -0.342803955078125, -0.31836700439453125, -0.2939300537109375, -0.26949310302734375, -0.24505615234375, -0.22061920166015625, -0.1961822509765625, -0.17174530029296875, -0.147308349609375, -0.12287139892578125, -0.0984344482421875, -0.07399749755859375, -0.049560546875, -0.02512359619140625, -0.0006866455078125, 0.02375030517578125, 0.048187255859375, 0.07262420654296875, 0.0970611572265625, 0.12149810791015625, 0.14593505859375, 0.17037200927734375, 0.1948089599609375, 0.21924591064453125, 0.243682861328125, 0.26811981201171875, 0.2925567626953125, 0.31699371337890625, 0.3414306640625, 0.36586761474609375, 0.3903045654296875, 0.41474151611328125, 0.439178466796875, 0.46361541748046875, 0.4880523681640625, 0.5124893188476562, 0.53692626953125, 0.5613632202148438, 0.5858001708984375, 0.6102371215820312, 0.634674072265625, 0.6591110229492188, 0.6835479736328125, 0.7079849243164062, 0.732421875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 9.0, 20.0, 42.0, 91.0, 158.0, 387.0, 153.0, 72.0, 40.0, 14.0, 6.0, 2.0, 5.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.47957420349121, -15.631742477416992, -14.783909797668457, -13.936078071594238, -13.088245391845703, -12.240413665771484, -11.392581939697266, -10.544750213623047, -9.696917533874512, -8.849085807800293, -8.001253128051758, -7.153421401977539, -6.305589199066162, -5.457756996154785, -4.609925270080566, -3.7620930671691895, -2.9142608642578125, -2.0664286613464355, -1.2185966968536377, -0.37076473236083984, 0.4770674705505371, 1.324899673461914, 2.172731399536133, 3.0205636024475098, 3.8683958053588867, 4.716228008270264, 5.564060211181641, 6.411891937255859, 7.259724140167236, 8.107556343078613, 8.955388069152832, 9.803220748901367, 10.651054382324219, 11.498886108398438, 12.346718788146973, 13.194550514221191, 14.042383193969727, 14.890214920043945, 15.738046646118164, 16.585878372192383, 17.433712005615234, 18.281543731689453, 19.129375457763672, 19.97720718383789, 20.825040817260742, 21.67287254333496, 22.52070426940918, 23.3685359954834, 24.216367721557617, 25.064199447631836, 25.912031173706055, 26.759864807128906, 27.607696533203125, 28.455528259277344, 29.303359985351562, 30.15119171142578, 30.9990234375, 31.84685516357422, 32.69468688964844, 33.542518615722656, 34.390350341796875, 35.238182067871094, 36.08601379394531, 36.9338493347168, 37.781681060791016]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 2.0, 5.0, 2.0, 1.0, 3.0, 5.0, 6.0, 12.0, 10.0, 14.0, 24.0, 18.0, 27.0, 23.0, 34.0, 33.0, 25.0, 27.0, 46.0, 56.0, 91.0, 96.0, 72.0, 57.0, 43.0, 43.0, 35.0, 30.0, 31.0, 23.0, 20.0, 21.0, 17.0, 10.0, 8.0, 3.0, 7.0, 5.0, 7.0, 1.0, 3.0, 3.0, 1.0, 1.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-12.414369583129883, -12.051536560058594, -11.688702583312988, -11.3258695602417, -10.963035583496094, -10.600202560424805, -10.237369537353516, -9.87453556060791, -9.511701583862305, -9.148868560791016, -8.78603458404541, -8.423201560974121, -8.060367584228516, -7.697534561157227, -7.334701061248779, -6.971867561340332, -6.609034538269043, -6.246201038360596, -5.883367538452148, -5.520534515380859, -5.157700538635254, -4.794867515563965, -4.432034015655518, -4.06920051574707, -3.706367015838623, -3.343533515930176, -2.9807000160217285, -2.6178667545318604, -2.255033254623413, -1.8921997547149658, -1.5293664932250977, -1.1665329933166504, -0.8036994934082031, -0.44086605310440063, -0.07803261280059814, 0.28480076789855957, 0.6476342678070068, 1.010467767715454, 1.3733010292053223, 1.7361345291137695, 2.098968029022217, 2.461801528930664, 2.8246350288391113, 3.1874682903289795, 3.5503017902374268, 3.913135290145874, 4.275968551635742, 4.6388020515441895, 5.001635551452637, 5.364469051361084, 5.727302551269531, 6.09013557434082, 6.452969551086426, 6.815802574157715, 7.178636074066162, 7.541469573974609, 7.904303073883057, 8.267136573791504, 8.629969596862793, 8.992803573608398, 9.355636596679688, 9.718470573425293, 10.081303596496582, 10.444137573242188, 10.806970596313477]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 6.0, 7.0, 11.0, 14.0, 28.0, 27.0, 40.0, 56.0, 94.0, 159.0, 312.0, 609.0, 1287.0, 3261.0, 10315.0, 47231.0, 416061.0, 2712647.0, 896600.0, 83283.0, 14597.0, 4264.0, 1553.0, 803.0, 409.0, 182.0, 134.0, 81.0, 42.0, 40.0, 31.0, 24.0, 21.0, 12.0, 11.0, 6.0, 5.0, 5.0, 5.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-1.4736328125, -1.4270782470703125, -1.380523681640625, -1.3339691162109375, -1.28741455078125, -1.2408599853515625, -1.194305419921875, -1.1477508544921875, -1.1011962890625, -1.0546417236328125, -1.008087158203125, -0.9615325927734375, -0.91497802734375, -0.8684234619140625, -0.821868896484375, -0.7753143310546875, -0.728759765625, -0.6822052001953125, -0.635650634765625, -0.5890960693359375, -0.54254150390625, -0.4959869384765625, -0.449432373046875, -0.4028778076171875, -0.3563232421875, -0.3097686767578125, -0.263214111328125, -0.2166595458984375, -0.17010498046875, -0.1235504150390625, -0.076995849609375, -0.0304412841796875, 0.01611328125, 0.0626678466796875, 0.109222412109375, 0.1557769775390625, 0.20233154296875, 0.2488861083984375, 0.295440673828125, 0.3419952392578125, 0.3885498046875, 0.4351043701171875, 0.481658935546875, 0.5282135009765625, 0.57476806640625, 0.6213226318359375, 0.667877197265625, 0.7144317626953125, 0.760986328125, 0.8075408935546875, 0.854095458984375, 0.9006500244140625, 0.94720458984375, 0.9937591552734375, 1.040313720703125, 1.0868682861328125, 1.1334228515625, 1.1799774169921875, 1.226531982421875, 1.2730865478515625, 1.31964111328125, 1.3661956787109375, 1.412750244140625, 1.4593048095703125, 1.505859375]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 2.0, 2.0, 4.0, 7.0, 7.0, 15.0, 11.0, 9.0, 17.0, 14.0, 20.0, 21.0, 34.0, 29.0, 39.0, 38.0, 28.0, 22.0, 42.0, 72.0, 47.0, 47.0, 52.0, 42.0, 50.0, 36.0, 53.0, 29.0, 40.0, 32.0, 21.0, 24.0, 19.0, 11.0, 15.0, 11.0, 4.0, 10.0, 8.0, 4.0, 6.0, 4.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.7490234375, -0.723480224609375, -0.69793701171875, -0.672393798828125, -0.6468505859375, -0.621307373046875, -0.59576416015625, -0.570220947265625, -0.544677734375, -0.519134521484375, -0.49359130859375, -0.468048095703125, -0.4425048828125, -0.416961669921875, -0.39141845703125, -0.365875244140625, -0.34033203125, -0.314788818359375, -0.28924560546875, -0.263702392578125, -0.2381591796875, -0.212615966796875, -0.18707275390625, -0.161529541015625, -0.135986328125, -0.110443115234375, -0.08489990234375, -0.059356689453125, -0.0338134765625, -0.008270263671875, 0.01727294921875, 0.042816162109375, 0.068359375, 0.093902587890625, 0.11944580078125, 0.144989013671875, 0.1705322265625, 0.196075439453125, 0.22161865234375, 0.247161865234375, 0.272705078125, 0.298248291015625, 0.32379150390625, 0.349334716796875, 0.3748779296875, 0.400421142578125, 0.42596435546875, 0.451507568359375, 0.47705078125, 0.502593994140625, 0.52813720703125, 0.553680419921875, 0.5792236328125, 0.604766845703125, 0.63031005859375, 0.655853271484375, 0.681396484375, 0.706939697265625, 0.73248291015625, 0.758026123046875, 0.7835693359375, 0.809112548828125, 0.83465576171875, 0.860198974609375, 0.8857421875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 5.0, 10.0, 5.0, 15.0, 22.0, 39.0, 64.0, 122.0, 196.0, 410.0, 986.0, 3867.0, 47146.0, 3791599.0, 336237.0, 10488.0, 1827.0, 612.0, 281.0, 123.0, 90.0, 48.0, 40.0, 23.0, 16.0, 3.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.3671875, -4.2337646484375, -4.100341796875, -3.9669189453125, -3.83349609375, -3.7000732421875, -3.566650390625, -3.4332275390625, -3.2998046875, -3.1663818359375, -3.032958984375, -2.8995361328125, -2.76611328125, -2.6326904296875, -2.499267578125, -2.3658447265625, -2.232421875, -2.0989990234375, -1.965576171875, -1.8321533203125, -1.69873046875, -1.5653076171875, -1.431884765625, -1.2984619140625, -1.1650390625, -1.0316162109375, -0.898193359375, -0.7647705078125, -0.63134765625, -0.4979248046875, -0.364501953125, -0.2310791015625, -0.09765625, 0.0357666015625, 0.169189453125, 0.3026123046875, 0.43603515625, 0.5694580078125, 0.702880859375, 0.8363037109375, 0.9697265625, 1.1031494140625, 1.236572265625, 1.3699951171875, 1.50341796875, 1.6368408203125, 1.770263671875, 1.9036865234375, 2.037109375, 2.1705322265625, 2.303955078125, 2.4373779296875, 2.57080078125, 2.7042236328125, 2.837646484375, 2.9710693359375, 3.1044921875, 3.2379150390625, 3.371337890625, 3.5047607421875, 3.63818359375, 3.7716064453125, 3.905029296875, 4.0384521484375, 4.171875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 5.0, 7.0, 10.0, 9.0, 30.0, 39.0, 50.0, 109.0, 201.0, 412.0, 729.0, 1025.0, 698.0, 321.0, 145.0, 101.0, 59.0, 37.0, 34.0, 19.0, 15.0, 7.0, 5.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.587890625, -3.489471435546875, -3.39105224609375, -3.292633056640625, -3.1942138671875, -3.095794677734375, -2.99737548828125, -2.898956298828125, -2.800537109375, -2.702117919921875, -2.60369873046875, -2.505279541015625, -2.4068603515625, -2.308441162109375, -2.21002197265625, -2.111602783203125, -2.01318359375, -1.914764404296875, -1.81634521484375, -1.717926025390625, -1.6195068359375, -1.521087646484375, -1.42266845703125, -1.324249267578125, -1.225830078125, -1.127410888671875, -1.02899169921875, -0.930572509765625, -0.8321533203125, -0.733734130859375, -0.63531494140625, -0.536895751953125, -0.4384765625, -0.340057373046875, -0.24163818359375, -0.143218994140625, -0.0447998046875, 0.053619384765625, 0.15203857421875, 0.250457763671875, 0.348876953125, 0.447296142578125, 0.54571533203125, 0.644134521484375, 0.7425537109375, 0.840972900390625, 0.93939208984375, 1.037811279296875, 1.13623046875, 1.234649658203125, 1.33306884765625, 1.431488037109375, 1.5299072265625, 1.628326416015625, 1.72674560546875, 1.825164794921875, 1.923583984375, 2.022003173828125, 2.12042236328125, 2.218841552734375, 2.3172607421875, 2.415679931640625, 2.51409912109375, 2.612518310546875, 2.7109375]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 5.0, 10.0, 10.0, 63.0, 165.0, 328.0, 260.0, 98.0, 38.0, 23.0, 5.0, 4.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.391866683959961, -7.300963878631592, -6.210061073303223, -5.119158744812012, -4.028255939483643, -2.9373531341552734, -1.8464508056640625, -0.7555480003356934, 0.3353548049926758, 1.4262574911117554, 2.517160177230835, 3.608062744140625, 4.698965549468994, 5.789868354797363, 6.880770683288574, 7.971673488616943, 9.062576293945312, 10.153478622436523, 11.24438190460205, 12.335284233093262, 13.426187515258789, 14.51708984375, 15.607992172241211, 16.698894500732422, 17.789798736572266, 18.880701065063477, 19.971603393554688, 21.06250762939453, 22.153409957885742, 23.244312286376953, 24.335214614868164, 25.426116943359375, 26.517017364501953, 27.607919692993164, 28.698822021484375, 29.78972625732422, 30.88062858581543, 31.97153091430664, 33.06243133544922, 34.15333557128906, 35.244239807128906, 36.33514404296875, 37.42604446411133, 38.51694869995117, 39.60784912109375, 40.698753356933594, 41.78965759277344, 42.880558013916016, 43.971458435058594, 45.06236267089844, 46.153263092041016, 47.24416732788086, 48.33506774902344, 49.42597198486328, 50.516876220703125, 51.6077766418457, 52.69868087768555, 53.78958511352539, 54.88048553466797, 55.97138977050781, 57.06229019165039, 58.153194427490234, 59.24409484863281, 60.334999084472656, 61.4259033203125]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 7.0, 2.0, 3.0, 6.0, 4.0, 5.0, 5.0, 7.0, 7.0, 9.0, 10.0, 16.0, 22.0, 19.0, 27.0, 39.0, 34.0, 30.0, 38.0, 43.0, 49.0, 66.0, 60.0, 71.0, 48.0, 52.0, 48.0, 27.0, 31.0, 44.0, 32.0, 21.0, 19.0, 15.0, 22.0, 20.0, 6.0, 11.0, 8.0, 11.0, 6.0, 7.0, 1.0, 5.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.874604225158691, -8.557976722717285, -8.241349220275879, -7.924721717834473, -7.608094215393066, -7.29146671295166, -6.974839210510254, -6.658211708068848, -6.341584205627441, -6.024956703186035, -5.708329200744629, -5.391701698303223, -5.075074195861816, -4.75844669342041, -4.441819190979004, -4.125191688537598, -3.808563709259033, -3.491936206817627, -3.1753087043762207, -2.8586812019348145, -2.542053699493408, -2.225426197052002, -1.9087984561920166, -1.5921709537506104, -1.275543451309204, -0.9589159488677979, -0.6422883868217468, -0.3256608247756958, -0.00903332233428955, 0.3075941801071167, 0.6242218017578125, 0.9408493041992188, 1.257476806640625, 1.5741043090820312, 1.8907318115234375, 2.2073593139648438, 2.52398681640625, 2.8406143188476562, 3.1572420597076416, 3.473869562149048, 3.790497064590454, 4.1071248054504395, 4.423752307891846, 4.740379810333252, 5.057007312774658, 5.3736348152160645, 5.690262317657471, 6.006889820098877, 6.323517322540283, 6.6401448249816895, 6.956772327423096, 7.273399829864502, 7.590027332305908, 7.9066548347473145, 8.223282814025879, 8.539910316467285, 8.856537818908691, 9.173165321350098, 9.489792823791504, 9.80642032623291, 10.123047828674316, 10.439675331115723, 10.756302833557129, 11.072930335998535, 11.389557838439941]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 5.0, 3.0, 3.0, 4.0, 2.0, 8.0, 13.0, 17.0, 16.0, 42.0, 58.0, 83.0, 109.0, 190.0, 303.0, 471.0, 834.0, 1569.0, 2864.0, 5573.0, 11376.0, 24068.0, 56065.0, 136507.0, 301432.0, 285810.0, 125160.0, 51384.0, 22589.0, 10510.0, 5279.0, 2669.0, 1408.0, 853.0, 483.0, 264.0, 175.0, 115.0, 72.0, 42.0, 33.0, 20.0, 24.0, 20.0, 12.0, 9.0, 8.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.4873046875, -1.442169189453125, -1.39703369140625, -1.351898193359375, -1.3067626953125, -1.261627197265625, -1.21649169921875, -1.171356201171875, -1.126220703125, -1.081085205078125, -1.03594970703125, -0.990814208984375, -0.9456787109375, -0.900543212890625, -0.85540771484375, -0.810272216796875, -0.76513671875, -0.720001220703125, -0.67486572265625, -0.629730224609375, -0.5845947265625, -0.539459228515625, -0.49432373046875, -0.449188232421875, -0.404052734375, -0.358917236328125, -0.31378173828125, -0.268646240234375, -0.2235107421875, -0.178375244140625, -0.13323974609375, -0.088104248046875, -0.04296875, 0.002166748046875, 0.04730224609375, 0.092437744140625, 0.1375732421875, 0.182708740234375, 0.22784423828125, 0.272979736328125, 0.318115234375, 0.363250732421875, 0.40838623046875, 0.453521728515625, 0.4986572265625, 0.543792724609375, 0.58892822265625, 0.634063720703125, 0.67919921875, 0.724334716796875, 0.76947021484375, 0.814605712890625, 0.8597412109375, 0.904876708984375, 0.95001220703125, 0.995147705078125, 1.040283203125, 1.085418701171875, 1.13055419921875, 1.175689697265625, 1.2208251953125, 1.265960693359375, 1.31109619140625, 1.356231689453125, 1.4013671875]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 4.0, 3.0, 5.0, 3.0, 15.0, 10.0, 12.0, 21.0, 18.0, 27.0, 34.0, 40.0, 40.0, 39.0, 46.0, 59.0, 58.0, 53.0, 69.0, 56.0, 57.0, 44.0, 48.0, 36.0, 29.0, 30.0, 25.0, 21.0, 24.0, 22.0, 14.0, 13.0, 5.0, 7.0, 5.0, 6.0, 5.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.947265625, -0.9149322509765625, -0.882598876953125, -0.8502655029296875, -0.81793212890625, -0.7855987548828125, -0.753265380859375, -0.7209320068359375, -0.6885986328125, -0.6562652587890625, -0.623931884765625, -0.5915985107421875, -0.55926513671875, -0.5269317626953125, -0.494598388671875, -0.4622650146484375, -0.429931640625, -0.3975982666015625, -0.365264892578125, -0.3329315185546875, -0.30059814453125, -0.2682647705078125, -0.235931396484375, -0.2035980224609375, -0.1712646484375, -0.1389312744140625, -0.106597900390625, -0.0742645263671875, -0.04193115234375, -0.0095977783203125, 0.022735595703125, 0.0550689697265625, 0.08740234375, 0.1197357177734375, 0.152069091796875, 0.1844024658203125, 0.21673583984375, 0.2490692138671875, 0.281402587890625, 0.3137359619140625, 0.3460693359375, 0.3784027099609375, 0.410736083984375, 0.4430694580078125, 0.47540283203125, 0.5077362060546875, 0.540069580078125, 0.5724029541015625, 0.604736328125, 0.6370697021484375, 0.669403076171875, 0.7017364501953125, 0.73406982421875, 0.7664031982421875, 0.798736572265625, 0.8310699462890625, 0.8634033203125, 0.8957366943359375, 0.928070068359375, 0.9604034423828125, 0.99273681640625, 1.0250701904296875, 1.057403564453125, 1.0897369384765625, 1.1220703125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 5.0, 3.0, 5.0, 7.0, 17.0, 18.0, 19.0, 20.0, 45.0, 52.0, 75.0, 90.0, 148.0, 192.0, 275.0, 391.0, 623.0, 996.0, 1964.0, 4341.0, 12916.0, 52197.0, 315146.0, 576936.0, 58262.0, 13878.0, 4670.0, 2081.0, 1078.0, 653.0, 404.0, 311.0, 206.0, 126.0, 106.0, 74.0, 61.0, 50.0, 24.0, 31.0, 19.0, 15.0, 6.0, 3.0, 6.0, 3.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.537109375, -2.457916259765625, -2.37872314453125, -2.299530029296875, -2.2203369140625, -2.141143798828125, -2.06195068359375, -1.982757568359375, -1.903564453125, -1.824371337890625, -1.74517822265625, -1.665985107421875, -1.5867919921875, -1.507598876953125, -1.42840576171875, -1.349212646484375, -1.27001953125, -1.190826416015625, -1.11163330078125, -1.032440185546875, -0.9532470703125, -0.874053955078125, -0.79486083984375, -0.715667724609375, -0.636474609375, -0.557281494140625, -0.47808837890625, -0.398895263671875, -0.3197021484375, -0.240509033203125, -0.16131591796875, -0.082122802734375, -0.0029296875, 0.076263427734375, 0.15545654296875, 0.234649658203125, 0.3138427734375, 0.393035888671875, 0.47222900390625, 0.551422119140625, 0.630615234375, 0.709808349609375, 0.78900146484375, 0.868194580078125, 0.9473876953125, 1.026580810546875, 1.10577392578125, 1.184967041015625, 1.26416015625, 1.343353271484375, 1.42254638671875, 1.501739501953125, 1.5809326171875, 1.660125732421875, 1.73931884765625, 1.818511962890625, 1.897705078125, 1.976898193359375, 2.05609130859375, 2.135284423828125, 2.2144775390625, 2.293670654296875, 2.37286376953125, 2.452056884765625, 2.53125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 2.0, 3.0, 1.0, 5.0, 2.0, 5.0, 8.0, 6.0, 12.0, 11.0, 11.0, 16.0, 19.0, 21.0, 25.0, 23.0, 35.0, 34.0, 49.0, 44.0, 57.0, 49.0, 55.0, 65.0, 55.0, 57.0, 51.0, 35.0, 44.0, 25.0, 28.0, 26.0, 29.0, 14.0, 18.0, 15.0, 7.0, 8.0, 13.0, 4.0, 7.0, 4.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.17578125, -3.07257080078125, -2.9693603515625, -2.86614990234375, -2.762939453125, -2.65972900390625, -2.5565185546875, -2.45330810546875, -2.35009765625, -2.24688720703125, -2.1436767578125, -2.04046630859375, -1.937255859375, -1.83404541015625, -1.7308349609375, -1.62762451171875, -1.5244140625, -1.42120361328125, -1.3179931640625, -1.21478271484375, -1.111572265625, -1.00836181640625, -0.9051513671875, -0.80194091796875, -0.69873046875, -0.59552001953125, -0.4923095703125, -0.38909912109375, -0.285888671875, -0.18267822265625, -0.0794677734375, 0.02374267578125, 0.126953125, 0.23016357421875, 0.3333740234375, 0.43658447265625, 0.539794921875, 0.64300537109375, 0.7462158203125, 0.84942626953125, 0.95263671875, 1.05584716796875, 1.1590576171875, 1.26226806640625, 1.365478515625, 1.46868896484375, 1.5718994140625, 1.67510986328125, 1.7783203125, 1.88153076171875, 1.9847412109375, 2.08795166015625, 2.191162109375, 2.29437255859375, 2.3975830078125, 2.50079345703125, 2.60400390625, 2.70721435546875, 2.8104248046875, 2.91363525390625, 3.016845703125, 3.12005615234375, 3.2232666015625, 3.32647705078125, 3.4296875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 9.0, 6.0, 14.0, 23.0, 35.0, 47.0, 55.0, 102.0, 153.0, 338.0, 716.0, 1724.0, 6063.0, 33057.0, 325285.0, 633021.0, 37557.0, 6938.0, 1908.0, 709.0, 326.0, 177.0, 94.0, 48.0, 60.0, 28.0, 25.0, 13.0, 10.0, 5.0, 7.0, 5.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0546875, -1.0245819091796875, -0.994476318359375, -0.9643707275390625, -0.93426513671875, -0.9041595458984375, -0.874053955078125, -0.8439483642578125, -0.8138427734375, -0.7837371826171875, -0.753631591796875, -0.7235260009765625, -0.69342041015625, -0.6633148193359375, -0.633209228515625, -0.6031036376953125, -0.572998046875, -0.5428924560546875, -0.512786865234375, -0.4826812744140625, -0.45257568359375, -0.4224700927734375, -0.392364501953125, -0.3622589111328125, -0.3321533203125, -0.3020477294921875, -0.271942138671875, -0.2418365478515625, -0.21173095703125, -0.1816253662109375, -0.151519775390625, -0.1214141845703125, -0.09130859375, -0.0612030029296875, -0.031097412109375, -0.0009918212890625, 0.02911376953125, 0.0592193603515625, 0.089324951171875, 0.1194305419921875, 0.1495361328125, 0.1796417236328125, 0.209747314453125, 0.2398529052734375, 0.26995849609375, 0.3000640869140625, 0.330169677734375, 0.3602752685546875, 0.390380859375, 0.4204864501953125, 0.450592041015625, 0.4806976318359375, 0.51080322265625, 0.5409088134765625, 0.571014404296875, 0.6011199951171875, 0.6312255859375, 0.6613311767578125, 0.691436767578125, 0.7215423583984375, 0.75164794921875, 0.7817535400390625, 0.811859130859375, 0.8419647216796875, 0.8720703125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 5.0, 10.0, 8.0, 4.0, 12.0, 23.0, 34.0, 36.0, 30.0, 33.0, 67.0, 59.0, 93.0, 115.0, 94.0, 82.0, 70.0, 51.0, 41.0, 27.0, 25.0, 17.0, 14.0, 13.0, 10.0, 2.0, 8.0, 5.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002989768981933594, -0.00029057078063488007, -0.00028216466307640076, -0.00027375854551792145, -0.00026535242795944214, -0.00025694631040096283, -0.0002485401928424835, -0.0002401340752840042, -0.0002317279577255249, -0.0002233218401670456, -0.00021491572260856628, -0.00020650960505008698, -0.00019810348749160767, -0.00018969736993312836, -0.00018129125237464905, -0.00017288513481616974, -0.00016447901725769043, -0.00015607289969921112, -0.0001476667821407318, -0.0001392606645822525, -0.0001308545470237732, -0.00012244842946529388, -0.00011404231190681458, -0.00010563619434833527, -9.723007678985596e-05, -8.882395923137665e-05, -8.041784167289734e-05, -7.201172411441803e-05, -6.360560655593872e-05, -5.519948899745941e-05, -4.67933714389801e-05, -3.8387253880500793e-05, -2.9981136322021484e-05, -2.1575018763542175e-05, -1.3168901205062866e-05, -4.762783646583557e-06, 3.643333911895752e-06, 1.2049451470375061e-05, 2.045556902885437e-05, 2.886168658733368e-05, 3.726780414581299e-05, 4.56739217042923e-05, 5.4080039262771606e-05, 6.248615682125092e-05, 7.089227437973022e-05, 7.929839193820953e-05, 8.770450949668884e-05, 9.611062705516815e-05, 0.00010451674461364746, 0.00011292286217212677, 0.00012132897973060608, 0.0001297350972890854, 0.0001381412148475647, 0.000146547332406044, 0.00015495344996452332, 0.00016335956752300262, 0.00017176568508148193, 0.00018017180263996124, 0.00018857792019844055, 0.00019698403775691986, 0.00020539015531539917, 0.00021379627287387848, 0.0002222023904323578, 0.0002306085079908371, 0.0002390146255493164]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 11.0, 11.0, 14.0, 9.0, 26.0, 41.0, 50.0, 65.0, 104.0, 144.0, 232.0, 344.0, 629.0, 994.0, 1962.0, 4409.0, 12340.0, 46250.0, 215397.0, 643347.0, 88117.0, 21110.0, 6815.0, 2791.0, 1347.0, 752.0, 429.0, 262.0, 167.0, 125.0, 83.0, 44.0, 30.0, 26.0, 24.0, 11.0, 15.0, 8.0, 5.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.599609375, -0.5820846557617188, -0.5645599365234375, -0.5470352172851562, -0.529510498046875, -0.5119857788085938, -0.4944610595703125, -0.47693634033203125, -0.45941162109375, -0.44188690185546875, -0.4243621826171875, -0.40683746337890625, -0.389312744140625, -0.37178802490234375, -0.3542633056640625, -0.33673858642578125, -0.3192138671875, -0.30168914794921875, -0.2841644287109375, -0.26663970947265625, -0.249114990234375, -0.23159027099609375, -0.2140655517578125, -0.19654083251953125, -0.17901611328125, -0.16149139404296875, -0.1439666748046875, -0.12644195556640625, -0.108917236328125, -0.09139251708984375, -0.0738677978515625, -0.05634307861328125, -0.038818359375, -0.02129364013671875, -0.0037689208984375, 0.01375579833984375, 0.031280517578125, 0.04880523681640625, 0.0663299560546875, 0.08385467529296875, 0.10137939453125, 0.11890411376953125, 0.1364288330078125, 0.15395355224609375, 0.171478271484375, 0.18900299072265625, 0.2065277099609375, 0.22405242919921875, 0.2415771484375, 0.25910186767578125, 0.2766265869140625, 0.29415130615234375, 0.311676025390625, 0.32920074462890625, 0.3467254638671875, 0.36425018310546875, 0.38177490234375, 0.39929962158203125, 0.4168243408203125, 0.43434906005859375, 0.451873779296875, 0.46939849853515625, 0.4869232177734375, 0.5044479370117188, 0.52197265625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 4.0, 4.0, 6.0, 10.0, 7.0, 15.0, 10.0, 18.0, 21.0, 27.0, 22.0, 31.0, 34.0, 40.0, 42.0, 42.0, 55.0, 88.0, 57.0, 67.0, 62.0, 61.0, 37.0, 52.0, 31.0, 23.0, 23.0, 26.0, 15.0, 13.0, 8.0, 10.0, 11.0, 5.0, 5.0, 5.0, 3.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0], "bins": [-0.6171875, -0.5996856689453125, -0.582183837890625, -0.5646820068359375, -0.54718017578125, -0.5296783447265625, -0.512176513671875, -0.4946746826171875, -0.4771728515625, -0.4596710205078125, -0.442169189453125, -0.4246673583984375, -0.40716552734375, -0.3896636962890625, -0.372161865234375, -0.3546600341796875, -0.337158203125, -0.3196563720703125, -0.302154541015625, -0.2846527099609375, -0.26715087890625, -0.2496490478515625, -0.232147216796875, -0.2146453857421875, -0.1971435546875, -0.1796417236328125, -0.162139892578125, -0.1446380615234375, -0.12713623046875, -0.1096343994140625, -0.092132568359375, -0.0746307373046875, -0.05712890625, -0.0396270751953125, -0.022125244140625, -0.0046234130859375, 0.01287841796875, 0.0303802490234375, 0.047882080078125, 0.0653839111328125, 0.0828857421875, 0.1003875732421875, 0.117889404296875, 0.1353912353515625, 0.15289306640625, 0.1703948974609375, 0.187896728515625, 0.2053985595703125, 0.222900390625, 0.2404022216796875, 0.257904052734375, 0.2754058837890625, 0.29290771484375, 0.3104095458984375, 0.327911376953125, 0.3454132080078125, 0.3629150390625, 0.3804168701171875, 0.397918701171875, 0.4154205322265625, 0.43292236328125, 0.4504241943359375, 0.467926025390625, 0.4854278564453125, 0.5029296875]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 8.0, 6.0, 26.0, 23.0, 67.0, 158.0, 388.0, 162.0, 90.0, 39.0, 19.0, 9.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-32.272552490234375, -31.393699645996094, -30.514846801757812, -29.63599395751953, -28.757139205932617, -27.878286361694336, -26.999433517456055, -26.120580673217773, -25.24172592163086, -24.362873077392578, -23.484020233154297, -22.605167388916016, -21.7263126373291, -20.84745979309082, -19.96860694885254, -19.089754104614258, -18.210901260375977, -17.332048416137695, -16.453195571899414, -15.574341773986816, -14.695487976074219, -13.816635131835938, -12.937782287597656, -12.058929443359375, -11.180075645446777, -10.301222801208496, -9.422369003295898, -8.543516159057617, -7.664662837982178, -6.785809516906738, -5.906956672668457, -5.028103351593018, -4.149250030517578, -3.2703967094421387, -2.3915436267852783, -1.512690544128418, -0.6338372230529785, 0.24501609802246094, 1.1238689422607422, 2.0027222633361816, 2.881575584411621, 3.7604289054870605, 4.6392822265625, 5.518135070800781, 6.396988391876221, 7.27584171295166, 8.154694557189941, 9.033548355102539, 9.91240119934082, 10.791254043579102, 11.6701078414917, 12.54896068572998, 13.427814483642578, 14.30666732788086, 15.18552017211914, 16.064373016357422, 16.943225860595703, 17.822078704833984, 18.700931549072266, 19.579784393310547, 20.45863914489746, 21.337491989135742, 22.216344833374023, 23.095197677612305, 23.97405242919922]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 5.0, 5.0, 10.0, 11.0, 13.0, 13.0, 14.0, 24.0, 27.0, 37.0, 26.0, 32.0, 29.0, 49.0, 78.0, 175.0, 137.0, 46.0, 39.0, 39.0, 31.0, 31.0, 17.0, 25.0, 16.0, 17.0, 17.0, 11.0, 11.0, 5.0, 5.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.693618774414062, -13.216774940490723, -12.739931106567383, -12.26308822631836, -11.78624439239502, -11.30940055847168, -10.83255672454834, -10.355712890625, -9.878870010375977, -9.402026176452637, -8.925182342529297, -8.448339462280273, -7.971495628356934, -7.494651794433594, -7.017807960510254, -6.540964603424072, -6.064120769500732, -5.587276935577393, -5.110433578491211, -4.633589744567871, -4.1567463874816895, -3.6799025535583496, -3.203058958053589, -2.726215362548828, -2.2493717670440674, -1.7725281715393066, -1.295684576034546, -0.8188408613204956, -0.34199726581573486, 0.13484644889831543, 0.6116900444030762, 1.088533639907837, 1.5653772354125977, 2.0422208309173584, 2.519064426422119, 2.995908260345459, 3.4727516174316406, 3.9495954513549805, 4.42643928527832, 4.903282642364502, 5.380125999450684, 5.856969833374023, 6.333813190460205, 6.810657024383545, 7.287500381469727, 7.764344215393066, 8.241188049316406, 8.71803092956543, 9.194875717163086, 9.671719551086426, 10.148563385009766, 10.625406265258789, 11.102250099182129, 11.579093933105469, 12.055937767028809, 12.532781600952148, 13.009624481201172, 13.486468315124512, 13.963312149047852, 14.440155029296875, 14.916998863220215, 15.393842697143555, 15.870686531066895, 16.347530364990234, 16.824373245239258]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 1.0, 3.0, 12.0, 10.0, 16.0, 12.0, 22.0, 32.0, 52.0, 82.0, 133.0, 225.0, 320.0, 495.0, 932.0, 1581.0, 3039.0, 6469.0, 16811.0, 51803.0, 197820.0, 818904.0, 1835094.0, 945474.0, 227536.0, 55396.0, 17473.0, 6934.0, 3294.0, 1640.0, 968.0, 559.0, 382.0, 258.0, 142.0, 117.0, 74.0, 41.0, 23.0, 20.0, 18.0, 14.0, 5.0, 11.0, 12.0, 10.0, 6.0, 2.0, 3.0, 1.0, 0.0, 4.0, 2.0, 1.0, 2.0], "bins": [-1.267578125, -1.2274017333984375, -1.187225341796875, -1.1470489501953125, -1.10687255859375, -1.0666961669921875, -1.026519775390625, -0.9863433837890625, -0.9461669921875, -0.9059906005859375, -0.865814208984375, -0.8256378173828125, -0.78546142578125, -0.7452850341796875, -0.705108642578125, -0.6649322509765625, -0.624755859375, -0.5845794677734375, -0.544403076171875, -0.5042266845703125, -0.46405029296875, -0.4238739013671875, -0.383697509765625, -0.3435211181640625, -0.3033447265625, -0.2631683349609375, -0.222991943359375, -0.1828155517578125, -0.14263916015625, -0.1024627685546875, -0.062286376953125, -0.0221099853515625, 0.01806640625, 0.0582427978515625, 0.098419189453125, 0.1385955810546875, 0.17877197265625, 0.2189483642578125, 0.259124755859375, 0.2993011474609375, 0.3394775390625, 0.3796539306640625, 0.419830322265625, 0.4600067138671875, 0.50018310546875, 0.5403594970703125, 0.580535888671875, 0.6207122802734375, 0.660888671875, 0.7010650634765625, 0.741241455078125, 0.7814178466796875, 0.82159423828125, 0.8617706298828125, 0.901947021484375, 0.9421234130859375, 0.9822998046875, 1.0224761962890625, 1.062652587890625, 1.1028289794921875, 1.14300537109375, 1.1831817626953125, 1.223358154296875, 1.2635345458984375, 1.3037109375]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 4.0, 9.0, 7.0, 11.0, 18.0, 20.0, 27.0, 25.0, 23.0, 29.0, 46.0, 41.0, 51.0, 53.0, 60.0, 50.0, 65.0, 52.0, 49.0, 44.0, 48.0, 41.0, 34.0, 40.0, 31.0, 28.0, 14.0, 15.0, 12.0, 14.0, 11.0, 9.0, 8.0, 2.0, 3.0, 7.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.70263671875, -0.6739730834960938, -0.6453094482421875, -0.6166458129882812, -0.587982177734375, -0.5593185424804688, -0.5306549072265625, -0.5019912719726562, -0.47332763671875, -0.44466400146484375, -0.4160003662109375, -0.38733673095703125, -0.358673095703125, -0.33000946044921875, -0.3013458251953125, -0.27268218994140625, -0.2440185546875, -0.21535491943359375, -0.1866912841796875, -0.15802764892578125, -0.129364013671875, -0.10070037841796875, -0.0720367431640625, -0.04337310791015625, -0.01470947265625, 0.01395416259765625, 0.0426177978515625, 0.07128143310546875, 0.099945068359375, 0.12860870361328125, 0.1572723388671875, 0.18593597412109375, 0.214599609375, 0.24326324462890625, 0.2719268798828125, 0.30059051513671875, 0.329254150390625, 0.35791778564453125, 0.3865814208984375, 0.41524505615234375, 0.44390869140625, 0.47257232666015625, 0.5012359619140625, 0.5298995971679688, 0.558563232421875, 0.5872268676757812, 0.6158905029296875, 0.6445541381835938, 0.6732177734375, 0.7018814086914062, 0.7305450439453125, 0.7592086791992188, 0.787872314453125, 0.8165359497070312, 0.8451995849609375, 0.8738632202148438, 0.90252685546875, 0.9311904907226562, 0.9598541259765625, 0.9885177612304688, 1.017181396484375, 1.0458450317382812, 1.0745086669921875, 1.1031723022460938, 1.1318359375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 5.0, 3.0, 9.0, 11.0, 10.0, 20.0, 43.0, 68.0, 153.0, 251.0, 628.0, 1675.0, 6606.0, 123414.0, 4012209.0, 42145.0, 4498.0, 1388.0, 561.0, 244.0, 138.0, 68.0, 44.0, 26.0, 20.0, 13.0, 7.0, 5.0, 4.0, 6.0, 1.0, 4.0, 0.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.45703125, -6.23724365234375, -6.0174560546875, -5.79766845703125, -5.577880859375, -5.35809326171875, -5.1383056640625, -4.91851806640625, -4.69873046875, -4.47894287109375, -4.2591552734375, -4.03936767578125, -3.819580078125, -3.59979248046875, -3.3800048828125, -3.16021728515625, -2.9404296875, -2.72064208984375, -2.5008544921875, -2.28106689453125, -2.061279296875, -1.84149169921875, -1.6217041015625, -1.40191650390625, -1.18212890625, -0.96234130859375, -0.7425537109375, -0.52276611328125, -0.302978515625, -0.08319091796875, 0.1365966796875, 0.35638427734375, 0.576171875, 0.79595947265625, 1.0157470703125, 1.23553466796875, 1.455322265625, 1.67510986328125, 1.8948974609375, 2.11468505859375, 2.33447265625, 2.55426025390625, 2.7740478515625, 2.99383544921875, 3.213623046875, 3.43341064453125, 3.6531982421875, 3.87298583984375, 4.0927734375, 4.31256103515625, 4.5323486328125, 4.75213623046875, 4.971923828125, 5.19171142578125, 5.4114990234375, 5.63128662109375, 5.85107421875, 6.07086181640625, 6.2906494140625, 6.51043701171875, 6.730224609375, 6.95001220703125, 7.1697998046875, 7.38958740234375, 7.609375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 6.0, 5.0, 9.0, 13.0, 14.0, 24.0, 34.0, 37.0, 68.0, 92.0, 154.0, 194.0, 322.0, 444.0, 616.0, 615.0, 463.0, 317.0, 221.0, 138.0, 79.0, 77.0, 34.0, 22.0, 34.0, 9.0, 10.0, 6.0, 5.0, 3.0, 4.0, 4.0, 1.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.087890625, -1.978363037109375, -1.86883544921875, -1.759307861328125, -1.6497802734375, -1.540252685546875, -1.43072509765625, -1.321197509765625, -1.211669921875, -1.102142333984375, -0.99261474609375, -0.883087158203125, -0.7735595703125, -0.664031982421875, -0.55450439453125, -0.444976806640625, -0.33544921875, -0.225921630859375, -0.11639404296875, -0.006866455078125, 0.1026611328125, 0.212188720703125, 0.32171630859375, 0.431243896484375, 0.540771484375, 0.650299072265625, 0.75982666015625, 0.869354248046875, 0.9788818359375, 1.088409423828125, 1.19793701171875, 1.307464599609375, 1.4169921875, 1.526519775390625, 1.63604736328125, 1.745574951171875, 1.8551025390625, 1.964630126953125, 2.07415771484375, 2.183685302734375, 2.293212890625, 2.402740478515625, 2.51226806640625, 2.621795654296875, 2.7313232421875, 2.840850830078125, 2.95037841796875, 3.059906005859375, 3.16943359375, 3.278961181640625, 3.38848876953125, 3.498016357421875, 3.6075439453125, 3.717071533203125, 3.82659912109375, 3.936126708984375, 4.045654296875, 4.155181884765625, 4.26470947265625, 4.374237060546875, 4.4837646484375, 4.593292236328125, 4.70281982421875, 4.812347412109375, 4.921875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 8.0, 6.0, 17.0, 43.0, 89.0, 212.0, 333.0, 173.0, 66.0, 33.0, 10.0, 5.0, 8.0, 4.0, 1.0, 1.0, 2.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.6939582824707, -32.69845199584961, -30.70294761657715, -28.707443237304688, -26.711936950683594, -24.716432571411133, -22.720928192138672, -20.725421905517578, -18.729917526245117, -16.734413146972656, -14.738906860351562, -12.743402481079102, -10.747897148132324, -8.752391815185547, -6.756887435913086, -4.761382102966309, -2.7658767700195312, -0.770371675491333, 1.2251334190368652, 3.2206382751464844, 5.216143608093262, 7.211648941040039, 9.2071533203125, 11.202658653259277, 13.198163986206055, 15.193669319152832, 17.18917465209961, 19.18467903137207, 21.18018341064453, 23.175689697265625, 25.171194076538086, 27.166698455810547, 29.162208557128906, 31.157712936401367, 33.15321731567383, 35.14872360229492, 37.144229888916016, 39.139732360839844, 41.13523864746094, 43.13074493408203, 45.126251220703125, 47.12175750732422, 49.11725997924805, 51.11276626586914, 53.108272552490234, 55.10377502441406, 57.099281311035156, 59.09478759765625, 61.09029006958008, 63.08579635620117, 65.081298828125, 67.0768051147461, 69.07231140136719, 71.06781768798828, 73.06332397460938, 75.05882263183594, 77.05432891845703, 79.04983520507812, 81.04534149169922, 83.04084777832031, 85.03634643554688, 87.03185272216797, 89.02735900878906, 91.02286529541016, 93.01837158203125]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 4.0, 8.0, 11.0, 13.0, 16.0, 13.0, 21.0, 18.0, 20.0, 19.0, 34.0, 38.0, 36.0, 36.0, 36.0, 58.0, 76.0, 69.0, 69.0, 47.0, 51.0, 39.0, 37.0, 43.0, 19.0, 25.0, 21.0, 20.0, 19.0, 15.0, 10.0, 13.0, 16.0, 8.0, 7.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-20.473234176635742, -19.86264419555664, -19.25205421447754, -18.641464233398438, -18.030874252319336, -17.420284271240234, -16.809694290161133, -16.19910430908203, -15.588515281677246, -14.977925300598145, -14.367335319519043, -13.756745338439941, -13.146156311035156, -12.535566329956055, -11.924976348876953, -11.314386367797852, -10.70379638671875, -10.093206405639648, -9.482616424560547, -8.872026443481445, -8.261436462402344, -7.6508469581604, -7.040257453918457, -6.4296674728393555, -5.819077491760254, -5.208487510681152, -4.597897529602051, -3.9873080253601074, -3.376718044281006, -2.7661280632019043, -2.155538320541382, -1.5449485778808594, -0.934356689453125, -0.323766827583313, 0.286823034286499, 0.897412896156311, 1.508002758026123, 2.1185927391052246, 2.729182481765747, 3.3397722244262695, 3.950362205505371, 4.560952186584473, 5.171542167663574, 5.782131671905518, 6.392721652984619, 7.003311634063721, 7.613901138305664, 8.224491119384766, 8.835081100463867, 9.445671081542969, 10.05626106262207, 10.666851043701172, 11.277441024780273, 11.888031005859375, 12.49862003326416, 13.109210014343262, 13.719799995422363, 14.330389976501465, 14.940979957580566, 15.551569938659668, 16.162158966064453, 16.772748947143555, 17.383338928222656, 17.993928909301758, 18.60451889038086]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 1.0, 3.0, 8.0, 9.0, 15.0, 16.0, 30.0, 37.0, 54.0, 101.0, 171.0, 376.0, 809.0, 2093.0, 5788.0, 19708.0, 92192.0, 635707.0, 234704.0, 40599.0, 10328.0, 3371.0, 1298.0, 532.0, 249.0, 138.0, 89.0, 45.0, 29.0, 18.0, 13.0, 10.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.828125, -2.739044189453125, -2.64996337890625, -2.560882568359375, -2.4718017578125, -2.382720947265625, -2.29364013671875, -2.204559326171875, -2.115478515625, -2.026397705078125, -1.93731689453125, -1.848236083984375, -1.7591552734375, -1.670074462890625, -1.58099365234375, -1.491912841796875, -1.40283203125, -1.313751220703125, -1.22467041015625, -1.135589599609375, -1.0465087890625, -0.957427978515625, -0.86834716796875, -0.779266357421875, -0.690185546875, -0.601104736328125, -0.51202392578125, -0.422943115234375, -0.3338623046875, -0.244781494140625, -0.15570068359375, -0.066619873046875, 0.0224609375, 0.111541748046875, 0.20062255859375, 0.289703369140625, 0.3787841796875, 0.467864990234375, 0.55694580078125, 0.646026611328125, 0.735107421875, 0.824188232421875, 0.91326904296875, 1.002349853515625, 1.0914306640625, 1.180511474609375, 1.26959228515625, 1.358673095703125, 1.44775390625, 1.536834716796875, 1.62591552734375, 1.714996337890625, 1.8040771484375, 1.893157958984375, 1.98223876953125, 2.071319580078125, 2.160400390625, 2.249481201171875, 2.33856201171875, 2.427642822265625, 2.5167236328125, 2.605804443359375, 2.69488525390625, 2.783966064453125, 2.873046875]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 1.0, 4.0, 5.0, 2.0, 7.0, 13.0, 22.0, 24.0, 34.0, 35.0, 44.0, 55.0, 71.0, 82.0, 71.0, 81.0, 66.0, 67.0, 58.0, 56.0, 47.0, 34.0, 30.0, 25.0, 18.0, 17.0, 11.0, 10.0, 7.0, 3.0, 2.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5078125, -1.4566497802734375, -1.405487060546875, -1.3543243408203125, -1.30316162109375, -1.2519989013671875, -1.200836181640625, -1.1496734619140625, -1.0985107421875, -1.0473480224609375, -0.996185302734375, -0.9450225830078125, -0.89385986328125, -0.8426971435546875, -0.791534423828125, -0.7403717041015625, -0.689208984375, -0.6380462646484375, -0.586883544921875, -0.5357208251953125, -0.48455810546875, -0.4333953857421875, -0.382232666015625, -0.3310699462890625, -0.2799072265625, -0.2287445068359375, -0.177581787109375, -0.1264190673828125, -0.07525634765625, -0.0240936279296875, 0.027069091796875, 0.0782318115234375, 0.12939453125, 0.1805572509765625, 0.231719970703125, 0.2828826904296875, 0.33404541015625, 0.3852081298828125, 0.436370849609375, 0.4875335693359375, 0.5386962890625, 0.5898590087890625, 0.641021728515625, 0.6921844482421875, 0.74334716796875, 0.7945098876953125, 0.845672607421875, 0.8968353271484375, 0.947998046875, 0.9991607666015625, 1.050323486328125, 1.1014862060546875, 1.15264892578125, 1.2038116455078125, 1.254974365234375, 1.3061370849609375, 1.3572998046875, 1.4084625244140625, 1.459625244140625, 1.5107879638671875, 1.56195068359375, 1.6131134033203125, 1.664276123046875, 1.7154388427734375, 1.7666015625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 2.0, 7.0, 4.0, 7.0, 8.0, 5.0, 8.0, 13.0, 14.0, 29.0, 34.0, 60.0, 83.0, 112.0, 213.0, 286.0, 515.0, 1015.0, 2383.0, 7031.0, 31743.0, 700090.0, 266509.0, 27463.0, 6460.0, 2163.0, 967.0, 505.0, 279.0, 191.0, 111.0, 88.0, 51.0, 32.0, 25.0, 16.0, 9.0, 8.0, 5.0, 5.0, 4.0, 0.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.1015625, -3.01531982421875, -2.9290771484375, -2.84283447265625, -2.756591796875, -2.67034912109375, -2.5841064453125, -2.49786376953125, -2.41162109375, -2.32537841796875, -2.2391357421875, -2.15289306640625, -2.066650390625, -1.98040771484375, -1.8941650390625, -1.80792236328125, -1.7216796875, -1.63543701171875, -1.5491943359375, -1.46295166015625, -1.376708984375, -1.29046630859375, -1.2042236328125, -1.11798095703125, -1.03173828125, -0.94549560546875, -0.8592529296875, -0.77301025390625, -0.686767578125, -0.60052490234375, -0.5142822265625, -0.42803955078125, -0.341796875, -0.25555419921875, -0.1693115234375, -0.08306884765625, 0.003173828125, 0.08941650390625, 0.1756591796875, 0.26190185546875, 0.34814453125, 0.43438720703125, 0.5206298828125, 0.60687255859375, 0.693115234375, 0.77935791015625, 0.8656005859375, 0.95184326171875, 1.0380859375, 1.12432861328125, 1.2105712890625, 1.29681396484375, 1.383056640625, 1.46929931640625, 1.5555419921875, 1.64178466796875, 1.72802734375, 1.81427001953125, 1.9005126953125, 1.98675537109375, 2.072998046875, 2.15924072265625, 2.2454833984375, 2.33172607421875, 2.41796875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 5.0, 3.0, 3.0, 4.0, 6.0, 6.0, 12.0, 11.0, 14.0, 11.0, 11.0, 20.0, 18.0, 14.0, 19.0, 28.0, 29.0, 28.0, 56.0, 58.0, 62.0, 76.0, 78.0, 59.0, 56.0, 48.0, 42.0, 35.0, 21.0, 16.0, 18.0, 20.0, 15.0, 18.0, 12.0, 16.0, 12.0, 13.0, 7.0, 7.0, 2.0, 5.0, 0.0, 3.0, 2.0, 4.0, 0.0, 1.0], "bins": [-4.78515625, -4.65924072265625, -4.5333251953125, -4.40740966796875, -4.281494140625, -4.15557861328125, -4.0296630859375, -3.90374755859375, -3.77783203125, -3.65191650390625, -3.5260009765625, -3.40008544921875, -3.274169921875, -3.14825439453125, -3.0223388671875, -2.89642333984375, -2.7705078125, -2.64459228515625, -2.5186767578125, -2.39276123046875, -2.266845703125, -2.14093017578125, -2.0150146484375, -1.88909912109375, -1.76318359375, -1.63726806640625, -1.5113525390625, -1.38543701171875, -1.259521484375, -1.13360595703125, -1.0076904296875, -0.88177490234375, -0.755859375, -0.62994384765625, -0.5040283203125, -0.37811279296875, -0.252197265625, -0.12628173828125, -0.0003662109375, 0.12554931640625, 0.25146484375, 0.37738037109375, 0.5032958984375, 0.62921142578125, 0.755126953125, 0.88104248046875, 1.0069580078125, 1.13287353515625, 1.2587890625, 1.38470458984375, 1.5106201171875, 1.63653564453125, 1.762451171875, 1.88836669921875, 2.0142822265625, 2.14019775390625, 2.26611328125, 2.39202880859375, 2.5179443359375, 2.64385986328125, 2.769775390625, 2.89569091796875, 3.0216064453125, 3.14752197265625, 3.2734375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 8.0, 8.0, 15.0, 16.0, 16.0, 26.0, 34.0, 36.0, 60.0, 89.0, 135.0, 253.0, 520.0, 1129.0, 3118.0, 10839.0, 54129.0, 886679.0, 72276.0, 12830.0, 3697.0, 1282.0, 597.0, 286.0, 156.0, 86.0, 74.0, 39.0, 29.0, 24.0, 7.0, 15.0, 13.0, 10.0, 10.0, 5.0, 5.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.66943359375, -0.6442337036132812, -0.6190338134765625, -0.5938339233398438, -0.568634033203125, -0.5434341430664062, -0.5182342529296875, -0.49303436279296875, -0.46783447265625, -0.44263458251953125, -0.4174346923828125, -0.39223480224609375, -0.367034912109375, -0.34183502197265625, -0.3166351318359375, -0.29143524169921875, -0.2662353515625, -0.24103546142578125, -0.2158355712890625, -0.19063568115234375, -0.165435791015625, -0.14023590087890625, -0.1150360107421875, -0.08983612060546875, -0.06463623046875, -0.03943634033203125, -0.0142364501953125, 0.01096343994140625, 0.036163330078125, 0.06136322021484375, 0.0865631103515625, 0.11176300048828125, 0.136962890625, 0.16216278076171875, 0.1873626708984375, 0.21256256103515625, 0.237762451171875, 0.26296234130859375, 0.2881622314453125, 0.31336212158203125, 0.33856201171875, 0.36376190185546875, 0.3889617919921875, 0.41416168212890625, 0.439361572265625, 0.46456146240234375, 0.4897613525390625, 0.5149612426757812, 0.5401611328125, 0.5653610229492188, 0.5905609130859375, 0.6157608032226562, 0.640960693359375, 0.6661605834960938, 0.6913604736328125, 0.7165603637695312, 0.74176025390625, 0.7669601440429688, 0.7921600341796875, 0.8173599243164062, 0.842559814453125, 0.8677597045898438, 0.8929595947265625, 0.9181594848632812, 0.943359375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 4.0, 6.0, 6.0, 2.0, 8.0, 4.0, 20.0, 15.0, 30.0, 33.0, 58.0, 74.0, 103.0, 146.0, 143.0, 95.0, 60.0, 54.0, 26.0, 27.0, 20.0, 17.0, 6.0, 11.0, 12.0, 3.0, 6.0, 5.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003075599670410156, -0.00029921717941761017, -0.0002908743917942047, -0.00028253160417079926, -0.0002741888165473938, -0.00026584602892398834, -0.0002575032413005829, -0.00024916045367717743, -0.00024081766605377197, -0.00023247487843036652, -0.00022413209080696106, -0.0002157893031835556, -0.00020744651556015015, -0.0001991037279367447, -0.00019076094031333923, -0.00018241815268993378, -0.00017407536506652832, -0.00016573257744312286, -0.0001573897898197174, -0.00014904700219631195, -0.0001407042145729065, -0.00013236142694950104, -0.00012401863932609558, -0.00011567585170269012, -0.00010733306407928467, -9.899027645587921e-05, -9.064748883247375e-05, -8.23047012090683e-05, -7.396191358566284e-05, -6.561912596225739e-05, -5.727633833885193e-05, -4.893355071544647e-05, -4.0590763092041016e-05, -3.224797546863556e-05, -2.3905187845230103e-05, -1.5562400221824646e-05, -7.2196125984191895e-06, 1.123175024986267e-06, 9.465962648391724e-06, 1.780875027179718e-05, 2.6151537895202637e-05, 3.449432551860809e-05, 4.283711314201355e-05, 5.1179900765419006e-05, 5.952268838882446e-05, 6.786547601222992e-05, 7.620826363563538e-05, 8.455105125904083e-05, 9.289383888244629e-05, 0.00010123662650585175, 0.0001095794141292572, 0.00011792220175266266, 0.00012626498937606812, 0.00013460777699947357, 0.00014295056462287903, 0.00015129335224628448, 0.00015963613986968994, 0.0001679789274930954, 0.00017632171511650085, 0.0001846645027399063, 0.00019300729036331177, 0.00020135007798671722, 0.00020969286561012268, 0.00021803565323352814, 0.0002263784408569336]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 8.0, 6.0, 11.0, 14.0, 25.0, 50.0, 90.0, 198.0, 452.0, 1354.0, 4828.0, 27074.0, 890518.0, 108929.0, 10966.0, 2560.0, 822.0, 311.0, 155.0, 73.0, 37.0, 23.0, 18.0, 4.0, 4.0, 4.0, 8.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.8583984375, -0.8313751220703125, -0.804351806640625, -0.7773284912109375, -0.75030517578125, -0.7232818603515625, -0.696258544921875, -0.6692352294921875, -0.6422119140625, -0.6151885986328125, -0.588165283203125, -0.5611419677734375, -0.53411865234375, -0.5070953369140625, -0.480072021484375, -0.4530487060546875, -0.426025390625, -0.3990020751953125, -0.371978759765625, -0.3449554443359375, -0.31793212890625, -0.2909088134765625, -0.263885498046875, -0.2368621826171875, -0.2098388671875, -0.1828155517578125, -0.155792236328125, -0.1287689208984375, -0.10174560546875, -0.0747222900390625, -0.047698974609375, -0.0206756591796875, 0.00634765625, 0.0333709716796875, 0.060394287109375, 0.0874176025390625, 0.11444091796875, 0.1414642333984375, 0.168487548828125, 0.1955108642578125, 0.2225341796875, 0.2495574951171875, 0.276580810546875, 0.3036041259765625, 0.33062744140625, 0.3576507568359375, 0.384674072265625, 0.4116973876953125, 0.438720703125, 0.4657440185546875, 0.492767333984375, 0.5197906494140625, 0.54681396484375, 0.5738372802734375, 0.600860595703125, 0.6278839111328125, 0.6549072265625, 0.6819305419921875, 0.708953857421875, 0.7359771728515625, 0.76300048828125, 0.7900238037109375, 0.817047119140625, 0.8440704345703125, 0.87109375]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 4.0, 8.0, 10.0, 11.0, 9.0, 24.0, 26.0, 42.0, 71.0, 122.0, 212.0, 167.0, 101.0, 62.0, 44.0, 25.0, 19.0, 11.0, 11.0, 4.0, 7.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.80712890625, -0.7747116088867188, -0.7422943115234375, -0.7098770141601562, -0.677459716796875, -0.6450424194335938, -0.6126251220703125, -0.5802078247070312, -0.54779052734375, -0.5153732299804688, -0.4829559326171875, -0.45053863525390625, -0.418121337890625, -0.38570404052734375, -0.3532867431640625, -0.32086944580078125, -0.2884521484375, -0.25603485107421875, -0.2236175537109375, -0.19120025634765625, -0.158782958984375, -0.12636566162109375, -0.0939483642578125, -0.06153106689453125, -0.02911376953125, 0.00330352783203125, 0.0357208251953125, 0.06813812255859375, 0.100555419921875, 0.13297271728515625, 0.1653900146484375, 0.19780731201171875, 0.230224609375, 0.26264190673828125, 0.2950592041015625, 0.32747650146484375, 0.359893798828125, 0.39231109619140625, 0.4247283935546875, 0.45714569091796875, 0.48956298828125, 0.5219802856445312, 0.5543975830078125, 0.5868148803710938, 0.619232177734375, 0.6516494750976562, 0.6840667724609375, 0.7164840698242188, 0.7489013671875, 0.7813186645507812, 0.8137359619140625, 0.8461532592773438, 0.878570556640625, 0.9109878540039062, 0.9434051513671875, 0.9758224487304688, 1.00823974609375, 1.0406570434570312, 1.0730743408203125, 1.1054916381835938, 1.137908935546875, 1.1703262329101562, 1.2027435302734375, 1.2351608276367188, 1.267578125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 4.0, 7.0, 9.0, 14.0, 47.0, 111.0, 365.0, 327.0, 72.0, 27.0, 16.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-60.41972351074219, -59.30076217651367, -58.18180465698242, -57.062843322753906, -55.943885803222656, -54.82492446899414, -53.705963134765625, -52.587005615234375, -51.46804428100586, -50.349082946777344, -49.230125427246094, -48.11116409301758, -46.99220275878906, -45.87324523925781, -44.7542839050293, -43.63532638549805, -42.51636505126953, -41.397403717041016, -40.278446197509766, -39.15948486328125, -38.04052734375, -36.921566009521484, -35.80260467529297, -34.68364715576172, -33.5646858215332, -32.44572448730469, -31.326766967773438, -30.207805633544922, -29.08884620666504, -27.969886779785156, -26.85092544555664, -25.731966018676758, -24.61301040649414, -23.494050979614258, -22.375091552734375, -21.25613021850586, -20.137170791625977, -19.018211364746094, -17.899250030517578, -16.780290603637695, -15.661331176757812, -14.54237174987793, -13.42341136932373, -12.304450988769531, -11.185491561889648, -10.066532135009766, -8.947571754455566, -7.828611850738525, -6.709651947021484, -5.590692043304443, -4.471732139587402, -3.3527722358703613, -2.2338123321533203, -1.1148524284362793, 0.004107475280761719, 1.1230673789978027, 2.2420272827148438, 3.3609871864318848, 4.479947090148926, 5.598906993865967, 6.717866897583008, 7.836826801300049, 8.95578670501709, 10.074747085571289, 11.193706512451172]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 3.0, 6.0, 6.0, 7.0, 6.0, 13.0, 13.0, 12.0, 15.0, 9.0, 23.0, 18.0, 36.0, 24.0, 19.0, 22.0, 44.0, 190.0, 248.0, 53.0, 28.0, 26.0, 25.0, 21.0, 28.0, 18.0, 16.0, 12.0, 7.0, 12.0, 5.0, 8.0, 8.0, 6.0, 3.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.198326110839844, -11.779027938842773, -11.35973072052002, -10.94043254852295, -10.521134376525879, -10.101837158203125, -9.682538986206055, -9.263240814208984, -8.843942642211914, -8.424644470214844, -8.00534725189209, -7.5860490798950195, -7.166750907897949, -6.747453212738037, -6.328155517578125, -5.908857345581055, -5.489559650421143, -5.0702619552612305, -4.65096378326416, -4.231666088104248, -3.8123679161071777, -3.3930702209472656, -2.9737722873687744, -2.554474353790283, -2.135176420211792, -1.7158784866333008, -1.2965805530548096, -0.8772827386856079, -0.4579848051071167, -0.03868699073791504, 0.38061094284057617, 0.7999088764190674, 1.2192068099975586, 1.6385047435760498, 2.057802677154541, 2.477100372314453, 2.8963985443115234, 3.3156962394714355, 3.7349941730499268, 4.154292106628418, 4.573590278625488, 4.9928879737854, 5.412186145782471, 5.831483840942383, 6.250782012939453, 6.670079708099365, 7.089377403259277, 7.508675575256348, 7.92797327041626, 8.347270965576172, 8.766569137573242, 9.185867309570312, 9.605164527893066, 10.024462699890137, 10.443760871887207, 10.863058090209961, 11.282356262207031, 11.701654434204102, 12.120951652526855, 12.540249824523926, 12.959547996520996, 13.37884521484375, 13.79814338684082, 14.21744155883789, 14.636739730834961]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 1.0, 2.0, 3.0, 3.0, 4.0, 7.0, 7.0, 10.0, 7.0, 15.0, 14.0, 13.0, 15.0, 17.0, 28.0, 22.0, 38.0, 29.0, 52.0, 67.0, 224.0, 119.0, 51.0, 37.0, 37.0, 32.0, 20.0, 16.0, 15.0, 22.0, 17.0, 11.0, 11.0, 13.0, 9.0, 3.0, 6.0, 4.0, 4.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.79638671875, -0.7628860473632812, -0.7293853759765625, -0.6958847045898438, -0.662384033203125, -0.6288833618164062, -0.5953826904296875, -0.5618820190429688, -0.52838134765625, -0.49488067626953125, -0.4613800048828125, -0.42787933349609375, -0.394378662109375, -0.36087799072265625, -0.3273773193359375, -0.29387664794921875, -0.2603759765625, -0.22687530517578125, -0.1933746337890625, -0.15987396240234375, -0.126373291015625, -0.09287261962890625, -0.0593719482421875, -0.02587127685546875, 0.00762939453125, 0.04113006591796875, 0.0746307373046875, 0.10813140869140625, 0.141632080078125, 0.17513275146484375, 0.2086334228515625, 0.24213409423828125, 0.275634765625, 0.30913543701171875, 0.3426361083984375, 0.37613677978515625, 0.409637451171875, 0.44313812255859375, 0.4766387939453125, 0.5101394653320312, 0.54364013671875, 0.5771408081054688, 0.6106414794921875, 0.6441421508789062, 0.677642822265625, 0.7111434936523438, 0.7446441650390625, 0.7781448364257812, 0.8116455078125, 0.8451461791992188, 0.8786468505859375, 0.9121475219726562, 0.945648193359375, 0.9791488647460938, 1.0126495361328125, 1.0461502075195312, 1.07965087890625, 1.1131515502929688, 1.1466522216796875, 1.1801528930664062, 1.213653564453125, 1.2471542358398438, 1.2806549072265625, 1.3141555786132812, 1.34765625]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 14.0, 14.0, 14.0, 15.0, 8.0, 18.0, 36.0, 60.0, 132.0, 238.0, 492.0, 1477.0, 5672.0, 196711.0, 8174326.0, 6720.0, 1600.0, 539.0, 207.0, 120.0, 68.0, 26.0, 25.0, 18.0, 10.0, 6.0, 5.0, 3.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.052157402038574, -12.690153121948242, -12.328149795532227, -11.966145515441895, -11.604141235351562, -11.24213695526123, -10.880132675170898, -10.518129348754883, -10.15612506866455, -9.794120788574219, -9.432117462158203, -9.070113182067871, -8.708108901977539, -8.346104621887207, -7.984100818634033, -7.622097015380859, -7.260092735290527, -6.898088455200195, -6.5360846519470215, -6.174080848693848, -5.812076568603516, -5.450072288513184, -5.08806848526001, -4.726064682006836, -4.364060401916504, -4.002056121826172, -3.640052318572998, -3.278048276901245, -2.916044235229492, -2.5540401935577393, -2.1920361518859863, -1.8300321102142334, -1.4680290222167969, -1.106024980545044, -0.744020938873291, -0.3820168972015381, -0.020012855529785156, 0.3419911861419678, 0.7039952278137207, 1.0659992694854736, 1.4280033111572266, 1.7900073528289795, 2.1520113945007324, 2.5140154361724854, 2.8760194778442383, 3.238023519515991, 3.600027561187744, 3.962031602859497, 4.32403564453125, 4.686039924621582, 5.048043727874756, 5.41004753112793, 5.772051811218262, 6.134056091308594, 6.496059894561768, 6.858063697814941, 7.220067977905273, 7.5820722579956055, 7.944076061248779, 8.306079864501953, 8.668084144592285, 9.030088424682617, 9.392091751098633, 9.754096031188965, 10.116100311279297]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 6.0, 1.0, 4.0, 6.0, 3.0, 3.0, 5.0, 4.0, 5.0, 6.0, 2.0, 8.0, 7.0, 5.0, 3.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-11.049534797668457, -10.772295951843262, -10.495057106018066, -10.217818260192871, -9.940579414367676, -9.66334056854248, -9.386101722717285, -9.108863830566406, -8.831624984741211, -8.554386138916016, -8.27714729309082, -7.999908447265625, -7.72266960144043, -7.445430755615234, -7.168192386627197, -6.890953540802002, -6.613714218139648, -6.336475372314453, -6.059236526489258, -5.7819976806640625, -5.504758834838867, -5.227519989013672, -4.950281620025635, -4.6730427742004395, -4.395803928375244, -4.118565082550049, -3.8413262367248535, -3.5640876293182373, -3.286848783493042, -3.0096099376678467, -2.7323713302612305, -2.455132484436035, -2.177894115447998, -1.9006552696228027, -1.623416543006897, -1.3461778163909912, -1.068938970565796, -0.7917001247406006, -0.5144613981246948, -0.23722267150878906, 0.04001617431640625, 0.3172549605369568, 0.5944937467575073, 0.8717325329780579, 1.1489713191986084, 1.4262101650238037, 1.7034488916397095, 1.9806876182556152, 2.2579264640808105, 2.535165309906006, 2.812404155731201, 3.0896427631378174, 3.3668816089630127, 3.644120454788208, 3.921359062194824, 4.1985979080200195, 4.475836753845215, 4.75307559967041, 5.0303144454956055, 5.307553291320801, 5.584792137145996, 5.862030982971191, 6.1392693519592285, 6.416508197784424, 6.693747043609619]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 3.0, 10.0, 7.0, 10.0, 14.0, 32.0, 38.0, 68.0, 105.0, 212.0, 637.0, 2515.0, 15599.0, 145855.0, 313839.0, 38476.0, 5139.0, 1059.0, 343.0, 129.0, 73.0, 40.0, 22.0, 18.0, 6.0, 4.0, 4.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-14.09375, -13.51171875, -12.9296875, -12.34765625, -11.765625, -11.18359375, -10.6015625, -10.01953125, -9.4375, -8.85546875, -8.2734375, -7.69140625, -7.109375, -6.52734375, -5.9453125, -5.36328125, -4.78125, -4.19921875, -3.6171875, -3.03515625, -2.453125, -1.87109375, -1.2890625, -0.70703125, -0.125, 0.45703125, 1.0390625, 1.62109375, 2.203125, 2.78515625, 3.3671875, 3.94921875, 4.53125, 5.11328125, 5.6953125, 6.27734375, 6.859375, 7.44140625, 8.0234375, 8.60546875, 9.1875, 9.76953125, 10.3515625, 10.93359375, 11.515625, 12.09765625, 12.6796875, 13.26171875, 13.84375, 14.42578125, 15.0078125, 15.58984375, 16.171875, 16.75390625, 17.3359375, 17.91796875, 18.5, 19.08203125, 19.6640625, 20.24609375, 20.828125, 21.41015625, 21.9921875, 22.57421875, 23.15625]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 5.0, 5.0, 7.0, 18.0, 20.0, 17.0, 29.0, 39.0, 44.0, 54.0, 68.0, 75.0, 84.0, 88.0, 68.0, 78.0, 65.0, 51.0, 36.0, 56.0, 29.0, 18.0, 5.0, 13.0, 7.0, 4.0, 5.0, 4.0, 0.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.705078125, -1.655426025390625, -1.60577392578125, -1.556121826171875, -1.5064697265625, -1.456817626953125, -1.40716552734375, -1.357513427734375, -1.307861328125, -1.258209228515625, -1.20855712890625, -1.158905029296875, -1.1092529296875, -1.059600830078125, -1.00994873046875, -0.960296630859375, -0.91064453125, -0.860992431640625, -0.81134033203125, -0.761688232421875, -0.7120361328125, -0.662384033203125, -0.61273193359375, -0.563079833984375, -0.513427734375, -0.463775634765625, -0.41412353515625, -0.364471435546875, -0.3148193359375, -0.265167236328125, -0.21551513671875, -0.165863037109375, -0.1162109375, -0.066558837890625, -0.01690673828125, 0.032745361328125, 0.0823974609375, 0.132049560546875, 0.18170166015625, 0.231353759765625, 0.281005859375, 0.330657958984375, 0.38031005859375, 0.429962158203125, 0.4796142578125, 0.529266357421875, 0.57891845703125, 0.628570556640625, 0.67822265625, 0.727874755859375, 0.77752685546875, 0.827178955078125, 0.8768310546875, 0.926483154296875, 0.97613525390625, 1.025787353515625, 1.075439453125, 1.125091552734375, 1.17474365234375, 1.224395751953125, 1.2740478515625, 1.323699951171875, 1.37335205078125, 1.423004150390625, 1.47265625]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 11.0, 9.0, 13.0, 69.0, 135.0, 163.0, 50.0, 16.0, 9.0, 7.0, 2.0, 5.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.818909645080566, -8.232321739196777, -7.6457343101501465, -7.059146881103516, -6.472558975219727, -5.885971546173096, -5.299384117126465, -4.712796211242676, -4.126208782196045, -3.539621114730835, -2.953033447265625, -2.366446018218994, -1.7798583507537842, -1.1932706832885742, -0.6066832542419434, -0.020095348358154297, 0.5664920806884766, 1.1530797481536865, 1.739667296409607, 2.3262548446655273, 2.9128425121307373, 3.4994301795959473, 4.086017608642578, 4.672605514526367, 5.259192943572998, 5.845780372619629, 6.432368278503418, 7.018955707550049, 7.60554313659668, 8.192131042480469, 8.778718948364258, 9.365306854248047, 9.951892852783203, 10.538480758666992, 11.125067710876465, 11.711655616760254, 12.298243522644043, 12.884830474853516, 13.471418380737305, 14.058006286621094, 14.644594192504883, 15.231182098388672, 15.817769050598145, 16.40435791015625, 16.990943908691406, 17.577531814575195, 18.164119720458984, 18.750707626342773, 19.337295532226562, 19.92388343811035, 20.51047134399414, 21.097057342529297, 21.683645248413086, 22.270233154296875, 22.856821060180664, 23.443408966064453, 24.02999496459961, 24.6165828704834, 25.203170776367188, 25.789756774902344, 26.376344680786133, 26.962932586669922, 27.54952049255371, 28.1361083984375, 28.72269630432129]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 6.0, 10.0, 6.0, 6.0, 8.0, 39.0, 82.0, 121.0, 99.0, 46.0, 11.0, 12.0, 8.0, 7.0, 9.0, 1.0, 2.0, 2.0, 2.0, 3.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.361876487731934, -8.096219062805176, -7.830562114715576, -7.564904689788818, -7.299247741699219, -7.033590316772461, -6.767932891845703, -6.502275466918945, -6.236618518829346, -5.970961093902588, -5.705304145812988, -5.4396467208862305, -5.173989295959473, -4.908332347869873, -4.642674922943115, -4.377017974853516, -4.111360549926758, -3.845703363418579, -3.5800461769104004, -3.3143887519836426, -3.048731565475464, -2.783074378967285, -2.5174169540405273, -2.2517597675323486, -1.98610258102417, -1.7204453945159912, -1.454788088798523, -1.1891307830810547, -0.923473596572876, -0.6578164100646973, -0.392159104347229, -0.12650179862976074, 0.13915634155273438, 0.40481358766555786, 0.6704708337783813, 0.9361280798912048, 1.2017853260040283, 1.467442512512207, 1.7330998182296753, 1.9987571239471436, 2.2644143104553223, 2.530071496963501, 2.7957286834716797, 3.0613861083984375, 3.327043294906616, 3.592700481414795, 3.8583579063415527, 4.124014854431152, 4.38967227935791, 4.655329704284668, 4.920986652374268, 5.186644077301025, 5.452301025390625, 5.717958450317383, 5.983615875244141, 6.249273300170898, 6.514930248260498, 6.780587673187256, 7.0462446212768555, 7.311902046203613, 7.577559471130371, 7.843216419219971, 8.10887336730957, 8.374530792236328, 8.640188217163086]}, "eval/loss": 4.239526271820068, "eval/wer": 2.4202697342324475, "eval/runtime": 935.6243, "eval/samples_per_second": 2.824, "eval/steps_per_second": 0.236, "train/train_runtime": 6633.4843, "train/train_samples_per_second": 4.302, "train/train_steps_per_second": 0.179, "train/total_flos": 0.0, "train/train_loss": 4.355411059521546} \ No newline at end of file