diff --git "a/wandb/run-20220301_171456-1jxdkzs7/files/wandb-summary.json" "b/wandb/run-20220301_171456-1jxdkzs7/files/wandb-summary.json" --- "a/wandb/run-20220301_171456-1jxdkzs7/files/wandb-summary.json" +++ "b/wandb/run-20220301_171456-1jxdkzs7/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 4.3147, "train/learning_rate": 9.92e-05, "train/epoch": 0.28, "train/global_step": 500, "_runtime": 2417, "_timestamp": 1646157313, "_step": 500, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 19.0, 100.0, 336.0, 399.0, 142.0, 16.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-236.66116333007812, -232.30247497558594, -227.9437713623047, -223.5850830078125, -219.22637939453125, -214.86769104003906, -210.5089874267578, -206.15029907226562, -201.79159545898438, -197.4329071044922, -193.07420349121094, -188.71551513671875, -184.3568115234375, -179.9981231689453, -175.63941955566406, -171.28073120117188, -166.92202758789062, -162.56333923339844, -158.2046356201172, -153.845947265625, -149.48724365234375, -145.12855529785156, -140.7698516845703, -136.41116333007812, -132.05247497558594, -127.69377899169922, -123.3350830078125, -118.97638702392578, -114.61769104003906, -110.25899505615234, -105.90029907226562, -101.54161071777344, -97.18289947509766, -92.82420349121094, -88.46550750732422, -84.1068115234375, -79.74811553955078, -75.38941955566406, -71.03073120117188, -66.67202758789062, -62.31333541870117, -57.95463943481445, -53.595943450927734, -49.23725128173828, -44.87855529785156, -40.519859313964844, -36.161163330078125, -31.802467346191406, -27.443771362304688, -23.08507537841797, -18.72637939453125, -14.367685317993164, -10.008989334106445, -5.650293350219727, -1.2915992736816406, 3.067096710205078, 7.425792694091797, 11.784488677978516, 16.143184661865234, 20.50187873840332, 24.86057472229004, 29.219270706176758, 33.577964782714844, 37.93666076660156, 42.29535675048828]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 5.0, 5.0, 6.0, 7.0, 11.0, 7.0, 21.0, 23.0, 26.0, 26.0, 28.0, 43.0, 36.0, 56.0, 65.0, 61.0, 68.0, 64.0, 47.0, 63.0, 42.0, 56.0, 50.0, 38.0, 35.0, 28.0, 22.0, 20.0, 9.0, 10.0, 8.0, 7.0, 7.0, 4.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-114.33270263671875, -111.34042358398438, -108.34813690185547, -105.35585021972656, -102.36357116699219, -99.37129211425781, -96.3790054321289, -93.38671875, -90.39443969726562, -87.40216064453125, -84.40987396240234, -81.41758728027344, -78.42530822753906, -75.43302917480469, -72.44074249267578, -69.44845581054688, -66.4561767578125, -63.46389389038086, -60.47161102294922, -57.47932815551758, -54.48704528808594, -51.4947624206543, -48.502479553222656, -45.510196685791016, -42.517913818359375, -39.525630950927734, -36.533348083496094, -33.54106521606445, -30.548782348632812, -27.556499481201172, -24.56421661376953, -21.57193374633789, -18.57965850830078, -15.58737564086914, -12.5950927734375, -9.60280990600586, -6.610527038574219, -3.618244171142578, -0.6259613037109375, 2.366321563720703, 5.358604431152344, 8.350887298583984, 11.343170166015625, 14.335453033447266, 17.327735900878906, 20.320018768310547, 23.312301635742188, 26.304584503173828, 29.29686737060547, 32.28915023803711, 35.28143310546875, 38.27371597290039, 41.26599884033203, 44.25828170776367, 47.25056457519531, 50.24284744262695, 53.235130310058594, 56.227413177490234, 59.219696044921875, 62.211978912353516, 65.20426177978516, 68.19654846191406, 71.18882751464844, 74.18110656738281, 77.17339324951172]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 7.0, 3.0, 14.0, 14.0, 17.0, 15.0, 24.0, 38.0, 38.0, 49.0, 44.0, 63.0, 67.0, 78.0, 86.0, 63.0, 54.0, 66.0, 49.0, 50.0, 34.0, 39.0, 29.0, 14.0, 15.0, 12.0, 8.0, 9.0, 3.0, 3.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.4296875, -5.295623779296875, -5.16156005859375, -5.027496337890625, -4.8934326171875, -4.759368896484375, -4.62530517578125, -4.491241455078125, -4.357177734375, -4.223114013671875, -4.08905029296875, -3.954986572265625, -3.8209228515625, -3.686859130859375, -3.55279541015625, -3.418731689453125, -3.28466796875, -3.150604248046875, -3.01654052734375, -2.882476806640625, -2.7484130859375, -2.614349365234375, -2.48028564453125, -2.346221923828125, -2.212158203125, -2.078094482421875, -1.94403076171875, -1.809967041015625, -1.6759033203125, -1.541839599609375, -1.40777587890625, -1.273712158203125, -1.1396484375, -1.005584716796875, -0.87152099609375, -0.737457275390625, -0.6033935546875, -0.469329833984375, -0.33526611328125, -0.201202392578125, -0.067138671875, 0.066925048828125, 0.20098876953125, 0.335052490234375, 0.4691162109375, 0.603179931640625, 0.73724365234375, 0.871307373046875, 1.00537109375, 1.139434814453125, 1.27349853515625, 1.407562255859375, 1.5416259765625, 1.675689697265625, 1.80975341796875, 1.943817138671875, 2.077880859375, 2.211944580078125, 2.34600830078125, 2.480072021484375, 2.6141357421875, 2.748199462890625, 2.88226318359375, 3.016326904296875, 3.150390625]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 6.0, 12.0, 21.0, 29.0, 49.0, 42.0, 95.0, 130.0, 226.0, 336.0, 513.0, 1049.0, 1993.0, 5698.0, 27959.0, 823494.0, 3250014.0, 67442.0, 9284.0, 2896.0, 1277.0, 641.0, 391.0, 248.0, 160.0, 97.0, 57.0, 47.0, 22.0, 18.0, 16.0, 9.0, 4.0, 3.0, 1.0, 4.0, 0.0, 1.0, 2.0], "bins": [-28.359375, -27.670654296875, -26.98193359375, -26.293212890625, -25.6044921875, -24.915771484375, -24.22705078125, -23.538330078125, -22.849609375, -22.160888671875, -21.47216796875, -20.783447265625, -20.0947265625, -19.406005859375, -18.71728515625, -18.028564453125, -17.33984375, -16.651123046875, -15.96240234375, -15.273681640625, -14.5849609375, -13.896240234375, -13.20751953125, -12.518798828125, -11.830078125, -11.141357421875, -10.45263671875, -9.763916015625, -9.0751953125, -8.386474609375, -7.69775390625, -7.009033203125, -6.3203125, -5.631591796875, -4.94287109375, -4.254150390625, -3.5654296875, -2.876708984375, -2.18798828125, -1.499267578125, -0.810546875, -0.121826171875, 0.56689453125, 1.255615234375, 1.9443359375, 2.633056640625, 3.32177734375, 4.010498046875, 4.69921875, 5.387939453125, 6.07666015625, 6.765380859375, 7.4541015625, 8.142822265625, 8.83154296875, 9.520263671875, 10.208984375, 10.897705078125, 11.58642578125, 12.275146484375, 12.9638671875, 13.652587890625, 14.34130859375, 15.030029296875, 15.71875]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 7.0, 2.0, 15.0, 13.0, 26.0, 29.0, 33.0, 53.0, 101.0, 127.0, 203.0, 276.0, 443.0, 578.0, 611.0, 449.0, 301.0, 240.0, 167.0, 98.0, 73.0, 52.0, 56.0, 30.0, 21.0, 15.0, 10.0, 11.0, 9.0, 5.0, 8.0, 4.0, 4.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-12.5859375, -12.180419921875, -11.77490234375, -11.369384765625, -10.9638671875, -10.558349609375, -10.15283203125, -9.747314453125, -9.341796875, -8.936279296875, -8.53076171875, -8.125244140625, -7.7197265625, -7.314208984375, -6.90869140625, -6.503173828125, -6.09765625, -5.692138671875, -5.28662109375, -4.881103515625, -4.4755859375, -4.070068359375, -3.66455078125, -3.259033203125, -2.853515625, -2.447998046875, -2.04248046875, -1.636962890625, -1.2314453125, -0.825927734375, -0.42041015625, -0.014892578125, 0.390625, 0.796142578125, 1.20166015625, 1.607177734375, 2.0126953125, 2.418212890625, 2.82373046875, 3.229248046875, 3.634765625, 4.040283203125, 4.44580078125, 4.851318359375, 5.2568359375, 5.662353515625, 6.06787109375, 6.473388671875, 6.87890625, 7.284423828125, 7.68994140625, 8.095458984375, 8.5009765625, 8.906494140625, 9.31201171875, 9.717529296875, 10.123046875, 10.528564453125, 10.93408203125, 11.339599609375, 11.7451171875, 12.150634765625, 12.55615234375, 12.961669921875, 13.3671875]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 1.0, 3.0, 2.0, 7.0, 9.0, 15.0, 15.0, 30.0, 33.0, 44.0, 70.0, 116.0, 141.0, 224.0, 397.0, 664.0, 1604.0, 6938.0, 197968.0, 3860011.0, 117513.0, 5245.0, 1447.0, 633.0, 366.0, 230.0, 151.0, 106.0, 86.0, 64.0, 32.0, 21.0, 17.0, 13.0, 19.0, 8.0, 8.0, 5.0, 7.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 3.0, 1.0, 1.0], "bins": [-41.4375, -40.16015625, -38.8828125, -37.60546875, -36.328125, -35.05078125, -33.7734375, -32.49609375, -31.21875, -29.94140625, -28.6640625, -27.38671875, -26.109375, -24.83203125, -23.5546875, -22.27734375, -21.0, -19.72265625, -18.4453125, -17.16796875, -15.890625, -14.61328125, -13.3359375, -12.05859375, -10.78125, -9.50390625, -8.2265625, -6.94921875, -5.671875, -4.39453125, -3.1171875, -1.83984375, -0.5625, 0.71484375, 1.9921875, 3.26953125, 4.546875, 5.82421875, 7.1015625, 8.37890625, 9.65625, 10.93359375, 12.2109375, 13.48828125, 14.765625, 16.04296875, 17.3203125, 18.59765625, 19.875, 21.15234375, 22.4296875, 23.70703125, 24.984375, 26.26171875, 27.5390625, 28.81640625, 30.09375, 31.37109375, 32.6484375, 33.92578125, 35.203125, 36.48046875, 37.7578125, 39.03515625, 40.3125]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 577.0, 408.0, 23.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-483.75653076171875, -473.193115234375, -462.62969970703125, -452.0663146972656, -441.5028991699219, -430.9394836425781, -420.3760681152344, -409.81268310546875, -399.249267578125, -388.68585205078125, -378.1224365234375, -367.5590515136719, -356.9956359863281, -346.4322204589844, -335.8688049316406, -325.305419921875, -314.74200439453125, -304.1785888671875, -293.61517333984375, -283.0517883300781, -272.4883728027344, -261.9249572753906, -251.36154174804688, -240.7981414794922, -230.23471069335938, -219.67129516601562, -209.10789489746094, -198.5444793701172, -187.9810791015625, -177.41766357421875, -166.854248046875, -156.2908477783203, -145.7274627685547, -135.16404724121094, -124.60064697265625, -114.0372314453125, -103.47383117675781, -92.91041564941406, -82.34700775146484, -71.78359985351562, -61.220191955566406, -50.65678405761719, -40.09337615966797, -29.529964447021484, -18.966556549072266, -8.403148651123047, 2.1602630615234375, 12.723670959472656, 23.287078857421875, 33.850486755371094, 44.41389465332031, 54.9773063659668, 65.54071044921875, 76.1041259765625, 86.66753387451172, 97.23094177246094, 107.79434967041016, 118.35775756835938, 128.92117309570312, 139.4845733642578, 150.04798889160156, 160.61138916015625, 171.1748046875, 181.73822021484375, 192.30162048339844]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 8.0, 8.0, 10.0, 16.0, 25.0, 14.0, 36.0, 37.0, 40.0, 47.0, 36.0, 57.0, 66.0, 62.0, 73.0, 71.0, 62.0, 54.0, 43.0, 53.0, 44.0, 27.0, 26.0, 20.0, 18.0, 14.0, 19.0, 7.0, 6.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-114.12615966796875, -111.22850799560547, -108.33086395263672, -105.43321228027344, -102.53556823730469, -99.6379165649414, -96.74026489257812, -93.84262084960938, -90.9449691772461, -88.04731750488281, -85.14967346191406, -82.25202178955078, -79.3543701171875, -76.45672607421875, -73.55907440185547, -70.66142272949219, -67.76377868652344, -64.86612701416016, -61.968482971191406, -59.070831298828125, -56.17318344116211, -53.275535583496094, -50.37788391113281, -47.4802360534668, -44.58258819580078, -41.684940338134766, -38.78729248046875, -35.88964080810547, -32.99199295043945, -30.094345092773438, -27.19669532775879, -24.29904556274414, -21.401397705078125, -18.50374984741211, -15.606100082397461, -12.708451271057129, -9.810802459716797, -6.913153648376465, -4.015504837036133, -1.1178550720214844, 1.7797927856445312, 4.677441596984863, 7.575090408325195, 10.472739219665527, 13.37038803100586, 16.268035888671875, 19.165685653686523, 22.063335418701172, 24.960983276367188, 27.858631134033203, 30.75628089904785, 33.6539306640625, 36.551578521728516, 39.44922637939453, 42.34687805175781, 45.24452590942383, 48.142173767089844, 51.03982162475586, 53.937469482421875, 56.835121154785156, 59.73276901245117, 62.63041687011719, 65.52806854248047, 68.42572021484375, 71.3233642578125]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 8.0, 7.0, 10.0, 5.0, 3.0, 14.0, 21.0, 21.0, 14.0, 29.0, 33.0, 37.0, 39.0, 33.0, 27.0, 46.0, 58.0, 51.0, 53.0, 56.0, 44.0, 42.0, 59.0, 40.0, 42.0, 29.0, 38.0, 19.0, 24.0, 33.0, 14.0, 12.0, 8.0, 10.0, 6.0, 1.0, 6.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-3.845703125, -3.73492431640625, -3.6241455078125, -3.51336669921875, -3.402587890625, -3.29180908203125, -3.1810302734375, -3.07025146484375, -2.95947265625, -2.84869384765625, -2.7379150390625, -2.62713623046875, -2.516357421875, -2.40557861328125, -2.2947998046875, -2.18402099609375, -2.0732421875, -1.96246337890625, -1.8516845703125, -1.74090576171875, -1.630126953125, -1.51934814453125, -1.4085693359375, -1.29779052734375, -1.18701171875, -1.07623291015625, -0.9654541015625, -0.85467529296875, -0.743896484375, -0.63311767578125, -0.5223388671875, -0.41156005859375, -0.30078125, -0.19000244140625, -0.0792236328125, 0.03155517578125, 0.142333984375, 0.25311279296875, 0.3638916015625, 0.47467041015625, 0.58544921875, 0.69622802734375, 0.8070068359375, 0.91778564453125, 1.028564453125, 1.13934326171875, 1.2501220703125, 1.36090087890625, 1.4716796875, 1.58245849609375, 1.6932373046875, 1.80401611328125, 1.914794921875, 2.02557373046875, 2.1363525390625, 2.24713134765625, 2.35791015625, 2.46868896484375, 2.5794677734375, 2.69024658203125, 2.801025390625, 2.91180419921875, 3.0225830078125, 3.13336181640625, 3.244140625]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 3.0, 3.0, 2.0, 3.0, 9.0, 11.0, 14.0, 15.0, 24.0, 46.0, 71.0, 92.0, 137.0, 198.0, 280.0, 434.0, 676.0, 1153.0, 1924.0, 3250.0, 5564.0, 9950.0, 18110.0, 34142.0, 67444.0, 134608.0, 242023.0, 244886.0, 137317.0, 68931.0, 34591.0, 18423.0, 10100.0, 5677.0, 3252.0, 1948.0, 1152.0, 730.0, 450.0, 302.0, 198.0, 130.0, 84.0, 63.0, 48.0, 30.0, 26.0, 12.0, 8.0, 4.0, 4.0, 4.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1429443359375, -0.1381816864013672, -0.13341903686523438, -0.12865638732910156, -0.12389373779296875, -0.11913108825683594, -0.11436843872070312, -0.10960578918457031, -0.1048431396484375, -0.10008049011230469, -0.09531784057617188, -0.09055519104003906, -0.08579254150390625, -0.08102989196777344, -0.07626724243164062, -0.07150459289550781, -0.066741943359375, -0.06197929382324219, -0.057216644287109375, -0.05245399475097656, -0.04769134521484375, -0.04292869567871094, -0.038166046142578125, -0.03340339660644531, -0.0286407470703125, -0.023878097534179688, -0.019115447998046875, -0.014352798461914062, -0.00959014892578125, -0.0048274993896484375, -6.4849853515625e-05, 0.0046977996826171875, 0.00946044921875, 0.014223098754882812, 0.018985748291015625, 0.023748397827148438, 0.02851104736328125, 0.03327369689941406, 0.038036346435546875, 0.04279899597167969, 0.0475616455078125, 0.05232429504394531, 0.057086944580078125, 0.06184959411621094, 0.06661224365234375, 0.07137489318847656, 0.07613754272460938, 0.08090019226074219, 0.085662841796875, 0.09042549133300781, 0.09518814086914062, 0.09995079040527344, 0.10471343994140625, 0.10947608947753906, 0.11423873901367188, 0.11900138854980469, 0.1237640380859375, 0.1285266876220703, 0.13328933715820312, 0.13805198669433594, 0.14281463623046875, 0.14757728576660156, 0.15233993530273438, 0.1571025848388672, 0.161865234375]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 4.0, 4.0, 5.0, 9.0, 15.0, 11.0, 11.0, 17.0, 31.0, 25.0, 22.0, 22.0, 21.0, 30.0, 26.0, 27.0, 45.0, 40.0, 40.0, 48.0, 43.0, 1064.0, 35.0, 34.0, 37.0, 40.0, 39.0, 24.0, 30.0, 28.0, 28.0, 21.0, 23.0, 19.0, 20.0, 16.0, 16.0, 5.0, 11.0, 6.0, 8.0, 2.0, 2.0, 7.0, 7.0, 2.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 2.0], "bins": [-1.8603515625, -1.8026275634765625, -1.744903564453125, -1.6871795654296875, -1.62945556640625, -1.5717315673828125, -1.514007568359375, -1.4562835693359375, -1.3985595703125, -1.3408355712890625, -1.283111572265625, -1.2253875732421875, -1.16766357421875, -1.1099395751953125, -1.052215576171875, -0.9944915771484375, -0.936767578125, -0.8790435791015625, -0.821319580078125, -0.7635955810546875, -0.70587158203125, -0.6481475830078125, -0.590423583984375, -0.5326995849609375, -0.4749755859375, -0.4172515869140625, -0.359527587890625, -0.3018035888671875, -0.24407958984375, -0.1863555908203125, -0.128631591796875, -0.0709075927734375, -0.01318359375, 0.0445404052734375, 0.102264404296875, 0.1599884033203125, 0.21771240234375, 0.2754364013671875, 0.333160400390625, 0.3908843994140625, 0.4486083984375, 0.5063323974609375, 0.564056396484375, 0.6217803955078125, 0.67950439453125, 0.7372283935546875, 0.794952392578125, 0.8526763916015625, 0.910400390625, 0.9681243896484375, 1.025848388671875, 1.0835723876953125, 1.14129638671875, 1.1990203857421875, 1.256744384765625, 1.3144683837890625, 1.3721923828125, 1.4299163818359375, 1.487640380859375, 1.5453643798828125, 1.60308837890625, 1.6608123779296875, 1.718536376953125, 1.7762603759765625, 1.833984375]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 7.0, 8.0, 19.0, 27.0, 45.0, 68.0, 104.0, 150.0, 231.0, 305.0, 410.0, 627.0, 1010.0, 1491.0, 2131.0, 3214.0, 4929.0, 7564.0, 11432.0, 18355.0, 29696.0, 48274.0, 80386.0, 128306.0, 217594.0, 1185935.0, 133879.0, 84309.0, 51150.0, 30721.0, 19083.0, 12267.0, 7891.0, 5192.0, 3295.0, 2327.0, 1545.0, 1055.0, 667.0, 429.0, 307.0, 234.0, 156.0, 115.0, 76.0, 38.0, 32.0, 18.0, 13.0, 10.0, 9.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.1055908203125, -0.10239601135253906, -0.09920120239257812, -0.09600639343261719, -0.09281158447265625, -0.08961677551269531, -0.08642196655273438, -0.08322715759277344, -0.0800323486328125, -0.07683753967285156, -0.07364273071289062, -0.07044792175292969, -0.06725311279296875, -0.06405830383300781, -0.060863494873046875, -0.05766868591308594, -0.054473876953125, -0.05127906799316406, -0.048084259033203125, -0.04488945007324219, -0.04169464111328125, -0.03849983215332031, -0.035305023193359375, -0.03211021423339844, -0.0289154052734375, -0.025720596313476562, -0.022525787353515625, -0.019330978393554688, -0.01613616943359375, -0.012941360473632812, -0.009746551513671875, -0.0065517425537109375, -0.00335693359375, -0.0001621246337890625, 0.003032684326171875, 0.0062274932861328125, 0.00942230224609375, 0.012617111206054688, 0.015811920166015625, 0.019006729125976562, 0.0222015380859375, 0.025396347045898438, 0.028591156005859375, 0.03178596496582031, 0.03498077392578125, 0.03817558288574219, 0.041370391845703125, 0.04456520080566406, 0.047760009765625, 0.05095481872558594, 0.054149627685546875, 0.05734443664550781, 0.06053924560546875, 0.06373405456542969, 0.06692886352539062, 0.07012367248535156, 0.0733184814453125, 0.07651329040527344, 0.07970809936523438, 0.08290290832519531, 0.08609771728515625, 0.08929252624511719, 0.09248733520507812, 0.09568214416503906, 0.098876953125]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 10.0, 8.0, 5.0, 10.0, 25.0, 11.0, 12.0, 32.0, 22.0, 29.0, 21.0, 35.0, 46.0, 42.0, 54.0, 45.0, 48.0, 58.0, 53.0, 53.0, 55.0, 38.0, 34.0, 32.0, 21.0, 28.0, 25.0, 15.0, 17.0, 23.0, 11.0, 11.0, 17.0, 10.0, 7.0, 5.0, 2.0, 14.0, 3.0, 2.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.00036644935607910156, -0.0003550387918949127, -0.0003436282277107239, -0.00033221766352653503, -0.0003208070993423462, -0.00030939653515815735, -0.0002979859709739685, -0.00028657540678977966, -0.0002751648426055908, -0.000263754278421402, -0.00025234371423721313, -0.0002409331500530243, -0.00022952258586883545, -0.0002181120216846466, -0.00020670145750045776, -0.00019529089331626892, -0.00018388032913208008, -0.00017246976494789124, -0.0001610592007637024, -0.00014964863657951355, -0.0001382380723953247, -0.00012682750821113586, -0.00011541694402694702, -0.00010400637984275818, -9.259581565856934e-05, -8.118525147438049e-05, -6.977468729019165e-05, -5.836412310600281e-05, -4.6953558921813965e-05, -3.554299473762512e-05, -2.413243055343628e-05, -1.2721866369247437e-05, -1.3113021850585938e-06, 1.0099261999130249e-05, 2.1509826183319092e-05, 3.2920390367507935e-05, 4.433095455169678e-05, 5.574151873588562e-05, 6.715208292007446e-05, 7.85626471042633e-05, 8.997321128845215e-05, 0.00010138377547264099, 0.00011279433965682983, 0.00012420490384101868, 0.00013561546802520752, 0.00014702603220939636, 0.0001584365963935852, 0.00016984716057777405, 0.0001812577247619629, 0.00019266828894615173, 0.00020407885313034058, 0.00021548941731452942, 0.00022689998149871826, 0.0002383105456829071, 0.00024972110986709595, 0.0002611316740512848, 0.00027254223823547363, 0.0002839528024196625, 0.0002953633666038513, 0.00030677393078804016, 0.000318184494972229, 0.00032959505915641785, 0.0003410056233406067, 0.00035241618752479553, 0.0003638267517089844]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 6.0, 3.0, 4.0, 8.0, 7.0, 12.0, 9.0, 26.0, 22.0, 25.0, 31.0, 60.0, 47.0, 52.0, 52.0, 96.0, 88.0, 96.0, 129.0, 154.0, 238.0, 404.0, 1721.0, 873780.0, 168970.0, 984.0, 353.0, 211.0, 168.0, 124.0, 120.0, 94.0, 77.0, 65.0, 48.0, 45.0, 43.0, 39.0, 28.0, 20.0, 19.0, 17.0, 15.0, 13.0, 16.0, 5.0, 2.0, 7.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.006717681884765625, -0.006506860256195068, -0.006296038627624512, -0.006085216999053955, -0.0058743953704833984, -0.005663573741912842, -0.005452752113342285, -0.0052419304847717285, -0.005031108856201172, -0.004820287227630615, -0.004609465599060059, -0.004398643970489502, -0.004187822341918945, -0.003977000713348389, -0.003766179084777832, -0.0035553574562072754, -0.0033445358276367188, -0.003133714199066162, -0.0029228925704956055, -0.002712070941925049, -0.002501249313354492, -0.0022904276847839355, -0.002079606056213379, -0.0018687844276428223, -0.0016579627990722656, -0.001447141170501709, -0.0012363195419311523, -0.0010254979133605957, -0.0008146762847900391, -0.0006038546562194824, -0.0003930330276489258, -0.00018221139907836914, 2.86102294921875e-05, 0.00023943185806274414, 0.0004502534866333008, 0.0006610751152038574, 0.0008718967437744141, 0.0010827183723449707, 0.0012935400009155273, 0.001504361629486084, 0.0017151832580566406, 0.0019260048866271973, 0.002136826515197754, 0.0023476481437683105, 0.002558469772338867, 0.002769291400909424, 0.0029801130294799805, 0.003190934658050537, 0.0034017562866210938, 0.0036125779151916504, 0.003823399543762207, 0.004034221172332764, 0.00424504280090332, 0.004455864429473877, 0.004666686058044434, 0.00487750768661499, 0.005088329315185547, 0.0052991509437561035, 0.00550997257232666, 0.005720794200897217, 0.0059316158294677734, 0.00614243745803833, 0.006353259086608887, 0.006564080715179443, 0.00677490234375]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 137.0, 855.0, 23.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0027874226216226816, -0.0027231096755713224, -0.002658796962350607, -0.0025944840162992477, -0.0025301710702478886, -0.0024658581241965294, -0.002401545410975814, -0.0023372324649244547, -0.002272919751703739, -0.00220860680565238, -0.0021442940924316645, -0.0020799811463803053, -0.002015668200328946, -0.0019513553706929088, -0.0018870425410568714, -0.0018227295950055122, -0.001758416648954153, -0.0016941038193181157, -0.0016297908732667565, -0.0015654780436307192, -0.00150116509757936, -0.0014368522679433227, -0.0013725394383072853, -0.0013082264922559261, -0.0012439136626198888, -0.0011796008329838514, -0.0011152878869324923, -0.001050975057296455, -0.0009866622276604176, -0.0009223492816090584, -0.000858036451973021, -0.0007937235641293228, -0.0007294106762856245, -0.0006650977884419262, -0.000600784900598228, -0.0005364720709621906, -0.00047215918311849236, -0.0004078462952747941, -0.0003435334365349263, -0.0002792205777950585, -0.00021490768995136023, -0.0001505948166595772, -8.628194336779416e-05, -2.196907007601112e-05, 4.2343803215771914e-05, 0.00010665669105947018, 0.00017096954979933798, 0.0002352824085392058, 0.00029959529638290405, 0.0003639081842266023, 0.0004282210429664701, 0.0004925339017063379, 0.0005568467895500362, 0.0006211596773937345, 0.0006854725070297718, 0.0007497853948734701, 0.0008140982827171683, 0.0008784111705608666, 0.0009427240584045649, 0.0010070368880406022, 0.0010713497176766396, 0.0011356626637279987, 0.001199975493364036, 0.0012642883230000734, 0.0013286012690514326]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 5.0, 7.0, 6.0, 16.0, 15.0, 10.0, 14.0, 22.0, 17.0, 24.0, 31.0, 24.0, 24.0, 39.0, 41.0, 44.0, 49.0, 31.0, 50.0, 27.0, 50.0, 45.0, 34.0, 33.0, 35.0, 38.0, 30.0, 30.0, 27.0, 31.0, 32.0, 21.0, 18.0, 11.0, 20.0, 18.0, 8.0, 7.0, 6.0, 5.0, 4.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002200603485107422, -0.00021316763013601303, -0.00020627491176128387, -0.00019938219338655472, -0.00019248947501182556, -0.0001855967566370964, -0.00017870403826236725, -0.0001718113198876381, -0.00016491860151290894, -0.00015802588313817978, -0.00015113316476345062, -0.00014424044638872147, -0.0001373477280139923, -0.00013045500963926315, -0.000123562291264534, -0.00011666957288980484, -0.00010977685451507568, -0.00010288413614034653, -9.599141776561737e-05, -8.909869939088821e-05, -8.220598101615906e-05, -7.53132626414299e-05, -6.842054426670074e-05, -6.152782589197159e-05, -5.463510751724243e-05, -4.7742389142513275e-05, -4.084967076778412e-05, -3.395695239305496e-05, -2.7064234018325806e-05, -2.017151564359665e-05, -1.3278797268867493e-05, -6.386078894138336e-06, 5.066394805908203e-07, 7.399357855319977e-06, 1.4292076230049133e-05, 2.118479460477829e-05, 2.8077512979507446e-05, 3.49702313542366e-05, 4.186294972896576e-05, 4.8755668103694916e-05, 5.564838647842407e-05, 6.254110485315323e-05, 6.943382322788239e-05, 7.632654160261154e-05, 8.32192599773407e-05, 9.011197835206985e-05, 9.700469672679901e-05, 0.00010389741510152817, 0.00011079013347625732, 0.00011768285185098648, 0.00012457557022571564, 0.0001314682886004448, 0.00013836100697517395, 0.0001452537253499031, 0.00015214644372463226, 0.00015903916209936142, 0.00016593188047409058, 0.00017282459884881973, 0.0001797173172235489, 0.00018661003559827805, 0.0001935027539730072, 0.00020039547234773636, 0.00020728819072246552, 0.00021418090909719467, 0.00022107362747192383]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 8.0, 7.0, 10.0, 5.0, 3.0, 14.0, 21.0, 21.0, 14.0, 29.0, 33.0, 37.0, 39.0, 33.0, 27.0, 46.0, 58.0, 51.0, 53.0, 56.0, 44.0, 42.0, 59.0, 40.0, 42.0, 29.0, 38.0, 19.0, 24.0, 33.0, 14.0, 12.0, 8.0, 10.0, 6.0, 1.0, 6.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-3.845703125, -3.73492431640625, -3.6241455078125, -3.51336669921875, -3.402587890625, -3.29180908203125, -3.1810302734375, -3.07025146484375, -2.95947265625, -2.84869384765625, -2.7379150390625, -2.62713623046875, -2.516357421875, -2.40557861328125, -2.2947998046875, -2.18402099609375, -2.0732421875, -1.96246337890625, -1.8516845703125, -1.74090576171875, -1.630126953125, -1.51934814453125, -1.4085693359375, -1.29779052734375, -1.18701171875, -1.07623291015625, -0.9654541015625, -0.85467529296875, -0.743896484375, -0.63311767578125, -0.5223388671875, -0.41156005859375, -0.30078125, -0.19000244140625, -0.0792236328125, 0.03155517578125, 0.142333984375, 0.25311279296875, 0.3638916015625, 0.47467041015625, 0.58544921875, 0.69622802734375, 0.8070068359375, 0.91778564453125, 1.028564453125, 1.13934326171875, 1.2501220703125, 1.36090087890625, 1.4716796875, 1.58245849609375, 1.6932373046875, 1.80401611328125, 1.914794921875, 2.02557373046875, 2.1363525390625, 2.24713134765625, 2.35791015625, 2.46868896484375, 2.5794677734375, 2.69024658203125, 2.801025390625, 2.91180419921875, 3.0225830078125, 3.13336181640625, 3.244140625]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 5.0, 1.0, 2.0, 3.0, 5.0, 8.0, 11.0, 19.0, 32.0, 55.0, 95.0, 132.0, 239.0, 351.0, 582.0, 986.0, 1619.0, 2856.0, 5351.0, 10997.0, 27423.0, 117451.0, 641894.0, 176596.0, 34954.0, 12916.0, 6002.0, 3291.0, 1866.0, 1069.0, 657.0, 400.0, 276.0, 156.0, 78.0, 60.0, 40.0, 18.0, 22.0, 11.0, 14.0, 6.0, 3.0, 3.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-13.9140625, -13.511962890625, -13.10986328125, -12.707763671875, -12.3056640625, -11.903564453125, -11.50146484375, -11.099365234375, -10.697265625, -10.295166015625, -9.89306640625, -9.490966796875, -9.0888671875, -8.686767578125, -8.28466796875, -7.882568359375, -7.48046875, -7.078369140625, -6.67626953125, -6.274169921875, -5.8720703125, -5.469970703125, -5.06787109375, -4.665771484375, -4.263671875, -3.861572265625, -3.45947265625, -3.057373046875, -2.6552734375, -2.253173828125, -1.85107421875, -1.448974609375, -1.046875, -0.644775390625, -0.24267578125, 0.159423828125, 0.5615234375, 0.963623046875, 1.36572265625, 1.767822265625, 2.169921875, 2.572021484375, 2.97412109375, 3.376220703125, 3.7783203125, 4.180419921875, 4.58251953125, 4.984619140625, 5.38671875, 5.788818359375, 6.19091796875, 6.593017578125, 6.9951171875, 7.397216796875, 7.79931640625, 8.201416015625, 8.603515625, 9.005615234375, 9.40771484375, 9.809814453125, 10.2119140625, 10.614013671875, 11.01611328125, 11.418212890625, 11.8203125]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 0.0, 6.0, 4.0, 4.0, 3.0, 10.0, 9.0, 11.0, 15.0, 8.0, 26.0, 24.0, 14.0, 32.0, 21.0, 37.0, 47.0, 45.0, 37.0, 70.0, 86.0, 156.0, 1553.0, 274.0, 104.0, 66.0, 61.0, 49.0, 40.0, 40.0, 25.0, 41.0, 31.0, 20.0, 12.0, 16.0, 11.0, 10.0, 7.0, 11.0, 6.0, 4.0, 5.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.796875, -11.44775390625, -11.0986328125, -10.74951171875, -10.400390625, -10.05126953125, -9.7021484375, -9.35302734375, -9.00390625, -8.65478515625, -8.3056640625, -7.95654296875, -7.607421875, -7.25830078125, -6.9091796875, -6.56005859375, -6.2109375, -5.86181640625, -5.5126953125, -5.16357421875, -4.814453125, -4.46533203125, -4.1162109375, -3.76708984375, -3.41796875, -3.06884765625, -2.7197265625, -2.37060546875, -2.021484375, -1.67236328125, -1.3232421875, -0.97412109375, -0.625, -0.27587890625, 0.0732421875, 0.42236328125, 0.771484375, 1.12060546875, 1.4697265625, 1.81884765625, 2.16796875, 2.51708984375, 2.8662109375, 3.21533203125, 3.564453125, 3.91357421875, 4.2626953125, 4.61181640625, 4.9609375, 5.31005859375, 5.6591796875, 6.00830078125, 6.357421875, 6.70654296875, 7.0556640625, 7.40478515625, 7.75390625, 8.10302734375, 8.4521484375, 8.80126953125, 9.150390625, 9.49951171875, 9.8486328125, 10.19775390625, 10.546875]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 2.0, 9.0, 7.0, 8.0, 6.0, 12.0, 9.0, 23.0, 18.0, 24.0, 27.0, 32.0, 42.0, 41.0, 88.0, 135.0, 286.0, 949.0, 31650.0, 3103678.0, 7258.0, 683.0, 233.0, 135.0, 70.0, 52.0, 47.0, 28.0, 18.0, 25.0, 16.0, 16.0, 15.0, 6.0, 14.0, 10.0, 12.0, 3.0, 2.0, 3.0, 5.0, 3.0, 2.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-44.875, -43.34765625, -41.8203125, -40.29296875, -38.765625, -37.23828125, -35.7109375, -34.18359375, -32.65625, -31.12890625, -29.6015625, -28.07421875, -26.546875, -25.01953125, -23.4921875, -21.96484375, -20.4375, -18.91015625, -17.3828125, -15.85546875, -14.328125, -12.80078125, -11.2734375, -9.74609375, -8.21875, -6.69140625, -5.1640625, -3.63671875, -2.109375, -0.58203125, 0.9453125, 2.47265625, 4.0, 5.52734375, 7.0546875, 8.58203125, 10.109375, 11.63671875, 13.1640625, 14.69140625, 16.21875, 17.74609375, 19.2734375, 20.80078125, 22.328125, 23.85546875, 25.3828125, 26.91015625, 28.4375, 29.96484375, 31.4921875, 33.01953125, 34.546875, 36.07421875, 37.6015625, 39.12890625, 40.65625, 42.18359375, 43.7109375, 45.23828125, 46.765625, 48.29296875, 49.8203125, 51.34765625, 52.875]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 20.0, 995.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-76.25436401367188, -61.881752014160156, -47.50914001464844, -33.13652801513672, -18.763916015625, -4.391304016113281, 9.981307983398438, 24.353919982910156, 38.726531982421875, 53.099143981933594, 67.47175598144531, 81.84436798095703, 96.21697998046875, 110.58959197998047, 124.96220397949219, 139.33480834960938, 153.70742797851562, 168.08004760742188, 182.45265197753906, 196.82525634765625, 211.1978759765625, 225.57049560546875, 239.94309997558594, 254.31570434570312, 268.6883239746094, 283.0609436035156, 297.43353271484375, 311.80615234375, 326.17877197265625, 340.5513916015625, 354.92401123046875, 369.2966003417969, 383.669189453125, 398.04180908203125, 412.4144287109375, 426.7870178222656, 441.1596374511719, 455.5322570800781, 469.90484619140625, 484.2774658203125, 498.65008544921875, 513.022705078125, 527.3953247070312, 541.7679443359375, 556.1405029296875, 570.5131225585938, 584.8857421875, 599.2583618164062, 613.6309814453125, 628.0036010742188, 642.376220703125, 656.7488403320312, 671.1214599609375, 685.4940185546875, 699.8666381835938, 714.2392578125, 728.6118774414062, 742.9844970703125, 757.3571166992188, 771.729736328125, 786.102294921875, 800.4749145507812, 814.8475341796875, 829.2201538085938, 843.5927734375]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 11.0, 5.0, 7.0, 14.0, 15.0, 22.0, 11.0, 20.0, 24.0, 33.0, 32.0, 33.0, 41.0, 45.0, 44.0, 44.0, 59.0, 52.0, 73.0, 50.0, 47.0, 35.0, 45.0, 32.0, 43.0, 31.0, 32.0, 30.0, 15.0, 7.0, 16.0, 15.0, 6.0, 6.0, 4.0, 4.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0], "bins": [-50.80261993408203, -49.36222839355469, -47.921836853027344, -46.4814453125, -45.041053771972656, -43.60065841674805, -42.1602668762207, -40.71987533569336, -39.279483795166016, -37.83909225463867, -36.39870071411133, -34.958309173583984, -33.517913818359375, -32.07752227783203, -30.637130737304688, -29.196739196777344, -27.75634765625, -26.315956115722656, -24.875564575195312, -23.435171127319336, -21.994779586791992, -20.55438804626465, -19.113994598388672, -17.673603057861328, -16.233211517333984, -14.79281997680664, -13.35242748260498, -11.91203498840332, -10.471643447875977, -9.031251907348633, -7.590859413146973, -6.1504669189453125, -4.710071563720703, -3.269679546356201, -1.8292875289916992, -0.38889551162719727, 1.0514965057373047, 2.4918885231018066, 3.9322805404663086, 5.372673034667969, 6.8130645751953125, 8.253456115722656, 9.693848609924316, 11.134241104125977, 12.57463264465332, 14.015024185180664, 15.455416679382324, 16.895809173583984, 18.336200714111328, 19.776592254638672, 21.216983795166016, 22.657377243041992, 24.097768783569336, 25.53816032409668, 26.978553771972656, 28.4189453125, 29.859336853027344, 31.299728393554688, 32.74011993408203, 34.180511474609375, 35.62090301513672, 37.06129837036133, 38.50168991088867, 39.942081451416016, 41.38247299194336]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 1.0, 3.0, 7.0, 6.0, 10.0, 9.0, 11.0, 13.0, 16.0, 27.0, 26.0, 31.0, 28.0, 40.0, 38.0, 38.0, 41.0, 61.0, 51.0, 57.0, 51.0, 50.0, 60.0, 59.0, 38.0, 30.0, 36.0, 28.0, 27.0, 26.0, 20.0, 17.0, 12.0, 7.0, 7.0, 10.0, 4.0, 1.0, 2.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-4.4296875, -4.3089599609375, -4.188232421875, -4.0675048828125, -3.94677734375, -3.8260498046875, -3.705322265625, -3.5845947265625, -3.4638671875, -3.3431396484375, -3.222412109375, -3.1016845703125, -2.98095703125, -2.8602294921875, -2.739501953125, -2.6187744140625, -2.498046875, -2.3773193359375, -2.256591796875, -2.1358642578125, -2.01513671875, -1.8944091796875, -1.773681640625, -1.6529541015625, -1.5322265625, -1.4114990234375, -1.290771484375, -1.1700439453125, -1.04931640625, -0.9285888671875, -0.807861328125, -0.6871337890625, -0.56640625, -0.4456787109375, -0.324951171875, -0.2042236328125, -0.08349609375, 0.0372314453125, 0.157958984375, 0.2786865234375, 0.3994140625, 0.5201416015625, 0.640869140625, 0.7615966796875, 0.88232421875, 1.0030517578125, 1.123779296875, 1.2445068359375, 1.365234375, 1.4859619140625, 1.606689453125, 1.7274169921875, 1.84814453125, 1.9688720703125, 2.089599609375, 2.2103271484375, 2.3310546875, 2.4517822265625, 2.572509765625, 2.6932373046875, 2.81396484375, 2.9346923828125, 3.055419921875, 3.1761474609375, 3.296875]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 7.0, 7.0, 5.0, 13.0, 23.0, 24.0, 35.0, 47.0, 46.0, 82.0, 150.0, 227.0, 401.0, 851.0, 2916.0, 31941.0, 2838493.0, 1295524.0, 19540.0, 2301.0, 700.0, 323.0, 229.0, 128.0, 80.0, 49.0, 48.0, 24.0, 25.0, 16.0, 11.0, 7.0, 5.0, 5.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-32.1875, -31.338623046875, -30.48974609375, -29.640869140625, -28.7919921875, -27.943115234375, -27.09423828125, -26.245361328125, -25.396484375, -24.547607421875, -23.69873046875, -22.849853515625, -22.0009765625, -21.152099609375, -20.30322265625, -19.454345703125, -18.60546875, -17.756591796875, -16.90771484375, -16.058837890625, -15.2099609375, -14.361083984375, -13.51220703125, -12.663330078125, -11.814453125, -10.965576171875, -10.11669921875, -9.267822265625, -8.4189453125, -7.570068359375, -6.72119140625, -5.872314453125, -5.0234375, -4.174560546875, -3.32568359375, -2.476806640625, -1.6279296875, -0.779052734375, 0.06982421875, 0.918701171875, 1.767578125, 2.616455078125, 3.46533203125, 4.314208984375, 5.1630859375, 6.011962890625, 6.86083984375, 7.709716796875, 8.55859375, 9.407470703125, 10.25634765625, 11.105224609375, 11.9541015625, 12.802978515625, 13.65185546875, 14.500732421875, 15.349609375, 16.198486328125, 17.04736328125, 17.896240234375, 18.7451171875, 19.593994140625, 20.44287109375, 21.291748046875, 22.140625]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 12.0, 6.0, 18.0, 20.0, 58.0, 68.0, 99.0, 184.0, 266.0, 455.0, 600.0, 761.0, 570.0, 364.0, 213.0, 148.0, 89.0, 45.0, 32.0, 24.0, 14.0, 12.0, 7.0, 4.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.4375, -17.9437255859375, -17.449951171875, -16.9561767578125, -16.46240234375, -15.9686279296875, -15.474853515625, -14.9810791015625, -14.4873046875, -13.9935302734375, -13.499755859375, -13.0059814453125, -12.51220703125, -12.0184326171875, -11.524658203125, -11.0308837890625, -10.537109375, -10.0433349609375, -9.549560546875, -9.0557861328125, -8.56201171875, -8.0682373046875, -7.574462890625, -7.0806884765625, -6.5869140625, -6.0931396484375, -5.599365234375, -5.1055908203125, -4.61181640625, -4.1180419921875, -3.624267578125, -3.1304931640625, -2.63671875, -2.1429443359375, -1.649169921875, -1.1553955078125, -0.66162109375, -0.1678466796875, 0.325927734375, 0.8197021484375, 1.3134765625, 1.8072509765625, 2.301025390625, 2.7947998046875, 3.28857421875, 3.7823486328125, 4.276123046875, 4.7698974609375, 5.263671875, 5.7574462890625, 6.251220703125, 6.7449951171875, 7.23876953125, 7.7325439453125, 8.226318359375, 8.7200927734375, 9.2138671875, 9.7076416015625, 10.201416015625, 10.6951904296875, 11.18896484375, 11.6827392578125, 12.176513671875, 12.6702880859375, 13.1640625]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 4.0, 4.0, 3.0, 6.0, 5.0, 8.0, 18.0, 31.0, 59.0, 53.0, 120.0, 242.0, 405.0, 829.0, 2213.0, 13686.0, 240437.0, 3583583.0, 330970.0, 17081.0, 2599.0, 922.0, 448.0, 209.0, 152.0, 73.0, 47.0, 33.0, 14.0, 10.0, 10.0, 7.0, 4.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-38.5, -37.474609375, -36.44921875, -35.423828125, -34.3984375, -33.373046875, -32.34765625, -31.322265625, -30.296875, -29.271484375, -28.24609375, -27.220703125, -26.1953125, -25.169921875, -24.14453125, -23.119140625, -22.09375, -21.068359375, -20.04296875, -19.017578125, -17.9921875, -16.966796875, -15.94140625, -14.916015625, -13.890625, -12.865234375, -11.83984375, -10.814453125, -9.7890625, -8.763671875, -7.73828125, -6.712890625, -5.6875, -4.662109375, -3.63671875, -2.611328125, -1.5859375, -0.560546875, 0.46484375, 1.490234375, 2.515625, 3.541015625, 4.56640625, 5.591796875, 6.6171875, 7.642578125, 8.66796875, 9.693359375, 10.71875, 11.744140625, 12.76953125, 13.794921875, 14.8203125, 15.845703125, 16.87109375, 17.896484375, 18.921875, 19.947265625, 20.97265625, 21.998046875, 23.0234375, 24.048828125, 25.07421875, 26.099609375, 27.125]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [5.0, 43.0, 340.0, 494.0, 129.0, 7.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.865354537963867, -15.233367919921875, -8.6013822555542, -1.9693965911865234, 4.662590026855469, 11.294576644897461, 17.92656135559082, 24.558549880981445, 31.190534591674805, 37.8225212097168, 44.454505920410156, 51.08649444580078, 57.71847915649414, 64.3504638671875, 70.98245239257812, 77.61444091796875, 84.24642181396484, 90.87841033935547, 97.51039123535156, 104.14237976074219, 110.77436828613281, 117.40635681152344, 124.03833770751953, 130.67031860351562, 137.30230712890625, 143.93429565429688, 150.5662841796875, 157.19827270507812, 163.8302459716797, 170.4622344970703, 177.09422302246094, 183.72621154785156, 190.3582000732422, 196.9901885986328, 203.62217712402344, 210.254150390625, 216.88613891601562, 223.51812744140625, 230.15011596679688, 236.7821044921875, 243.41409301757812, 250.04608154296875, 256.6780700683594, 263.31005859375, 269.9420471191406, 276.57403564453125, 283.20599365234375, 289.8380126953125, 296.469970703125, 303.1019592285156, 309.73394775390625, 316.3659362792969, 322.9979248046875, 329.6299133300781, 336.26190185546875, 342.89385986328125, 349.52587890625, 356.1578674316406, 362.78985595703125, 369.4218444824219, 376.0538330078125, 382.6858215332031, 389.31781005859375, 395.94976806640625, 402.5817565917969]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 6.0, 6.0, 7.0, 14.0, 10.0, 11.0, 14.0, 23.0, 27.0, 31.0, 29.0, 33.0, 29.0, 37.0, 39.0, 42.0, 47.0, 45.0, 42.0, 40.0, 34.0, 51.0, 40.0, 36.0, 40.0, 46.0, 32.0, 32.0, 23.0, 24.0, 14.0, 13.0, 18.0, 10.0, 12.0, 8.0, 13.0, 4.0, 6.0, 7.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.60449981689453, -34.446632385253906, -33.28876495361328, -32.13090133666992, -30.973033905029297, -29.815166473388672, -28.65730094909668, -27.499435424804688, -26.341567993164062, -25.183700561523438, -24.025835037231445, -22.867969512939453, -21.710102081298828, -20.552234649658203, -19.39436912536621, -18.23650360107422, -17.078636169433594, -15.920769691467285, -14.762903213500977, -13.605036735534668, -12.44717025756836, -11.28930377960205, -10.131437301635742, -8.973570823669434, -7.815704345703125, -6.657837867736816, -5.499971389770508, -4.342104911804199, -3.1842384338378906, -2.026371955871582, -0.8685054779052734, 0.28936100006103516, 1.4472274780273438, 2.6050939559936523, 3.762960433959961, 4.9208269119262695, 6.078693389892578, 7.236559867858887, 8.394426345825195, 9.552292823791504, 10.710159301757812, 11.868025779724121, 13.02589225769043, 14.183758735656738, 15.341625213623047, 16.499492645263672, 17.657358169555664, 18.815223693847656, 19.97309112548828, 21.130958557128906, 22.2888240814209, 23.44668960571289, 24.604557037353516, 25.76242446899414, 26.920289993286133, 28.078155517578125, 29.23602294921875, 30.393890380859375, 31.551755905151367, 32.70962142944336, 33.867488861083984, 35.02535629272461, 36.18321990966797, 37.341087341308594, 38.49895477294922]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 4.0, 4.0, 5.0, 13.0, 7.0, 12.0, 9.0, 22.0, 20.0, 29.0, 20.0, 34.0, 27.0, 22.0, 28.0, 34.0, 46.0, 49.0, 39.0, 44.0, 42.0, 44.0, 42.0, 40.0, 35.0, 37.0, 49.0, 44.0, 26.0, 24.0, 28.0, 23.0, 19.0, 17.0, 16.0, 9.0, 10.0, 7.0, 3.0, 6.0, 3.0, 4.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.16796875, -3.06109619140625, -2.9542236328125, -2.84735107421875, -2.740478515625, -2.63360595703125, -2.5267333984375, -2.41986083984375, -2.31298828125, -2.20611572265625, -2.0992431640625, -1.99237060546875, -1.885498046875, -1.77862548828125, -1.6717529296875, -1.56488037109375, -1.4580078125, -1.35113525390625, -1.2442626953125, -1.13739013671875, -1.030517578125, -0.92364501953125, -0.8167724609375, -0.70989990234375, -0.60302734375, -0.49615478515625, -0.3892822265625, -0.28240966796875, -0.175537109375, -0.06866455078125, 0.0382080078125, 0.14508056640625, 0.251953125, 0.35882568359375, 0.4656982421875, 0.57257080078125, 0.679443359375, 0.78631591796875, 0.8931884765625, 1.00006103515625, 1.10693359375, 1.21380615234375, 1.3206787109375, 1.42755126953125, 1.534423828125, 1.64129638671875, 1.7481689453125, 1.85504150390625, 1.9619140625, 2.06878662109375, 2.1756591796875, 2.28253173828125, 2.389404296875, 2.49627685546875, 2.6031494140625, 2.71002197265625, 2.81689453125, 2.92376708984375, 3.0306396484375, 3.13751220703125, 3.244384765625, 3.35125732421875, 3.4581298828125, 3.56500244140625, 3.671875]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 2.0, 8.0, 14.0, 23.0, 33.0, 41.0, 47.0, 77.0, 113.0, 190.0, 252.0, 358.0, 542.0, 857.0, 1224.0, 1870.0, 2982.0, 4526.0, 7232.0, 11770.0, 19365.0, 32593.0, 56667.0, 98627.0, 162869.0, 211582.0, 173663.0, 108355.0, 61872.0, 35399.0, 20622.0, 12582.0, 7912.0, 4980.0, 3189.0, 2063.0, 1379.0, 851.0, 611.0, 383.0, 298.0, 173.0, 136.0, 75.0, 52.0, 32.0, 20.0, 24.0, 10.0, 8.0, 2.0, 7.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1201171875, -0.11605644226074219, -0.11199569702148438, -0.10793495178222656, -0.10387420654296875, -0.09981346130371094, -0.09575271606445312, -0.09169197082519531, -0.0876312255859375, -0.08357048034667969, -0.07950973510742188, -0.07544898986816406, -0.07138824462890625, -0.06732749938964844, -0.06326675415039062, -0.05920600891113281, -0.055145263671875, -0.05108451843261719, -0.047023773193359375, -0.04296302795410156, -0.03890228271484375, -0.03484153747558594, -0.030780792236328125, -0.026720046997070312, -0.0226593017578125, -0.018598556518554688, -0.014537811279296875, -0.010477066040039062, -0.00641632080078125, -0.0023555755615234375, 0.001705169677734375, 0.0057659149169921875, 0.00982666015625, 0.013887405395507812, 0.017948150634765625, 0.022008895874023438, 0.02606964111328125, 0.030130386352539062, 0.034191131591796875, 0.03825187683105469, 0.0423126220703125, 0.04637336730957031, 0.050434112548828125, 0.05449485778808594, 0.05855560302734375, 0.06261634826660156, 0.06667709350585938, 0.07073783874511719, 0.074798583984375, 0.07885932922363281, 0.08292007446289062, 0.08698081970214844, 0.09104156494140625, 0.09510231018066406, 0.09916305541992188, 0.10322380065917969, 0.1072845458984375, 0.11134529113769531, 0.11540603637695312, 0.11946678161621094, 0.12352752685546875, 0.12758827209472656, 0.13164901733398438, 0.1357097625732422, 0.1397705078125]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0, 5.0, 6.0, 7.0, 9.0, 14.0, 10.0, 10.0, 26.0, 21.0, 19.0, 21.0, 21.0, 25.0, 38.0, 34.0, 41.0, 30.0, 32.0, 41.0, 45.0, 33.0, 1069.0, 35.0, 41.0, 48.0, 30.0, 41.0, 29.0, 35.0, 26.0, 22.0, 19.0, 17.0, 16.0, 20.0, 18.0, 13.0, 9.0, 10.0, 11.0, 8.0, 3.0, 6.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.12109375, -2.059417724609375, -1.99774169921875, -1.936065673828125, -1.8743896484375, -1.812713623046875, -1.75103759765625, -1.689361572265625, -1.627685546875, -1.566009521484375, -1.50433349609375, -1.442657470703125, -1.3809814453125, -1.319305419921875, -1.25762939453125, -1.195953369140625, -1.13427734375, -1.072601318359375, -1.01092529296875, -0.949249267578125, -0.8875732421875, -0.825897216796875, -0.76422119140625, -0.702545166015625, -0.640869140625, -0.579193115234375, -0.51751708984375, -0.455841064453125, -0.3941650390625, -0.332489013671875, -0.27081298828125, -0.209136962890625, -0.1474609375, -0.085784912109375, -0.02410888671875, 0.037567138671875, 0.0992431640625, 0.160919189453125, 0.22259521484375, 0.284271240234375, 0.345947265625, 0.407623291015625, 0.46929931640625, 0.530975341796875, 0.5926513671875, 0.654327392578125, 0.71600341796875, 0.777679443359375, 0.83935546875, 0.901031494140625, 0.96270751953125, 1.024383544921875, 1.0860595703125, 1.147735595703125, 1.20941162109375, 1.271087646484375, 1.332763671875, 1.394439697265625, 1.45611572265625, 1.517791748046875, 1.5794677734375, 1.641143798828125, 1.70281982421875, 1.764495849609375, 1.826171875]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 3.0, 2.0, 8.0, 9.0, 18.0, 29.0, 48.0, 71.0, 108.0, 180.0, 224.0, 344.0, 555.0, 803.0, 1227.0, 1877.0, 2957.0, 4457.0, 7111.0, 11283.0, 18208.0, 30401.0, 51324.0, 87375.0, 141241.0, 1238460.0, 183333.0, 125125.0, 75942.0, 44338.0, 26091.0, 15999.0, 10128.0, 6227.0, 4181.0, 2613.0, 1627.0, 1090.0, 725.0, 477.0, 301.0, 211.0, 148.0, 90.0, 71.0, 35.0, 28.0, 14.0, 15.0, 3.0, 0.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.12396240234375, -0.12030220031738281, -0.11664199829101562, -0.11298179626464844, -0.10932159423828125, -0.10566139221191406, -0.10200119018554688, -0.09834098815917969, -0.0946807861328125, -0.09102058410644531, -0.08736038208007812, -0.08370018005371094, -0.08003997802734375, -0.07637977600097656, -0.07271957397460938, -0.06905937194824219, -0.065399169921875, -0.06173896789550781, -0.058078765869140625, -0.05441856384277344, -0.05075836181640625, -0.04709815979003906, -0.043437957763671875, -0.03977775573730469, -0.0361175537109375, -0.03245735168457031, -0.028797149658203125, -0.025136947631835938, -0.02147674560546875, -0.017816543579101562, -0.014156341552734375, -0.010496139526367188, -0.0068359375, -0.0031757354736328125, 0.000484466552734375, 0.0041446685791015625, 0.00780487060546875, 0.011465072631835938, 0.015125274658203125, 0.018785476684570312, 0.0224456787109375, 0.026105880737304688, 0.029766082763671875, 0.03342628479003906, 0.03708648681640625, 0.04074668884277344, 0.044406890869140625, 0.04806709289550781, 0.051727294921875, 0.05538749694824219, 0.059047698974609375, 0.06270790100097656, 0.06636810302734375, 0.07002830505371094, 0.07368850708007812, 0.07734870910644531, 0.0810089111328125, 0.08466911315917969, 0.08832931518554688, 0.09198951721191406, 0.09564971923828125, 0.09930992126464844, 0.10297012329101562, 0.10663032531738281, 0.11029052734375]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 0.0, 3.0, 4.0, 7.0, 4.0, 6.0, 9.0, 10.0, 13.0, 12.0, 18.0, 27.0, 31.0, 39.0, 44.0, 51.0, 40.0, 71.0, 78.0, 60.0, 61.0, 66.0, 69.0, 38.0, 30.0, 49.0, 45.0, 19.0, 22.0, 15.0, 15.0, 8.0, 10.0, 10.0, 8.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004169940948486328, -0.000401865690946579, -0.00038673728704452515, -0.0003716088831424713, -0.0003564804792404175, -0.00034135207533836365, -0.0003262236714363098, -0.000311095267534256, -0.00029596686363220215, -0.0002808384597301483, -0.0002657100558280945, -0.00025058165192604065, -0.00023545324802398682, -0.00022032484412193298, -0.00020519644021987915, -0.00019006803631782532, -0.00017493963241577148, -0.00015981122851371765, -0.00014468282461166382, -0.00012955442070960999, -0.00011442601680755615, -9.929761290550232e-05, -8.416920900344849e-05, -6.904080510139465e-05, -5.391240119934082e-05, -3.878399729728699e-05, -2.3655593395233154e-05, -8.527189493179321e-06, 6.601214408874512e-06, 2.1729618310928345e-05, 3.685802221298218e-05, 5.198642611503601e-05, 6.711483001708984e-05, 8.224323391914368e-05, 9.737163782119751e-05, 0.00011250004172325134, 0.00012762844562530518, 0.000142756849527359, 0.00015788525342941284, 0.00017301365733146667, 0.0001881420612335205, 0.00020327046513557434, 0.00021839886903762817, 0.000233527272939682, 0.00024865567684173584, 0.00026378408074378967, 0.0002789124846458435, 0.00029404088854789734, 0.00030916929244995117, 0.000324297696352005, 0.00033942610025405884, 0.00035455450415611267, 0.0003696829080581665, 0.00038481131196022034, 0.00039993971586227417, 0.000415068119764328, 0.00043019652366638184, 0.00044532492756843567, 0.0004604533314704895, 0.00047558173537254333, 0.0004907101392745972, 0.000505838543176651, 0.0005209669470787048, 0.0005360953509807587, 0.0005512237548828125]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 4.0, 5.0, 12.0, 3.0, 21.0, 23.0, 17.0, 27.0, 28.0, 52.0, 73.0, 94.0, 113.0, 132.0, 248.0, 409.0, 1050.0, 192225.0, 850208.0, 2409.0, 448.0, 228.0, 174.0, 156.0, 101.0, 86.0, 46.0, 40.0, 31.0, 23.0, 18.0, 9.0, 10.0, 6.0, 3.0, 6.0, 3.0, 5.0, 1.0, 2.0, 4.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01009368896484375, -0.009806513786315918, -0.009519338607788086, -0.009232163429260254, -0.008944988250732422, -0.00865781307220459, -0.008370637893676758, -0.008083462715148926, -0.007796287536621094, -0.007509112358093262, -0.00722193717956543, -0.006934762001037598, -0.006647586822509766, -0.006360411643981934, -0.0060732364654541016, -0.0057860612869262695, -0.0054988861083984375, -0.0052117109298706055, -0.0049245357513427734, -0.004637360572814941, -0.004350185394287109, -0.004063010215759277, -0.0037758350372314453, -0.0034886598587036133, -0.0032014846801757812, -0.0029143095016479492, -0.002627134323120117, -0.002339959144592285, -0.002052783966064453, -0.001765608787536621, -0.001478433609008789, -0.001191258430480957, -0.000904083251953125, -0.000616908073425293, -0.00032973289489746094, -4.2557716369628906e-05, 0.0002446174621582031, 0.0005317926406860352, 0.0008189678192138672, 0.0011061429977416992, 0.0013933181762695312, 0.0016804933547973633, 0.0019676685333251953, 0.0022548437118530273, 0.0025420188903808594, 0.0028291940689086914, 0.0031163692474365234, 0.0034035444259643555, 0.0036907196044921875, 0.0039778947830200195, 0.0042650699615478516, 0.004552245140075684, 0.004839420318603516, 0.005126595497131348, 0.00541377067565918, 0.005700945854187012, 0.005988121032714844, 0.006275296211242676, 0.006562471389770508, 0.00684964656829834, 0.007136821746826172, 0.007423996925354004, 0.007711172103881836, 0.007998347282409668, 0.0082855224609375]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 9.0, 54.0, 143.0, 323.0, 277.0, 146.0, 45.0, 13.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007299691787920892, -0.0007018558098934591, -0.0006737424992024899, -0.0006456291303038597, -0.0006175157614052296, -0.0005894023925065994, -0.0005612890236079693, -0.0005331757129170001, -0.0005050623440183699, -0.00047694897511973977, -0.0004488356353249401, -0.0004207222955301404, -0.00039260892663151026, -0.0003644955577328801, -0.00033638221793808043, -0.00030826887814328074, -0.0002801555092446506, -0.00025204214034602046, -0.00022392880055122077, -0.00019581544620450586, -0.00016770209185779095, -0.00013958873751107603, -0.00011147538316436112, -8.33620288176462e-05, -5.524867447093129e-05, -2.7135320124216378e-05, 9.780342224985361e-07, 2.909138856921345e-05, 5.7204742915928364e-05, 8.531809726264328e-05, 0.00011343145160935819, 0.0001415448059560731, 0.00016965821851044893, 0.00019777157285716385, 0.00022588492720387876, 0.00025399826699867845, 0.0002821116358973086, 0.00031022500479593873, 0.0003383383445907384, 0.0003664516843855381, 0.00039456505328416824, 0.0004226784221827984, 0.00045079176197759807, 0.00047890510177239776, 0.0005070184706710279, 0.000535131839569658, 0.0005632451502606273, 0.0005913585191592574, 0.0006194718880578876, 0.0006475852569565177, 0.0006756986258551478, 0.0007038119365461171, 0.0007319253054447472, 0.0007600386743433774, 0.0007881519850343466, 0.0008162653539329767, 0.0008443787228316069, 0.000872492091730237, 0.0009006054606288671, 0.0009287187713198364, 0.0009568321402184665, 0.0009849454509094357, 0.0010130588198080659, 0.001041172188706696, 0.0010692855576053262]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 7.0, 6.0, 5.0, 10.0, 8.0, 15.0, 10.0, 10.0, 22.0, 24.0, 19.0, 21.0, 16.0, 41.0, 36.0, 36.0, 37.0, 41.0, 48.0, 38.0, 46.0, 41.0, 34.0, 42.0, 32.0, 34.0, 35.0, 26.0, 35.0, 39.0, 20.0, 21.0, 30.0, 22.0, 20.0, 16.0, 8.0, 12.0, 11.0, 11.0, 4.0, 6.0, 5.0, 0.0, 2.0, 2.0, 5.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00020772218704223633, -0.00020059477537870407, -0.00019346736371517181, -0.00018633995205163956, -0.0001792125403881073, -0.00017208512872457504, -0.00016495771706104279, -0.00015783030539751053, -0.00015070289373397827, -0.00014357548207044601, -0.00013644807040691376, -0.0001293206587433815, -0.00012219324707984924, -0.00011506583541631699, -0.00010793842375278473, -0.00010081101208925247, -9.368360042572021e-05, -8.655618876218796e-05, -7.94287770986557e-05, -7.230136543512344e-05, -6.517395377159119e-05, -5.804654210805893e-05, -5.091913044452667e-05, -4.3791718780994415e-05, -3.666430711746216e-05, -2.95368954539299e-05, -2.2409483790397644e-05, -1.5282072126865387e-05, -8.15466046333313e-06, -1.0272487998008728e-06, 6.100162863731384e-06, 1.3227574527263641e-05, 2.03549861907959e-05, 2.7482397854328156e-05, 3.460980951786041e-05, 4.173722118139267e-05, 4.886463284492493e-05, 5.5992044508457184e-05, 6.311945617198944e-05, 7.02468678355217e-05, 7.737427949905396e-05, 8.450169116258621e-05, 9.162910282611847e-05, 9.875651448965073e-05, 0.00010588392615318298, 0.00011301133781671524, 0.0001201387494802475, 0.00012726616114377975, 0.000134393572807312, 0.00014152098447084427, 0.00014864839613437653, 0.00015577580779790878, 0.00016290321946144104, 0.0001700306311249733, 0.00017715804278850555, 0.0001842854544520378, 0.00019141286611557007, 0.00019854027777910233, 0.00020566768944263458, 0.00021279510110616684, 0.0002199225127696991, 0.00022704992443323135, 0.0002341773360967636, 0.00024130474776029587, 0.0002484321594238281]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 4.0, 4.0, 5.0, 13.0, 7.0, 12.0, 9.0, 22.0, 20.0, 29.0, 20.0, 34.0, 27.0, 22.0, 28.0, 34.0, 46.0, 49.0, 39.0, 44.0, 42.0, 44.0, 42.0, 39.0, 36.0, 37.0, 48.0, 45.0, 26.0, 24.0, 28.0, 23.0, 19.0, 17.0, 16.0, 9.0, 10.0, 7.0, 3.0, 6.0, 3.0, 4.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.16796875, -3.06109619140625, -2.9542236328125, -2.84735107421875, -2.740478515625, -2.63360595703125, -2.5267333984375, -2.41986083984375, -2.31298828125, -2.20611572265625, -2.0992431640625, -1.99237060546875, -1.885498046875, -1.77862548828125, -1.6717529296875, -1.56488037109375, -1.4580078125, -1.35113525390625, -1.2442626953125, -1.13739013671875, -1.030517578125, -0.92364501953125, -0.8167724609375, -0.70989990234375, -0.60302734375, -0.49615478515625, -0.3892822265625, -0.28240966796875, -0.175537109375, -0.06866455078125, 0.0382080078125, 0.14508056640625, 0.251953125, 0.35882568359375, 0.4656982421875, 0.57257080078125, 0.679443359375, 0.78631591796875, 0.8931884765625, 1.00006103515625, 1.10693359375, 1.21380615234375, 1.3206787109375, 1.42755126953125, 1.534423828125, 1.64129638671875, 1.7481689453125, 1.85504150390625, 1.9619140625, 2.06878662109375, 2.1756591796875, 2.28253173828125, 2.389404296875, 2.49627685546875, 2.6031494140625, 2.71002197265625, 2.81689453125, 2.92376708984375, 3.0306396484375, 3.13751220703125, 3.244384765625, 3.35125732421875, 3.4581298828125, 3.56500244140625, 3.671875]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 4.0, 3.0, 9.0, 13.0, 15.0, 21.0, 24.0, 32.0, 41.0, 54.0, 69.0, 92.0, 147.0, 171.0, 286.0, 362.0, 636.0, 963.0, 1723.0, 3329.0, 7274.0, 17375.0, 44204.0, 126292.0, 391240.0, 298319.0, 94810.0, 34353.0, 13797.0, 6035.0, 2860.0, 1461.0, 847.0, 505.0, 329.0, 239.0, 162.0, 123.0, 91.0, 77.0, 35.0, 26.0, 31.0, 23.0, 15.0, 11.0, 11.0, 7.0, 4.0, 6.0, 5.0, 0.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.935546875, -2.8338623046875, -2.732177734375, -2.6304931640625, -2.52880859375, -2.4271240234375, -2.325439453125, -2.2237548828125, -2.1220703125, -2.0203857421875, -1.918701171875, -1.8170166015625, -1.71533203125, -1.6136474609375, -1.511962890625, -1.4102783203125, -1.30859375, -1.2069091796875, -1.105224609375, -1.0035400390625, -0.90185546875, -0.8001708984375, -0.698486328125, -0.5968017578125, -0.4951171875, -0.3934326171875, -0.291748046875, -0.1900634765625, -0.08837890625, 0.0133056640625, 0.114990234375, 0.2166748046875, 0.318359375, 0.4200439453125, 0.521728515625, 0.6234130859375, 0.72509765625, 0.8267822265625, 0.928466796875, 1.0301513671875, 1.1318359375, 1.2335205078125, 1.335205078125, 1.4368896484375, 1.53857421875, 1.6402587890625, 1.741943359375, 1.8436279296875, 1.9453125, 2.0469970703125, 2.148681640625, 2.2503662109375, 2.35205078125, 2.4537353515625, 2.555419921875, 2.6571044921875, 2.7587890625, 2.8604736328125, 2.962158203125, 3.0638427734375, 3.16552734375, 3.2672119140625, 3.368896484375, 3.4705810546875, 3.572265625]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 3.0, 11.0, 5.0, 9.0, 8.0, 15.0, 9.0, 19.0, 23.0, 26.0, 25.0, 31.0, 39.0, 33.0, 42.0, 51.0, 47.0, 71.0, 222.0, 1739.0, 123.0, 65.0, 60.0, 47.0, 43.0, 44.0, 36.0, 25.0, 30.0, 24.0, 18.0, 17.0, 17.0, 13.0, 10.0, 11.0, 5.0, 4.0, 7.0, 5.0, 3.0, 4.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-12.9765625, -12.59765625, -12.21875, -11.83984375, -11.4609375, -11.08203125, -10.703125, -10.32421875, -9.9453125, -9.56640625, -9.1875, -8.80859375, -8.4296875, -8.05078125, -7.671875, -7.29296875, -6.9140625, -6.53515625, -6.15625, -5.77734375, -5.3984375, -5.01953125, -4.640625, -4.26171875, -3.8828125, -3.50390625, -3.125, -2.74609375, -2.3671875, -1.98828125, -1.609375, -1.23046875, -0.8515625, -0.47265625, -0.09375, 0.28515625, 0.6640625, 1.04296875, 1.421875, 1.80078125, 2.1796875, 2.55859375, 2.9375, 3.31640625, 3.6953125, 4.07421875, 4.453125, 4.83203125, 5.2109375, 5.58984375, 5.96875, 6.34765625, 6.7265625, 7.10546875, 7.484375, 7.86328125, 8.2421875, 8.62109375, 9.0, 9.37890625, 9.7578125, 10.13671875, 10.515625, 10.89453125, 11.2734375]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 5.0, 2.0, 4.0, 4.0, 6.0, 5.0, 10.0, 12.0, 13.0, 20.0, 15.0, 22.0, 31.0, 41.0, 39.0, 52.0, 96.0, 161.0, 283.0, 557.0, 1704.0, 8734.0, 2820271.0, 305889.0, 5354.0, 1227.0, 452.0, 243.0, 134.0, 78.0, 47.0, 41.0, 26.0, 26.0, 19.0, 16.0, 17.0, 10.0, 11.0, 7.0, 7.0, 4.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.390625, -25.507568359375, -24.62451171875, -23.741455078125, -22.8583984375, -21.975341796875, -21.09228515625, -20.209228515625, -19.326171875, -18.443115234375, -17.56005859375, -16.677001953125, -15.7939453125, -14.910888671875, -14.02783203125, -13.144775390625, -12.26171875, -11.378662109375, -10.49560546875, -9.612548828125, -8.7294921875, -7.846435546875, -6.96337890625, -6.080322265625, -5.197265625, -4.314208984375, -3.43115234375, -2.548095703125, -1.6650390625, -0.781982421875, 0.10107421875, 0.984130859375, 1.8671875, 2.750244140625, 3.63330078125, 4.516357421875, 5.3994140625, 6.282470703125, 7.16552734375, 8.048583984375, 8.931640625, 9.814697265625, 10.69775390625, 11.580810546875, 12.4638671875, 13.346923828125, 14.22998046875, 15.113037109375, 15.99609375, 16.879150390625, 17.76220703125, 18.645263671875, 19.5283203125, 20.411376953125, 21.29443359375, 22.177490234375, 23.060546875, 23.943603515625, 24.82666015625, 25.709716796875, 26.5927734375, 27.475830078125, 28.35888671875, 29.241943359375, 30.125]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [9.0, 802.0, 205.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.181434631347656, -4.676226615905762, 0.8289813995361328, 6.334190368652344, 11.839397430419922, 17.3446044921875, 22.849815368652344, 28.355022430419922, 33.8602294921875, 39.36543655395508, 44.870643615722656, 50.3758544921875, 55.88106155395508, 61.386268615722656, 66.8914794921875, 72.39668273925781, 77.90189361572266, 83.4071044921875, 88.91230773925781, 94.41751861572266, 99.9227294921875, 105.42793273925781, 110.93314361572266, 116.4383544921875, 121.94355773925781, 127.44876861572266, 132.9539794921875, 138.4591827392578, 143.96438598632812, 149.4696044921875, 154.9748077392578, 160.48001098632812, 165.9852294921875, 171.4904327392578, 176.9956512451172, 182.5008544921875, 188.0060577392578, 193.51126098632812, 199.0164794921875, 204.5216827392578, 210.02688598632812, 215.53208923339844, 221.0373077392578, 226.54251098632812, 232.04771423339844, 237.55291748046875, 243.05813598632812, 248.56333923339844, 254.0685577392578, 259.5737609863281, 265.0789794921875, 270.58416748046875, 276.0893859863281, 281.5946044921875, 287.09979248046875, 292.6050109863281, 298.1102294921875, 303.6154479980469, 309.1206359863281, 314.6258544921875, 320.1310729980469, 325.6362609863281, 331.1414794921875, 336.6466979980469, 342.1518859863281]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 1.0, 1.0, 5.0, 6.0, 3.0, 3.0, 7.0, 7.0, 13.0, 17.0, 16.0, 26.0, 26.0, 23.0, 27.0, 32.0, 22.0, 37.0, 27.0, 36.0, 39.0, 32.0, 43.0, 53.0, 47.0, 33.0, 47.0, 45.0, 36.0, 37.0, 35.0, 26.0, 29.0, 23.0, 19.0, 11.0, 19.0, 17.0, 12.0, 17.0, 11.0, 9.0, 3.0, 10.0, 5.0, 6.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0], "bins": [-39.39646530151367, -38.245079040527344, -37.093692779541016, -35.94230270385742, -34.790916442871094, -33.639530181884766, -32.48814392089844, -31.33675765991211, -30.18536949157715, -29.03398323059082, -27.88259506225586, -26.73120880126953, -25.579822540283203, -24.428434371948242, -23.277048110961914, -22.125659942626953, -20.974273681640625, -19.822887420654297, -18.671499252319336, -17.520112991333008, -16.368724822998047, -15.217338562011719, -14.06595230102539, -12.914565086364746, -11.763177871704102, -10.611790657043457, -9.460403442382812, -8.309017181396484, -7.15762996673584, -6.006242752075195, -4.854856014251709, -3.7034692764282227, -2.5520782470703125, -1.400691270828247, -0.24930429458618164, 0.9020826816558838, 2.053469657897949, 3.2048568725585938, 4.35624361038208, 5.507630348205566, 6.659017562866211, 7.8104047775268555, 8.9617919921875, 10.113178253173828, 11.264565467834473, 12.415952682495117, 13.567338943481445, 14.71872615814209, 15.870113372802734, 17.021499633789062, 18.172887802124023, 19.32427406311035, 20.475662231445312, 21.62704849243164, 22.77843475341797, 23.929821014404297, 25.081209182739258, 26.232595443725586, 27.383983612060547, 28.535369873046875, 29.686756134033203, 30.838144302368164, 31.989530563354492, 33.14091873168945, 34.29230499267578]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 6.0, 3.0, 12.0, 7.0, 9.0, 10.0, 19.0, 17.0, 24.0, 23.0, 26.0, 28.0, 25.0, 28.0, 30.0, 36.0, 45.0, 53.0, 40.0, 35.0, 37.0, 50.0, 40.0, 39.0, 36.0, 38.0, 39.0, 46.0, 30.0, 26.0, 23.0, 20.0, 23.0, 17.0, 12.0, 12.0, 6.0, 10.0, 3.0, 5.0, 1.0, 5.0, 4.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.185546875, -3.077117919921875, -2.96868896484375, -2.860260009765625, -2.7518310546875, -2.643402099609375, -2.53497314453125, -2.426544189453125, -2.318115234375, -2.209686279296875, -2.10125732421875, -1.992828369140625, -1.8843994140625, -1.775970458984375, -1.66754150390625, -1.559112548828125, -1.45068359375, -1.342254638671875, -1.23382568359375, -1.125396728515625, -1.0169677734375, -0.908538818359375, -0.80010986328125, -0.691680908203125, -0.583251953125, -0.474822998046875, -0.36639404296875, -0.257965087890625, -0.1495361328125, -0.041107177734375, 0.06732177734375, 0.175750732421875, 0.2841796875, 0.392608642578125, 0.50103759765625, 0.609466552734375, 0.7178955078125, 0.826324462890625, 0.93475341796875, 1.043182373046875, 1.151611328125, 1.260040283203125, 1.36846923828125, 1.476898193359375, 1.5853271484375, 1.693756103515625, 1.80218505859375, 1.910614013671875, 2.01904296875, 2.127471923828125, 2.23590087890625, 2.344329833984375, 2.4527587890625, 2.561187744140625, 2.66961669921875, 2.778045654296875, 2.886474609375, 2.994903564453125, 3.10333251953125, 3.211761474609375, 3.3201904296875, 3.428619384765625, 3.53704833984375, 3.645477294921875, 3.75390625]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 6.0, 8.0, 15.0, 12.0, 8.0, 22.0, 25.0, 36.0, 32.0, 49.0, 52.0, 62.0, 79.0, 110.0, 183.0, 386.0, 1382.0, 7994.0, 80017.0, 2513025.0, 1530958.0, 51936.0, 5776.0, 1103.0, 339.0, 169.0, 118.0, 95.0, 59.0, 47.0, 46.0, 27.0, 26.0, 19.0, 21.0, 12.0, 7.0, 7.0, 5.0, 6.0, 3.0, 1.0, 4.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-16.546875, -16.01171875, -15.4765625, -14.94140625, -14.40625, -13.87109375, -13.3359375, -12.80078125, -12.265625, -11.73046875, -11.1953125, -10.66015625, -10.125, -9.58984375, -9.0546875, -8.51953125, -7.984375, -7.44921875, -6.9140625, -6.37890625, -5.84375, -5.30859375, -4.7734375, -4.23828125, -3.703125, -3.16796875, -2.6328125, -2.09765625, -1.5625, -1.02734375, -0.4921875, 0.04296875, 0.578125, 1.11328125, 1.6484375, 2.18359375, 2.71875, 3.25390625, 3.7890625, 4.32421875, 4.859375, 5.39453125, 5.9296875, 6.46484375, 7.0, 7.53515625, 8.0703125, 8.60546875, 9.140625, 9.67578125, 10.2109375, 10.74609375, 11.28125, 11.81640625, 12.3515625, 12.88671875, 13.421875, 13.95703125, 14.4921875, 15.02734375, 15.5625, 16.09765625, 16.6328125, 17.16796875, 17.703125]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 3.0, 2.0, 6.0, 11.0, 15.0, 19.0, 21.0, 32.0, 75.0, 95.0, 148.0, 253.0, 385.0, 484.0, 675.0, 579.0, 419.0, 311.0, 192.0, 113.0, 94.0, 51.0, 29.0, 28.0, 17.0, 8.0, 4.0, 5.0, 3.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.59375, -12.15625, -11.71875, -11.28125, -10.84375, -10.40625, -9.96875, -9.53125, -9.09375, -8.65625, -8.21875, -7.78125, -7.34375, -6.90625, -6.46875, -6.03125, -5.59375, -5.15625, -4.71875, -4.28125, -3.84375, -3.40625, -2.96875, -2.53125, -2.09375, -1.65625, -1.21875, -0.78125, -0.34375, 0.09375, 0.53125, 0.96875, 1.40625, 1.84375, 2.28125, 2.71875, 3.15625, 3.59375, 4.03125, 4.46875, 4.90625, 5.34375, 5.78125, 6.21875, 6.65625, 7.09375, 7.53125, 7.96875, 8.40625, 8.84375, 9.28125, 9.71875, 10.15625, 10.59375, 11.03125, 11.46875, 11.90625, 12.34375, 12.78125, 13.21875, 13.65625, 14.09375, 14.53125, 14.96875, 15.40625]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 7.0, 8.0, 14.0, 48.0, 100.0, 225.0, 552.0, 2226.0, 18943.0, 501599.0, 3524279.0, 136463.0, 7782.0, 1241.0, 475.0, 183.0, 89.0, 28.0, 18.0, 11.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.40625, -15.2607421875, -14.115234375, -12.9697265625, -11.82421875, -10.6787109375, -9.533203125, -8.3876953125, -7.2421875, -6.0966796875, -4.951171875, -3.8056640625, -2.66015625, -1.5146484375, -0.369140625, 0.7763671875, 1.921875, 3.0673828125, 4.212890625, 5.3583984375, 6.50390625, 7.6494140625, 8.794921875, 9.9404296875, 11.0859375, 12.2314453125, 13.376953125, 14.5224609375, 15.66796875, 16.8134765625, 17.958984375, 19.1044921875, 20.25, 21.3955078125, 22.541015625, 23.6865234375, 24.83203125, 25.9775390625, 27.123046875, 28.2685546875, 29.4140625, 30.5595703125, 31.705078125, 32.8505859375, 33.99609375, 35.1416015625, 36.287109375, 37.4326171875, 38.578125, 39.7236328125, 40.869140625, 42.0146484375, 43.16015625, 44.3056640625, 45.451171875, 46.5966796875, 47.7421875, 48.8876953125, 50.033203125, 51.1787109375, 52.32421875, 53.4697265625, 54.615234375, 55.7607421875, 56.90625]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 8.0, 32.0, 103.0, 217.0, 322.0, 205.0, 84.0, 28.0, 7.0, 6.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.20258331298828, -30.18130874633789, -26.160032272338867, -22.138755798339844, -18.117481231689453, -14.096206665039062, -10.074930191040039, -6.053653717041016, -2.032379150390625, 1.988896369934082, 6.010171890258789, 10.031447410583496, 14.052722930908203, 18.073997497558594, 22.095273971557617, 26.11655044555664, 30.13782501220703, 34.15909957885742, 38.18037414550781, 42.20165252685547, 46.22292709350586, 50.24420166015625, 54.265480041503906, 58.2867546081543, 62.30802917480469, 66.32930755615234, 70.35057830810547, 74.37185668945312, 78.39312744140625, 82.4144058227539, 86.43568420410156, 90.45695495605469, 94.47824096679688, 98.49951934814453, 102.52079010009766, 106.54206848144531, 110.56333923339844, 114.5846176147461, 118.60589599609375, 122.62716674804688, 126.64844512939453, 130.6697235107422, 134.6909942626953, 138.71226501464844, 142.73355102539062, 146.75482177734375, 150.77609252929688, 154.79737854003906, 158.8186492919922, 162.8399200439453, 166.8612060546875, 170.88247680664062, 174.90374755859375, 178.92501831054688, 182.94630432128906, 186.9675750732422, 190.98886108398438, 195.0101318359375, 199.0314178466797, 203.0526885986328, 207.07395935058594, 211.09524536132812, 215.11651611328125, 219.13778686523438, 223.1590576171875]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 5.0, 3.0, 3.0, 2.0, 1.0, 9.0, 8.0, 13.0, 5.0, 16.0, 19.0, 18.0, 11.0, 25.0, 25.0, 23.0, 23.0, 22.0, 37.0, 31.0, 29.0, 33.0, 27.0, 37.0, 45.0, 48.0, 35.0, 36.0, 39.0, 31.0, 36.0, 26.0, 31.0, 25.0, 23.0, 26.0, 23.0, 18.0, 20.0, 18.0, 19.0, 17.0, 17.0, 11.0, 9.0, 14.0, 2.0, 3.0, 4.0, 3.0, 6.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-30.316314697265625, -29.36502456665039, -28.413732528686523, -27.46244239807129, -26.511150360107422, -25.559860229492188, -24.608570098876953, -23.657278060913086, -22.70598602294922, -21.754695892333984, -20.803403854370117, -19.852113723754883, -18.900821685791016, -17.94953155517578, -16.998241424560547, -16.04694938659668, -15.095659255981445, -14.144368171691895, -13.193077087402344, -12.24178695678711, -11.290494918823242, -10.339204788208008, -9.387913703918457, -8.436622619628906, -7.4853315353393555, -6.534040451049805, -5.582749366760254, -4.631458759307861, -3.6801676750183105, -2.7288765907287598, -1.7775859832763672, -0.8262948989868164, 0.12499618530273438, 1.0762871503829956, 2.027578115463257, 2.9788689613342285, 3.9301600456237793, 4.88145112991333, 5.832741737365723, 6.784032821655273, 7.735323905944824, 8.686614990234375, 9.637906074523926, 10.589197158813477, 11.540487289428711, 12.491779327392578, 13.443069458007812, 14.394360542297363, 15.345651626586914, 16.29694175720215, 17.248233795166016, 18.19952392578125, 19.150815963745117, 20.10210609436035, 21.05339813232422, 22.004688262939453, 22.955978393554688, 23.907268524169922, 24.85856056213379, 25.809850692749023, 26.76114273071289, 27.712432861328125, 28.66372299194336, 29.615015029907227, 30.566307067871094]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 0.0, 9.0, 15.0, 8.0, 8.0, 13.0, 16.0, 18.0, 23.0, 19.0, 32.0, 25.0, 31.0, 29.0, 38.0, 41.0, 31.0, 39.0, 35.0, 57.0, 50.0, 46.0, 34.0, 51.0, 44.0, 35.0, 46.0, 33.0, 18.0, 30.0, 20.0, 21.0, 18.0, 14.0, 10.0, 8.0, 10.0, 6.0, 6.0, 5.0, 2.0, 2.0, 4.0, 2.0, 0.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.71875, -3.602935791015625, -3.48712158203125, -3.371307373046875, -3.2554931640625, -3.139678955078125, -3.02386474609375, -2.908050537109375, -2.792236328125, -2.676422119140625, -2.56060791015625, -2.444793701171875, -2.3289794921875, -2.213165283203125, -2.09735107421875, -1.981536865234375, -1.86572265625, -1.749908447265625, -1.63409423828125, -1.518280029296875, -1.4024658203125, -1.286651611328125, -1.17083740234375, -1.055023193359375, -0.939208984375, -0.823394775390625, -0.70758056640625, -0.591766357421875, -0.4759521484375, -0.360137939453125, -0.24432373046875, -0.128509521484375, -0.0126953125, 0.103118896484375, 0.21893310546875, 0.334747314453125, 0.4505615234375, 0.566375732421875, 0.68218994140625, 0.798004150390625, 0.913818359375, 1.029632568359375, 1.14544677734375, 1.261260986328125, 1.3770751953125, 1.492889404296875, 1.60870361328125, 1.724517822265625, 1.84033203125, 1.956146240234375, 2.07196044921875, 2.187774658203125, 2.3035888671875, 2.419403076171875, 2.53521728515625, 2.651031494140625, 2.766845703125, 2.882659912109375, 2.99847412109375, 3.114288330078125, 3.2301025390625, 3.345916748046875, 3.46173095703125, 3.577545166015625, 3.693359375]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 6.0, 11.0, 8.0, 17.0, 23.0, 42.0, 46.0, 70.0, 90.0, 142.0, 179.0, 270.0, 378.0, 535.0, 745.0, 1029.0, 1509.0, 2127.0, 3002.0, 4338.0, 6383.0, 9078.0, 13575.0, 20911.0, 31516.0, 48872.0, 76060.0, 114206.0, 155955.0, 167501.0, 130959.0, 88969.0, 58071.0, 37294.0, 23935.0, 16050.0, 10548.0, 7328.0, 5011.0, 3409.0, 2498.0, 1718.0, 1238.0, 871.0, 615.0, 445.0, 316.0, 199.0, 160.0, 96.0, 69.0, 42.0, 34.0, 15.0, 19.0, 17.0, 11.0, 5.0, 2.0, 3.0], "bins": [-0.11834716796875, -0.11478137969970703, -0.11121559143066406, -0.1076498031616211, -0.10408401489257812, -0.10051822662353516, -0.09695243835449219, -0.09338665008544922, -0.08982086181640625, -0.08625507354736328, -0.08268928527832031, -0.07912349700927734, -0.07555770874023438, -0.0719919204711914, -0.06842613220214844, -0.06486034393310547, -0.0612945556640625, -0.05772876739501953, -0.05416297912597656, -0.050597190856933594, -0.047031402587890625, -0.043465614318847656, -0.03989982604980469, -0.03633403778076172, -0.03276824951171875, -0.02920246124267578, -0.025636672973632812, -0.022070884704589844, -0.018505096435546875, -0.014939308166503906, -0.011373519897460938, -0.007807731628417969, -0.004241943359375, -0.0006761550903320312, 0.0028896331787109375, 0.006455421447753906, 0.010021209716796875, 0.013586997985839844, 0.017152786254882812, 0.02071857452392578, 0.02428436279296875, 0.02785015106201172, 0.03141593933105469, 0.034981727600097656, 0.038547515869140625, 0.042113304138183594, 0.04567909240722656, 0.04924488067626953, 0.0528106689453125, 0.05637645721435547, 0.05994224548339844, 0.0635080337524414, 0.06707382202148438, 0.07063961029052734, 0.07420539855957031, 0.07777118682861328, 0.08133697509765625, 0.08490276336669922, 0.08846855163574219, 0.09203433990478516, 0.09560012817382812, 0.0991659164428711, 0.10273170471191406, 0.10629749298095703, 0.10986328125]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 4.0, 7.0, 10.0, 5.0, 11.0, 13.0, 11.0, 21.0, 20.0, 17.0, 20.0, 31.0, 33.0, 37.0, 35.0, 40.0, 32.0, 42.0, 36.0, 49.0, 1057.0, 40.0, 31.0, 30.0, 40.0, 40.0, 40.0, 40.0, 35.0, 25.0, 27.0, 31.0, 21.0, 18.0, 13.0, 9.0, 7.0, 10.0, 7.0, 9.0, 5.0, 3.0, 5.0, 4.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.369140625, -2.30108642578125, -2.2330322265625, -2.16497802734375, -2.096923828125, -2.02886962890625, -1.9608154296875, -1.89276123046875, -1.82470703125, -1.75665283203125, -1.6885986328125, -1.62054443359375, -1.552490234375, -1.48443603515625, -1.4163818359375, -1.34832763671875, -1.2802734375, -1.21221923828125, -1.1441650390625, -1.07611083984375, -1.008056640625, -0.94000244140625, -0.8719482421875, -0.80389404296875, -0.73583984375, -0.66778564453125, -0.5997314453125, -0.53167724609375, -0.463623046875, -0.39556884765625, -0.3275146484375, -0.25946044921875, -0.19140625, -0.12335205078125, -0.0552978515625, 0.01275634765625, 0.080810546875, 0.14886474609375, 0.2169189453125, 0.28497314453125, 0.35302734375, 0.42108154296875, 0.4891357421875, 0.55718994140625, 0.625244140625, 0.69329833984375, 0.7613525390625, 0.82940673828125, 0.8974609375, 0.96551513671875, 1.0335693359375, 1.10162353515625, 1.169677734375, 1.23773193359375, 1.3057861328125, 1.37384033203125, 1.44189453125, 1.50994873046875, 1.5780029296875, 1.64605712890625, 1.714111328125, 1.78216552734375, 1.8502197265625, 1.91827392578125, 1.986328125]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 2.0, 10.0, 12.0, 15.0, 28.0, 48.0, 63.0, 100.0, 159.0, 259.0, 438.0, 590.0, 944.0, 1435.0, 2078.0, 3196.0, 4772.0, 7103.0, 11286.0, 18023.0, 29241.0, 47772.0, 77608.0, 121478.0, 166950.0, 1223941.0, 137819.0, 91677.0, 56410.0, 34407.0, 21240.0, 13193.0, 8461.0, 5589.0, 3638.0, 2422.0, 1631.0, 1061.0, 701.0, 487.0, 303.0, 188.0, 129.0, 91.0, 48.0, 33.0, 15.0, 17.0, 7.0, 6.0, 7.0, 2.0, 1.0, 2.0, 2.0], "bins": [-0.125244140625, -0.12157917022705078, -0.11791419982910156, -0.11424922943115234, -0.11058425903320312, -0.1069192886352539, -0.10325431823730469, -0.09958934783935547, -0.09592437744140625, -0.09225940704345703, -0.08859443664550781, -0.0849294662475586, -0.08126449584960938, -0.07759952545166016, -0.07393455505371094, -0.07026958465576172, -0.0666046142578125, -0.06293964385986328, -0.05927467346191406, -0.055609703063964844, -0.051944732666015625, -0.048279762268066406, -0.04461479187011719, -0.04094982147216797, -0.03728485107421875, -0.03361988067626953, -0.029954910278320312, -0.026289939880371094, -0.022624969482421875, -0.018959999084472656, -0.015295028686523438, -0.011630058288574219, -0.007965087890625, -0.004300117492675781, -0.0006351470947265625, 0.0030298233032226562, 0.006694793701171875, 0.010359764099121094, 0.014024734497070312, 0.01768970489501953, 0.02135467529296875, 0.02501964569091797, 0.028684616088867188, 0.032349586486816406, 0.036014556884765625, 0.039679527282714844, 0.04334449768066406, 0.04700946807861328, 0.0506744384765625, 0.05433940887451172, 0.05800437927246094, 0.061669349670410156, 0.06533432006835938, 0.0689992904663086, 0.07266426086425781, 0.07632923126220703, 0.07999420166015625, 0.08365917205810547, 0.08732414245605469, 0.0909891128540039, 0.09465408325195312, 0.09831905364990234, 0.10198402404785156, 0.10564899444580078, 0.10931396484375]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 5.0, 4.0, 5.0, 3.0, 3.0, 11.0, 8.0, 7.0, 10.0, 12.0, 19.0, 25.0, 33.0, 35.0, 36.0, 32.0, 40.0, 39.0, 38.0, 55.0, 52.0, 50.0, 43.0, 41.0, 54.0, 33.0, 43.0, 45.0, 31.0, 35.0, 26.0, 19.0, 18.0, 20.0, 16.0, 19.0, 11.0, 8.0, 6.0, 5.0, 6.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0004069805145263672, -0.0003936551511287689, -0.00038032978773117065, -0.0003670044243335724, -0.0003536790609359741, -0.00034035369753837585, -0.0003270283341407776, -0.0003137029707431793, -0.00030037760734558105, -0.0002870522439479828, -0.0002737268805503845, -0.00026040151715278625, -0.000247076153755188, -0.00023375079035758972, -0.00022042542695999146, -0.0002071000635623932, -0.00019377470016479492, -0.00018044933676719666, -0.0001671239733695984, -0.00015379860997200012, -0.00014047324657440186, -0.0001271478831768036, -0.00011382251977920532, -0.00010049715638160706, -8.717179298400879e-05, -7.384642958641052e-05, -6.0521066188812256e-05, -4.719570279121399e-05, -3.387033939361572e-05, -2.0544975996017456e-05, -7.2196125984191895e-06, 6.105750799179077e-06, 1.9431114196777344e-05, 3.275647759437561e-05, 4.608184099197388e-05, 5.9407204389572144e-05, 7.273256778717041e-05, 8.605793118476868e-05, 9.938329458236694e-05, 0.00011270865797996521, 0.00012603402137756348, 0.00013935938477516174, 0.00015268474817276, 0.00016601011157035828, 0.00017933547496795654, 0.0001926608383655548, 0.00020598620176315308, 0.00021931156516075134, 0.0002326369285583496, 0.0002459622919559479, 0.00025928765535354614, 0.0002726130187511444, 0.0002859383821487427, 0.00029926374554634094, 0.0003125891089439392, 0.0003259144723415375, 0.00033923983573913574, 0.000352565199136734, 0.0003658905625343323, 0.00037921592593193054, 0.0003925412893295288, 0.0004058666527271271, 0.00041919201612472534, 0.0004325173795223236, 0.0004458427429199219]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 7.0, 8.0, 10.0, 12.0, 14.0, 18.0, 35.0, 30.0, 43.0, 50.0, 62.0, 88.0, 125.0, 146.0, 196.0, 295.0, 483.0, 2613.0, 300203.0, 735187.0, 7065.0, 600.0, 340.0, 183.0, 156.0, 144.0, 111.0, 89.0, 59.0, 48.0, 26.0, 26.0, 27.0, 15.0, 10.0, 14.0, 7.0, 9.0, 1.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.008087158203125, -0.007843077182769775, -0.007598996162414551, -0.007354915142059326, -0.0071108341217041016, -0.006866753101348877, -0.006622672080993652, -0.006378591060638428, -0.006134510040283203, -0.0058904290199279785, -0.005646347999572754, -0.005402266979217529, -0.005158185958862305, -0.00491410493850708, -0.0046700239181518555, -0.004425942897796631, -0.004181861877441406, -0.003937780857086182, -0.003693699836730957, -0.0034496188163757324, -0.003205537796020508, -0.002961456775665283, -0.0027173757553100586, -0.002473294734954834, -0.0022292137145996094, -0.0019851326942443848, -0.0017410516738891602, -0.0014969706535339355, -0.001252889633178711, -0.0010088086128234863, -0.0007647275924682617, -0.0005206465721130371, -0.0002765655517578125, -3.248453140258789e-05, 0.00021159648895263672, 0.00045567750930786133, 0.0006997585296630859, 0.0009438395500183105, 0.0011879205703735352, 0.0014320015907287598, 0.0016760826110839844, 0.001920163631439209, 0.0021642446517944336, 0.002408325672149658, 0.002652406692504883, 0.0028964877128601074, 0.003140568733215332, 0.0033846497535705566, 0.0036287307739257812, 0.003872811794281006, 0.0041168928146362305, 0.004360973834991455, 0.00460505485534668, 0.004849135875701904, 0.005093216896057129, 0.0053372979164123535, 0.005581378936767578, 0.005825459957122803, 0.006069540977478027, 0.006313621997833252, 0.0065577030181884766, 0.006801784038543701, 0.007045865058898926, 0.00728994607925415, 0.007534027099609375]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 5.0, 45.0, 247.0, 487.0, 201.0, 28.0, 3.0, 2.0], "bins": [-0.0031702760607004166, -0.0031169261783361435, -0.0030635762959718704, -0.0030102261807769537, -0.0029568762984126806, -0.0029035264160484076, -0.0028501765336841345, -0.0027968264184892178, -0.0027434765361249447, -0.0026901266537606716, -0.0026367767713963985, -0.002583426656201482, -0.0025300767738372087, -0.0024767268914729357, -0.0024233770091086626, -0.002370026893913746, -0.002316677011549473, -0.0022633271291851997, -0.0022099772468209267, -0.00215662713162601, -0.002103277249261737, -0.002049927366897464, -0.0019965774845331907, -0.0019432274857535958, -0.0018898777198046446, -0.0018365278374403715, -0.0017831778386607766, -0.0017298279562965035, -0.0016764779575169086, -0.0016231280751526356, -0.0015697781927883625, -0.0015164281940087676, -0.0014630780788138509, -0.0014097281964495778, -0.001356378197669983, -0.0013030283153057098, -0.001249678316526115, -0.0011963284341618419, -0.001142978435382247, -0.001089628553017974, -0.0010362786706537008, -0.0009829287882894278, -0.0009295787895098329, -0.0008762289071455598, -0.0008228789083659649, -0.0007695290260016918, -0.0007161790854297578, -0.0006628291448578238, -0.000609479146078229, -0.000556129205506295, -0.000502779264934361, -0.00044942935346625745, -0.00039607941289432347, -0.0003427294723223895, -0.00028937956085428596, -0.00023602962028235197, -0.00018267969426233321, -0.00012932976824231446, -7.597982767038047e-05, -2.2629901650361717e-05, 3.072003892157227e-05, 8.406997949350625e-05, 0.00013741989096160978, 0.00019076983153354377, 0.00024411977210547775]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 6.0, 2.0, 6.0, 5.0, 8.0, 5.0, 11.0, 11.0, 11.0, 8.0, 16.0, 24.0, 22.0, 33.0, 32.0, 38.0, 33.0, 32.0, 39.0, 37.0, 38.0, 35.0, 47.0, 40.0, 36.0, 38.0, 40.0, 31.0, 35.0, 37.0, 33.0, 33.0, 24.0, 25.0, 16.0, 24.0, 14.0, 17.0, 10.0, 16.0, 9.0, 4.0, 2.0, 5.0, 4.0, 2.0, 5.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.0002645254135131836, -0.0002567218616604805, -0.0002489183098077774, -0.0002411147579550743, -0.00023331120610237122, -0.00022550765424966812, -0.00021770410239696503, -0.00020990055054426193, -0.00020209699869155884, -0.00019429344683885574, -0.00018648989498615265, -0.00017868634313344955, -0.00017088279128074646, -0.00016307923942804337, -0.00015527568757534027, -0.00014747213572263718, -0.00013966858386993408, -0.000131865032017231, -0.0001240614801645279, -0.0001162579283118248, -0.0001084543764591217, -0.00010065082460641861, -9.284727275371552e-05, -8.504372090101242e-05, -7.724016904830933e-05, -6.943661719560623e-05, -6.163306534290314e-05, -5.382951349020004e-05, -4.602596163749695e-05, -3.8222409784793854e-05, -3.041885793209076e-05, -2.2615306079387665e-05, -1.481175422668457e-05, -7.008202373981476e-06, 7.953494787216187e-07, 8.598901331424713e-06, 1.6402453184127808e-05, 2.4206005036830902e-05, 3.2009556889533997e-05, 3.981310874223709e-05, 4.7616660594940186e-05, 5.542021244764328e-05, 6.322376430034637e-05, 7.102731615304947e-05, 7.883086800575256e-05, 8.663441985845566e-05, 9.443797171115875e-05, 0.00010224152356386185, 0.00011004507541656494, 0.00011784862726926804, 0.00012565217912197113, 0.00013345573097467422, 0.00014125928282737732, 0.00014906283468008041, 0.0001568663865327835, 0.0001646699383854866, 0.0001724734902381897, 0.0001802770420908928, 0.00018808059394359589, 0.00019588414579629898, 0.00020368769764900208, 0.00021149124950170517, 0.00021929480135440826, 0.00022709835320711136, 0.00023490190505981445]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 0.0, 9.0, 15.0, 8.0, 8.0, 13.0, 16.0, 18.0, 23.0, 19.0, 32.0, 25.0, 31.0, 29.0, 38.0, 41.0, 31.0, 39.0, 35.0, 57.0, 50.0, 46.0, 34.0, 51.0, 44.0, 35.0, 46.0, 33.0, 18.0, 30.0, 20.0, 21.0, 18.0, 14.0, 10.0, 8.0, 10.0, 6.0, 6.0, 5.0, 2.0, 2.0, 4.0, 2.0, 0.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.71875, -3.602935791015625, -3.48712158203125, -3.371307373046875, -3.2554931640625, -3.139678955078125, -3.02386474609375, -2.908050537109375, -2.792236328125, -2.676422119140625, -2.56060791015625, -2.444793701171875, -2.3289794921875, -2.213165283203125, -2.09735107421875, -1.981536865234375, -1.86572265625, -1.749908447265625, -1.63409423828125, -1.518280029296875, -1.4024658203125, -1.286651611328125, -1.17083740234375, -1.055023193359375, -0.939208984375, -0.823394775390625, -0.70758056640625, -0.591766357421875, -0.4759521484375, -0.360137939453125, -0.24432373046875, -0.128509521484375, -0.0126953125, 0.103118896484375, 0.21893310546875, 0.334747314453125, 0.4505615234375, 0.566375732421875, 0.68218994140625, 0.798004150390625, 0.913818359375, 1.029632568359375, 1.14544677734375, 1.261260986328125, 1.3770751953125, 1.492889404296875, 1.60870361328125, 1.724517822265625, 1.84033203125, 1.956146240234375, 2.07196044921875, 2.187774658203125, 2.3035888671875, 2.419403076171875, 2.53521728515625, 2.651031494140625, 2.766845703125, 2.882659912109375, 2.99847412109375, 3.114288330078125, 3.2301025390625, 3.345916748046875, 3.46173095703125, 3.577545166015625, 3.693359375]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 1.0, 0.0, 2.0, 4.0, 3.0, 6.0, 7.0, 11.0, 26.0, 35.0, 59.0, 93.0, 124.0, 197.0, 276.0, 401.0, 671.0, 990.0, 1425.0, 2062.0, 3160.0, 4783.0, 7376.0, 12308.0, 23019.0, 49983.0, 126542.0, 413377.0, 241009.0, 81070.0, 34415.0, 17308.0, 9822.0, 6146.0, 3892.0, 2637.0, 1801.0, 1170.0, 771.0, 525.0, 393.0, 242.0, 131.0, 85.0, 65.0, 54.0, 32.0, 25.0, 11.0, 11.0, 5.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.453125, -2.3734130859375, -2.293701171875, -2.2139892578125, -2.13427734375, -2.0545654296875, -1.974853515625, -1.8951416015625, -1.8154296875, -1.7357177734375, -1.656005859375, -1.5762939453125, -1.49658203125, -1.4168701171875, -1.337158203125, -1.2574462890625, -1.177734375, -1.0980224609375, -1.018310546875, -0.9385986328125, -0.85888671875, -0.7791748046875, -0.699462890625, -0.6197509765625, -0.5400390625, -0.4603271484375, -0.380615234375, -0.3009033203125, -0.22119140625, -0.1414794921875, -0.061767578125, 0.0179443359375, 0.09765625, 0.1773681640625, 0.257080078125, 0.3367919921875, 0.41650390625, 0.4962158203125, 0.575927734375, 0.6556396484375, 0.7353515625, 0.8150634765625, 0.894775390625, 0.9744873046875, 1.05419921875, 1.1339111328125, 1.213623046875, 1.2933349609375, 1.373046875, 1.4527587890625, 1.532470703125, 1.6121826171875, 1.69189453125, 1.7716064453125, 1.851318359375, 1.9310302734375, 2.0107421875, 2.0904541015625, 2.170166015625, 2.2498779296875, 2.32958984375, 2.4093017578125, 2.489013671875, 2.5687255859375, 2.6484375]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 3.0, 4.0, 4.0, 4.0, 4.0, 12.0, 12.0, 11.0, 16.0, 10.0, 17.0, 30.0, 18.0, 14.0, 27.0, 27.0, 28.0, 41.0, 39.0, 34.0, 42.0, 73.0, 98.0, 1684.0, 271.0, 89.0, 47.0, 41.0, 40.0, 21.0, 40.0, 35.0, 23.0, 29.0, 18.0, 19.0, 20.0, 13.0, 15.0, 12.0, 16.0, 10.0, 10.0, 5.0, 6.0, 3.0, 4.0, 1.0, 4.0, 5.0, 3.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0], "bins": [-11.8125, -11.4295654296875, -11.046630859375, -10.6636962890625, -10.28076171875, -9.8978271484375, -9.514892578125, -9.1319580078125, -8.7490234375, -8.3660888671875, -7.983154296875, -7.6002197265625, -7.21728515625, -6.8343505859375, -6.451416015625, -6.0684814453125, -5.685546875, -5.3026123046875, -4.919677734375, -4.5367431640625, -4.15380859375, -3.7708740234375, -3.387939453125, -3.0050048828125, -2.6220703125, -2.2391357421875, -1.856201171875, -1.4732666015625, -1.09033203125, -0.7073974609375, -0.324462890625, 0.0584716796875, 0.44140625, 0.8243408203125, 1.207275390625, 1.5902099609375, 1.97314453125, 2.3560791015625, 2.739013671875, 3.1219482421875, 3.5048828125, 3.8878173828125, 4.270751953125, 4.6536865234375, 5.03662109375, 5.4195556640625, 5.802490234375, 6.1854248046875, 6.568359375, 6.9512939453125, 7.334228515625, 7.7171630859375, 8.10009765625, 8.4830322265625, 8.865966796875, 9.2489013671875, 9.6318359375, 10.0147705078125, 10.397705078125, 10.7806396484375, 11.16357421875, 11.5465087890625, 11.929443359375, 12.3123779296875, 12.6953125]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 7.0, 1.0, 4.0, 9.0, 3.0, 6.0, 8.0, 14.0, 16.0, 21.0, 22.0, 16.0, 32.0, 26.0, 50.0, 62.0, 100.0, 133.0, 227.0, 499.0, 1696.0, 16291.0, 2748327.0, 367453.0, 8440.0, 1177.0, 398.0, 213.0, 134.0, 84.0, 44.0, 36.0, 26.0, 27.0, 25.0, 16.0, 19.0, 14.0, 14.0, 4.0, 4.0, 9.0, 0.0, 7.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-29.28125, -28.50830078125, -27.7353515625, -26.96240234375, -26.189453125, -25.41650390625, -24.6435546875, -23.87060546875, -23.09765625, -22.32470703125, -21.5517578125, -20.77880859375, -20.005859375, -19.23291015625, -18.4599609375, -17.68701171875, -16.9140625, -16.14111328125, -15.3681640625, -14.59521484375, -13.822265625, -13.04931640625, -12.2763671875, -11.50341796875, -10.73046875, -9.95751953125, -9.1845703125, -8.41162109375, -7.638671875, -6.86572265625, -6.0927734375, -5.31982421875, -4.546875, -3.77392578125, -3.0009765625, -2.22802734375, -1.455078125, -0.68212890625, 0.0908203125, 0.86376953125, 1.63671875, 2.40966796875, 3.1826171875, 3.95556640625, 4.728515625, 5.50146484375, 6.2744140625, 7.04736328125, 7.8203125, 8.59326171875, 9.3662109375, 10.13916015625, 10.912109375, 11.68505859375, 12.4580078125, 13.23095703125, 14.00390625, 14.77685546875, 15.5498046875, 16.32275390625, 17.095703125, 17.86865234375, 18.6416015625, 19.41455078125, 20.1875]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [2.0, 16.0, 998.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.581470489501953, -13.88715934753418, -4.192848205566406, 5.501462936401367, 15.19577407836914, 24.890087127685547, 34.58439636230469, 44.27870559692383, 53.973018646240234, 63.667327880859375, 73.36164093017578, 83.05595397949219, 92.75025939941406, 102.444580078125, 112.13888549804688, 121.83319091796875, 131.5275115966797, 141.22181701660156, 150.9161376953125, 160.61044311523438, 170.30474853515625, 179.9990692138672, 189.69337463378906, 199.3876953125, 209.08200073242188, 218.77630615234375, 228.4706268310547, 238.16493225097656, 247.8592529296875, 257.5535583496094, 267.24786376953125, 276.9421691894531, 286.636474609375, 296.3307800292969, 306.02508544921875, 315.71942138671875, 325.4137268066406, 335.1080322265625, 344.8023376464844, 354.49664306640625, 364.19097900390625, 373.8852844238281, 383.57958984375, 393.27392578125, 402.9682312011719, 412.66253662109375, 422.3568420410156, 432.0511474609375, 441.7454528808594, 451.43975830078125, 461.1340637207031, 470.8283996582031, 480.522705078125, 490.2170104980469, 499.91131591796875, 509.6056213378906, 519.2999267578125, 528.9942626953125, 538.6885375976562, 548.3828735351562, 558.0771484375, 567.771484375, 577.4658203125, 587.1600952148438, 596.8544311523438]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 5.0, 7.0, 5.0, 7.0, 6.0, 9.0, 12.0, 14.0, 10.0, 9.0, 15.0, 22.0, 17.0, 20.0, 26.0, 26.0, 25.0, 33.0, 36.0, 43.0, 33.0, 41.0, 34.0, 36.0, 44.0, 39.0, 47.0, 44.0, 33.0, 33.0, 31.0, 33.0, 26.0, 25.0, 25.0, 19.0, 21.0, 18.0, 17.0, 16.0, 6.0, 10.0, 5.0, 7.0, 5.0, 4.0, 4.0, 3.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.25785446166992, -34.98994827270508, -33.72203826904297, -32.454132080078125, -31.18622398376465, -29.918315887451172, -28.650409698486328, -27.38250160217285, -26.114593505859375, -24.8466854095459, -23.578777313232422, -22.310871124267578, -21.0429630279541, -19.775054931640625, -18.50714874267578, -17.239240646362305, -15.971332550048828, -14.703424453735352, -13.435517311096191, -12.167610168457031, -10.899702072143555, -9.631793975830078, -8.363886833190918, -7.095979690551758, -5.828071594238281, -4.560163974761963, -3.2922563552856445, -2.024348735809326, -0.7564411163330078, 0.5114665031433105, 1.779374122619629, 3.047281265258789, 4.315193176269531, 5.58310079574585, 6.851008415222168, 8.118915557861328, 9.386823654174805, 10.654731750488281, 11.922638893127441, 13.190546035766602, 14.458454132080078, 15.726362228393555, 16.99427032470703, 18.262176513671875, 19.53008460998535, 20.797992706298828, 22.065898895263672, 23.33380699157715, 24.601715087890625, 25.8696231842041, 27.137531280517578, 28.405437469482422, 29.6733455657959, 30.941253662109375, 32.20915985107422, 33.47706604003906, 34.74497604370117, 36.012882232666016, 37.280792236328125, 38.54869842529297, 39.81660461425781, 41.08451461791992, 42.352420806884766, 43.620330810546875, 44.88823699951172]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 5.0, 6.0, 6.0, 17.0, 7.0, 10.0, 21.0, 25.0, 25.0, 17.0, 36.0, 27.0, 24.0, 35.0, 40.0, 29.0, 47.0, 32.0, 37.0, 56.0, 50.0, 59.0, 34.0, 46.0, 32.0, 44.0, 40.0, 27.0, 37.0, 22.0, 17.0, 19.0, 12.0, 16.0, 4.0, 7.0, 9.0, 9.0, 5.0, 2.0, 1.0, 3.0, 2.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-4.0078125, -3.885009765625, -3.76220703125, -3.639404296875, -3.5166015625, -3.393798828125, -3.27099609375, -3.148193359375, -3.025390625, -2.902587890625, -2.77978515625, -2.656982421875, -2.5341796875, -2.411376953125, -2.28857421875, -2.165771484375, -2.04296875, -1.920166015625, -1.79736328125, -1.674560546875, -1.5517578125, -1.428955078125, -1.30615234375, -1.183349609375, -1.060546875, -0.937744140625, -0.81494140625, -0.692138671875, -0.5693359375, -0.446533203125, -0.32373046875, -0.200927734375, -0.078125, 0.044677734375, 0.16748046875, 0.290283203125, 0.4130859375, 0.535888671875, 0.65869140625, 0.781494140625, 0.904296875, 1.027099609375, 1.14990234375, 1.272705078125, 1.3955078125, 1.518310546875, 1.64111328125, 1.763916015625, 1.88671875, 2.009521484375, 2.13232421875, 2.255126953125, 2.3779296875, 2.500732421875, 2.62353515625, 2.746337890625, 2.869140625, 2.991943359375, 3.11474609375, 3.237548828125, 3.3603515625, 3.483154296875, 3.60595703125, 3.728759765625, 3.8515625]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 4.0, 1.0, 3.0, 5.0, 5.0, 5.0, 10.0, 13.0, 19.0, 17.0, 27.0, 22.0, 38.0, 42.0, 58.0, 81.0, 113.0, 210.0, 563.0, 2303.0, 12521.0, 106593.0, 2542329.0, 1452792.0, 65267.0, 8514.0, 1673.0, 467.0, 172.0, 101.0, 78.0, 47.0, 55.0, 32.0, 25.0, 17.0, 13.0, 6.0, 10.0, 13.0, 6.0, 6.0, 4.0, 5.0, 2.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-17.140625, -16.61962890625, -16.0986328125, -15.57763671875, -15.056640625, -14.53564453125, -14.0146484375, -13.49365234375, -12.97265625, -12.45166015625, -11.9306640625, -11.40966796875, -10.888671875, -10.36767578125, -9.8466796875, -9.32568359375, -8.8046875, -8.28369140625, -7.7626953125, -7.24169921875, -6.720703125, -6.19970703125, -5.6787109375, -5.15771484375, -4.63671875, -4.11572265625, -3.5947265625, -3.07373046875, -2.552734375, -2.03173828125, -1.5107421875, -0.98974609375, -0.46875, 0.05224609375, 0.5732421875, 1.09423828125, 1.615234375, 2.13623046875, 2.6572265625, 3.17822265625, 3.69921875, 4.22021484375, 4.7412109375, 5.26220703125, 5.783203125, 6.30419921875, 6.8251953125, 7.34619140625, 7.8671875, 8.38818359375, 8.9091796875, 9.43017578125, 9.951171875, 10.47216796875, 10.9931640625, 11.51416015625, 12.03515625, 12.55615234375, 13.0771484375, 13.59814453125, 14.119140625, 14.64013671875, 15.1611328125, 15.68212890625, 16.203125]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 5.0, 2.0, 4.0, 4.0, 2.0, 7.0, 13.0, 38.0, 40.0, 73.0, 103.0, 157.0, 220.0, 320.0, 545.0, 693.0, 598.0, 447.0, 279.0, 188.0, 101.0, 90.0, 48.0, 29.0, 24.0, 17.0, 10.0, 9.0, 2.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.71875, -11.26220703125, -10.8056640625, -10.34912109375, -9.892578125, -9.43603515625, -8.9794921875, -8.52294921875, -8.06640625, -7.60986328125, -7.1533203125, -6.69677734375, -6.240234375, -5.78369140625, -5.3271484375, -4.87060546875, -4.4140625, -3.95751953125, -3.5009765625, -3.04443359375, -2.587890625, -2.13134765625, -1.6748046875, -1.21826171875, -0.76171875, -0.30517578125, 0.1513671875, 0.60791015625, 1.064453125, 1.52099609375, 1.9775390625, 2.43408203125, 2.890625, 3.34716796875, 3.8037109375, 4.26025390625, 4.716796875, 5.17333984375, 5.6298828125, 6.08642578125, 6.54296875, 6.99951171875, 7.4560546875, 7.91259765625, 8.369140625, 8.82568359375, 9.2822265625, 9.73876953125, 10.1953125, 10.65185546875, 11.1083984375, 11.56494140625, 12.021484375, 12.47802734375, 12.9345703125, 13.39111328125, 13.84765625, 14.30419921875, 14.7607421875, 15.21728515625, 15.673828125, 16.13037109375, 16.5869140625, 17.04345703125, 17.5]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 9.0, 14.0, 11.0, 22.0, 49.0, 81.0, 135.0, 309.0, 714.0, 3233.0, 29671.0, 733271.0, 3298261.0, 118004.0, 8176.0, 1423.0, 468.0, 217.0, 110.0, 41.0, 25.0, 15.0, 6.0, 7.0, 8.0, 3.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.125, -30.9873046875, -29.849609375, -28.7119140625, -27.57421875, -26.4365234375, -25.298828125, -24.1611328125, -23.0234375, -21.8857421875, -20.748046875, -19.6103515625, -18.47265625, -17.3349609375, -16.197265625, -15.0595703125, -13.921875, -12.7841796875, -11.646484375, -10.5087890625, -9.37109375, -8.2333984375, -7.095703125, -5.9580078125, -4.8203125, -3.6826171875, -2.544921875, -1.4072265625, -0.26953125, 0.8681640625, 2.005859375, 3.1435546875, 4.28125, 5.4189453125, 6.556640625, 7.6943359375, 8.83203125, 9.9697265625, 11.107421875, 12.2451171875, 13.3828125, 14.5205078125, 15.658203125, 16.7958984375, 17.93359375, 19.0712890625, 20.208984375, 21.3466796875, 22.484375, 23.6220703125, 24.759765625, 25.8974609375, 27.03515625, 28.1728515625, 29.310546875, 30.4482421875, 31.5859375, 32.7236328125, 33.861328125, 34.9990234375, 36.13671875, 37.2744140625, 38.412109375, 39.5498046875, 40.6875]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 3.0, 4.0, 17.0, 35.0, 72.0, 129.0, 153.0, 184.0, 165.0, 109.0, 63.0, 50.0, 11.0, 7.0, 3.0, 5.0, 1.0], "bins": [-157.37026977539062, -154.48284912109375, -151.5954132080078, -148.70799255371094, -145.820556640625, -142.93313598632812, -140.0457000732422, -137.1582794189453, -134.27084350585938, -131.3834228515625, -128.49598693847656, -125.60855865478516, -122.72113037109375, -119.83370971679688, -116.94628143310547, -114.05885314941406, -111.17143249511719, -108.28400421142578, -105.39657592773438, -102.50914764404297, -99.62171936035156, -96.73429870605469, -93.84687042236328, -90.95944213867188, -88.07201385498047, -85.18458557128906, -82.29715728759766, -79.40972900390625, -76.52230834960938, -73.63488006591797, -70.74745178222656, -67.86002349853516, -64.97260284423828, -62.085174560546875, -59.19774627685547, -56.31032180786133, -53.42289352416992, -50.535465240478516, -47.648040771484375, -44.76061248779297, -41.87318420410156, -38.985755920410156, -36.09832763671875, -33.21090316772461, -30.323474884033203, -27.436046600341797, -24.548620223999023, -21.66119384765625, -18.773765563964844, -15.886338233947754, -12.998910903930664, -10.111483573913574, -7.224056243896484, -4.3366289138793945, -1.4492015838623047, 1.4382247924804688, 4.325653076171875, 7.213080406188965, 10.100507736206055, 12.987935066223145, 15.875362396240234, 18.76279067993164, 21.650217056274414, 24.537643432617188, 27.425071716308594]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 5.0, 2.0, 2.0, 8.0, 3.0, 2.0, 4.0, 7.0, 7.0, 9.0, 7.0, 17.0, 20.0, 17.0, 15.0, 19.0, 26.0, 21.0, 34.0, 34.0, 27.0, 39.0, 35.0, 40.0, 37.0, 43.0, 32.0, 49.0, 40.0, 34.0, 36.0, 32.0, 31.0, 37.0, 43.0, 22.0, 23.0, 21.0, 15.0, 22.0, 26.0, 17.0, 10.0, 8.0, 3.0, 7.0, 7.0, 0.0, 7.0, 2.0, 4.0, 3.0, 3.0, 3.0, 0.0, 2.0], "bins": [-37.487037658691406, -36.40272903442383, -35.318416595458984, -34.234107971191406, -33.14979553222656, -32.065486907958984, -30.981176376342773, -29.896865844726562, -28.812557220458984, -27.728246688842773, -26.643936157226562, -25.559627532958984, -24.475317001342773, -23.391006469726562, -22.30669593811035, -21.22238540649414, -20.13807487487793, -19.05376434326172, -17.969453811645508, -16.885143280029297, -15.800834655761719, -14.716524124145508, -13.632213592529297, -12.547903060913086, -11.463593482971191, -10.37928295135498, -9.294973373413086, -8.210662841796875, -7.126352787017822, -6.0420427322387695, -4.957732200622559, -3.873422145843506, -2.789112091064453, -1.7048019170761108, -0.6204917430877686, 0.4638185501098633, 1.548128604888916, 2.6324386596679688, 3.7167491912841797, 4.801059246063232, 5.885369300842285, 6.969679355621338, 8.05398941040039, 9.138299942016602, 10.222610473632812, 11.306920051574707, 12.391230583190918, 13.475540161132812, 14.559850692749023, 15.644161224365234, 16.728471755981445, 17.812782287597656, 18.897090911865234, 19.981401443481445, 21.065711975097656, 22.150022506713867, 23.234333038330078, 24.31864356994629, 25.4029541015625, 26.487262725830078, 27.57157325744629, 28.6558837890625, 29.74019432067871, 30.824504852294922, 31.9088134765625]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 5.0, 7.0, 5.0, 13.0, 12.0, 15.0, 15.0, 18.0, 27.0, 30.0, 29.0, 27.0, 26.0, 38.0, 40.0, 34.0, 43.0, 43.0, 56.0, 37.0, 33.0, 47.0, 48.0, 42.0, 39.0, 41.0, 37.0, 37.0, 28.0, 26.0, 12.0, 20.0, 15.0, 14.0, 6.0, 8.0, 4.0, 5.0, 10.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.203125, -4.0733642578125, -3.943603515625, -3.8138427734375, -3.68408203125, -3.5543212890625, -3.424560546875, -3.2947998046875, -3.1650390625, -3.0352783203125, -2.905517578125, -2.7757568359375, -2.64599609375, -2.5162353515625, -2.386474609375, -2.2567138671875, -2.126953125, -1.9971923828125, -1.867431640625, -1.7376708984375, -1.60791015625, -1.4781494140625, -1.348388671875, -1.2186279296875, -1.0888671875, -0.9591064453125, -0.829345703125, -0.6995849609375, -0.56982421875, -0.4400634765625, -0.310302734375, -0.1805419921875, -0.05078125, 0.0789794921875, 0.208740234375, 0.3385009765625, 0.46826171875, 0.5980224609375, 0.727783203125, 0.8575439453125, 0.9873046875, 1.1170654296875, 1.246826171875, 1.3765869140625, 1.50634765625, 1.6361083984375, 1.765869140625, 1.8956298828125, 2.025390625, 2.1551513671875, 2.284912109375, 2.4146728515625, 2.54443359375, 2.6741943359375, 2.803955078125, 2.9337158203125, 3.0634765625, 3.1932373046875, 3.322998046875, 3.4527587890625, 3.58251953125, 3.7122802734375, 3.842041015625, 3.9718017578125, 4.1015625]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 5.0, 7.0, 27.0, 22.0, 52.0, 58.0, 96.0, 115.0, 167.0, 211.0, 387.0, 585.0, 879.0, 1240.0, 1945.0, 3160.0, 4876.0, 7704.0, 12344.0, 19668.0, 32045.0, 53487.0, 89712.0, 143711.0, 192554.0, 176804.0, 120241.0, 72870.0, 43509.0, 25984.0, 16095.0, 9986.0, 6306.0, 4076.0, 2548.0, 1809.0, 1118.0, 725.0, 475.0, 305.0, 186.0, 138.0, 91.0, 78.0, 45.0, 42.0, 30.0, 13.0, 8.0, 9.0, 5.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.1512451171875, -0.14648818969726562, -0.14173126220703125, -0.13697433471679688, -0.1322174072265625, -0.12746047973632812, -0.12270355224609375, -0.11794662475585938, -0.113189697265625, -0.10843276977539062, -0.10367584228515625, -0.09891891479492188, -0.0941619873046875, -0.08940505981445312, -0.08464813232421875, -0.07989120483398438, -0.07513427734375, -0.07037734985351562, -0.06562042236328125, -0.060863494873046875, -0.0561065673828125, -0.051349639892578125, -0.04659271240234375, -0.041835784912109375, -0.037078857421875, -0.032321929931640625, -0.02756500244140625, -0.022808074951171875, -0.0180511474609375, -0.013294219970703125, -0.00853729248046875, -0.003780364990234375, 0.0009765625, 0.005733489990234375, 0.01049041748046875, 0.015247344970703125, 0.0200042724609375, 0.024761199951171875, 0.02951812744140625, 0.034275054931640625, 0.039031982421875, 0.043788909912109375, 0.04854583740234375, 0.053302764892578125, 0.0580596923828125, 0.06281661987304688, 0.06757354736328125, 0.07233047485351562, 0.07708740234375, 0.08184432983398438, 0.08660125732421875, 0.09135818481445312, 0.0961151123046875, 0.10087203979492188, 0.10562896728515625, 0.11038589477539062, 0.115142822265625, 0.11989974975585938, 0.12465667724609375, 0.12941360473632812, 0.1341705322265625, 0.13892745971679688, 0.14368438720703125, 0.14844131469726562, 0.1531982421875]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 5.0, 1.0, 5.0, 3.0, 3.0, 8.0, 7.0, 6.0, 7.0, 8.0, 8.0, 18.0, 10.0, 17.0, 21.0, 20.0, 29.0, 27.0, 25.0, 34.0, 31.0, 40.0, 31.0, 22.0, 35.0, 39.0, 27.0, 1057.0, 36.0, 41.0, 32.0, 29.0, 28.0, 27.0, 36.0, 20.0, 27.0, 31.0, 22.0, 22.0, 18.0, 22.0, 14.0, 12.0, 13.0, 9.0, 10.0, 10.0, 12.0, 2.0, 5.0, 4.0, 4.0, 2.0, 3.0, 0.0, 1.0, 4.0, 2.0, 2.0, 2.0], "bins": [-1.966796875, -1.902099609375, -1.83740234375, -1.772705078125, -1.7080078125, -1.643310546875, -1.57861328125, -1.513916015625, -1.44921875, -1.384521484375, -1.31982421875, -1.255126953125, -1.1904296875, -1.125732421875, -1.06103515625, -0.996337890625, -0.931640625, -0.866943359375, -0.80224609375, -0.737548828125, -0.6728515625, -0.608154296875, -0.54345703125, -0.478759765625, -0.4140625, -0.349365234375, -0.28466796875, -0.219970703125, -0.1552734375, -0.090576171875, -0.02587890625, 0.038818359375, 0.103515625, 0.168212890625, 0.23291015625, 0.297607421875, 0.3623046875, 0.427001953125, 0.49169921875, 0.556396484375, 0.62109375, 0.685791015625, 0.75048828125, 0.815185546875, 0.8798828125, 0.944580078125, 1.00927734375, 1.073974609375, 1.138671875, 1.203369140625, 1.26806640625, 1.332763671875, 1.3974609375, 1.462158203125, 1.52685546875, 1.591552734375, 1.65625, 1.720947265625, 1.78564453125, 1.850341796875, 1.9150390625, 1.979736328125, 2.04443359375, 2.109130859375, 2.173828125]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 10.0, 11.0, 22.0, 25.0, 54.0, 71.0, 93.0, 161.0, 220.0, 320.0, 510.0, 617.0, 1038.0, 1446.0, 2129.0, 3008.0, 4509.0, 6893.0, 9905.0, 14987.0, 22847.0, 35934.0, 54824.0, 83784.0, 120512.0, 266988.0, 1089277.0, 124397.0, 86759.0, 57582.0, 36740.0, 23957.0, 15556.0, 10172.0, 6923.0, 4607.0, 3190.0, 2190.0, 1502.0, 1050.0, 756.0, 518.0, 337.0, 225.0, 151.0, 117.0, 82.0, 47.0, 31.0, 20.0, 12.0, 10.0, 8.0, 1.0, 2.0, 0.0, 4.0, 2.0, 0.0, 1.0], "bins": [-0.10955810546875, -0.1059112548828125, -0.102264404296875, -0.0986175537109375, -0.094970703125, -0.0913238525390625, -0.087677001953125, -0.0840301513671875, -0.08038330078125, -0.0767364501953125, -0.073089599609375, -0.0694427490234375, -0.0657958984375, -0.0621490478515625, -0.058502197265625, -0.0548553466796875, -0.05120849609375, -0.0475616455078125, -0.043914794921875, -0.0402679443359375, -0.03662109375, -0.0329742431640625, -0.029327392578125, -0.0256805419921875, -0.02203369140625, -0.0183868408203125, -0.014739990234375, -0.0110931396484375, -0.0074462890625, -0.0037994384765625, -0.000152587890625, 0.0034942626953125, 0.00714111328125, 0.0107879638671875, 0.014434814453125, 0.0180816650390625, 0.021728515625, 0.0253753662109375, 0.029022216796875, 0.0326690673828125, 0.03631591796875, 0.0399627685546875, 0.043609619140625, 0.0472564697265625, 0.0509033203125, 0.0545501708984375, 0.058197021484375, 0.0618438720703125, 0.06549072265625, 0.0691375732421875, 0.072784423828125, 0.0764312744140625, 0.080078125, 0.0837249755859375, 0.087371826171875, 0.0910186767578125, 0.09466552734375, 0.0983123779296875, 0.101959228515625, 0.1056060791015625, 0.1092529296875, 0.1128997802734375, 0.116546630859375, 0.1201934814453125, 0.12384033203125]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 6.0, 3.0, 7.0, 11.0, 8.0, 11.0, 11.0, 13.0, 16.0, 17.0, 25.0, 26.0, 37.0, 50.0, 56.0, 66.0, 57.0, 56.0, 46.0, 72.0, 49.0, 51.0, 62.0, 37.0, 45.0, 31.0, 29.0, 24.0, 21.0, 7.0, 10.0, 11.0, 5.0, 8.0, 4.0, 2.0, 2.0, 5.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0007777214050292969, -0.0007544606924057007, -0.0007311999797821045, -0.0007079392671585083, -0.0006846785545349121, -0.0006614178419113159, -0.0006381571292877197, -0.0006148964166641235, -0.0005916357040405273, -0.0005683749914169312, -0.000545114278793335, -0.0005218535661697388, -0.0004985928535461426, -0.0004753321409225464, -0.0004520714282989502, -0.000428810715675354, -0.0004055500030517578, -0.0003822892904281616, -0.00035902857780456543, -0.00033576786518096924, -0.00031250715255737305, -0.00028924643993377686, -0.00026598572731018066, -0.00024272501468658447, -0.00021946430206298828, -0.0001962035894393921, -0.0001729428768157959, -0.0001496821641921997, -0.00012642145156860352, -0.00010316073894500732, -7.990002632141113e-05, -5.663931369781494e-05, -3.337860107421875e-05, -1.0117888450622559e-05, 1.3142824172973633e-05, 3.6403536796569824e-05, 5.9664249420166016e-05, 8.292496204376221e-05, 0.0001061856746673584, 0.0001294463872909546, 0.00015270709991455078, 0.00017596781253814697, 0.00019922852516174316, 0.00022248923778533936, 0.00024574995040893555, 0.00026901066303253174, 0.00029227137565612793, 0.0003155320882797241, 0.0003387928009033203, 0.0003620535135269165, 0.0003853142261505127, 0.0004085749387741089, 0.0004318356513977051, 0.00045509636402130127, 0.00047835707664489746, 0.0005016177892684937, 0.0005248785018920898, 0.000548139214515686, 0.0005713999271392822, 0.0005946606397628784, 0.0006179213523864746, 0.0006411820650100708, 0.000664442777633667, 0.0006877034902572632, 0.0007109642028808594]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 4.0, 4.0, 4.0, 0.0, 10.0, 7.0, 19.0, 10.0, 19.0, 31.0, 36.0, 66.0, 76.0, 113.0, 150.0, 233.0, 428.0, 921.0, 44371.0, 991526.0, 8845.0, 628.0, 341.0, 201.0, 172.0, 122.0, 49.0, 39.0, 36.0, 20.0, 13.0, 18.0, 12.0, 10.0, 8.0, 6.0, 7.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0134429931640625, -0.013000249862670898, -0.012557506561279297, -0.012114763259887695, -0.011672019958496094, -0.011229276657104492, -0.01078653335571289, -0.010343790054321289, -0.009901046752929688, -0.009458303451538086, -0.009015560150146484, -0.008572816848754883, -0.008130073547363281, -0.00768733024597168, -0.007244586944580078, -0.0068018436431884766, -0.006359100341796875, -0.0059163570404052734, -0.005473613739013672, -0.00503087043762207, -0.004588127136230469, -0.004145383834838867, -0.0037026405334472656, -0.003259897232055664, -0.0028171539306640625, -0.002374410629272461, -0.0019316673278808594, -0.0014889240264892578, -0.0010461807250976562, -0.0006034374237060547, -0.00016069412231445312, 0.00028204917907714844, 0.00072479248046875, 0.0011675357818603516, 0.0016102790832519531, 0.0020530223846435547, 0.0024957656860351562, 0.002938508987426758, 0.0033812522888183594, 0.003823995590209961, 0.0042667388916015625, 0.004709482192993164, 0.005152225494384766, 0.005594968795776367, 0.006037712097167969, 0.00648045539855957, 0.006923198699951172, 0.0073659420013427734, 0.007808685302734375, 0.008251428604125977, 0.008694171905517578, 0.00913691520690918, 0.009579658508300781, 0.010022401809692383, 0.010465145111083984, 0.010907888412475586, 0.011350631713867188, 0.011793375015258789, 0.01223611831665039, 0.012678861618041992, 0.013121604919433594, 0.013564348220825195, 0.014007091522216797, 0.014449834823608398, 0.014892578125]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 11.0, 46.0, 185.0, 341.0, 281.0, 121.0, 23.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014068412128835917, -0.0013561598025262356, -0.0013054783921688795, -0.0012547969818115234, -0.0012041155714541674, -0.0011534341610968113, -0.0011027527507394552, -0.0010520713403820992, -0.001001389930024743, -0.000950708519667387, -0.0009000271093100309, -0.0008493456989526749, -0.0007986642885953188, -0.0007479828782379627, -0.0006973014678806067, -0.0006466200575232506, -0.0005959385889582336, -0.0005452571786008775, -0.0004945757682435215, -0.0004438943578861654, -0.0003932129475288093, -0.0003425315080676228, -0.0002918500977102667, -0.00024116868735291064, -0.00019048727699555457, -0.0001398058666381985, -8.912444900488481e-05, -3.8443031371571124e-05, 1.2238378985784948e-05, 6.291980389505625e-05, 0.00011360121425241232, 0.0001642826246097684, 0.00021496403496712446, 0.00026564544532448053, 0.0003163268556818366, 0.0003670082660391927, 0.00041768967639654875, 0.0004683711158577353, 0.0005190524971112609, 0.000569733907468617, 0.000620415317825973, 0.0006710967281833291, 0.0007217781385406852, 0.0007724595488980412, 0.0008231409592553973, 0.0008738223696127534, 0.0009245037799701095, 0.0009751851903274655, 0.0010258667171001434, 0.0010765481274574995, 0.0011272295378148556, 0.0011779109481722116, 0.0012285923585295677, 0.0012792737688869238, 0.0013299551792442799, 0.001380636589601636, 0.001431317999958992, 0.001481999410316348, 0.0015326808206737041, 0.0015833622310310602, 0.0016340436413884163, 0.0016847250517457724, 0.0017354064621031284, 0.0017860878724604845, 0.0018367692828178406]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 4.0, 1.0, 7.0, 8.0, 8.0, 6.0, 6.0, 12.0, 15.0, 19.0, 10.0, 17.0, 16.0, 27.0, 28.0, 24.0, 34.0, 26.0, 25.0, 29.0, 37.0, 31.0, 46.0, 33.0, 37.0, 30.0, 26.0, 44.0, 37.0, 28.0, 26.0, 30.0, 41.0, 34.0, 28.0, 28.0, 19.0, 20.0, 19.0, 11.0, 16.0, 8.0, 7.0, 12.0, 7.0, 7.0, 5.0, 5.0, 3.0, 5.0, 0.0, 4.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0], "bins": [-0.00031512975692749023, -0.00030435342341661453, -0.00029357708990573883, -0.00028280075639486313, -0.0002720244228839874, -0.0002612480893731117, -0.000250471755862236, -0.00023969542235136032, -0.00022891908884048462, -0.00021814275532960892, -0.00020736642181873322, -0.0001965900883078575, -0.0001858137547969818, -0.0001750374212861061, -0.0001642610877752304, -0.0001534847542643547, -0.000142708420753479, -0.0001319320872426033, -0.0001211557537317276, -0.0001103794202208519, -9.96030867099762e-05, -8.88267531991005e-05, -7.805041968822479e-05, -6.727408617734909e-05, -5.649775266647339e-05, -4.572141915559769e-05, -3.4945085644721985e-05, -2.4168752133846283e-05, -1.3392418622970581e-05, -2.616085112094879e-06, 8.160248398780823e-06, 1.8936581909656525e-05, 2.9712915420532227e-05, 4.048924893140793e-05, 5.126558244228363e-05, 6.204191595315933e-05, 7.281824946403503e-05, 8.359458297491074e-05, 9.437091648578644e-05, 0.00010514724999666214, 0.00011592358350753784, 0.00012669991701841354, 0.00013747625052928925, 0.00014825258404016495, 0.00015902891755104065, 0.00016980525106191635, 0.00018058158457279205, 0.00019135791808366776, 0.00020213425159454346, 0.00021291058510541916, 0.00022368691861629486, 0.00023446325212717056, 0.00024523958563804626, 0.00025601591914892197, 0.00026679225265979767, 0.00027756858617067337, 0.00028834491968154907, 0.0002991212531924248, 0.0003098975867033005, 0.0003206739202141762, 0.0003314502537250519, 0.0003422265872359276, 0.0003530029207468033, 0.000363779254257679, 0.0003745555877685547]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 5.0, 7.0, 5.0, 13.0, 12.0, 15.0, 15.0, 18.0, 27.0, 30.0, 29.0, 27.0, 26.0, 38.0, 40.0, 34.0, 43.0, 43.0, 56.0, 37.0, 33.0, 47.0, 48.0, 42.0, 39.0, 41.0, 37.0, 37.0, 28.0, 26.0, 12.0, 20.0, 15.0, 14.0, 6.0, 8.0, 4.0, 5.0, 10.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.203125, -4.0733642578125, -3.943603515625, -3.8138427734375, -3.68408203125, -3.5543212890625, -3.424560546875, -3.2947998046875, -3.1650390625, -3.0352783203125, -2.905517578125, -2.7757568359375, -2.64599609375, -2.5162353515625, -2.386474609375, -2.2567138671875, -2.126953125, -1.9971923828125, -1.867431640625, -1.7376708984375, -1.60791015625, -1.4781494140625, -1.348388671875, -1.2186279296875, -1.0888671875, -0.9591064453125, -0.829345703125, -0.6995849609375, -0.56982421875, -0.4400634765625, -0.310302734375, -0.1805419921875, -0.05078125, 0.0789794921875, 0.208740234375, 0.3385009765625, 0.46826171875, 0.5980224609375, 0.727783203125, 0.8575439453125, 0.9873046875, 1.1170654296875, 1.246826171875, 1.3765869140625, 1.50634765625, 1.6361083984375, 1.765869140625, 1.8956298828125, 2.025390625, 2.1551513671875, 2.284912109375, 2.4146728515625, 2.54443359375, 2.6741943359375, 2.803955078125, 2.9337158203125, 3.0634765625, 3.1932373046875, 3.322998046875, 3.4527587890625, 3.58251953125, 3.7122802734375, 3.842041015625, 3.9718017578125, 4.1015625]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 5.0, 2.0, 14.0, 9.0, 12.0, 16.0, 15.0, 22.0, 33.0, 45.0, 81.0, 117.0, 185.0, 334.0, 534.0, 1016.0, 1819.0, 3245.0, 6294.0, 13079.0, 31343.0, 97905.0, 431495.0, 333067.0, 77757.0, 26385.0, 11364.0, 5596.0, 2916.0, 1577.0, 914.0, 506.0, 324.0, 177.0, 113.0, 67.0, 39.0, 29.0, 21.0, 22.0, 18.0, 13.0, 6.0, 9.0, 8.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.818359375, -3.698699951171875, -3.57904052734375, -3.459381103515625, -3.3397216796875, -3.220062255859375, -3.10040283203125, -2.980743408203125, -2.861083984375, -2.741424560546875, -2.62176513671875, -2.502105712890625, -2.3824462890625, -2.262786865234375, -2.14312744140625, -2.023468017578125, -1.90380859375, -1.784149169921875, -1.66448974609375, -1.544830322265625, -1.4251708984375, -1.305511474609375, -1.18585205078125, -1.066192626953125, -0.946533203125, -0.826873779296875, -0.70721435546875, -0.587554931640625, -0.4678955078125, -0.348236083984375, -0.22857666015625, -0.108917236328125, 0.0107421875, 0.130401611328125, 0.25006103515625, 0.369720458984375, 0.4893798828125, 0.609039306640625, 0.72869873046875, 0.848358154296875, 0.968017578125, 1.087677001953125, 1.20733642578125, 1.326995849609375, 1.4466552734375, 1.566314697265625, 1.68597412109375, 1.805633544921875, 1.92529296875, 2.044952392578125, 2.16461181640625, 2.284271240234375, 2.4039306640625, 2.523590087890625, 2.64324951171875, 2.762908935546875, 2.882568359375, 3.002227783203125, 3.12188720703125, 3.241546630859375, 3.3612060546875, 3.480865478515625, 3.60052490234375, 3.720184326171875, 3.83984375]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 5.0, 5.0, 2.0, 4.0, 5.0, 9.0, 15.0, 19.0, 21.0, 15.0, 25.0, 33.0, 34.0, 29.0, 40.0, 37.0, 56.0, 53.0, 105.0, 421.0, 1542.0, 118.0, 63.0, 50.0, 49.0, 41.0, 29.0, 39.0, 25.0, 32.0, 18.0, 22.0, 18.0, 16.0, 18.0, 3.0, 7.0, 3.0, 14.0, 5.0, 1.0, 1.0, 1.0, 5.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.7109375, -15.2493896484375, -14.787841796875, -14.3262939453125, -13.86474609375, -13.4031982421875, -12.941650390625, -12.4801025390625, -12.0185546875, -11.5570068359375, -11.095458984375, -10.6339111328125, -10.17236328125, -9.7108154296875, -9.249267578125, -8.7877197265625, -8.326171875, -7.8646240234375, -7.403076171875, -6.9415283203125, -6.47998046875, -6.0184326171875, -5.556884765625, -5.0953369140625, -4.6337890625, -4.1722412109375, -3.710693359375, -3.2491455078125, -2.78759765625, -2.3260498046875, -1.864501953125, -1.4029541015625, -0.94140625, -0.4798583984375, -0.018310546875, 0.4432373046875, 0.90478515625, 1.3663330078125, 1.827880859375, 2.2894287109375, 2.7509765625, 3.2125244140625, 3.674072265625, 4.1356201171875, 4.59716796875, 5.0587158203125, 5.520263671875, 5.9818115234375, 6.443359375, 6.9049072265625, 7.366455078125, 7.8280029296875, 8.28955078125, 8.7510986328125, 9.212646484375, 9.6741943359375, 10.1357421875, 10.5972900390625, 11.058837890625, 11.5203857421875, 11.98193359375, 12.4434814453125, 12.905029296875, 13.3665771484375, 13.828125]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 11.0, 5.0, 3.0, 8.0, 11.0, 17.0, 22.0, 22.0, 25.0, 44.0, 34.0, 62.0, 69.0, 123.0, 229.0, 388.0, 1120.0, 6214.0, 344926.0, 2775879.0, 13577.0, 1649.0, 551.0, 249.0, 125.0, 76.0, 66.0, 51.0, 23.0, 28.0, 23.0, 24.0, 14.0, 13.0, 6.0, 1.0, 3.0, 4.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-22.375, -21.6328125, -20.890625, -20.1484375, -19.40625, -18.6640625, -17.921875, -17.1796875, -16.4375, -15.6953125, -14.953125, -14.2109375, -13.46875, -12.7265625, -11.984375, -11.2421875, -10.5, -9.7578125, -9.015625, -8.2734375, -7.53125, -6.7890625, -6.046875, -5.3046875, -4.5625, -3.8203125, -3.078125, -2.3359375, -1.59375, -0.8515625, -0.109375, 0.6328125, 1.375, 2.1171875, 2.859375, 3.6015625, 4.34375, 5.0859375, 5.828125, 6.5703125, 7.3125, 8.0546875, 8.796875, 9.5390625, 10.28125, 11.0234375, 11.765625, 12.5078125, 13.25, 13.9921875, 14.734375, 15.4765625, 16.21875, 16.9609375, 17.703125, 18.4453125, 19.1875, 19.9296875, 20.671875, 21.4140625, 22.15625, 22.8984375, 23.640625, 24.3828125, 25.125]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 19.0, 48.0, 87.0, 155.0, 235.0, 174.0, 141.0, 70.0, 45.0, 20.0, 6.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.086982727050781, -10.286264419555664, -9.48554515838623, -8.684825897216797, -7.88410758972168, -7.083388805389404, -6.282670021057129, -5.4819512367248535, -4.681232452392578, -3.8805136680603027, -3.0797948837280273, -2.279076099395752, -1.4783573150634766, -0.6776385307312012, 0.12308025360107422, 0.9237990379333496, 1.724517822265625, 2.5252366065979004, 3.325955390930176, 4.126674175262451, 4.927392959594727, 5.728111743927002, 6.528830528259277, 7.329549312591553, 8.130268096923828, 8.930986404418945, 9.731705665588379, 10.532424926757812, 11.33314323425293, 12.133861541748047, 12.93458080291748, 13.735300064086914, 14.536018371582031, 15.336736679077148, 16.137454986572266, 16.938175201416016, 17.738893508911133, 18.53961181640625, 19.34033203125, 20.141050338745117, 20.941768646240234, 21.74248695373535, 22.54320526123047, 23.34392547607422, 24.144643783569336, 24.945362091064453, 25.746082305908203, 26.54680061340332, 27.347518920898438, 28.148237228393555, 28.948955535888672, 29.749675750732422, 30.55039405822754, 31.351112365722656, 32.151832580566406, 32.95254898071289, 33.75326919555664, 34.55398941040039, 35.354705810546875, 36.155426025390625, 36.956146240234375, 37.75686264038086, 38.55758285522461, 39.358299255371094, 40.159019470214844]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 2.0, 6.0, 3.0, 5.0, 6.0, 6.0, 20.0, 13.0, 16.0, 15.0, 26.0, 24.0, 28.0, 22.0, 30.0, 28.0, 33.0, 36.0, 39.0, 22.0, 45.0, 30.0, 54.0, 42.0, 38.0, 33.0, 31.0, 47.0, 44.0, 36.0, 19.0, 31.0, 29.0, 19.0, 26.0, 20.0, 14.0, 13.0, 15.0, 8.0, 13.0, 8.0, 1.0, 1.0, 4.0, 4.0, 4.0, 1.0, 4.0, 0.0, 1.0, 1.0], "bins": [-46.61693572998047, -45.26165771484375, -43.906375885009766, -42.55109405517578, -41.19581604003906, -39.840538024902344, -38.48525619506836, -37.129974365234375, -35.774696350097656, -34.41941833496094, -33.06413650512695, -31.7088565826416, -30.35357666015625, -28.9982967376709, -27.643016815185547, -26.287736892700195, -24.932456970214844, -23.577177047729492, -22.22189712524414, -20.86661720275879, -19.511337280273438, -18.156057357788086, -16.800777435302734, -15.445497512817383, -14.090217590332031, -12.73493766784668, -11.379657745361328, -10.024377822875977, -8.669097900390625, -7.313817977905273, -5.958538055419922, -4.60325813293457, -3.247974395751953, -1.8926944732666016, -0.53741455078125, 0.8178653717041016, 2.173145294189453, 3.5284252166748047, 4.883705139160156, 6.238985061645508, 7.594264984130859, 8.949544906616211, 10.304824829101562, 11.660104751586914, 13.015384674072266, 14.370664596557617, 15.725944519042969, 17.08122444152832, 18.436504364013672, 19.791784286499023, 21.147064208984375, 22.502344131469727, 23.857624053955078, 25.21290397644043, 26.56818389892578, 27.923463821411133, 29.278743743896484, 30.634023666381836, 31.989303588867188, 33.344581604003906, 34.69986343383789, 36.055145263671875, 37.410423278808594, 38.76570129394531, 40.1209831237793]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 6.0, 6.0, 10.0, 9.0, 18.0, 15.0, 14.0, 23.0, 29.0, 23.0, 31.0, 29.0, 28.0, 39.0, 31.0, 47.0, 41.0, 57.0, 35.0, 42.0, 38.0, 51.0, 40.0, 41.0, 42.0, 40.0, 40.0, 31.0, 27.0, 15.0, 16.0, 24.0, 12.0, 8.0, 11.0, 5.0, 4.0, 7.0, 6.0, 7.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.25, -4.11724853515625, -3.9844970703125, -3.85174560546875, -3.718994140625, -3.58624267578125, -3.4534912109375, -3.32073974609375, -3.18798828125, -3.05523681640625, -2.9224853515625, -2.78973388671875, -2.656982421875, -2.52423095703125, -2.3914794921875, -2.25872802734375, -2.1259765625, -1.99322509765625, -1.8604736328125, -1.72772216796875, -1.594970703125, -1.46221923828125, -1.3294677734375, -1.19671630859375, -1.06396484375, -0.93121337890625, -0.7984619140625, -0.66571044921875, -0.532958984375, -0.40020751953125, -0.2674560546875, -0.13470458984375, -0.001953125, 0.13079833984375, 0.2635498046875, 0.39630126953125, 0.529052734375, 0.66180419921875, 0.7945556640625, 0.92730712890625, 1.06005859375, 1.19281005859375, 1.3255615234375, 1.45831298828125, 1.591064453125, 1.72381591796875, 1.8565673828125, 1.98931884765625, 2.1220703125, 2.25482177734375, 2.3875732421875, 2.52032470703125, 2.653076171875, 2.78582763671875, 2.9185791015625, 3.05133056640625, 3.18408203125, 3.31683349609375, 3.4495849609375, 3.58233642578125, 3.715087890625, 3.84783935546875, 3.9805908203125, 4.11334228515625, 4.24609375]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 4.0, 5.0, 5.0, 6.0, 4.0, 9.0, 11.0, 12.0, 20.0, 22.0, 36.0, 50.0, 66.0, 152.0, 288.0, 674.0, 1713.0, 4841.0, 15105.0, 56319.0, 315289.0, 2325291.0, 1275512.0, 150718.0, 33094.0, 9602.0, 3243.0, 1175.0, 483.0, 227.0, 108.0, 52.0, 34.0, 26.0, 19.0, 15.0, 9.0, 9.0, 14.0, 3.0, 8.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-10.2890625, -9.9754638671875, -9.661865234375, -9.3482666015625, -9.03466796875, -8.7210693359375, -8.407470703125, -8.0938720703125, -7.7802734375, -7.4666748046875, -7.153076171875, -6.8394775390625, -6.52587890625, -6.2122802734375, -5.898681640625, -5.5850830078125, -5.271484375, -4.9578857421875, -4.644287109375, -4.3306884765625, -4.01708984375, -3.7034912109375, -3.389892578125, -3.0762939453125, -2.7626953125, -2.4490966796875, -2.135498046875, -1.8218994140625, -1.50830078125, -1.1947021484375, -0.881103515625, -0.5675048828125, -0.25390625, 0.0596923828125, 0.373291015625, 0.6868896484375, 1.00048828125, 1.3140869140625, 1.627685546875, 1.9412841796875, 2.2548828125, 2.5684814453125, 2.882080078125, 3.1956787109375, 3.50927734375, 3.8228759765625, 4.136474609375, 4.4500732421875, 4.763671875, 5.0772705078125, 5.390869140625, 5.7044677734375, 6.01806640625, 6.3316650390625, 6.645263671875, 6.9588623046875, 7.2724609375, 7.5860595703125, 7.899658203125, 8.2132568359375, 8.52685546875, 8.8404541015625, 9.154052734375, 9.4676513671875, 9.78125]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 3.0, 4.0, 8.0, 4.0, 5.0, 16.0, 19.0, 15.0, 11.0, 29.0, 33.0, 34.0, 87.0, 73.0, 110.0, 141.0, 216.0, 267.0, 369.0, 458.0, 463.0, 418.0, 315.0, 263.0, 186.0, 148.0, 100.0, 67.0, 55.0, 50.0, 37.0, 25.0, 11.0, 9.0, 9.0, 7.0, 2.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.09375, -11.76953125, -11.4453125, -11.12109375, -10.796875, -10.47265625, -10.1484375, -9.82421875, -9.5, -9.17578125, -8.8515625, -8.52734375, -8.203125, -7.87890625, -7.5546875, -7.23046875, -6.90625, -6.58203125, -6.2578125, -5.93359375, -5.609375, -5.28515625, -4.9609375, -4.63671875, -4.3125, -3.98828125, -3.6640625, -3.33984375, -3.015625, -2.69140625, -2.3671875, -2.04296875, -1.71875, -1.39453125, -1.0703125, -0.74609375, -0.421875, -0.09765625, 0.2265625, 0.55078125, 0.875, 1.19921875, 1.5234375, 1.84765625, 2.171875, 2.49609375, 2.8203125, 3.14453125, 3.46875, 3.79296875, 4.1171875, 4.44140625, 4.765625, 5.08984375, 5.4140625, 5.73828125, 6.0625, 6.38671875, 6.7109375, 7.03515625, 7.359375, 7.68359375, 8.0078125, 8.33203125, 8.65625]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 11.0, 19.0, 34.0, 61.0, 141.0, 334.0, 1030.0, 4990.0, 44382.0, 890064.0, 3107605.0, 131790.0, 11156.0, 1767.0, 487.0, 217.0, 95.0, 56.0, 22.0, 9.0, 7.0, 7.0, 2.0, 1.0, 0.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.171875, -18.173583984375, -17.17529296875, -16.177001953125, -15.1787109375, -14.180419921875, -13.18212890625, -12.183837890625, -11.185546875, -10.187255859375, -9.18896484375, -8.190673828125, -7.1923828125, -6.194091796875, -5.19580078125, -4.197509765625, -3.19921875, -2.200927734375, -1.20263671875, -0.204345703125, 0.7939453125, 1.792236328125, 2.79052734375, 3.788818359375, 4.787109375, 5.785400390625, 6.78369140625, 7.781982421875, 8.7802734375, 9.778564453125, 10.77685546875, 11.775146484375, 12.7734375, 13.771728515625, 14.77001953125, 15.768310546875, 16.7666015625, 17.764892578125, 18.76318359375, 19.761474609375, 20.759765625, 21.758056640625, 22.75634765625, 23.754638671875, 24.7529296875, 25.751220703125, 26.74951171875, 27.747802734375, 28.74609375, 29.744384765625, 30.74267578125, 31.740966796875, 32.7392578125, 33.737548828125, 34.73583984375, 35.734130859375, 36.732421875, 37.730712890625, 38.72900390625, 39.727294921875, 40.7255859375, 41.723876953125, 42.72216796875, 43.720458984375, 44.71875]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 11.0, 30.0, 64.0, 126.0, 212.0, 215.0, 174.0, 105.0, 50.0, 12.0, 8.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-170.8758087158203, -167.1961669921875, -163.5165252685547, -159.83688354492188, -156.1572265625, -152.4775848388672, -148.79794311523438, -145.11830139160156, -141.43865966796875, -137.75901794433594, -134.07937622070312, -130.3997344970703, -126.72008514404297, -123.04044342041016, -119.36079406738281, -115.68115234375, -112.00151062011719, -108.32186889648438, -104.64222717285156, -100.96257781982422, -97.2829360961914, -93.6032943725586, -89.92364501953125, -86.24400329589844, -82.56436157226562, -78.88471984863281, -75.205078125, -71.52542877197266, -67.84578704833984, -64.16614532470703, -60.48649978637695, -56.806854248046875, -53.12721252441406, -49.44757080078125, -45.76792526245117, -42.088279724121094, -38.40863800048828, -34.72899627685547, -31.04935073852539, -27.369707107543945, -23.6900634765625, -20.010419845581055, -16.33077621459961, -12.651132583618164, -8.971488952636719, -5.291845321655273, -1.6122016906738281, 2.067441940307617, 5.7470855712890625, 9.426729202270508, 13.106372833251953, 16.7860164642334, 20.465660095214844, 24.14530372619629, 27.824947357177734, 31.50459098815918, 35.184234619140625, 38.86387634277344, 42.543521881103516, 46.223167419433594, 49.902809143066406, 53.58245086669922, 57.2620964050293, 60.941741943359375, 64.62138366699219]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 4.0, 2.0, 15.0, 8.0, 9.0, 13.0, 9.0, 25.0, 22.0, 16.0, 28.0, 21.0, 30.0, 35.0, 41.0, 36.0, 43.0, 51.0, 37.0, 41.0, 49.0, 49.0, 44.0, 37.0, 42.0, 47.0, 39.0, 25.0, 29.0, 16.0, 20.0, 24.0, 15.0, 15.0, 14.0, 14.0, 13.0, 8.0, 5.0, 10.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.59796142578125, -32.361366271972656, -31.12476921081543, -29.888172149658203, -28.651575088500977, -27.41497802734375, -26.178382873535156, -24.94178581237793, -23.705188751220703, -22.468591690063477, -21.231996536254883, -19.995399475097656, -18.75880241394043, -17.522205352783203, -16.28561019897461, -15.049013137817383, -13.812417984008789, -12.575821876525879, -11.339224815368652, -10.102628707885742, -8.866031646728516, -7.6294355392456055, -6.392839431762695, -5.156242370605469, -3.9196462631225586, -2.6830496788024902, -1.446453332901001, -0.20985698699951172, 1.0267395973205566, 2.263336181640625, 3.499932289123535, 4.736529350280762, 5.973125457763672, 7.20972204208374, 8.446318626403809, 9.682914733886719, 10.919511795043945, 12.156107902526855, 13.392704010009766, 14.629301071166992, 15.865897178649902, 17.102493286132812, 18.33909034729004, 19.575687408447266, 20.81228256225586, 22.048879623413086, 23.285476684570312, 24.522071838378906, 25.758668899536133, 26.99526596069336, 28.231861114501953, 29.46845817565918, 30.705055236816406, 31.941650390625, 33.178245544433594, 34.41484451293945, 35.65143966674805, 36.88803482055664, 38.1246337890625, 39.361228942871094, 40.59782409667969, 41.83442306518555, 43.07101821899414, 44.3076171875, 45.544212341308594]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 9.0, 9.0, 16.0, 7.0, 12.0, 14.0, 9.0, 25.0, 20.0, 20.0, 30.0, 26.0, 33.0, 36.0, 35.0, 33.0, 50.0, 55.0, 51.0, 42.0, 42.0, 49.0, 46.0, 29.0, 35.0, 35.0, 34.0, 28.0, 23.0, 26.0, 32.0, 24.0, 19.0, 9.0, 6.0, 11.0, 6.0, 0.0, 4.0, 6.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.5, -4.3609619140625, -4.221923828125, -4.0828857421875, -3.94384765625, -3.8048095703125, -3.665771484375, -3.5267333984375, -3.3876953125, -3.2486572265625, -3.109619140625, -2.9705810546875, -2.83154296875, -2.6925048828125, -2.553466796875, -2.4144287109375, -2.275390625, -2.1363525390625, -1.997314453125, -1.8582763671875, -1.71923828125, -1.5802001953125, -1.441162109375, -1.3021240234375, -1.1630859375, -1.0240478515625, -0.885009765625, -0.7459716796875, -0.60693359375, -0.4678955078125, -0.328857421875, -0.1898193359375, -0.05078125, 0.0882568359375, 0.227294921875, 0.3663330078125, 0.50537109375, 0.6444091796875, 0.783447265625, 0.9224853515625, 1.0615234375, 1.2005615234375, 1.339599609375, 1.4786376953125, 1.61767578125, 1.7567138671875, 1.895751953125, 2.0347900390625, 2.173828125, 2.3128662109375, 2.451904296875, 2.5909423828125, 2.72998046875, 2.8690185546875, 3.008056640625, 3.1470947265625, 3.2861328125, 3.4251708984375, 3.564208984375, 3.7032470703125, 3.84228515625, 3.9813232421875, 4.120361328125, 4.2593994140625, 4.3984375]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 7.0, 8.0, 7.0, 12.0, 16.0, 15.0, 21.0, 32.0, 40.0, 79.0, 108.0, 155.0, 199.0, 289.0, 423.0, 596.0, 819.0, 1259.0, 1848.0, 2673.0, 4014.0, 5853.0, 9052.0, 14179.0, 21880.0, 35001.0, 55992.0, 90653.0, 140302.0, 180540.0, 166208.0, 117200.0, 73374.0, 45195.0, 28083.0, 17756.0, 11576.0, 7408.0, 4989.0, 3442.0, 2232.0, 1579.0, 1044.0, 734.0, 479.0, 339.0, 229.0, 188.0, 123.0, 89.0, 79.0, 37.0, 29.0, 24.0, 19.0, 17.0, 6.0, 6.0, 6.0, 5.0, 2.0, 3.0], "bins": [-0.1468505859375, -0.1422290802001953, -0.13760757446289062, -0.13298606872558594, -0.12836456298828125, -0.12374305725097656, -0.11912155151367188, -0.11450004577636719, -0.1098785400390625, -0.10525703430175781, -0.10063552856445312, -0.09601402282714844, -0.09139251708984375, -0.08677101135253906, -0.08214950561523438, -0.07752799987792969, -0.072906494140625, -0.06828498840332031, -0.06366348266601562, -0.05904197692871094, -0.05442047119140625, -0.04979896545410156, -0.045177459716796875, -0.04055595397949219, -0.0359344482421875, -0.03131294250488281, -0.026691436767578125, -0.022069931030273438, -0.01744842529296875, -0.012826919555664062, -0.008205413818359375, -0.0035839080810546875, 0.00103759765625, 0.0056591033935546875, 0.010280609130859375, 0.014902114868164062, 0.01952362060546875, 0.024145126342773438, 0.028766632080078125, 0.03338813781738281, 0.0380096435546875, 0.04263114929199219, 0.047252655029296875, 0.05187416076660156, 0.05649566650390625, 0.06111717224121094, 0.06573867797851562, 0.07036018371582031, 0.074981689453125, 0.07960319519042969, 0.08422470092773438, 0.08884620666503906, 0.09346771240234375, 0.09808921813964844, 0.10271072387695312, 0.10733222961425781, 0.1119537353515625, 0.11657524108886719, 0.12119674682617188, 0.12581825256347656, 0.13043975830078125, 0.13506126403808594, 0.13968276977539062, 0.1443042755126953, 0.14892578125]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 8.0, 6.0, 7.0, 8.0, 13.0, 20.0, 17.0, 18.0, 16.0, 22.0, 28.0, 29.0, 31.0, 31.0, 35.0, 30.0, 36.0, 34.0, 44.0, 41.0, 1082.0, 32.0, 30.0, 44.0, 39.0, 36.0, 28.0, 34.0, 45.0, 25.0, 20.0, 19.0, 25.0, 20.0, 14.0, 7.0, 10.0, 12.0, 6.0, 8.0, 6.0, 2.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.751953125, -2.66668701171875, -2.5814208984375, -2.49615478515625, -2.410888671875, -2.32562255859375, -2.2403564453125, -2.15509033203125, -2.06982421875, -1.98455810546875, -1.8992919921875, -1.81402587890625, -1.728759765625, -1.64349365234375, -1.5582275390625, -1.47296142578125, -1.3876953125, -1.30242919921875, -1.2171630859375, -1.13189697265625, -1.046630859375, -0.96136474609375, -0.8760986328125, -0.79083251953125, -0.70556640625, -0.62030029296875, -0.5350341796875, -0.44976806640625, -0.364501953125, -0.27923583984375, -0.1939697265625, -0.10870361328125, -0.0234375, 0.06182861328125, 0.1470947265625, 0.23236083984375, 0.317626953125, 0.40289306640625, 0.4881591796875, 0.57342529296875, 0.65869140625, 0.74395751953125, 0.8292236328125, 0.91448974609375, 0.999755859375, 1.08502197265625, 1.1702880859375, 1.25555419921875, 1.3408203125, 1.42608642578125, 1.5113525390625, 1.59661865234375, 1.681884765625, 1.76715087890625, 1.8524169921875, 1.93768310546875, 2.02294921875, 2.10821533203125, 2.1934814453125, 2.27874755859375, 2.364013671875, 2.44927978515625, 2.5345458984375, 2.61981201171875, 2.705078125]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 6.0, 9.0, 18.0, 27.0, 35.0, 45.0, 86.0, 120.0, 192.0, 297.0, 472.0, 713.0, 1059.0, 1594.0, 2523.0, 3790.0, 5831.0, 9141.0, 14327.0, 23379.0, 38493.0, 64896.0, 107350.0, 163102.0, 1241628.0, 157574.0, 102369.0, 61097.0, 36349.0, 22070.0, 13637.0, 8675.0, 5691.0, 3693.0, 2327.0, 1590.0, 1004.0, 666.0, 439.0, 299.0, 171.0, 123.0, 86.0, 48.0, 46.0, 13.0, 19.0, 7.0, 3.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1492919921875, -0.1445446014404297, -0.13979721069335938, -0.13504981994628906, -0.13030242919921875, -0.12555503845214844, -0.12080764770507812, -0.11606025695800781, -0.1113128662109375, -0.10656547546386719, -0.10181808471679688, -0.09707069396972656, -0.09232330322265625, -0.08757591247558594, -0.08282852172851562, -0.07808113098144531, -0.073333740234375, -0.06858634948730469, -0.06383895874023438, -0.05909156799316406, -0.05434417724609375, -0.04959678649902344, -0.044849395751953125, -0.04010200500488281, -0.0353546142578125, -0.030607223510742188, -0.025859832763671875, -0.021112442016601562, -0.01636505126953125, -0.011617660522460938, -0.006870269775390625, -0.0021228790283203125, 0.00262451171875, 0.0073719024658203125, 0.012119293212890625, 0.016866683959960938, 0.02161407470703125, 0.026361465454101562, 0.031108856201171875, 0.03585624694824219, 0.0406036376953125, 0.04535102844238281, 0.050098419189453125, 0.05484580993652344, 0.05959320068359375, 0.06434059143066406, 0.06908798217773438, 0.07383537292480469, 0.078582763671875, 0.08333015441894531, 0.08807754516601562, 0.09282493591308594, 0.09757232666015625, 0.10231971740722656, 0.10706710815429688, 0.11181449890136719, 0.1165618896484375, 0.12130928039550781, 0.12605667114257812, 0.13080406188964844, 0.13555145263671875, 0.14029884338378906, 0.14504623413085938, 0.1497936248779297, 0.154541015625]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 12.0, 4.0, 17.0, 13.0, 14.0, 29.0, 48.0, 60.0, 62.0, 74.0, 89.0, 92.0, 102.0, 88.0, 77.0, 55.0, 32.0, 35.0, 19.0, 20.0, 14.0, 11.0, 14.0, 8.0, 2.0, 7.0, 5.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009293556213378906, -0.0008981302380561829, -0.0008669048547744751, -0.0008356794714927673, -0.0008044540882110596, -0.0007732287049293518, -0.000742003321647644, -0.0007107779383659363, -0.0006795525550842285, -0.0006483271718025208, -0.000617101788520813, -0.0005858764052391052, -0.0005546510219573975, -0.0005234256386756897, -0.0004922002553939819, -0.00046097487211227417, -0.0004297494888305664, -0.00039852410554885864, -0.0003672987222671509, -0.0003360733389854431, -0.00030484795570373535, -0.0002736225724220276, -0.00024239718914031982, -0.00021117180585861206, -0.0001799464225769043, -0.00014872103929519653, -0.00011749565601348877, -8.6270272731781e-05, -5.504488945007324e-05, -2.381950616836548e-05, 7.405877113342285e-06, 3.863126039505005e-05, 6.985664367675781e-05, 0.00010108202695846558, 0.00013230741024017334, 0.0001635327935218811, 0.00019475817680358887, 0.00022598356008529663, 0.0002572089433670044, 0.00028843432664871216, 0.0003196597099304199, 0.0003508850932121277, 0.00038211047649383545, 0.0004133358597755432, 0.000444561243057251, 0.00047578662633895874, 0.0005070120096206665, 0.0005382373929023743, 0.000569462776184082, 0.0006006881594657898, 0.0006319135427474976, 0.0006631389260292053, 0.0006943643093109131, 0.0007255896925926208, 0.0007568150758743286, 0.0007880404591560364, 0.0008192658424377441, 0.0008504912257194519, 0.0008817166090011597, 0.0009129419922828674, 0.0009441673755645752, 0.000975392758846283, 0.0010066181421279907, 0.0010378435254096985, 0.0010690689086914062]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 7.0, 16.0, 13.0, 11.0, 23.0, 26.0, 32.0, 62.0, 93.0, 108.0, 203.0, 382.0, 819.0, 30889.0, 1001696.0, 12579.0, 689.0, 325.0, 183.0, 123.0, 93.0, 50.0, 32.0, 33.0, 20.0, 17.0, 6.0, 11.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.016693115234375, -0.01622188091278076, -0.015750646591186523, -0.015279412269592285, -0.014808177947998047, -0.014336943626403809, -0.01386570930480957, -0.013394474983215332, -0.012923240661621094, -0.012452006340026855, -0.011980772018432617, -0.011509537696838379, -0.01103830337524414, -0.010567069053649902, -0.010095834732055664, -0.009624600410461426, -0.009153366088867188, -0.00868213176727295, -0.008210897445678711, -0.007739663124084473, -0.007268428802490234, -0.006797194480895996, -0.006325960159301758, -0.0058547258377075195, -0.005383491516113281, -0.004912257194519043, -0.004441022872924805, -0.003969788551330566, -0.003498554229736328, -0.00302731990814209, -0.0025560855865478516, -0.0020848512649536133, -0.001613616943359375, -0.0011423826217651367, -0.0006711483001708984, -0.00019991397857666016, 0.0002713203430175781, 0.0007425546646118164, 0.0012137889862060547, 0.001685023307800293, 0.0021562576293945312, 0.0026274919509887695, 0.003098726272583008, 0.003569960594177246, 0.004041194915771484, 0.004512429237365723, 0.004983663558959961, 0.005454897880554199, 0.0059261322021484375, 0.006397366523742676, 0.006868600845336914, 0.007339835166931152, 0.007811069488525391, 0.008282303810119629, 0.008753538131713867, 0.009224772453308105, 0.009696006774902344, 0.010167241096496582, 0.01063847541809082, 0.011109709739685059, 0.011580944061279297, 0.012052178382873535, 0.012523412704467773, 0.012994647026062012, 0.01346588134765625]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 8.0, 18.0, 49.0, 111.0, 185.0, 260.0, 203.0, 119.0, 37.0, 15.0, 8.0, 1.0, 1.0], "bins": [-0.0021879717241972685, -0.002149266889318824, -0.002110562054440379, -0.002071856986731291, -0.002033152151852846, -0.0019944473169744015, -0.001955742482095957, -0.0019170376472175121, -0.0018783326959237456, -0.001839627861045301, -0.0018009229097515345, -0.0017622180748730898, -0.0017235132399946451, -0.0016848082887008786, -0.001646103453822434, -0.0016073985025286674, -0.0015686936676502228, -0.001529988832771778, -0.0014912838814780116, -0.001452579046599567, -0.0014138742117211223, -0.0013751692604273558, -0.001336464425548911, -0.0012977595906704664, -0.0012590547557920218, -0.001220349920913577, -0.0011816449696198106, -0.001142940134741366, -0.0011042352998629212, -0.0010655303485691547, -0.00102682551369071, -0.0009881206788122654, -0.0009494158439338207, -0.0009107109508477151, -0.0008720061159692705, -0.0008333012228831649, -0.0007945963297970593, -0.0007558914367109537, -0.000717186601832509, -0.0006784817087464035, -0.0006397768156602979, -0.0006010719225741923, -0.0005623670876957476, -0.000523662194609642, -0.00048495730152353644, -0.0004462524375412613, -0.0004075475735589862, -0.0003688426804728806, -0.0003301378164906055, -0.00029143295250833035, -0.00025272805942222476, -0.00021402319543994963, -0.00017531831690575927, -0.00013661343837156892, -9.790857438929379e-05, -5.9203681303188205e-05, -2.0498817320913076e-05, 1.8206057575298473e-05, 5.691093247151002e-05, 9.561580372974277e-05, 0.00013432068226393312, 0.00017302556079812348, 0.0002117304247803986, 0.0002504353178665042, 0.0002891401818487793]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 6.0, 3.0, 9.0, 6.0, 14.0, 9.0, 14.0, 17.0, 19.0, 15.0, 26.0, 35.0, 28.0, 26.0, 36.0, 43.0, 29.0, 36.0, 41.0, 45.0, 35.0, 41.0, 40.0, 36.0, 32.0, 40.0, 35.0, 37.0, 31.0, 36.0, 26.0, 18.0, 33.0, 17.0, 13.0, 10.0, 13.0, 8.0, 15.0, 11.0, 6.0, 5.0, 1.0, 2.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.0003782510757446289, -0.00036605354398489, -0.00035385601222515106, -0.00034165848046541214, -0.0003294609487056732, -0.0003172634169459343, -0.0003050658851861954, -0.00029286835342645645, -0.00028067082166671753, -0.0002684732899069786, -0.0002562757581472397, -0.00024407822638750076, -0.00023188069462776184, -0.00021968316286802292, -0.000207485631108284, -0.00019528809934854507, -0.00018309056758880615, -0.00017089303582906723, -0.0001586955040693283, -0.00014649797230958939, -0.00013430044054985046, -0.00012210290879011154, -0.00010990537703037262, -9.77078452706337e-05, -8.551031351089478e-05, -7.331278175115585e-05, -6.111524999141693e-05, -4.891771823167801e-05, -3.672018647193909e-05, -2.4522654712200165e-05, -1.2325122952461243e-05, -1.2759119272232056e-07, 1.2069940567016602e-05, 2.4267472326755524e-05, 3.6465004086494446e-05, 4.866253584623337e-05, 6.086006760597229e-05, 7.305759936571121e-05, 8.525513112545013e-05, 9.745266288518906e-05, 0.00010965019464492798, 0.0001218477264046669, 0.00013404525816440582, 0.00014624278992414474, 0.00015844032168388367, 0.0001706378534436226, 0.0001828353852033615, 0.00019503291696310043, 0.00020723044872283936, 0.00021942798048257828, 0.0002316255122423172, 0.00024382304400205612, 0.00025602057576179504, 0.00026821810752153397, 0.0002804156392812729, 0.0002926131710410118, 0.00030481070280075073, 0.00031700823456048965, 0.0003292057663202286, 0.0003414032980799675, 0.0003536008298397064, 0.00036579836159944534, 0.00037799589335918427, 0.0003901934251189232, 0.0004023909568786621]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 9.0, 9.0, 16.0, 7.0, 12.0, 14.0, 9.0, 25.0, 20.0, 20.0, 30.0, 26.0, 33.0, 36.0, 35.0, 33.0, 50.0, 55.0, 51.0, 42.0, 43.0, 48.0, 46.0, 29.0, 35.0, 35.0, 34.0, 28.0, 23.0, 26.0, 32.0, 24.0, 19.0, 9.0, 6.0, 11.0, 6.0, 0.0, 4.0, 6.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.5, -4.3609619140625, -4.221923828125, -4.0828857421875, -3.94384765625, -3.8048095703125, -3.665771484375, -3.5267333984375, -3.3876953125, -3.2486572265625, -3.109619140625, -2.9705810546875, -2.83154296875, -2.6925048828125, -2.553466796875, -2.4144287109375, -2.275390625, -2.1363525390625, -1.997314453125, -1.8582763671875, -1.71923828125, -1.5802001953125, -1.441162109375, -1.3021240234375, -1.1630859375, -1.0240478515625, -0.885009765625, -0.7459716796875, -0.60693359375, -0.4678955078125, -0.328857421875, -0.1898193359375, -0.05078125, 0.0882568359375, 0.227294921875, 0.3663330078125, 0.50537109375, 0.6444091796875, 0.783447265625, 0.9224853515625, 1.0615234375, 1.2005615234375, 1.339599609375, 1.4786376953125, 1.61767578125, 1.7567138671875, 1.895751953125, 2.0347900390625, 2.173828125, 2.3128662109375, 2.451904296875, 2.5909423828125, 2.72998046875, 2.8690185546875, 3.008056640625, 3.1470947265625, 3.2861328125, 3.4251708984375, 3.564208984375, 3.7032470703125, 3.84228515625, 3.9813232421875, 4.120361328125, 4.2593994140625, 4.3984375]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 5.0, 9.0, 13.0, 21.0, 28.0, 31.0, 37.0, 72.0, 101.0, 162.0, 252.0, 416.0, 778.0, 1289.0, 2503.0, 5160.0, 11472.0, 28692.0, 81374.0, 264880.0, 424808.0, 145113.0, 47743.0, 18017.0, 7584.0, 3634.0, 1840.0, 996.0, 566.0, 343.0, 217.0, 134.0, 91.0, 64.0, 34.0, 21.0, 17.0, 11.0, 7.0, 6.0, 7.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.60546875, -2.524688720703125, -2.44390869140625, -2.363128662109375, -2.2823486328125, -2.201568603515625, -2.12078857421875, -2.040008544921875, -1.959228515625, -1.878448486328125, -1.79766845703125, -1.716888427734375, -1.6361083984375, -1.555328369140625, -1.47454833984375, -1.393768310546875, -1.31298828125, -1.232208251953125, -1.15142822265625, -1.070648193359375, -0.9898681640625, -0.909088134765625, -0.82830810546875, -0.747528076171875, -0.666748046875, -0.585968017578125, -0.50518798828125, -0.424407958984375, -0.3436279296875, -0.262847900390625, -0.18206787109375, -0.101287841796875, -0.0205078125, 0.060272216796875, 0.14105224609375, 0.221832275390625, 0.3026123046875, 0.383392333984375, 0.46417236328125, 0.544952392578125, 0.625732421875, 0.706512451171875, 0.78729248046875, 0.868072509765625, 0.9488525390625, 1.029632568359375, 1.11041259765625, 1.191192626953125, 1.27197265625, 1.352752685546875, 1.43353271484375, 1.514312744140625, 1.5950927734375, 1.675872802734375, 1.75665283203125, 1.837432861328125, 1.918212890625, 1.998992919921875, 2.07977294921875, 2.160552978515625, 2.2413330078125, 2.322113037109375, 2.40289306640625, 2.483673095703125, 2.564453125]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 5.0, 9.0, 14.0, 12.0, 16.0, 16.0, 34.0, 26.0, 34.0, 50.0, 49.0, 40.0, 62.0, 102.0, 1798.0, 326.0, 75.0, 56.0, 44.0, 54.0, 44.0, 42.0, 35.0, 23.0, 17.0, 23.0, 21.0, 8.0, 8.0, 4.0, 1.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.671875, -18.024169921875, -17.37646484375, -16.728759765625, -16.0810546875, -15.433349609375, -14.78564453125, -14.137939453125, -13.490234375, -12.842529296875, -12.19482421875, -11.547119140625, -10.8994140625, -10.251708984375, -9.60400390625, -8.956298828125, -8.30859375, -7.660888671875, -7.01318359375, -6.365478515625, -5.7177734375, -5.070068359375, -4.42236328125, -3.774658203125, -3.126953125, -2.479248046875, -1.83154296875, -1.183837890625, -0.5361328125, 0.111572265625, 0.75927734375, 1.406982421875, 2.0546875, 2.702392578125, 3.35009765625, 3.997802734375, 4.6455078125, 5.293212890625, 5.94091796875, 6.588623046875, 7.236328125, 7.884033203125, 8.53173828125, 9.179443359375, 9.8271484375, 10.474853515625, 11.12255859375, 11.770263671875, 12.41796875, 13.065673828125, 13.71337890625, 14.361083984375, 15.0087890625, 15.656494140625, 16.30419921875, 16.951904296875, 17.599609375, 18.247314453125, 18.89501953125, 19.542724609375, 20.1904296875, 20.838134765625, 21.48583984375, 22.133544921875, 22.78125]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 1.0, 3.0, 1.0, 6.0, 9.0, 10.0, 24.0, 23.0, 17.0, 32.0, 45.0, 56.0, 75.0, 138.0, 233.0, 431.0, 1525.0, 263744.0, 2875880.0, 2277.0, 533.0, 230.0, 124.0, 94.0, 47.0, 33.0, 37.0, 18.0, 17.0, 18.0, 10.0, 10.0, 3.0, 6.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.59375, -36.5224609375, -35.451171875, -34.3798828125, -33.30859375, -32.2373046875, -31.166015625, -30.0947265625, -29.0234375, -27.9521484375, -26.880859375, -25.8095703125, -24.73828125, -23.6669921875, -22.595703125, -21.5244140625, -20.453125, -19.3818359375, -18.310546875, -17.2392578125, -16.16796875, -15.0966796875, -14.025390625, -12.9541015625, -11.8828125, -10.8115234375, -9.740234375, -8.6689453125, -7.59765625, -6.5263671875, -5.455078125, -4.3837890625, -3.3125, -2.2412109375, -1.169921875, -0.0986328125, 0.97265625, 2.0439453125, 3.115234375, 4.1865234375, 5.2578125, 6.3291015625, 7.400390625, 8.4716796875, 9.54296875, 10.6142578125, 11.685546875, 12.7568359375, 13.828125, 14.8994140625, 15.970703125, 17.0419921875, 18.11328125, 19.1845703125, 20.255859375, 21.3271484375, 22.3984375, 23.4697265625, 24.541015625, 25.6123046875, 26.68359375, 27.7548828125, 28.826171875, 29.8974609375, 30.96875]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [986.0, 31.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.918238639831543, 2.3808555603027344, 10.679949760437012, 18.979042053222656, 27.27813720703125, 35.577232360839844, 43.87632369995117, 52.175418853759766, 60.47451400756836, 68.77360534667969, 77.07270050048828, 85.37179565429688, 93.67089080810547, 101.96998596191406, 110.26907348632812, 118.56817626953125, 126.86727142333984, 135.16636657714844, 143.4654541015625, 151.76455688476562, 160.0636444091797, 168.3627471923828, 176.66183471679688, 184.9609375, 193.26002502441406, 201.55911254882812, 209.85821533203125, 218.1573028564453, 226.45640563964844, 234.7554931640625, 243.05459594726562, 251.3536834716797, 259.6528015136719, 267.951904296875, 276.2509765625, 284.5500793457031, 292.84918212890625, 301.1482849121094, 309.4473571777344, 317.7464599609375, 326.0455627441406, 334.34466552734375, 342.64373779296875, 350.9428405761719, 359.241943359375, 367.5410461425781, 375.8401184082031, 384.13922119140625, 392.43829345703125, 400.7373962402344, 409.0364685058594, 417.3355712890625, 425.6346740722656, 433.93377685546875, 442.23284912109375, 450.5319519042969, 458.8310546875, 467.1301574707031, 475.4292297363281, 483.72833251953125, 492.0274353027344, 500.3265380859375, 508.6256103515625, 516.9246826171875, 525.2238159179688]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 3.0, 12.0, 16.0, 12.0, 15.0, 20.0, 21.0, 20.0, 31.0, 27.0, 22.0, 30.0, 53.0, 36.0, 44.0, 31.0, 50.0, 40.0, 39.0, 42.0, 51.0, 38.0, 46.0, 34.0, 31.0, 30.0, 39.0, 14.0, 24.0, 18.0, 22.0, 15.0, 11.0, 9.0, 7.0, 12.0, 8.0, 6.0, 9.0, 7.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.399940490722656, -43.87556076049805, -42.35118103027344, -40.82680130004883, -39.30242156982422, -37.77804183959961, -36.253662109375, -34.729278564453125, -33.20490264892578, -31.680522918701172, -30.156143188476562, -28.631763458251953, -27.107383728027344, -25.583003997802734, -24.058622360229492, -22.534242630004883, -21.00986099243164, -19.48548126220703, -17.961101531982422, -16.436721801757812, -14.912341117858887, -13.387961387634277, -11.863580703735352, -10.339200973510742, -8.814821243286133, -7.290441513061523, -5.766061305999756, -4.241681098937988, -2.717301368713379, -1.1929216384887695, 0.33145904541015625, 1.8558387756347656, 3.380218505859375, 4.904598236083984, 6.428978443145752, 7.9533586502075195, 9.477738380432129, 11.002118110656738, 12.526498794555664, 14.050878524780273, 15.575258255004883, 17.099637985229492, 18.6240177154541, 20.148399353027344, 21.672779083251953, 23.197158813476562, 24.721538543701172, 26.24591827392578, 27.77029800415039, 29.294677734375, 30.81905746459961, 32.34343719482422, 33.86781692504883, 35.39219665527344, 36.91658020019531, 38.440956115722656, 39.96533966064453, 41.48971939086914, 43.01409912109375, 44.53847885131836, 46.06285858154297, 47.58723831176758, 49.11161804199219, 50.63600158691406, 52.160377502441406]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 7.0, 8.0, 13.0, 11.0, 8.0, 18.0, 11.0, 16.0, 29.0, 19.0, 32.0, 24.0, 34.0, 37.0, 35.0, 39.0, 43.0, 54.0, 58.0, 35.0, 45.0, 48.0, 41.0, 31.0, 36.0, 40.0, 29.0, 29.0, 24.0, 34.0, 24.0, 24.0, 16.0, 6.0, 11.0, 7.0, 5.0, 3.0, 6.0, 4.0, 4.0, 0.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-4.734375, -4.592041015625, -4.44970703125, -4.307373046875, -4.1650390625, -4.022705078125, -3.88037109375, -3.738037109375, -3.595703125, -3.453369140625, -3.31103515625, -3.168701171875, -3.0263671875, -2.884033203125, -2.74169921875, -2.599365234375, -2.45703125, -2.314697265625, -2.17236328125, -2.030029296875, -1.8876953125, -1.745361328125, -1.60302734375, -1.460693359375, -1.318359375, -1.176025390625, -1.03369140625, -0.891357421875, -0.7490234375, -0.606689453125, -0.46435546875, -0.322021484375, -0.1796875, -0.037353515625, 0.10498046875, 0.247314453125, 0.3896484375, 0.531982421875, 0.67431640625, 0.816650390625, 0.958984375, 1.101318359375, 1.24365234375, 1.385986328125, 1.5283203125, 1.670654296875, 1.81298828125, 1.955322265625, 2.09765625, 2.239990234375, 2.38232421875, 2.524658203125, 2.6669921875, 2.809326171875, 2.95166015625, 3.093994140625, 3.236328125, 3.378662109375, 3.52099609375, 3.663330078125, 3.8056640625, 3.947998046875, 4.09033203125, 4.232666015625, 4.375]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 3.0, 7.0, 4.0, 13.0, 7.0, 8.0, 16.0, 15.0, 17.0, 18.0, 19.0, 36.0, 49.0, 56.0, 90.0, 190.0, 491.0, 1333.0, 4896.0, 21710.0, 125699.0, 1524858.0, 2279381.0, 196348.0, 29884.0, 6315.0, 1689.0, 546.0, 212.0, 98.0, 64.0, 40.0, 25.0, 42.0, 19.0, 17.0, 18.0, 12.0, 11.0, 2.0, 9.0, 6.0, 3.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-12.609375, -12.2039794921875, -11.798583984375, -11.3931884765625, -10.98779296875, -10.5823974609375, -10.177001953125, -9.7716064453125, -9.3662109375, -8.9608154296875, -8.555419921875, -8.1500244140625, -7.74462890625, -7.3392333984375, -6.933837890625, -6.5284423828125, -6.123046875, -5.7176513671875, -5.312255859375, -4.9068603515625, -4.50146484375, -4.0960693359375, -3.690673828125, -3.2852783203125, -2.8798828125, -2.4744873046875, -2.069091796875, -1.6636962890625, -1.25830078125, -0.8529052734375, -0.447509765625, -0.0421142578125, 0.36328125, 0.7686767578125, 1.174072265625, 1.5794677734375, 1.98486328125, 2.3902587890625, 2.795654296875, 3.2010498046875, 3.6064453125, 4.0118408203125, 4.417236328125, 4.8226318359375, 5.22802734375, 5.6334228515625, 6.038818359375, 6.4442138671875, 6.849609375, 7.2550048828125, 7.660400390625, 8.0657958984375, 8.47119140625, 8.8765869140625, 9.281982421875, 9.6873779296875, 10.0927734375, 10.4981689453125, 10.903564453125, 11.3089599609375, 11.71435546875, 12.1197509765625, 12.525146484375, 12.9305419921875, 13.3359375]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 6.0, 5.0, 10.0, 7.0, 13.0, 23.0, 31.0, 51.0, 77.0, 117.0, 121.0, 185.0, 253.0, 380.0, 470.0, 576.0, 502.0, 389.0, 253.0, 174.0, 136.0, 96.0, 59.0, 39.0, 32.0, 19.0, 21.0, 7.0, 4.0, 2.0, 5.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.4375, -13.04736328125, -12.6572265625, -12.26708984375, -11.876953125, -11.48681640625, -11.0966796875, -10.70654296875, -10.31640625, -9.92626953125, -9.5361328125, -9.14599609375, -8.755859375, -8.36572265625, -7.9755859375, -7.58544921875, -7.1953125, -6.80517578125, -6.4150390625, -6.02490234375, -5.634765625, -5.24462890625, -4.8544921875, -4.46435546875, -4.07421875, -3.68408203125, -3.2939453125, -2.90380859375, -2.513671875, -2.12353515625, -1.7333984375, -1.34326171875, -0.953125, -0.56298828125, -0.1728515625, 0.21728515625, 0.607421875, 0.99755859375, 1.3876953125, 1.77783203125, 2.16796875, 2.55810546875, 2.9482421875, 3.33837890625, 3.728515625, 4.11865234375, 4.5087890625, 4.89892578125, 5.2890625, 5.67919921875, 6.0693359375, 6.45947265625, 6.849609375, 7.23974609375, 7.6298828125, 8.02001953125, 8.41015625, 8.80029296875, 9.1904296875, 9.58056640625, 9.970703125, 10.36083984375, 10.7509765625, 11.14111328125, 11.53125]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 4.0, 3.0, 5.0, 9.0, 8.0, 14.0, 23.0, 22.0, 33.0, 54.0, 75.0, 125.0, 231.0, 351.0, 652.0, 1349.0, 3391.0, 9851.0, 36246.0, 163262.0, 1028716.0, 2443416.0, 399770.0, 77870.0, 18779.0, 5659.0, 2085.0, 949.0, 528.0, 295.0, 187.0, 99.0, 69.0, 52.0, 26.0, 14.0, 19.0, 12.0, 7.0, 9.0, 5.0, 3.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.7109375, -15.1917724609375, -14.672607421875, -14.1534423828125, -13.63427734375, -13.1151123046875, -12.595947265625, -12.0767822265625, -11.5576171875, -11.0384521484375, -10.519287109375, -10.0001220703125, -9.48095703125, -8.9617919921875, -8.442626953125, -7.9234619140625, -7.404296875, -6.8851318359375, -6.365966796875, -5.8468017578125, -5.32763671875, -4.8084716796875, -4.289306640625, -3.7701416015625, -3.2509765625, -2.7318115234375, -2.212646484375, -1.6934814453125, -1.17431640625, -0.6551513671875, -0.135986328125, 0.3831787109375, 0.90234375, 1.4215087890625, 1.940673828125, 2.4598388671875, 2.97900390625, 3.4981689453125, 4.017333984375, 4.5364990234375, 5.0556640625, 5.5748291015625, 6.093994140625, 6.6131591796875, 7.13232421875, 7.6514892578125, 8.170654296875, 8.6898193359375, 9.208984375, 9.7281494140625, 10.247314453125, 10.7664794921875, 11.28564453125, 11.8048095703125, 12.323974609375, 12.8431396484375, 13.3623046875, 13.8814697265625, 14.400634765625, 14.9197998046875, 15.43896484375, 15.9581298828125, 16.477294921875, 16.9964599609375, 17.515625]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 6.0, 10.0, 16.0, 23.0, 41.0, 49.0, 87.0, 95.0, 114.0, 106.0, 127.0, 77.0, 81.0, 51.0, 41.0, 25.0, 17.0, 16.0, 10.0, 9.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.65876007080078, -30.797504425048828, -28.936248779296875, -27.074993133544922, -25.21373748779297, -23.352481842041016, -21.491226196289062, -19.62997055053711, -17.768714904785156, -15.907459259033203, -14.04620361328125, -12.184947967529297, -10.323692321777344, -8.462437629699707, -6.601181983947754, -4.739926338195801, -2.878671646118164, -1.0174161195755005, 0.8438394069671631, 2.705094814300537, 4.56635046005249, 6.427605628967285, 8.288861274719238, 10.150116920471191, 12.011372566223145, 13.872628211975098, 15.73388385772705, 17.595138549804688, 19.45639419555664, 21.317649841308594, 23.178905487060547, 25.0401611328125, 26.901416778564453, 28.762672424316406, 30.62392807006836, 32.48518371582031, 34.346439361572266, 36.20769500732422, 38.06895065307617, 39.930206298828125, 41.79146194458008, 43.65271759033203, 45.513973236083984, 47.37522888183594, 49.23648452758789, 51.097740173339844, 52.9589958190918, 54.82025146484375, 56.68150329589844, 58.54275894165039, 60.404014587402344, 62.2652702331543, 64.12652587890625, 65.98777770996094, 67.84903717041016, 69.71028900146484, 71.57154846191406, 73.43280029296875, 75.29405975341797, 77.15531158447266, 79.01657104492188, 80.87782287597656, 82.73908233642578, 84.60033416748047, 86.46159362792969]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 7.0, 2.0, 3.0, 10.0, 11.0, 19.0, 14.0, 17.0, 17.0, 22.0, 23.0, 29.0, 36.0, 39.0, 30.0, 37.0, 34.0, 50.0, 41.0, 30.0, 52.0, 43.0, 21.0, 30.0, 38.0, 40.0, 29.0, 42.0, 32.0, 26.0, 28.0, 24.0, 27.0, 28.0, 7.0, 9.0, 11.0, 10.0, 13.0, 6.0, 9.0, 3.0, 5.0, 3.0, 1.0, 3.0], "bins": [-44.38105773925781, -43.23212432861328, -42.08319091796875, -40.93425369262695, -39.78532028198242, -38.63638687133789, -37.487449645996094, -36.33851623535156, -35.18958282470703, -34.0406494140625, -32.89171600341797, -31.742778778076172, -30.59384536743164, -29.44491195678711, -28.295976638793945, -27.14704132080078, -25.99810791015625, -24.84917449951172, -23.700239181518555, -22.55130386352539, -21.40237045288086, -20.253437042236328, -19.104501724243164, -17.95556640625, -16.80663299560547, -15.657698631286621, -14.508764266967773, -13.359829902648926, -12.210895538330078, -11.06196117401123, -9.913026809692383, -8.764092445373535, -7.6151580810546875, -6.46622371673584, -5.317289352416992, -4.1683549880981445, -3.019420623779297, -1.8704862594604492, -0.7215518951416016, 0.4273824691772461, 1.5763168334960938, 2.7252511978149414, 3.874185562133789, 5.023119926452637, 6.172054290771484, 7.320988655090332, 8.46992301940918, 9.618857383728027, 10.767791748046875, 11.916726112365723, 13.06566047668457, 14.214594841003418, 15.363529205322266, 16.512462615966797, 17.66139793395996, 18.810333251953125, 19.959266662597656, 21.108200073242188, 22.25713539123535, 23.406070709228516, 24.555004119873047, 25.703937530517578, 26.852872848510742, 28.001808166503906, 29.150741577148438]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 3.0, 5.0, 6.0, 8.0, 4.0, 5.0, 13.0, 15.0, 21.0, 21.0, 22.0, 26.0, 21.0, 27.0, 25.0, 43.0, 36.0, 36.0, 50.0, 42.0, 40.0, 51.0, 62.0, 44.0, 41.0, 30.0, 41.0, 28.0, 31.0, 39.0, 28.0, 26.0, 22.0, 23.0, 11.0, 17.0, 10.0, 6.0, 8.0, 5.0, 3.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-5.31640625, -5.16583251953125, -5.0152587890625, -4.86468505859375, -4.714111328125, -4.56353759765625, -4.4129638671875, -4.26239013671875, -4.11181640625, -3.96124267578125, -3.8106689453125, -3.66009521484375, -3.509521484375, -3.35894775390625, -3.2083740234375, -3.05780029296875, -2.9072265625, -2.75665283203125, -2.6060791015625, -2.45550537109375, -2.304931640625, -2.15435791015625, -2.0037841796875, -1.85321044921875, -1.70263671875, -1.55206298828125, -1.4014892578125, -1.25091552734375, -1.100341796875, -0.94976806640625, -0.7991943359375, -0.64862060546875, -0.498046875, -0.34747314453125, -0.1968994140625, -0.04632568359375, 0.104248046875, 0.25482177734375, 0.4053955078125, 0.55596923828125, 0.70654296875, 0.85711669921875, 1.0076904296875, 1.15826416015625, 1.308837890625, 1.45941162109375, 1.6099853515625, 1.76055908203125, 1.9111328125, 2.06170654296875, 2.2122802734375, 2.36285400390625, 2.513427734375, 2.66400146484375, 2.8145751953125, 2.96514892578125, 3.11572265625, 3.26629638671875, 3.4168701171875, 3.56744384765625, 3.718017578125, 3.86859130859375, 4.0191650390625, 4.16973876953125, 4.3203125]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 2.0, 2.0, 2.0, 9.0, 18.0, 22.0, 35.0, 43.0, 76.0, 113.0, 149.0, 280.0, 449.0, 624.0, 1065.0, 1685.0, 2879.0, 4892.0, 8642.0, 15116.0, 28058.0, 53788.0, 102781.0, 182174.0, 239235.0, 182507.0, 104626.0, 54287.0, 28721.0, 15493.0, 8529.0, 4794.0, 2824.0, 1807.0, 1013.0, 668.0, 401.0, 261.0, 165.0, 106.0, 68.0, 49.0, 35.0, 22.0, 15.0, 12.0, 8.0, 6.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.183349609375, -0.17691802978515625, -0.1704864501953125, -0.16405487060546875, -0.157623291015625, -0.15119171142578125, -0.1447601318359375, -0.13832855224609375, -0.13189697265625, -0.12546539306640625, -0.1190338134765625, -0.11260223388671875, -0.106170654296875, -0.09973907470703125, -0.0933074951171875, -0.08687591552734375, -0.0804443359375, -0.07401275634765625, -0.0675811767578125, -0.06114959716796875, -0.054718017578125, -0.04828643798828125, -0.0418548583984375, -0.03542327880859375, -0.02899169921875, -0.02256011962890625, -0.0161285400390625, -0.00969696044921875, -0.003265380859375, 0.00316619873046875, 0.0095977783203125, 0.01602935791015625, 0.0224609375, 0.02889251708984375, 0.0353240966796875, 0.04175567626953125, 0.048187255859375, 0.05461883544921875, 0.0610504150390625, 0.06748199462890625, 0.07391357421875, 0.08034515380859375, 0.0867767333984375, 0.09320831298828125, 0.099639892578125, 0.10607147216796875, 0.1125030517578125, 0.11893463134765625, 0.1253662109375, 0.13179779052734375, 0.1382293701171875, 0.14466094970703125, 0.151092529296875, 0.15752410888671875, 0.1639556884765625, 0.17038726806640625, 0.17681884765625, 0.18325042724609375, 0.1896820068359375, 0.19611358642578125, 0.202545166015625, 0.20897674560546875, 0.2154083251953125, 0.22183990478515625, 0.228271484375]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 4.0, 11.0, 6.0, 6.0, 10.0, 7.0, 9.0, 9.0, 15.0, 15.0, 14.0, 19.0, 18.0, 24.0, 21.0, 29.0, 32.0, 30.0, 32.0, 27.0, 45.0, 31.0, 27.0, 43.0, 1066.0, 33.0, 34.0, 43.0, 47.0, 27.0, 44.0, 33.0, 26.0, 36.0, 26.0, 19.0, 20.0, 15.0, 12.0, 13.0, 17.0, 7.0, 4.0, 5.0, 3.0, 3.0, 5.0, 1.0, 5.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.865234375, -2.77978515625, -2.6943359375, -2.60888671875, -2.5234375, -2.43798828125, -2.3525390625, -2.26708984375, -2.181640625, -2.09619140625, -2.0107421875, -1.92529296875, -1.83984375, -1.75439453125, -1.6689453125, -1.58349609375, -1.498046875, -1.41259765625, -1.3271484375, -1.24169921875, -1.15625, -1.07080078125, -0.9853515625, -0.89990234375, -0.814453125, -0.72900390625, -0.6435546875, -0.55810546875, -0.47265625, -0.38720703125, -0.3017578125, -0.21630859375, -0.130859375, -0.04541015625, 0.0400390625, 0.12548828125, 0.2109375, 0.29638671875, 0.3818359375, 0.46728515625, 0.552734375, 0.63818359375, 0.7236328125, 0.80908203125, 0.89453125, 0.97998046875, 1.0654296875, 1.15087890625, 1.236328125, 1.32177734375, 1.4072265625, 1.49267578125, 1.578125, 1.66357421875, 1.7490234375, 1.83447265625, 1.919921875, 2.00537109375, 2.0908203125, 2.17626953125, 2.26171875, 2.34716796875, 2.4326171875, 2.51806640625, 2.603515625]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 3.0, 2.0, 7.0, 18.0, 16.0, 34.0, 58.0, 91.0, 144.0, 207.0, 345.0, 454.0, 729.0, 1016.0, 1514.0, 2221.0, 3261.0, 4775.0, 7075.0, 10824.0, 16616.0, 26027.0, 42009.0, 68650.0, 109393.0, 156406.0, 1225227.0, 148156.0, 100524.0, 62691.0, 38743.0, 24117.0, 15391.0, 9978.0, 6722.0, 4370.0, 2959.0, 2086.0, 1427.0, 925.0, 672.0, 420.0, 309.0, 197.0, 122.0, 83.0, 53.0, 29.0, 15.0, 16.0, 6.0, 3.0, 5.0, 2.0, 0.0, 1.0], "bins": [-0.1622314453125, -0.1575164794921875, -0.152801513671875, -0.1480865478515625, -0.14337158203125, -0.1386566162109375, -0.133941650390625, -0.1292266845703125, -0.12451171875, -0.1197967529296875, -0.115081787109375, -0.1103668212890625, -0.10565185546875, -0.1009368896484375, -0.096221923828125, -0.0915069580078125, -0.0867919921875, -0.0820770263671875, -0.077362060546875, -0.0726470947265625, -0.06793212890625, -0.0632171630859375, -0.058502197265625, -0.0537872314453125, -0.049072265625, -0.0443572998046875, -0.039642333984375, -0.0349273681640625, -0.03021240234375, -0.0254974365234375, -0.020782470703125, -0.0160675048828125, -0.0113525390625, -0.0066375732421875, -0.001922607421875, 0.0027923583984375, 0.00750732421875, 0.0122222900390625, 0.016937255859375, 0.0216522216796875, 0.0263671875, 0.0310821533203125, 0.035797119140625, 0.0405120849609375, 0.04522705078125, 0.0499420166015625, 0.054656982421875, 0.0593719482421875, 0.0640869140625, 0.0688018798828125, 0.073516845703125, 0.0782318115234375, 0.08294677734375, 0.0876617431640625, 0.092376708984375, 0.0970916748046875, 0.101806640625, 0.1065216064453125, 0.111236572265625, 0.1159515380859375, 0.12066650390625, 0.1253814697265625, 0.130096435546875, 0.1348114013671875, 0.1395263671875]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 2.0, 4.0, 1.0, 2.0, 3.0, 2.0, 4.0, 4.0, 8.0, 17.0, 11.0, 10.0, 16.0, 18.0, 29.0, 32.0, 16.0, 26.0, 47.0, 48.0, 43.0, 43.0, 63.0, 58.0, 52.0, 55.0, 54.0, 39.0, 58.0, 42.0, 33.0, 33.0, 21.0, 25.0, 16.0, 11.0, 12.0, 7.0, 6.0, 6.0, 2.0, 8.0, 8.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0007658004760742188, -0.0007423609495162964, -0.000718921422958374, -0.0006954818964004517, -0.0006720423698425293, -0.0006486028432846069, -0.0006251633167266846, -0.0006017237901687622, -0.0005782842636108398, -0.0005548447370529175, -0.0005314052104949951, -0.0005079656839370728, -0.0004845261573791504, -0.00046108663082122803, -0.00043764710426330566, -0.0004142075777053833, -0.00039076805114746094, -0.0003673285245895386, -0.0003438889980316162, -0.00032044947147369385, -0.0002970099449157715, -0.0002735704183578491, -0.00025013089179992676, -0.0002266913652420044, -0.00020325183868408203, -0.00017981231212615967, -0.0001563727855682373, -0.00013293325901031494, -0.00010949373245239258, -8.605420589447021e-05, -6.261467933654785e-05, -3.917515277862549e-05, -1.5735626220703125e-05, 7.703900337219238e-06, 3.11434268951416e-05, 5.4582953453063965e-05, 7.802248001098633e-05, 0.00010146200656890869, 0.00012490153312683105, 0.00014834105968475342, 0.00017178058624267578, 0.00019522011280059814, 0.0002186596393585205, 0.00024209916591644287, 0.00026553869247436523, 0.0002889782190322876, 0.00031241774559020996, 0.0003358572721481323, 0.0003592967987060547, 0.00038273632526397705, 0.0004061758518218994, 0.0004296153783798218, 0.00045305490493774414, 0.0004764944314956665, 0.0004999339580535889, 0.0005233734846115112, 0.0005468130111694336, 0.000570252537727356, 0.0005936920642852783, 0.0006171315908432007, 0.000640571117401123, 0.0006640106439590454, 0.0006874501705169678, 0.0007108896970748901, 0.0007343292236328125]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 7.0, 3.0, 7.0, 10.0, 10.0, 8.0, 16.0, 16.0, 22.0, 43.0, 33.0, 59.0, 74.0, 84.0, 157.0, 201.0, 314.0, 515.0, 2866.0, 225090.0, 806103.0, 10921.0, 774.0, 381.0, 230.0, 161.0, 94.0, 77.0, 65.0, 39.0, 38.0, 35.0, 21.0, 21.0, 15.0, 12.0, 4.0, 6.0, 5.0, 2.0, 1.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.01200103759765625, -0.011616230010986328, -0.011231422424316406, -0.010846614837646484, -0.010461807250976562, -0.01007699966430664, -0.009692192077636719, -0.009307384490966797, -0.008922576904296875, -0.008537769317626953, -0.008152961730957031, -0.007768154144287109, -0.0073833465576171875, -0.006998538970947266, -0.006613731384277344, -0.006228923797607422, -0.0058441162109375, -0.005459308624267578, -0.005074501037597656, -0.004689693450927734, -0.0043048858642578125, -0.003920078277587891, -0.0035352706909179688, -0.003150463104248047, -0.002765655517578125, -0.002380847930908203, -0.0019960403442382812, -0.0016112327575683594, -0.0012264251708984375, -0.0008416175842285156, -0.00045680999755859375, -7.200241088867188e-05, 0.00031280517578125, 0.0006976127624511719, 0.0010824203491210938, 0.0014672279357910156, 0.0018520355224609375, 0.0022368431091308594, 0.0026216506958007812, 0.003006458282470703, 0.003391265869140625, 0.003776073455810547, 0.004160881042480469, 0.004545688629150391, 0.0049304962158203125, 0.005315303802490234, 0.005700111389160156, 0.006084918975830078, 0.0064697265625, 0.006854534149169922, 0.007239341735839844, 0.007624149322509766, 0.008008956909179688, 0.00839376449584961, 0.008778572082519531, 0.009163379669189453, 0.009548187255859375, 0.009932994842529297, 0.010317802429199219, 0.01070261001586914, 0.011087417602539062, 0.011472225189208984, 0.011857032775878906, 0.012241840362548828, 0.01262664794921875]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 8.0, 19.0, 59.0, 127.0, 235.0, 257.0, 158.0, 95.0, 31.0, 14.0, 8.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0022775267716497183, -0.002234741346910596, -0.0021919559221714735, -0.002149170497432351, -0.0021063850726932287, -0.00206359988078475, -0.0020208144560456276, -0.001978029031306505, -0.0019352436065673828, -0.0018924581818282604, -0.001849672757089138, -0.0018068874487653375, -0.001764102024026215, -0.0017213165992870927, -0.0016785311745479703, -0.0016357458662241697, -0.0015929604414850473, -0.001550175016745925, -0.0015073895920068026, -0.001464604283683002, -0.0014218188589438796, -0.0013790334342047572, -0.0013362480094656348, -0.0012934627011418343, -0.00125067715998739, -0.0012078917352482677, -0.0011651063105091453, -0.0011223210021853447, -0.0010795355774462223, -0.0010367501527071, -0.0009939647279679775, -0.000951179361436516, -0.0009083939366973937, -0.0008656085119582713, -0.0008228231454268098, -0.0007800377206876874, -0.0007372523541562259, -0.0006944669294171035, -0.000651681562885642, -0.0006088961381465197, -0.0005661107134073973, -0.0005233252886682749, -0.0004805399221368134, -0.000437754497397691, -0.00039496913086622953, -0.00035218370612710714, -0.0003093983104918152, -0.0002666129148565233, -0.0002238275483250618, -0.00018104215268976986, -0.00013825675705447793, -9.547134686727077e-05, -5.2685951231978834e-05, -9.9005555966869e-06, 3.288485459052026e-05, 7.56702502258122e-05, 0.00011845564586110413, 0.00016124104149639606, 0.000204026437131688, 0.00024681183276697993, 0.0002895972575061023, 0.0003323826240375638, 0.0003751680487766862, 0.0004179534444119781, 0.00046073884004727006]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 4.0, 1.0, 3.0, 4.0, 10.0, 7.0, 14.0, 9.0, 16.0, 18.0, 13.0, 15.0, 25.0, 18.0, 25.0, 25.0, 24.0, 31.0, 28.0, 33.0, 44.0, 40.0, 25.0, 28.0, 38.0, 47.0, 39.0, 32.0, 33.0, 43.0, 34.0, 38.0, 30.0, 35.0, 20.0, 23.0, 21.0, 12.0, 23.0, 18.0, 14.0, 4.0, 7.0, 9.0, 7.0, 6.0, 7.0, 4.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0003566145896911621, -0.0003436431288719177, -0.00033067166805267334, -0.00031770020723342896, -0.00030472874641418457, -0.0002917572855949402, -0.0002787858247756958, -0.0002658143639564514, -0.00025284290313720703, -0.00023987144231796265, -0.00022689998149871826, -0.00021392852067947388, -0.0002009570598602295, -0.0001879855990409851, -0.00017501413822174072, -0.00016204267740249634, -0.00014907121658325195, -0.00013609975576400757, -0.00012312829494476318, -0.0001101568341255188, -9.718537330627441e-05, -8.421391248703003e-05, -7.124245166778564e-05, -5.827099084854126e-05, -4.5299530029296875e-05, -3.232806921005249e-05, -1.9356608390808105e-05, -6.385147571563721e-06, 6.586313247680664e-06, 1.955777406692505e-05, 3.2529234886169434e-05, 4.550069570541382e-05, 5.84721565246582e-05, 7.144361734390259e-05, 8.441507816314697e-05, 9.738653898239136e-05, 0.00011035799980163574, 0.00012332946062088013, 0.0001363009214401245, 0.0001492723822593689, 0.00016224384307861328, 0.00017521530389785767, 0.00018818676471710205, 0.00020115822553634644, 0.00021412968635559082, 0.0002271011471748352, 0.0002400726079940796, 0.000253044068813324, 0.00026601552963256836, 0.00027898699045181274, 0.00029195845127105713, 0.0003049299120903015, 0.0003179013729095459, 0.0003308728337287903, 0.00034384429454803467, 0.00035681575536727905, 0.00036978721618652344, 0.0003827586770057678, 0.0003957301378250122, 0.0004087015986442566, 0.000421673059463501, 0.00043464452028274536, 0.00044761598110198975, 0.00046058744192123413, 0.0004735589027404785]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 3.0, 5.0, 6.0, 8.0, 4.0, 5.0, 13.0, 15.0, 21.0, 21.0, 22.0, 26.0, 21.0, 27.0, 25.0, 43.0, 36.0, 36.0, 50.0, 42.0, 41.0, 50.0, 62.0, 44.0, 41.0, 30.0, 41.0, 28.0, 31.0, 39.0, 28.0, 26.0, 22.0, 23.0, 11.0, 17.0, 10.0, 6.0, 8.0, 5.0, 3.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-5.31640625, -5.16583251953125, -5.0152587890625, -4.86468505859375, -4.714111328125, -4.56353759765625, -4.4129638671875, -4.26239013671875, -4.11181640625, -3.96124267578125, -3.8106689453125, -3.66009521484375, -3.509521484375, -3.35894775390625, -3.2083740234375, -3.05780029296875, -2.9072265625, -2.75665283203125, -2.6060791015625, -2.45550537109375, -2.304931640625, -2.15435791015625, -2.0037841796875, -1.85321044921875, -1.70263671875, -1.55206298828125, -1.4014892578125, -1.25091552734375, -1.100341796875, -0.94976806640625, -0.7991943359375, -0.64862060546875, -0.498046875, -0.34747314453125, -0.1968994140625, -0.04632568359375, 0.104248046875, 0.25482177734375, 0.4053955078125, 0.55596923828125, 0.70654296875, 0.85711669921875, 1.0076904296875, 1.15826416015625, 1.308837890625, 1.45941162109375, 1.6099853515625, 1.76055908203125, 1.9111328125, 2.06170654296875, 2.2122802734375, 2.36285400390625, 2.513427734375, 2.66400146484375, 2.8145751953125, 2.96514892578125, 3.11572265625, 3.26629638671875, 3.4168701171875, 3.56744384765625, 3.718017578125, 3.86859130859375, 4.0191650390625, 4.16973876953125, 4.3203125]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 3.0, 5.0, 1.0, 2.0, 9.0, 8.0, 9.0, 15.0, 24.0, 29.0, 28.0, 62.0, 74.0, 93.0, 137.0, 173.0, 212.0, 283.0, 432.0, 580.0, 840.0, 1141.0, 1675.0, 2411.0, 3670.0, 5656.0, 9421.0, 17765.0, 40749.0, 117963.0, 431498.0, 271993.0, 76256.0, 28828.0, 13780.0, 7804.0, 4685.0, 3034.0, 2012.0, 1414.0, 1052.0, 697.0, 532.0, 380.0, 300.0, 212.0, 155.0, 115.0, 83.0, 70.0, 57.0, 38.0, 20.0, 21.0, 16.0, 14.0, 11.0, 11.0, 4.0, 5.0, 1.0, 2.0], "bins": [-3.912109375, -3.792877197265625, -3.67364501953125, -3.554412841796875, -3.4351806640625, -3.315948486328125, -3.19671630859375, -3.077484130859375, -2.958251953125, -2.839019775390625, -2.71978759765625, -2.600555419921875, -2.4813232421875, -2.362091064453125, -2.24285888671875, -2.123626708984375, -2.00439453125, -1.885162353515625, -1.76593017578125, -1.646697998046875, -1.5274658203125, -1.408233642578125, -1.28900146484375, -1.169769287109375, -1.050537109375, -0.931304931640625, -0.81207275390625, -0.692840576171875, -0.5736083984375, -0.454376220703125, -0.33514404296875, -0.215911865234375, -0.0966796875, 0.022552490234375, 0.14178466796875, 0.261016845703125, 0.3802490234375, 0.499481201171875, 0.61871337890625, 0.737945556640625, 0.857177734375, 0.976409912109375, 1.09564208984375, 1.214874267578125, 1.3341064453125, 1.453338623046875, 1.57257080078125, 1.691802978515625, 1.81103515625, 1.930267333984375, 2.04949951171875, 2.168731689453125, 2.2879638671875, 2.407196044921875, 2.52642822265625, 2.645660400390625, 2.764892578125, 2.884124755859375, 3.00335693359375, 3.122589111328125, 3.2418212890625, 3.361053466796875, 3.48028564453125, 3.599517822265625, 3.71875]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 4.0, 5.0, 10.0, 16.0, 7.0, 7.0, 19.0, 18.0, 18.0, 22.0, 26.0, 21.0, 28.0, 42.0, 42.0, 38.0, 63.0, 60.0, 85.0, 167.0, 1589.0, 198.0, 87.0, 63.0, 51.0, 46.0, 48.0, 38.0, 33.0, 24.0, 21.0, 18.0, 21.0, 20.0, 12.0, 12.0, 12.0, 8.0, 11.0, 15.0, 3.0, 6.0, 3.0, 2.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-14.78125, -14.312744140625, -13.84423828125, -13.375732421875, -12.9072265625, -12.438720703125, -11.97021484375, -11.501708984375, -11.033203125, -10.564697265625, -10.09619140625, -9.627685546875, -9.1591796875, -8.690673828125, -8.22216796875, -7.753662109375, -7.28515625, -6.816650390625, -6.34814453125, -5.879638671875, -5.4111328125, -4.942626953125, -4.47412109375, -4.005615234375, -3.537109375, -3.068603515625, -2.60009765625, -2.131591796875, -1.6630859375, -1.194580078125, -0.72607421875, -0.257568359375, 0.2109375, 0.679443359375, 1.14794921875, 1.616455078125, 2.0849609375, 2.553466796875, 3.02197265625, 3.490478515625, 3.958984375, 4.427490234375, 4.89599609375, 5.364501953125, 5.8330078125, 6.301513671875, 6.77001953125, 7.238525390625, 7.70703125, 8.175537109375, 8.64404296875, 9.112548828125, 9.5810546875, 10.049560546875, 10.51806640625, 10.986572265625, 11.455078125, 11.923583984375, 12.39208984375, 12.860595703125, 13.3291015625, 13.797607421875, 14.26611328125, 14.734619140625, 15.203125]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 4.0, 11.0, 7.0, 17.0, 17.0, 22.0, 25.0, 48.0, 61.0, 80.0, 145.0, 254.0, 567.0, 2438.0, 47666.0, 3069659.0, 21855.0, 1717.0, 483.0, 246.0, 115.0, 68.0, 54.0, 51.0, 22.0, 27.0, 13.0, 9.0, 8.0, 8.0, 2.0, 2.0, 3.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.75, -40.376953125, -39.00390625, -37.630859375, -36.2578125, -34.884765625, -33.51171875, -32.138671875, -30.765625, -29.392578125, -28.01953125, -26.646484375, -25.2734375, -23.900390625, -22.52734375, -21.154296875, -19.78125, -18.408203125, -17.03515625, -15.662109375, -14.2890625, -12.916015625, -11.54296875, -10.169921875, -8.796875, -7.423828125, -6.05078125, -4.677734375, -3.3046875, -1.931640625, -0.55859375, 0.814453125, 2.1875, 3.560546875, 4.93359375, 6.306640625, 7.6796875, 9.052734375, 10.42578125, 11.798828125, 13.171875, 14.544921875, 15.91796875, 17.291015625, 18.6640625, 20.037109375, 21.41015625, 22.783203125, 24.15625, 25.529296875, 26.90234375, 28.275390625, 29.6484375, 31.021484375, 32.39453125, 33.767578125, 35.140625, 36.513671875, 37.88671875, 39.259765625, 40.6328125, 42.005859375, 43.37890625, 44.751953125, 46.125]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 60.0, 746.0, 202.0, 6.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.9249210357666, -25.482179641723633, -20.039438247680664, -14.596696853637695, -9.153955459594727, -3.711214065551758, 1.731527328491211, 7.17426872253418, 12.617010116577148, 18.059751510620117, 23.502492904663086, 28.945234298706055, 34.387977600097656, 39.830718994140625, 45.273460388183594, 50.71620178222656, 56.15894317626953, 61.6016845703125, 67.04442596435547, 72.48716735839844, 77.9299087524414, 83.37265014648438, 88.81539154052734, 94.25813293457031, 99.70087432861328, 105.14361572265625, 110.58635711669922, 116.02909851074219, 121.47183990478516, 126.91458129882812, 132.35733032226562, 137.80006408691406, 143.2427978515625, 148.685546875, 154.12828063964844, 159.57101440429688, 165.01376342773438, 170.45651245117188, 175.8992462158203, 181.34197998046875, 186.78472900390625, 192.22747802734375, 197.6702117919922, 203.11294555664062, 208.55569458007812, 213.99844360351562, 219.44117736816406, 224.8839111328125, 230.32666015625, 235.7694091796875, 241.21214294433594, 246.65487670898438, 252.09762573242188, 257.5403747558594, 262.98309326171875, 268.42584228515625, 273.86859130859375, 279.31134033203125, 284.75408935546875, 290.1968078613281, 295.6395568847656, 301.0823059082031, 306.5250244140625, 311.9677734375, 317.4105224609375]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 6.0, 4.0, 2.0, 2.0, 6.0, 7.0, 6.0, 12.0, 14.0, 12.0, 13.0, 16.0, 22.0, 18.0, 30.0, 19.0, 33.0, 35.0, 34.0, 39.0, 34.0, 42.0, 50.0, 31.0, 45.0, 36.0, 44.0, 24.0, 49.0, 42.0, 36.0, 35.0, 34.0, 28.0, 16.0, 25.0, 13.0, 15.0, 14.0, 13.0, 13.0, 7.0, 6.0, 8.0, 10.0, 5.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-44.25762176513672, -42.87405776977539, -41.49049758911133, -40.10693359375, -38.72337341308594, -37.33980941772461, -35.95624542236328, -34.57268524169922, -33.189125061035156, -31.80556297302246, -30.422000885009766, -29.038436889648438, -27.654876708984375, -26.271312713623047, -24.88775062561035, -23.504188537597656, -22.120624542236328, -20.737062454223633, -19.353500366210938, -17.96993637084961, -16.586376190185547, -15.202813148498535, -13.819250106811523, -12.435688018798828, -11.052125930786133, -9.668563842773438, -8.285001754760742, -6.9014387130737305, -5.517876625061035, -4.13431453704834, -2.750751495361328, -1.3671894073486328, 0.0163726806640625, 1.399935007095337, 2.7834973335266113, 4.167059898376465, 5.55062198638916, 6.9341840744018555, 8.317747116088867, 9.701309204101562, 11.084871292114258, 12.468433380126953, 13.851995468139648, 15.23555850982666, 16.619121551513672, 18.002681732177734, 19.386245727539062, 20.769807815551758, 22.153369903564453, 23.53693199157715, 24.920494079589844, 26.304058074951172, 27.687618255615234, 29.071182250976562, 30.454744338989258, 31.838306427001953, 33.22187042236328, 34.60543441772461, 35.98899459838867, 37.37255859375, 38.75611877441406, 40.13968276977539, 41.52324676513672, 42.90680694580078, 44.290367126464844]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 8.0, 6.0, 4.0, 4.0, 8.0, 12.0, 13.0, 22.0, 16.0, 16.0, 30.0, 19.0, 33.0, 37.0, 42.0, 37.0, 44.0, 47.0, 54.0, 42.0, 49.0, 45.0, 49.0, 47.0, 28.0, 41.0, 42.0, 31.0, 29.0, 29.0, 24.0, 20.0, 18.0, 13.0, 14.0, 6.0, 8.0, 5.0, 3.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-5.66796875, -5.50616455078125, -5.3443603515625, -5.18255615234375, -5.020751953125, -4.85894775390625, -4.6971435546875, -4.53533935546875, -4.37353515625, -4.21173095703125, -4.0499267578125, -3.88812255859375, -3.726318359375, -3.56451416015625, -3.4027099609375, -3.24090576171875, -3.0791015625, -2.91729736328125, -2.7554931640625, -2.59368896484375, -2.431884765625, -2.27008056640625, -2.1082763671875, -1.94647216796875, -1.78466796875, -1.62286376953125, -1.4610595703125, -1.29925537109375, -1.137451171875, -0.97564697265625, -0.8138427734375, -0.65203857421875, -0.490234375, -0.32843017578125, -0.1666259765625, -0.00482177734375, 0.156982421875, 0.31878662109375, 0.4805908203125, 0.64239501953125, 0.80419921875, 0.96600341796875, 1.1278076171875, 1.28961181640625, 1.451416015625, 1.61322021484375, 1.7750244140625, 1.93682861328125, 2.0986328125, 2.26043701171875, 2.4222412109375, 2.58404541015625, 2.745849609375, 2.90765380859375, 3.0694580078125, 3.23126220703125, 3.39306640625, 3.55487060546875, 3.7166748046875, 3.87847900390625, 4.040283203125, 4.20208740234375, 4.3638916015625, 4.52569580078125, 4.6875]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 6.0, 14.0, 14.0, 22.0, 23.0, 39.0, 57.0, 86.0, 122.0, 224.0, 361.0, 582.0, 971.0, 1676.0, 3203.0, 5639.0, 10638.0, 21598.0, 46006.0, 114560.0, 363910.0, 1140758.0, 1517211.0, 643523.0, 192558.0, 69624.0, 30076.0, 14292.0, 7349.0, 3905.0, 2136.0, 1244.0, 710.0, 440.0, 237.0, 154.0, 123.0, 55.0, 50.0, 37.0, 14.0, 13.0, 5.0, 8.0, 7.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.37109375, -5.19342041015625, -5.0157470703125, -4.83807373046875, -4.660400390625, -4.48272705078125, -4.3050537109375, -4.12738037109375, -3.94970703125, -3.77203369140625, -3.5943603515625, -3.41668701171875, -3.239013671875, -3.06134033203125, -2.8836669921875, -2.70599365234375, -2.5283203125, -2.35064697265625, -2.1729736328125, -1.99530029296875, -1.817626953125, -1.63995361328125, -1.4622802734375, -1.28460693359375, -1.10693359375, -0.92926025390625, -0.7515869140625, -0.57391357421875, -0.396240234375, -0.21856689453125, -0.0408935546875, 0.13677978515625, 0.314453125, 0.49212646484375, 0.6697998046875, 0.84747314453125, 1.025146484375, 1.20281982421875, 1.3804931640625, 1.55816650390625, 1.73583984375, 1.91351318359375, 2.0911865234375, 2.26885986328125, 2.446533203125, 2.62420654296875, 2.8018798828125, 2.97955322265625, 3.1572265625, 3.33489990234375, 3.5125732421875, 3.69024658203125, 3.867919921875, 4.04559326171875, 4.2232666015625, 4.40093994140625, 4.57861328125, 4.75628662109375, 4.9339599609375, 5.11163330078125, 5.289306640625, 5.46697998046875, 5.6446533203125, 5.82232666015625, 6.0]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 6.0, 8.0, 9.0, 12.0, 12.0, 28.0, 44.0, 57.0, 89.0, 128.0, 177.0, 282.0, 399.0, 540.0, 632.0, 521.0, 372.0, 252.0, 150.0, 118.0, 87.0, 45.0, 28.0, 24.0, 24.0, 13.0, 9.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-18.0625, -17.6141357421875, -17.165771484375, -16.7174072265625, -16.26904296875, -15.8206787109375, -15.372314453125, -14.9239501953125, -14.4755859375, -14.0272216796875, -13.578857421875, -13.1304931640625, -12.68212890625, -12.2337646484375, -11.785400390625, -11.3370361328125, -10.888671875, -10.4403076171875, -9.991943359375, -9.5435791015625, -9.09521484375, -8.6468505859375, -8.198486328125, -7.7501220703125, -7.3017578125, -6.8533935546875, -6.405029296875, -5.9566650390625, -5.50830078125, -5.0599365234375, -4.611572265625, -4.1632080078125, -3.71484375, -3.2664794921875, -2.818115234375, -2.3697509765625, -1.92138671875, -1.4730224609375, -1.024658203125, -0.5762939453125, -0.1279296875, 0.3204345703125, 0.768798828125, 1.2171630859375, 1.66552734375, 2.1138916015625, 2.562255859375, 3.0106201171875, 3.458984375, 3.9073486328125, 4.355712890625, 4.8040771484375, 5.25244140625, 5.7008056640625, 6.149169921875, 6.5975341796875, 7.0458984375, 7.4942626953125, 7.942626953125, 8.3909912109375, 8.83935546875, 9.2877197265625, 9.736083984375, 10.1844482421875, 10.6328125]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 8.0, 3.0, 8.0, 22.0, 25.0, 40.0, 54.0, 85.0, 138.0, 233.0, 387.0, 908.0, 2220.0, 8374.0, 41256.0, 271784.0, 2644877.0, 1080675.0, 115611.0, 20146.0, 4659.0, 1427.0, 562.0, 293.0, 178.0, 113.0, 67.0, 40.0, 31.0, 21.0, 14.0, 11.0, 7.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.5546875, -14.9007568359375, -14.246826171875, -13.5928955078125, -12.93896484375, -12.2850341796875, -11.631103515625, -10.9771728515625, -10.3232421875, -9.6693115234375, -9.015380859375, -8.3614501953125, -7.70751953125, -7.0535888671875, -6.399658203125, -5.7457275390625, -5.091796875, -4.4378662109375, -3.783935546875, -3.1300048828125, -2.47607421875, -1.8221435546875, -1.168212890625, -0.5142822265625, 0.1396484375, 0.7935791015625, 1.447509765625, 2.1014404296875, 2.75537109375, 3.4093017578125, 4.063232421875, 4.7171630859375, 5.37109375, 6.0250244140625, 6.678955078125, 7.3328857421875, 7.98681640625, 8.6407470703125, 9.294677734375, 9.9486083984375, 10.6025390625, 11.2564697265625, 11.910400390625, 12.5643310546875, 13.21826171875, 13.8721923828125, 14.526123046875, 15.1800537109375, 15.833984375, 16.4879150390625, 17.141845703125, 17.7957763671875, 18.44970703125, 19.1036376953125, 19.757568359375, 20.4114990234375, 21.0654296875, 21.7193603515625, 22.373291015625, 23.0272216796875, 23.68115234375, 24.3350830078125, 24.989013671875, 25.6429443359375, 26.296875]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 7.0, 25.0, 49.0, 110.0, 164.0, 196.0, 175.0, 160.0, 74.0, 30.0, 18.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-175.703857421875, -172.17605590820312, -168.6482696533203, -165.12046813964844, -161.59266662597656, -158.06488037109375, -154.53707885742188, -151.00927734375, -147.4814910888672, -143.9536895751953, -140.4259033203125, -136.89810180664062, -133.37030029296875, -129.84251403808594, -126.31471252441406, -122.78691101074219, -119.25910949707031, -115.73131561279297, -112.2035140991211, -108.67572021484375, -105.1479263305664, -101.62012481689453, -98.09233093261719, -94.56452941894531, -91.0367431640625, -87.50894927978516, -83.98114776611328, -80.45335388183594, -76.9255599975586, -73.39775848388672, -69.86996459960938, -66.3421630859375, -62.814369201660156, -59.28657150268555, -55.7587776184082, -52.230979919433594, -48.703182220458984, -45.175384521484375, -41.64759063720703, -38.11979293823242, -34.59199523925781, -31.064199447631836, -27.536401748657227, -24.00860595703125, -20.48080825805664, -16.953012466430664, -13.425216674804688, -9.897418975830078, -6.369625091552734, -2.8418285846710205, 0.6859679222106934, 4.213764190673828, 7.741560935974121, 11.269357681274414, 14.79715347290039, 18.324951171875, 21.852746963500977, 25.380542755126953, 28.908340454101562, 32.436134338378906, 35.963932037353516, 39.491729736328125, 43.01952362060547, 46.547325134277344, 50.07511901855469]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 2.0, 0.0, 3.0, 0.0, 4.0, 5.0, 7.0, 8.0, 13.0, 14.0, 11.0, 11.0, 23.0, 29.0, 29.0, 34.0, 24.0, 33.0, 44.0, 43.0, 37.0, 37.0, 45.0, 47.0, 51.0, 54.0, 42.0, 41.0, 51.0, 34.0, 39.0, 36.0, 25.0, 24.0, 26.0, 22.0, 16.0, 9.0, 8.0, 11.0, 4.0, 3.0, 4.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-49.245849609375, -47.93264389038086, -46.61943435668945, -45.30622863769531, -43.99302291870117, -42.67981719970703, -41.366607666015625, -40.053401947021484, -38.740196228027344, -37.4269905090332, -36.1137809753418, -34.800575256347656, -33.487369537353516, -32.174163818359375, -30.86095428466797, -29.547748565673828, -28.234540939331055, -26.92133331298828, -25.60812759399414, -24.294919967651367, -22.981714248657227, -21.668506622314453, -20.355300903320312, -19.04209327697754, -17.728885650634766, -16.415678024291992, -15.102472305297852, -13.789264678955078, -12.476058959960938, -11.162851333618164, -9.849644660949707, -8.53643798828125, -7.223232269287109, -5.910025596618652, -4.596818923950195, -3.28361177444458, -1.970405101776123, -0.657198429107666, 0.6560087203979492, 1.9692153930664062, 3.2824220657348633, 4.59562873840332, 5.908835411071777, 7.222042560577393, 8.535249710083008, 9.848455429077148, 11.161663055419922, 12.474869728088379, 13.788076400756836, 15.101283073425293, 16.41448974609375, 17.727697372436523, 19.040903091430664, 20.354110717773438, 21.667316436767578, 22.98052406311035, 24.293731689453125, 25.6069393157959, 26.92014503479004, 28.233352661132812, 29.546558380126953, 30.859766006469727, 32.1729736328125, 33.48617935180664, 34.79938507080078]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 4.0, 5.0, 6.0, 4.0, 6.0, 15.0, 14.0, 15.0, 18.0, 16.0, 20.0, 26.0, 23.0, 33.0, 48.0, 31.0, 38.0, 32.0, 46.0, 39.0, 53.0, 43.0, 49.0, 40.0, 52.0, 30.0, 38.0, 27.0, 31.0, 29.0, 33.0, 22.0, 29.0, 18.0, 13.0, 12.0, 13.0, 9.0, 8.0, 4.0, 4.0, 5.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-5.43359375, -5.27459716796875, -5.1156005859375, -4.95660400390625, -4.797607421875, -4.63861083984375, -4.4796142578125, -4.32061767578125, -4.16162109375, -4.00262451171875, -3.8436279296875, -3.68463134765625, -3.525634765625, -3.36663818359375, -3.2076416015625, -3.04864501953125, -2.8896484375, -2.73065185546875, -2.5716552734375, -2.41265869140625, -2.253662109375, -2.09466552734375, -1.9356689453125, -1.77667236328125, -1.61767578125, -1.45867919921875, -1.2996826171875, -1.14068603515625, -0.981689453125, -0.82269287109375, -0.6636962890625, -0.50469970703125, -0.345703125, -0.18670654296875, -0.0277099609375, 0.13128662109375, 0.290283203125, 0.44927978515625, 0.6082763671875, 0.76727294921875, 0.92626953125, 1.08526611328125, 1.2442626953125, 1.40325927734375, 1.562255859375, 1.72125244140625, 1.8802490234375, 2.03924560546875, 2.1982421875, 2.35723876953125, 2.5162353515625, 2.67523193359375, 2.834228515625, 2.99322509765625, 3.1522216796875, 3.31121826171875, 3.47021484375, 3.62921142578125, 3.7882080078125, 3.94720458984375, 4.106201171875, 4.26519775390625, 4.4241943359375, 4.58319091796875, 4.7421875]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [5.0, 0.0, 2.0, 2.0, 1.0, 1.0, 8.0, 12.0, 12.0, 25.0, 28.0, 49.0, 81.0, 129.0, 158.0, 253.0, 417.0, 588.0, 1008.0, 1487.0, 2348.0, 3630.0, 5779.0, 9039.0, 14882.0, 24656.0, 40857.0, 70548.0, 119813.0, 184339.0, 204669.0, 145408.0, 88125.0, 51291.0, 30233.0, 18434.0, 11192.0, 6929.0, 4313.0, 2805.0, 1744.0, 1177.0, 718.0, 433.0, 323.0, 221.0, 144.0, 88.0, 57.0, 33.0, 27.0, 16.0, 14.0, 11.0, 1.0, 7.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.183837890625, -0.1777515411376953, -0.17166519165039062, -0.16557884216308594, -0.15949249267578125, -0.15340614318847656, -0.14731979370117188, -0.1412334442138672, -0.1351470947265625, -0.1290607452392578, -0.12297439575195312, -0.11688804626464844, -0.11080169677734375, -0.10471534729003906, -0.09862899780273438, -0.09254264831542969, -0.086456298828125, -0.08036994934082031, -0.07428359985351562, -0.06819725036621094, -0.06211090087890625, -0.05602455139160156, -0.049938201904296875, -0.04385185241699219, -0.0377655029296875, -0.03167915344238281, -0.025592803955078125, -0.019506454467773438, -0.01342010498046875, -0.0073337554931640625, -0.001247406005859375, 0.0048389434814453125, 0.01092529296875, 0.017011642456054688, 0.023097991943359375, 0.029184341430664062, 0.03527069091796875, 0.04135704040527344, 0.047443389892578125, 0.05352973937988281, 0.0596160888671875, 0.06570243835449219, 0.07178878784179688, 0.07787513732910156, 0.08396148681640625, 0.09004783630371094, 0.09613418579101562, 0.10222053527832031, 0.108306884765625, 0.11439323425292969, 0.12047958374023438, 0.12656593322753906, 0.13265228271484375, 0.13873863220214844, 0.14482498168945312, 0.1509113311767578, 0.1569976806640625, 0.1630840301513672, 0.16917037963867188, 0.17525672912597656, 0.18134307861328125, 0.18742942810058594, 0.19351577758789062, 0.1996021270751953, 0.2056884765625]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 3.0, 0.0, 7.0, 7.0, 9.0, 11.0, 13.0, 19.0, 20.0, 15.0, 19.0, 35.0, 27.0, 24.0, 28.0, 35.0, 33.0, 35.0, 51.0, 38.0, 33.0, 1065.0, 40.0, 34.0, 35.0, 42.0, 27.0, 38.0, 41.0, 25.0, 28.0, 30.0, 25.0, 25.0, 23.0, 14.0, 8.0, 12.0, 11.0, 10.0, 11.0, 5.0, 7.0, 6.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.69140625, -2.597686767578125, -2.50396728515625, -2.410247802734375, -2.3165283203125, -2.222808837890625, -2.12908935546875, -2.035369873046875, -1.941650390625, -1.847930908203125, -1.75421142578125, -1.660491943359375, -1.5667724609375, -1.473052978515625, -1.37933349609375, -1.285614013671875, -1.19189453125, -1.098175048828125, -1.00445556640625, -0.910736083984375, -0.8170166015625, -0.723297119140625, -0.62957763671875, -0.535858154296875, -0.442138671875, -0.348419189453125, -0.25469970703125, -0.160980224609375, -0.0672607421875, 0.026458740234375, 0.12017822265625, 0.213897705078125, 0.3076171875, 0.401336669921875, 0.49505615234375, 0.588775634765625, 0.6824951171875, 0.776214599609375, 0.86993408203125, 0.963653564453125, 1.057373046875, 1.151092529296875, 1.24481201171875, 1.338531494140625, 1.4322509765625, 1.525970458984375, 1.61968994140625, 1.713409423828125, 1.80712890625, 1.900848388671875, 1.99456787109375, 2.088287353515625, 2.1820068359375, 2.275726318359375, 2.36944580078125, 2.463165283203125, 2.556884765625, 2.650604248046875, 2.74432373046875, 2.838043212890625, 2.9317626953125, 3.025482177734375, 3.11920166015625, 3.212921142578125, 3.306640625]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 2.0, 7.0, 11.0, 12.0, 26.0, 41.0, 59.0, 98.0, 153.0, 245.0, 363.0, 593.0, 848.0, 1282.0, 1923.0, 3103.0, 4518.0, 7178.0, 11208.0, 17675.0, 28524.0, 45970.0, 75669.0, 120193.0, 168978.0, 1226675.0, 140940.0, 91341.0, 56209.0, 34441.0, 21319.0, 13367.0, 8390.0, 5461.0, 3582.0, 2357.0, 1503.0, 981.0, 683.0, 435.0, 257.0, 206.0, 132.0, 63.0, 44.0, 29.0, 18.0, 11.0, 5.0, 4.0, 7.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1505126953125, -0.1453571319580078, -0.14020156860351562, -0.13504600524902344, -0.12989044189453125, -0.12473487854003906, -0.11957931518554688, -0.11442375183105469, -0.1092681884765625, -0.10411262512207031, -0.09895706176757812, -0.09380149841308594, -0.08864593505859375, -0.08349037170410156, -0.07833480834960938, -0.07317924499511719, -0.068023681640625, -0.06286811828613281, -0.057712554931640625, -0.05255699157714844, -0.04740142822265625, -0.04224586486816406, -0.037090301513671875, -0.03193473815917969, -0.0267791748046875, -0.021623611450195312, -0.016468048095703125, -0.011312484741210938, -0.00615692138671875, -0.0010013580322265625, 0.004154205322265625, 0.009309768676757812, 0.01446533203125, 0.019620895385742188, 0.024776458740234375, 0.029932022094726562, 0.03508758544921875, 0.04024314880371094, 0.045398712158203125, 0.05055427551269531, 0.0557098388671875, 0.06086540222167969, 0.06602096557617188, 0.07117652893066406, 0.07633209228515625, 0.08148765563964844, 0.08664321899414062, 0.09179878234863281, 0.096954345703125, 0.10210990905761719, 0.10726547241210938, 0.11242103576660156, 0.11757659912109375, 0.12273216247558594, 0.12788772583007812, 0.1330432891845703, 0.1381988525390625, 0.1433544158935547, 0.14850997924804688, 0.15366554260253906, 0.15882110595703125, 0.16397666931152344, 0.16913223266601562, 0.1742877960205078, 0.179443359375]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 3.0, 8.0, 7.0, 8.0, 7.0, 7.0, 2.0, 15.0, 10.0, 15.0, 13.0, 29.0, 33.0, 40.0, 36.0, 39.0, 51.0, 53.0, 62.0, 55.0, 59.0, 68.0, 50.0, 46.0, 50.0, 49.0, 25.0, 27.0, 27.0, 28.0, 11.0, 11.0, 12.0, 9.0, 5.0, 8.0, 5.0, 7.0, 4.0, 5.0, 3.0, 1.0, 4.0, 1.0, 0.0, 2.0, 1.0, 4.0], "bins": [-0.0011186599731445312, -0.0010878071188926697, -0.001056954264640808, -0.0010261014103889465, -0.000995248556137085, -0.0009643957018852234, -0.0009335428476333618, -0.0009026899933815002, -0.0008718371391296387, -0.0008409842848777771, -0.0008101314306259155, -0.000779278576374054, -0.0007484257221221924, -0.0007175728678703308, -0.0006867200136184692, -0.0006558671593666077, -0.0006250143051147461, -0.0005941614508628845, -0.000563308596611023, -0.0005324557423591614, -0.0005016028881072998, -0.00047075003385543823, -0.00043989717960357666, -0.0004090443253517151, -0.0003781914710998535, -0.00034733861684799194, -0.00031648576259613037, -0.0002856329083442688, -0.0002547800540924072, -0.00022392719984054565, -0.00019307434558868408, -0.0001622214913368225, -0.00013136863708496094, -0.00010051578283309937, -6.966292858123779e-05, -3.881007432937622e-05, -7.957220077514648e-06, 2.2895634174346924e-05, 5.3748488426208496e-05, 8.460134267807007e-05, 0.00011545419692993164, 0.0001463070511817932, 0.00017715990543365479, 0.00020801275968551636, 0.00023886561393737793, 0.0002697184681892395, 0.0003005713224411011, 0.00033142417669296265, 0.0003622770309448242, 0.0003931298851966858, 0.00042398273944854736, 0.00045483559370040894, 0.0004856884479522705, 0.0005165413022041321, 0.0005473941564559937, 0.0005782470107078552, 0.0006090998649597168, 0.0006399527192115784, 0.0006708055734634399, 0.0007016584277153015, 0.0007325112819671631, 0.0007633641362190247, 0.0007942169904708862, 0.0008250698447227478, 0.0008559226989746094]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 2.0, 5.0, 0.0, 3.0, 4.0, 5.0, 6.0, 4.0, 11.0, 10.0, 18.0, 18.0, 29.0, 37.0, 43.0, 76.0, 86.0, 144.0, 245.0, 426.0, 995.0, 22678.0, 984636.0, 36743.0, 1135.0, 423.0, 243.0, 134.0, 103.0, 80.0, 56.0, 45.0, 36.0, 20.0, 11.0, 9.0, 7.0, 8.0, 4.0, 7.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0164337158203125, -0.015877485275268555, -0.01532125473022461, -0.014765024185180664, -0.014208793640136719, -0.013652563095092773, -0.013096332550048828, -0.012540102005004883, -0.011983871459960938, -0.011427640914916992, -0.010871410369873047, -0.010315179824829102, -0.009758949279785156, -0.009202718734741211, -0.008646488189697266, -0.00809025764465332, -0.007534027099609375, -0.00697779655456543, -0.006421566009521484, -0.005865335464477539, -0.005309104919433594, -0.0047528743743896484, -0.004196643829345703, -0.003640413284301758, -0.0030841827392578125, -0.002527952194213867, -0.001971721649169922, -0.0014154911041259766, -0.0008592605590820312, -0.00030303001403808594, 0.0002532005310058594, 0.0008094310760498047, 0.00136566162109375, 0.0019218921661376953, 0.0024781227111816406, 0.003034353256225586, 0.0035905838012695312, 0.0041468143463134766, 0.004703044891357422, 0.005259275436401367, 0.0058155059814453125, 0.006371736526489258, 0.006927967071533203, 0.0074841976165771484, 0.008040428161621094, 0.008596658706665039, 0.009152889251708984, 0.00970911979675293, 0.010265350341796875, 0.01082158088684082, 0.011377811431884766, 0.011934041976928711, 0.012490272521972656, 0.013046503067016602, 0.013602733612060547, 0.014158964157104492, 0.014715194702148438, 0.015271425247192383, 0.015827655792236328, 0.016383886337280273, 0.01694011688232422, 0.017496347427368164, 0.01805257797241211, 0.018608808517456055, 0.0191650390625]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 29.0, 480.0, 481.0, 28.0], "bins": [-0.011031245812773705, -0.010853352956473827, -0.01067546010017395, -0.010497568175196648, -0.01031967531889677, -0.010141782462596893, -0.009963889606297016, -0.009785996749997139, -0.009608104825019836, -0.00943021196871996, -0.009252319112420082, -0.00907442718744278, -0.008896534331142902, -0.008718641474843025, -0.008540748618543148, -0.008362855762243271, -0.008184963837265968, -0.008007070980966091, -0.007829178124666214, -0.007651285734027624, -0.007473393343389034, -0.007295500487089157, -0.00711760763078928, -0.00693971524015069, -0.006761821918189526, -0.0065839290618896484, -0.006406036671251059, -0.006228143814951181, -0.0060502514243125916, -0.005872358568012714, -0.005694465711712837, -0.005516573321074247, -0.0053386809304356575, -0.00516078807413578, -0.0049828956834971905, -0.004805002827197313, -0.0046271104365587234, -0.004449217580258846, -0.004271324723958969, -0.004093432333320379, -0.003915539477020502, -0.0037376468535512686, -0.003559754230082035, -0.003381861373782158, -0.003203968983143568, -0.003026076126843691, -0.0028481835033744574, -0.002670290879905224, -0.0024923982564359903, -0.002314505632966757, -0.0021366130094975233, -0.00195872038602829, -0.0017808276461437345, -0.001602935022674501, -0.0014250422827899456, -0.001247149659320712, -0.0010692570358514786, -0.0008913644123822451, -0.0007134717307053506, -0.0005355790490284562, -0.0003576864255592227, -0.00017979380208998919, -1.9010622054338455e-06, 0.00017599156126379967, 0.0003538841556292027]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 6.0, 9.0, 9.0, 18.0, 22.0, 21.0, 20.0, 28.0, 27.0, 37.0, 31.0, 35.0, 42.0, 45.0, 37.0, 34.0, 47.0, 65.0, 40.0, 45.0, 56.0, 60.0, 47.0, 44.0, 25.0, 23.0, 29.0, 21.0, 19.0, 16.0, 14.0, 10.0, 5.0, 4.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0007114410400390625, -0.0006903428584337234, -0.0006692446768283844, -0.0006481464952230453, -0.0006270483136177063, -0.0006059501320123672, -0.0005848519504070282, -0.0005637537688016891, -0.0005426555871963501, -0.000521557405591011, -0.000500459223985672, -0.00047936104238033295, -0.0004582628607749939, -0.00043716467916965485, -0.0004160664975643158, -0.00039496831595897675, -0.0003738701343536377, -0.00035277195274829865, -0.0003316737711429596, -0.00031057558953762054, -0.0002894774079322815, -0.00026837922632694244, -0.0002472810447216034, -0.00022618286311626434, -0.0002050846815109253, -0.00018398649990558624, -0.0001628883183002472, -0.00014179013669490814, -0.00012069195508956909, -9.959377348423004e-05, -7.849559187889099e-05, -5.739741027355194e-05, -3.629922866821289e-05, -1.520104706287384e-05, 5.89713454246521e-06, 2.699531614780426e-05, 4.809349775314331e-05, 6.919167935848236e-05, 9.028986096382141e-05, 0.00011138804256916046, 0.0001324862241744995, 0.00015358440577983856, 0.0001746825873851776, 0.00019578076899051666, 0.0002168789505958557, 0.00023797713220119476, 0.0002590753138065338, 0.00028017349541187286, 0.0003012716770172119, 0.00032236985862255096, 0.00034346804022789, 0.00036456622183322906, 0.0003856644034385681, 0.00040676258504390717, 0.0004278607666492462, 0.00044895894825458527, 0.0004700571298599243, 0.0004911553114652634, 0.0005122534930706024, 0.0005333516746759415, 0.0005544498562812805, 0.0005755480378866196, 0.0005966462194919586, 0.0006177444010972977, 0.0006388425827026367]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 4.0, 5.0, 6.0, 4.0, 6.0, 15.0, 14.0, 15.0, 18.0, 16.0, 20.0, 27.0, 22.0, 33.0, 48.0, 31.0, 38.0, 32.0, 46.0, 39.0, 53.0, 43.0, 49.0, 40.0, 52.0, 30.0, 38.0, 27.0, 31.0, 29.0, 33.0, 22.0, 29.0, 18.0, 13.0, 12.0, 13.0, 9.0, 8.0, 4.0, 4.0, 5.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-5.43359375, -5.27459716796875, -5.1156005859375, -4.95660400390625, -4.797607421875, -4.63861083984375, -4.4796142578125, -4.32061767578125, -4.16162109375, -4.00262451171875, -3.8436279296875, -3.68463134765625, -3.525634765625, -3.36663818359375, -3.2076416015625, -3.04864501953125, -2.8896484375, -2.73065185546875, -2.5716552734375, -2.41265869140625, -2.253662109375, -2.09466552734375, -1.9356689453125, -1.77667236328125, -1.61767578125, -1.45867919921875, -1.2996826171875, -1.14068603515625, -0.981689453125, -0.82269287109375, -0.6636962890625, -0.50469970703125, -0.345703125, -0.18670654296875, -0.0277099609375, 0.13128662109375, 0.290283203125, 0.44927978515625, 0.6082763671875, 0.76727294921875, 0.92626953125, 1.08526611328125, 1.2442626953125, 1.40325927734375, 1.562255859375, 1.72125244140625, 1.8802490234375, 2.03924560546875, 2.1982421875, 2.35723876953125, 2.5162353515625, 2.67523193359375, 2.834228515625, 2.99322509765625, 3.1522216796875, 3.31121826171875, 3.47021484375, 3.62921142578125, 3.7882080078125, 3.94720458984375, 4.106201171875, 4.26519775390625, 4.4241943359375, 4.58319091796875, 4.7421875]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 0.0, 4.0, 1.0, 3.0, 5.0, 11.0, 8.0, 13.0, 19.0, 35.0, 33.0, 37.0, 66.0, 91.0, 111.0, 159.0, 228.0, 326.0, 435.0, 660.0, 961.0, 1512.0, 2377.0, 3972.0, 7723.0, 17093.0, 46241.0, 178559.0, 555405.0, 156390.0, 42227.0, 16017.0, 7265.0, 3832.0, 2299.0, 1402.0, 880.0, 636.0, 408.0, 332.0, 237.0, 150.0, 102.0, 79.0, 62.0, 37.0, 24.0, 27.0, 27.0, 11.0, 5.0, 9.0, 6.0, 6.0, 2.0, 0.0, 3.0, 3.0, 1.0, 2.0], "bins": [-4.5703125, -4.42950439453125, -4.2886962890625, -4.14788818359375, -4.007080078125, -3.86627197265625, -3.7254638671875, -3.58465576171875, -3.44384765625, -3.30303955078125, -3.1622314453125, -3.02142333984375, -2.880615234375, -2.73980712890625, -2.5989990234375, -2.45819091796875, -2.3173828125, -2.17657470703125, -2.0357666015625, -1.89495849609375, -1.754150390625, -1.61334228515625, -1.4725341796875, -1.33172607421875, -1.19091796875, -1.05010986328125, -0.9093017578125, -0.76849365234375, -0.627685546875, -0.48687744140625, -0.3460693359375, -0.20526123046875, -0.064453125, 0.07635498046875, 0.2171630859375, 0.35797119140625, 0.498779296875, 0.63958740234375, 0.7803955078125, 0.92120361328125, 1.06201171875, 1.20281982421875, 1.3436279296875, 1.48443603515625, 1.625244140625, 1.76605224609375, 1.9068603515625, 2.04766845703125, 2.1884765625, 2.32928466796875, 2.4700927734375, 2.61090087890625, 2.751708984375, 2.89251708984375, 3.0333251953125, 3.17413330078125, 3.31494140625, 3.45574951171875, 3.5965576171875, 3.73736572265625, 3.878173828125, 4.01898193359375, 4.1597900390625, 4.30059814453125, 4.44140625]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 2.0, 0.0, 12.0, 12.0, 5.0, 14.0, 15.0, 6.0, 21.0, 27.0, 28.0, 21.0, 28.0, 45.0, 46.0, 43.0, 51.0, 54.0, 141.0, 1549.0, 314.0, 121.0, 65.0, 66.0, 47.0, 60.0, 31.0, 27.0, 20.0, 17.0, 28.0, 22.0, 22.0, 20.0, 13.0, 12.0, 13.0, 10.0, 8.0, 4.0, 5.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.640625, -16.083984375, -15.52734375, -14.970703125, -14.4140625, -13.857421875, -13.30078125, -12.744140625, -12.1875, -11.630859375, -11.07421875, -10.517578125, -9.9609375, -9.404296875, -8.84765625, -8.291015625, -7.734375, -7.177734375, -6.62109375, -6.064453125, -5.5078125, -4.951171875, -4.39453125, -3.837890625, -3.28125, -2.724609375, -2.16796875, -1.611328125, -1.0546875, -0.498046875, 0.05859375, 0.615234375, 1.171875, 1.728515625, 2.28515625, 2.841796875, 3.3984375, 3.955078125, 4.51171875, 5.068359375, 5.625, 6.181640625, 6.73828125, 7.294921875, 7.8515625, 8.408203125, 8.96484375, 9.521484375, 10.078125, 10.634765625, 11.19140625, 11.748046875, 12.3046875, 12.861328125, 13.41796875, 13.974609375, 14.53125, 15.087890625, 15.64453125, 16.201171875, 16.7578125, 17.314453125, 17.87109375, 18.427734375, 18.984375]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 5.0, 6.0, 7.0, 15.0, 19.0, 26.0, 29.0, 42.0, 54.0, 72.0, 133.0, 192.0, 355.0, 734.0, 4517.0, 2466088.0, 668379.0, 3530.0, 692.0, 293.0, 192.0, 115.0, 64.0, 44.0, 25.0, 20.0, 21.0, 17.0, 10.0, 3.0, 9.0, 4.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.59375, -36.98291015625, -35.3720703125, -33.76123046875, -32.150390625, -30.53955078125, -28.9287109375, -27.31787109375, -25.70703125, -24.09619140625, -22.4853515625, -20.87451171875, -19.263671875, -17.65283203125, -16.0419921875, -14.43115234375, -12.8203125, -11.20947265625, -9.5986328125, -7.98779296875, -6.376953125, -4.76611328125, -3.1552734375, -1.54443359375, 0.06640625, 1.67724609375, 3.2880859375, 4.89892578125, 6.509765625, 8.12060546875, 9.7314453125, 11.34228515625, 12.953125, 14.56396484375, 16.1748046875, 17.78564453125, 19.396484375, 21.00732421875, 22.6181640625, 24.22900390625, 25.83984375, 27.45068359375, 29.0615234375, 30.67236328125, 32.283203125, 33.89404296875, 35.5048828125, 37.11572265625, 38.7265625, 40.33740234375, 41.9482421875, 43.55908203125, 45.169921875, 46.78076171875, 48.3916015625, 50.00244140625, 51.61328125, 53.22412109375, 54.8349609375, 56.44580078125, 58.056640625, 59.66748046875, 61.2783203125, 62.88916015625, 64.5]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 9.0, 16.0, 51.0, 97.0, 185.0, 224.0, 187.0, 126.0, 50.0, 31.0, 15.0, 7.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.00701332092285, -27.95994758605957, -26.912883758544922, -25.86581802368164, -24.818754196166992, -23.77168846130371, -22.724624633789062, -21.67755889892578, -20.6304931640625, -19.58342742919922, -18.53636360168457, -17.48929786682129, -16.44223403930664, -15.39516830444336, -14.348103523254395, -13.30103874206543, -12.253974914550781, -11.206910133361816, -10.159845352172852, -9.11277961730957, -8.065715789794922, -7.018650531768799, -5.971585273742676, -4.924520492553711, -3.877455711364746, -2.8303909301757812, -1.7833259105682373, -0.7362608909606934, 0.3108038902282715, 1.3578686714172363, 2.4049339294433594, 3.451998710632324, 4.499061584472656, 5.546126365661621, 6.593191146850586, 7.640256404876709, 8.687320709228516, 9.734386444091797, 10.781451225280762, 11.828516006469727, 12.875580787658691, 13.922645568847656, 14.969710350036621, 16.016775131225586, 17.063840866088867, 18.110904693603516, 19.157970428466797, 20.205036163330078, 21.252099990844727, 22.299165725708008, 23.346229553222656, 24.393295288085938, 25.440359115600586, 26.487424850463867, 27.534488677978516, 28.581554412841797, 29.628620147705078, 30.67568588256836, 31.722749710083008, 32.769813537597656, 33.81687927246094, 34.86394500732422, 35.9110107421875, 36.95807647705078, 38.0051383972168]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 2.0, 1.0, 2.0, 5.0, 3.0, 8.0, 7.0, 10.0, 10.0, 14.0, 6.0, 30.0, 16.0, 26.0, 22.0, 33.0, 18.0, 30.0, 31.0, 38.0, 36.0, 41.0, 38.0, 37.0, 38.0, 34.0, 32.0, 37.0, 36.0, 36.0, 46.0, 37.0, 32.0, 33.0, 36.0, 16.0, 20.0, 18.0, 19.0, 11.0, 9.0, 13.0, 11.0, 10.0, 5.0, 7.0, 5.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-42.002071380615234, -40.70711898803711, -39.412166595458984, -38.11721420288086, -36.82225799560547, -35.527305603027344, -34.23235321044922, -32.937400817871094, -31.64244842529297, -30.347496032714844, -29.05254364013672, -27.75758934020996, -26.462636947631836, -25.16768455505371, -23.872730255126953, -22.577777862548828, -21.282825469970703, -19.987873077392578, -18.692920684814453, -17.397966384887695, -16.10301399230957, -14.808061599731445, -13.513108253479004, -12.218154907226562, -10.923202514648438, -9.628250122070312, -8.333296775817871, -7.038343906402588, -5.743391036987305, -4.4484381675720215, -3.1534852981567383, -1.8585319519042969, -0.5635833740234375, 0.7313694953918457, 2.026322364807129, 3.321275234222412, 4.616228103637695, 5.9111809730529785, 7.206133842468262, 8.501087188720703, 9.796039581298828, 11.090991973876953, 12.385945320129395, 13.680898666381836, 14.975851058959961, 16.270803451538086, 17.565757751464844, 18.86071014404297, 20.155662536621094, 21.45061492919922, 22.745567321777344, 24.0405216217041, 25.335474014282227, 26.63042640686035, 27.92538070678711, 29.220333099365234, 30.51528549194336, 31.810237884521484, 33.10519027709961, 34.400142669677734, 35.695098876953125, 36.99005126953125, 38.285003662109375, 39.5799560546875, 40.874908447265625]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 8.0, 3.0, 11.0, 11.0, 8.0, 13.0, 15.0, 20.0, 15.0, 30.0, 22.0, 29.0, 23.0, 40.0, 30.0, 46.0, 42.0, 38.0, 39.0, 48.0, 46.0, 41.0, 45.0, 45.0, 41.0, 24.0, 26.0, 36.0, 31.0, 27.0, 22.0, 27.0, 23.0, 17.0, 10.0, 10.0, 6.0, 10.0, 7.0, 6.0, 3.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0], "bins": [-5.36328125, -5.205810546875, -5.04833984375, -4.890869140625, -4.7333984375, -4.575927734375, -4.41845703125, -4.260986328125, -4.103515625, -3.946044921875, -3.78857421875, -3.631103515625, -3.4736328125, -3.316162109375, -3.15869140625, -3.001220703125, -2.84375, -2.686279296875, -2.52880859375, -2.371337890625, -2.2138671875, -2.056396484375, -1.89892578125, -1.741455078125, -1.583984375, -1.426513671875, -1.26904296875, -1.111572265625, -0.9541015625, -0.796630859375, -0.63916015625, -0.481689453125, -0.32421875, -0.166748046875, -0.00927734375, 0.148193359375, 0.3056640625, 0.463134765625, 0.62060546875, 0.778076171875, 0.935546875, 1.093017578125, 1.25048828125, 1.407958984375, 1.5654296875, 1.722900390625, 1.88037109375, 2.037841796875, 2.1953125, 2.352783203125, 2.51025390625, 2.667724609375, 2.8251953125, 2.982666015625, 3.14013671875, 3.297607421875, 3.455078125, 3.612548828125, 3.77001953125, 3.927490234375, 4.0849609375, 4.242431640625, 4.39990234375, 4.557373046875, 4.71484375]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 9.0, 12.0, 6.0, 8.0, 7.0, 12.0, 19.0, 20.0, 31.0, 36.0, 42.0, 45.0, 64.0, 100.0, 192.0, 482.0, 1870.0, 10264.0, 96123.0, 2687851.0, 1339079.0, 49692.0, 6234.0, 1188.0, 363.0, 150.0, 80.0, 62.0, 55.0, 39.0, 35.0, 27.0, 24.0, 12.0, 11.0, 13.0, 10.0, 6.0, 2.0, 1.0, 6.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.078125, -18.439453125, -17.80078125, -17.162109375, -16.5234375, -15.884765625, -15.24609375, -14.607421875, -13.96875, -13.330078125, -12.69140625, -12.052734375, -11.4140625, -10.775390625, -10.13671875, -9.498046875, -8.859375, -8.220703125, -7.58203125, -6.943359375, -6.3046875, -5.666015625, -5.02734375, -4.388671875, -3.75, -3.111328125, -2.47265625, -1.833984375, -1.1953125, -0.556640625, 0.08203125, 0.720703125, 1.359375, 1.998046875, 2.63671875, 3.275390625, 3.9140625, 4.552734375, 5.19140625, 5.830078125, 6.46875, 7.107421875, 7.74609375, 8.384765625, 9.0234375, 9.662109375, 10.30078125, 10.939453125, 11.578125, 12.216796875, 12.85546875, 13.494140625, 14.1328125, 14.771484375, 15.41015625, 16.048828125, 16.6875, 17.326171875, 17.96484375, 18.603515625, 19.2421875, 19.880859375, 20.51953125, 21.158203125, 21.796875]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 8.0, 10.0, 15.0, 13.0, 30.0, 49.0, 39.0, 68.0, 104.0, 154.0, 247.0, 336.0, 498.0, 584.0, 570.0, 438.0, 288.0, 196.0, 134.0, 92.0, 63.0, 39.0, 25.0, 26.0, 10.0, 7.0, 11.0, 5.0, 2.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.8359375, -13.3997802734375, -12.963623046875, -12.5274658203125, -12.09130859375, -11.6551513671875, -11.218994140625, -10.7828369140625, -10.3466796875, -9.9105224609375, -9.474365234375, -9.0382080078125, -8.60205078125, -8.1658935546875, -7.729736328125, -7.2935791015625, -6.857421875, -6.4212646484375, -5.985107421875, -5.5489501953125, -5.11279296875, -4.6766357421875, -4.240478515625, -3.8043212890625, -3.3681640625, -2.9320068359375, -2.495849609375, -2.0596923828125, -1.62353515625, -1.1873779296875, -0.751220703125, -0.3150634765625, 0.12109375, 0.5572509765625, 0.993408203125, 1.4295654296875, 1.86572265625, 2.3018798828125, 2.738037109375, 3.1741943359375, 3.6103515625, 4.0465087890625, 4.482666015625, 4.9188232421875, 5.35498046875, 5.7911376953125, 6.227294921875, 6.6634521484375, 7.099609375, 7.5357666015625, 7.971923828125, 8.4080810546875, 8.84423828125, 9.2803955078125, 9.716552734375, 10.1527099609375, 10.5888671875, 11.0250244140625, 11.461181640625, 11.8973388671875, 12.33349609375, 12.7696533203125, 13.205810546875, 13.6419677734375, 14.078125]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 7.0, 4.0, 8.0, 9.0, 15.0, 24.0, 26.0, 45.0, 93.0, 144.0, 303.0, 670.0, 2279.0, 16016.0, 380520.0, 3636826.0, 145857.0, 8681.0, 1646.0, 546.0, 223.0, 125.0, 85.0, 40.0, 38.0, 22.0, 7.0, 10.0, 6.0, 3.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.53125, -36.3349609375, -35.138671875, -33.9423828125, -32.74609375, -31.5498046875, -30.353515625, -29.1572265625, -27.9609375, -26.7646484375, -25.568359375, -24.3720703125, -23.17578125, -21.9794921875, -20.783203125, -19.5869140625, -18.390625, -17.1943359375, -15.998046875, -14.8017578125, -13.60546875, -12.4091796875, -11.212890625, -10.0166015625, -8.8203125, -7.6240234375, -6.427734375, -5.2314453125, -4.03515625, -2.8388671875, -1.642578125, -0.4462890625, 0.75, 1.9462890625, 3.142578125, 4.3388671875, 5.53515625, 6.7314453125, 7.927734375, 9.1240234375, 10.3203125, 11.5166015625, 12.712890625, 13.9091796875, 15.10546875, 16.3017578125, 17.498046875, 18.6943359375, 19.890625, 21.0869140625, 22.283203125, 23.4794921875, 24.67578125, 25.8720703125, 27.068359375, 28.2646484375, 29.4609375, 30.6572265625, 31.853515625, 33.0498046875, 34.24609375, 35.4423828125, 36.638671875, 37.8349609375, 39.03125]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 18.0, 49.0, 107.0, 223.0, 275.0, 190.0, 98.0, 32.0, 9.0, 8.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-108.51905822753906, -103.89047241210938, -99.26188659667969, -94.63330078125, -90.00471496582031, -85.37612915039062, -80.74754333496094, -76.11895751953125, -71.49037170410156, -66.86178588867188, -62.23320007324219, -57.6046142578125, -52.97602844238281, -48.347442626953125, -43.71885681152344, -39.09027099609375, -34.46168518066406, -29.833099365234375, -25.204513549804688, -20.575927734375, -15.947341918945312, -11.318756103515625, -6.6901702880859375, -2.06158447265625, 2.5670013427734375, 7.195587158203125, 11.824172973632812, 16.4527587890625, 21.081344604492188, 25.709930419921875, 30.338516235351562, 34.96710205078125, 39.59568786621094, 44.224273681640625, 48.85285949707031, 53.4814453125, 58.11003112792969, 62.738616943359375, 67.36720275878906, 71.99578857421875, 76.62437438964844, 81.25296020507812, 85.88154602050781, 90.5101318359375, 95.13871765136719, 99.76730346679688, 104.39588928222656, 109.02447509765625, 113.65306091308594, 118.28164672851562, 122.91023254394531, 127.538818359375, 132.1674041748047, 136.79598999023438, 141.42457580566406, 146.05316162109375, 150.68174743652344, 155.31033325195312, 159.9389190673828, 164.5675048828125, 169.1960906982422, 173.82467651367188, 178.45326232910156, 183.08184814453125, 187.71043395996094]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 5.0, 1.0, 2.0, 6.0, 8.0, 5.0, 8.0, 6.0, 7.0, 13.0, 20.0, 23.0, 17.0, 20.0, 25.0, 24.0, 28.0, 44.0, 33.0, 36.0, 40.0, 42.0, 47.0, 46.0, 49.0, 45.0, 47.0, 41.0, 25.0, 35.0, 28.0, 28.0, 29.0, 30.0, 38.0, 15.0, 18.0, 10.0, 13.0, 16.0, 9.0, 8.0, 8.0, 5.0, 6.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.179771423339844, -31.954757690429688, -30.72974395751953, -29.504730224609375, -28.279714584350586, -27.05470085144043, -25.829687118530273, -24.604671478271484, -23.379657745361328, -22.154644012451172, -20.929630279541016, -19.70461654663086, -18.47960090637207, -17.254587173461914, -16.029573440551758, -14.804558753967285, -13.579545974731445, -12.354532241821289, -11.129517555236816, -9.90450382232666, -8.679489135742188, -7.454475402832031, -6.229461669921875, -5.004446983337402, -3.779433250427246, -2.5544190406799316, -1.3294050693511963, -0.10439109802246094, 1.1206231117248535, 2.345637321472168, 3.570651054382324, 4.795665740966797, 6.020679473876953, 7.245693683624268, 8.470707893371582, 9.695721626281738, 10.920736312866211, 12.145750045776367, 13.370763778686523, 14.595778465270996, 15.820792198181152, 17.045806884765625, 18.27082061767578, 19.495834350585938, 20.720848083496094, 21.94586181640625, 23.170875549316406, 24.395891189575195, 25.62090492248535, 26.845918655395508, 28.070932388305664, 29.295948028564453, 30.52096176147461, 31.745975494384766, 32.97098922729492, 34.19600296020508, 35.421016693115234, 36.64603042602539, 37.87104415893555, 39.0960578918457, 40.32107162475586, 41.54608917236328, 42.77110290527344, 43.996116638183594, 45.22113037109375]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 6.0, 8.0, 5.0, 7.0, 10.0, 10.0, 12.0, 13.0, 16.0, 21.0, 14.0, 28.0, 28.0, 25.0, 31.0, 43.0, 37.0, 40.0, 37.0, 48.0, 42.0, 37.0, 44.0, 51.0, 28.0, 38.0, 36.0, 51.0, 22.0, 29.0, 24.0, 28.0, 25.0, 20.0, 21.0, 16.0, 9.0, 6.0, 11.0, 5.0, 10.0, 2.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-5.41015625, -5.24853515625, -5.0869140625, -4.92529296875, -4.763671875, -4.60205078125, -4.4404296875, -4.27880859375, -4.1171875, -3.95556640625, -3.7939453125, -3.63232421875, -3.470703125, -3.30908203125, -3.1474609375, -2.98583984375, -2.82421875, -2.66259765625, -2.5009765625, -2.33935546875, -2.177734375, -2.01611328125, -1.8544921875, -1.69287109375, -1.53125, -1.36962890625, -1.2080078125, -1.04638671875, -0.884765625, -0.72314453125, -0.5615234375, -0.39990234375, -0.23828125, -0.07666015625, 0.0849609375, 0.24658203125, 0.408203125, 0.56982421875, 0.7314453125, 0.89306640625, 1.0546875, 1.21630859375, 1.3779296875, 1.53955078125, 1.701171875, 1.86279296875, 2.0244140625, 2.18603515625, 2.34765625, 2.50927734375, 2.6708984375, 2.83251953125, 2.994140625, 3.15576171875, 3.3173828125, 3.47900390625, 3.640625, 3.80224609375, 3.9638671875, 4.12548828125, 4.287109375, 4.44873046875, 4.6103515625, 4.77197265625, 4.93359375]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 5.0, 5.0, 9.0, 14.0, 21.0, 36.0, 58.0, 93.0, 88.0, 154.0, 207.0, 364.0, 552.0, 810.0, 1185.0, 1781.0, 2693.0, 4150.0, 6646.0, 10119.0, 16215.0, 26658.0, 45006.0, 76725.0, 128202.0, 187161.0, 193841.0, 136981.0, 83036.0, 48635.0, 28532.0, 17450.0, 10955.0, 7027.0, 4491.0, 2966.0, 1875.0, 1260.0, 858.0, 540.0, 400.0, 243.0, 175.0, 109.0, 84.0, 46.0, 30.0, 20.0, 18.0, 8.0, 8.0, 9.0, 6.0, 3.0, 2.0], "bins": [-0.2152099609375, -0.2090740203857422, -0.20293807983398438, -0.19680213928222656, -0.19066619873046875, -0.18453025817871094, -0.17839431762695312, -0.1722583770751953, -0.1661224365234375, -0.1599864959716797, -0.15385055541992188, -0.14771461486816406, -0.14157867431640625, -0.13544273376464844, -0.12930679321289062, -0.12317085266113281, -0.117034912109375, -0.11089897155761719, -0.10476303100585938, -0.09862709045410156, -0.09249114990234375, -0.08635520935058594, -0.08021926879882812, -0.07408332824707031, -0.0679473876953125, -0.06181144714355469, -0.055675506591796875, -0.04953956604003906, -0.04340362548828125, -0.03726768493652344, -0.031131744384765625, -0.024995803833007812, -0.01885986328125, -0.012723922729492188, -0.006587982177734375, -0.0004520416259765625, 0.00568389892578125, 0.011819839477539062, 0.017955780029296875, 0.024091720581054688, 0.0302276611328125, 0.03636360168457031, 0.042499542236328125, 0.04863548278808594, 0.05477142333984375, 0.06090736389160156, 0.06704330444335938, 0.07317924499511719, 0.079315185546875, 0.08545112609863281, 0.09158706665039062, 0.09772300720214844, 0.10385894775390625, 0.10999488830566406, 0.11613082885742188, 0.12226676940917969, 0.1284027099609375, 0.1345386505126953, 0.14067459106445312, 0.14681053161621094, 0.15294647216796875, 0.15908241271972656, 0.16521835327148438, 0.1713542938232422, 0.177490234375]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 5.0, 10.0, 3.0, 9.0, 7.0, 9.0, 6.0, 5.0, 14.0, 11.0, 17.0, 14.0, 20.0, 24.0, 26.0, 19.0, 36.0, 23.0, 36.0, 40.0, 42.0, 35.0, 40.0, 33.0, 1053.0, 44.0, 46.0, 39.0, 38.0, 32.0, 31.0, 26.0, 37.0, 29.0, 14.0, 28.0, 17.0, 11.0, 14.0, 8.0, 9.0, 11.0, 7.0, 9.0, 3.0, 7.0, 10.0, 7.0, 3.0, 6.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-2.798828125, -2.710601806640625, -2.62237548828125, -2.534149169921875, -2.4459228515625, -2.357696533203125, -2.26947021484375, -2.181243896484375, -2.093017578125, -2.004791259765625, -1.91656494140625, -1.828338623046875, -1.7401123046875, -1.651885986328125, -1.56365966796875, -1.475433349609375, -1.38720703125, -1.298980712890625, -1.21075439453125, -1.122528076171875, -1.0343017578125, -0.946075439453125, -0.85784912109375, -0.769622802734375, -0.681396484375, -0.593170166015625, -0.50494384765625, -0.416717529296875, -0.3284912109375, -0.240264892578125, -0.15203857421875, -0.063812255859375, 0.0244140625, 0.112640380859375, 0.20086669921875, 0.289093017578125, 0.3773193359375, 0.465545654296875, 0.55377197265625, 0.641998291015625, 0.730224609375, 0.818450927734375, 0.90667724609375, 0.994903564453125, 1.0831298828125, 1.171356201171875, 1.25958251953125, 1.347808837890625, 1.43603515625, 1.524261474609375, 1.61248779296875, 1.700714111328125, 1.7889404296875, 1.877166748046875, 1.96539306640625, 2.053619384765625, 2.141845703125, 2.230072021484375, 2.31829833984375, 2.406524658203125, 2.4947509765625, 2.582977294921875, 2.67120361328125, 2.759429931640625, 2.84765625]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 4.0, 8.0, 15.0, 15.0, 28.0, 46.0, 67.0, 121.0, 161.0, 238.0, 333.0, 527.0, 759.0, 1035.0, 1425.0, 2085.0, 2962.0, 4232.0, 6030.0, 8687.0, 13421.0, 20146.0, 31281.0, 49541.0, 77718.0, 117262.0, 158522.0, 1210957.0, 131691.0, 91179.0, 57966.0, 36801.0, 23489.0, 15427.0, 10231.0, 6702.0, 4718.0, 3379.0, 2378.0, 1701.0, 1198.0, 858.0, 580.0, 382.0, 285.0, 195.0, 127.0, 86.0, 55.0, 27.0, 23.0, 12.0, 7.0, 10.0, 8.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.148193359375, -0.14344024658203125, -0.1386871337890625, -0.13393402099609375, -0.129180908203125, -0.12442779541015625, -0.1196746826171875, -0.11492156982421875, -0.11016845703125, -0.10541534423828125, -0.1006622314453125, -0.09590911865234375, -0.091156005859375, -0.08640289306640625, -0.0816497802734375, -0.07689666748046875, -0.0721435546875, -0.06739044189453125, -0.0626373291015625, -0.05788421630859375, -0.053131103515625, -0.04837799072265625, -0.0436248779296875, -0.03887176513671875, -0.03411865234375, -0.02936553955078125, -0.0246124267578125, -0.01985931396484375, -0.015106201171875, -0.01035308837890625, -0.0055999755859375, -0.00084686279296875, 0.00390625, 0.00865936279296875, 0.0134124755859375, 0.01816558837890625, 0.022918701171875, 0.02767181396484375, 0.0324249267578125, 0.03717803955078125, 0.04193115234375, 0.04668426513671875, 0.0514373779296875, 0.05619049072265625, 0.060943603515625, 0.06569671630859375, 0.0704498291015625, 0.07520294189453125, 0.0799560546875, 0.08470916748046875, 0.0894622802734375, 0.09421539306640625, 0.098968505859375, 0.10372161865234375, 0.1084747314453125, 0.11322784423828125, 0.11798095703125, 0.12273406982421875, 0.1274871826171875, 0.13224029541015625, 0.136993408203125, 0.14174652099609375, 0.1464996337890625, 0.15125274658203125, 0.156005859375]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 1.0, 4.0, 8.0, 6.0, 7.0, 10.0, 16.0, 10.0, 22.0, 24.0, 28.0, 34.0, 50.0, 50.0, 55.0, 73.0, 77.0, 83.0, 60.0, 70.0, 60.0, 46.0, 30.0, 34.0, 33.0, 20.0, 19.0, 19.0, 10.0, 8.0, 11.0, 7.0, 4.0, 0.0, 6.0, 5.0, 1.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010271072387695312, -0.0009954720735549927, -0.0009638369083404541, -0.0009322017431259155, -0.000900566577911377, -0.0008689314126968384, -0.0008372962474822998, -0.0008056610822677612, -0.0007740259170532227, -0.0007423907518386841, -0.0007107555866241455, -0.0006791204214096069, -0.0006474852561950684, -0.0006158500909805298, -0.0005842149257659912, -0.0005525797605514526, -0.0005209445953369141, -0.0004893094301223755, -0.0004576742649078369, -0.00042603909969329834, -0.00039440393447875977, -0.0003627687692642212, -0.0003311336040496826, -0.00029949843883514404, -0.00026786327362060547, -0.0002362281084060669, -0.00020459294319152832, -0.00017295777797698975, -0.00014132261276245117, -0.0001096874475479126, -7.805228233337402e-05, -4.641711711883545e-05, -1.4781951904296875e-05, 1.68532133102417e-05, 4.8488378524780273e-05, 8.012354373931885e-05, 0.00011175870895385742, 0.000143393874168396, 0.00017502903938293457, 0.00020666420459747314, 0.00023829936981201172, 0.0002699345350265503, 0.00030156970024108887, 0.00033320486545562744, 0.000364840030670166, 0.0003964751958847046, 0.00042811036109924316, 0.00045974552631378174, 0.0004913806915283203, 0.0005230158567428589, 0.0005546510219573975, 0.000586286187171936, 0.0006179213523864746, 0.0006495565176010132, 0.0006811916828155518, 0.0007128268480300903, 0.0007444620132446289, 0.0007760971784591675, 0.0008077323436737061, 0.0008393675088882446, 0.0008710026741027832, 0.0009026378393173218, 0.0009342730045318604, 0.0009659081697463989, 0.0009975433349609375]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 2.0, 9.0, 16.0, 8.0, 14.0, 24.0, 52.0, 47.0, 68.0, 84.0, 157.0, 286.0, 551.0, 3647.0, 579024.0, 460146.0, 3060.0, 560.0, 298.0, 171.0, 113.0, 50.0, 45.0, 36.0, 23.0, 22.0, 11.0, 8.0, 5.0, 6.0, 5.0, 2.0, 1.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.018524169921875, -0.017944812774658203, -0.017365455627441406, -0.01678609848022461, -0.016206741333007812, -0.015627384185791016, -0.015048027038574219, -0.014468669891357422, -0.013889312744140625, -0.013309955596923828, -0.012730598449707031, -0.012151241302490234, -0.011571884155273438, -0.01099252700805664, -0.010413169860839844, -0.009833812713623047, -0.00925445556640625, -0.008675098419189453, -0.008095741271972656, -0.007516384124755859, -0.0069370269775390625, -0.006357669830322266, -0.005778312683105469, -0.005198955535888672, -0.004619598388671875, -0.004040241241455078, -0.0034608840942382812, -0.0028815269470214844, -0.0023021697998046875, -0.0017228126525878906, -0.0011434555053710938, -0.0005640983581542969, 1.52587890625e-05, 0.0005946159362792969, 0.0011739730834960938, 0.0017533302307128906, 0.0023326873779296875, 0.0029120445251464844, 0.0034914016723632812, 0.004070758819580078, 0.004650115966796875, 0.005229473114013672, 0.005808830261230469, 0.006388187408447266, 0.0069675445556640625, 0.007546901702880859, 0.008126258850097656, 0.008705615997314453, 0.00928497314453125, 0.009864330291748047, 0.010443687438964844, 0.01102304458618164, 0.011602401733398438, 0.012181758880615234, 0.012761116027832031, 0.013340473175048828, 0.013919830322265625, 0.014499187469482422, 0.015078544616699219, 0.015657901763916016, 0.016237258911132812, 0.01681661605834961, 0.017395973205566406, 0.017975330352783203, 0.0185546875]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 20.0, 58.0, 224.0, 364.0, 258.0, 73.0, 14.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004354157019406557, -0.004271441604942083, -0.004188726656138897, -0.004106011241674423, -0.0040232958272099495, -0.003940580878406763, -0.0038578654639422894, -0.0037751502823084593, -0.003692435100674629, -0.003609719919040799, -0.0035270045045763254, -0.0034442893229424953, -0.0033615741413086653, -0.003278858959674835, -0.0031961435452103615, -0.0031134283635765314, -0.0030307129491120577, -0.0029479977674782276, -0.002865282353013754, -0.002782567171379924, -0.0026998519897460938, -0.00261713657528162, -0.00253442139364779, -0.00245170621201396, -0.002368990797549486, -0.002286275615915656, -0.0022035602014511824, -0.0021208450198173523, -0.0020381298381835222, -0.001955414656549692, -0.0018726992420852184, -0.0017899840604513884, -0.0017072688788175583, -0.0016245535807684064, -0.0015418383991345763, -0.0014591231010854244, -0.0013764079194515944, -0.0012936926214024425, -0.0012109773233532906, -0.0011282621417194605, -0.0010455469600856304, -0.0009628317202441394, -0.0008801164804026484, -0.0007974011823534966, -0.0007146859425120056, -0.0006319707026705146, -0.0005492554046213627, -0.0004665401647798717, -0.0003838248667307198, -0.0003011096268892288, -0.00021839435794390738, -0.00013567908899858594, -5.2963849157094955e-05, 2.975139068439603e-05, 0.00011246668873354793, 0.0001951819285750389, 0.0002778971684165299, 0.0003606124082580209, 0.0004433276772033423, 0.0005260429461486638, 0.0006087581859901547, 0.0006914734258316457, 0.0007741887238807976, 0.0008569039637222886, 0.0009396192035637796]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 2.0, 6.0, 6.0, 7.0, 8.0, 7.0, 11.0, 12.0, 14.0, 11.0, 18.0, 18.0, 20.0, 22.0, 33.0, 41.0, 25.0, 20.0, 34.0, 49.0, 33.0, 50.0, 43.0, 42.0, 37.0, 45.0, 45.0, 36.0, 30.0, 34.0, 34.0, 27.0, 21.0, 27.0, 23.0, 23.0, 10.0, 16.0, 17.0, 18.0, 4.0, 9.0, 5.0, 7.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.0005303025245666504, -0.0005153492093086243, -0.0005003958940505981, -0.000485442578792572, -0.0004704892635345459, -0.0004555359482765198, -0.00044058263301849365, -0.00042562931776046753, -0.0004106760025024414, -0.0003957226872444153, -0.00038076937198638916, -0.00036581605672836304, -0.0003508627414703369, -0.0003359094262123108, -0.00032095611095428467, -0.00030600279569625854, -0.0002910494804382324, -0.0002760961651802063, -0.0002611428499221802, -0.00024618953466415405, -0.00023123621940612793, -0.0002162829041481018, -0.00020132958889007568, -0.00018637627363204956, -0.00017142295837402344, -0.00015646964311599731, -0.0001415163278579712, -0.00012656301259994507, -0.00011160969734191895, -9.665638208389282e-05, -8.17030668258667e-05, -6.674975156784058e-05, -5.179643630981445e-05, -3.684312105178833e-05, -2.1889805793762207e-05, -6.936490535736084e-06, 8.016824722290039e-06, 2.2970139980316162e-05, 3.7923455238342285e-05, 5.287677049636841e-05, 6.783008575439453e-05, 8.278340101242065e-05, 9.773671627044678e-05, 0.0001126900315284729, 0.00012764334678649902, 0.00014259666204452515, 0.00015754997730255127, 0.0001725032925605774, 0.00018745660781860352, 0.00020240992307662964, 0.00021736323833465576, 0.00023231655359268188, 0.000247269868850708, 0.00026222318410873413, 0.00027717649936676025, 0.0002921298146247864, 0.0003070831298828125, 0.0003220364451408386, 0.00033698976039886475, 0.00035194307565689087, 0.000366896390914917, 0.0003818497061729431, 0.00039680302143096924, 0.00041175633668899536, 0.0004267096519470215]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 6.0, 8.0, 5.0, 7.0, 10.0, 10.0, 12.0, 13.0, 16.0, 21.0, 14.0, 28.0, 28.0, 25.0, 31.0, 43.0, 37.0, 40.0, 37.0, 48.0, 42.0, 37.0, 44.0, 51.0, 28.0, 38.0, 36.0, 51.0, 22.0, 29.0, 24.0, 28.0, 25.0, 20.0, 21.0, 16.0, 9.0, 6.0, 11.0, 5.0, 10.0, 2.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-5.41015625, -5.24853515625, -5.0869140625, -4.92529296875, -4.763671875, -4.60205078125, -4.4404296875, -4.27880859375, -4.1171875, -3.95556640625, -3.7939453125, -3.63232421875, -3.470703125, -3.30908203125, -3.1474609375, -2.98583984375, -2.82421875, -2.66259765625, -2.5009765625, -2.33935546875, -2.177734375, -2.01611328125, -1.8544921875, -1.69287109375, -1.53125, -1.36962890625, -1.2080078125, -1.04638671875, -0.884765625, -0.72314453125, -0.5615234375, -0.39990234375, -0.23828125, -0.07666015625, 0.0849609375, 0.24658203125, 0.408203125, 0.56982421875, 0.7314453125, 0.89306640625, 1.0546875, 1.21630859375, 1.3779296875, 1.53955078125, 1.701171875, 1.86279296875, 2.0244140625, 2.18603515625, 2.34765625, 2.50927734375, 2.6708984375, 2.83251953125, 2.994140625, 3.15576171875, 3.3173828125, 3.47900390625, 3.640625, 3.80224609375, 3.9638671875, 4.12548828125, 4.287109375, 4.44873046875, 4.6103515625, 4.77197265625, 4.93359375]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 7.0, 4.0, 10.0, 12.0, 23.0, 27.0, 41.0, 44.0, 83.0, 93.0, 161.0, 217.0, 288.0, 432.0, 632.0, 889.0, 1207.0, 1881.0, 2926.0, 4695.0, 7711.0, 13581.0, 26861.0, 58364.0, 151678.0, 416735.0, 210360.0, 75949.0, 32941.0, 16330.0, 9041.0, 5314.0, 3257.0, 2108.0, 1468.0, 929.0, 666.0, 463.0, 321.0, 244.0, 174.0, 130.0, 68.0, 53.0, 37.0, 29.0, 30.0, 16.0, 13.0, 9.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.41796875, -3.313262939453125, -3.20855712890625, -3.103851318359375, -2.9991455078125, -2.894439697265625, -2.78973388671875, -2.685028076171875, -2.580322265625, -2.475616455078125, -2.37091064453125, -2.266204833984375, -2.1614990234375, -2.056793212890625, -1.95208740234375, -1.847381591796875, -1.74267578125, -1.637969970703125, -1.53326416015625, -1.428558349609375, -1.3238525390625, -1.219146728515625, -1.11444091796875, -1.009735107421875, -0.905029296875, -0.800323486328125, -0.69561767578125, -0.590911865234375, -0.4862060546875, -0.381500244140625, -0.27679443359375, -0.172088623046875, -0.0673828125, 0.037322998046875, 0.14202880859375, 0.246734619140625, 0.3514404296875, 0.456146240234375, 0.56085205078125, 0.665557861328125, 0.770263671875, 0.874969482421875, 0.97967529296875, 1.084381103515625, 1.1890869140625, 1.293792724609375, 1.39849853515625, 1.503204345703125, 1.60791015625, 1.712615966796875, 1.81732177734375, 1.922027587890625, 2.0267333984375, 2.131439208984375, 2.23614501953125, 2.340850830078125, 2.445556640625, 2.550262451171875, 2.65496826171875, 2.759674072265625, 2.8643798828125, 2.969085693359375, 3.07379150390625, 3.178497314453125, 3.283203125]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 3.0, 8.0, 4.0, 7.0, 5.0, 14.0, 21.0, 16.0, 20.0, 28.0, 22.0, 35.0, 31.0, 48.0, 39.0, 63.0, 68.0, 111.0, 231.0, 1663.0, 150.0, 64.0, 59.0, 46.0, 36.0, 45.0, 34.0, 26.0, 22.0, 22.0, 21.0, 21.0, 10.0, 14.0, 10.0, 7.0, 7.0, 12.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.734375, -17.08447265625, -16.4345703125, -15.78466796875, -15.134765625, -14.48486328125, -13.8349609375, -13.18505859375, -12.53515625, -11.88525390625, -11.2353515625, -10.58544921875, -9.935546875, -9.28564453125, -8.6357421875, -7.98583984375, -7.3359375, -6.68603515625, -6.0361328125, -5.38623046875, -4.736328125, -4.08642578125, -3.4365234375, -2.78662109375, -2.13671875, -1.48681640625, -0.8369140625, -0.18701171875, 0.462890625, 1.11279296875, 1.7626953125, 2.41259765625, 3.0625, 3.71240234375, 4.3623046875, 5.01220703125, 5.662109375, 6.31201171875, 6.9619140625, 7.61181640625, 8.26171875, 8.91162109375, 9.5615234375, 10.21142578125, 10.861328125, 11.51123046875, 12.1611328125, 12.81103515625, 13.4609375, 14.11083984375, 14.7607421875, 15.41064453125, 16.060546875, 16.71044921875, 17.3603515625, 18.01025390625, 18.66015625, 19.31005859375, 19.9599609375, 20.60986328125, 21.259765625, 21.90966796875, 22.5595703125, 23.20947265625, 23.859375]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 2.0, 6.0, 9.0, 16.0, 34.0, 44.0, 69.0, 125.0, 359.0, 1357.0, 243383.0, 2897543.0, 1957.0, 420.0, 186.0, 81.0, 52.0, 23.0, 15.0, 9.0, 4.0, 6.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.8125, -78.791015625, -75.76953125, -72.748046875, -69.7265625, -66.705078125, -63.68359375, -60.662109375, -57.640625, -54.619140625, -51.59765625, -48.576171875, -45.5546875, -42.533203125, -39.51171875, -36.490234375, -33.46875, -30.447265625, -27.42578125, -24.404296875, -21.3828125, -18.361328125, -15.33984375, -12.318359375, -9.296875, -6.275390625, -3.25390625, -0.232421875, 2.7890625, 5.810546875, 8.83203125, 11.853515625, 14.875, 17.896484375, 20.91796875, 23.939453125, 26.9609375, 29.982421875, 33.00390625, 36.025390625, 39.046875, 42.068359375, 45.08984375, 48.111328125, 51.1328125, 54.154296875, 57.17578125, 60.197265625, 63.21875, 66.240234375, 69.26171875, 72.283203125, 75.3046875, 78.326171875, 81.34765625, 84.369140625, 87.390625, 90.412109375, 93.43359375, 96.455078125, 99.4765625, 102.498046875, 105.51953125, 108.541015625, 111.5625]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 814.0, 205.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-77.352294921875, -50.90937423706055, -24.466453552246094, 1.976470947265625, 28.419387817382812, 54.8623046875, 81.30523681640625, 107.74815368652344, 134.19107055664062, 160.6339874267578, 187.076904296875, 213.51983642578125, 239.96275329589844, 266.4056701660156, 292.8486022949219, 319.29150390625, 345.73443603515625, 372.1773681640625, 398.6202697753906, 425.0632019042969, 451.506103515625, 477.94903564453125, 504.3919677734375, 530.8348999023438, 557.27783203125, 583.7207641601562, 610.1636962890625, 636.6065673828125, 663.0494995117188, 689.492431640625, 715.9353637695312, 742.3782958984375, 768.8211669921875, 795.2640991210938, 821.70703125, 848.14990234375, 874.5928344726562, 901.0357666015625, 927.4786987304688, 953.921630859375, 980.364501953125, 1006.8074340820312, 1033.2503662109375, 1059.6932373046875, 1086.13623046875, 1112.5791015625, 1139.02197265625, 1165.4649658203125, 1191.907958984375, 1218.350830078125, 1244.7938232421875, 1271.2366943359375, 1297.6796875, 1324.12255859375, 1350.5654296875, 1377.0084228515625, 1403.4512939453125, 1429.8941650390625, 1456.337158203125, 1482.780029296875, 1509.2230224609375, 1535.6658935546875, 1562.10888671875, 1588.5517578125, 1614.99462890625]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 2.0, 1.0, 7.0, 5.0, 7.0, 13.0, 3.0, 7.0, 12.0, 10.0, 17.0, 21.0, 18.0, 31.0, 31.0, 32.0, 48.0, 41.0, 42.0, 34.0, 41.0, 50.0, 54.0, 52.0, 42.0, 41.0, 40.0, 44.0, 40.0, 22.0, 32.0, 21.0, 23.0, 24.0, 19.0, 16.0, 13.0, 8.0, 8.0, 6.0, 5.0, 6.0, 5.0, 3.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-60.052040100097656, -58.12053680419922, -56.189029693603516, -54.25752639770508, -52.32602310180664, -50.39451599121094, -48.4630126953125, -46.53150939941406, -44.600006103515625, -42.66850280761719, -40.736995697021484, -38.80549240112305, -36.87398910522461, -34.942481994628906, -33.01097869873047, -31.07947540283203, -29.147968292236328, -27.216463088989258, -25.28495979309082, -23.35345458984375, -21.421951293945312, -19.490446090698242, -17.558940887451172, -15.627436637878418, -13.695932388305664, -11.76442813873291, -9.832923889160156, -7.901418685913086, -5.969914436340332, -4.038410186767578, -2.106904983520508, -0.1754007339477539, 1.7560997009277344, 3.6876041889190674, 5.6191086769104, 7.5506134033203125, 9.482117652893066, 11.41362190246582, 13.34512710571289, 15.276631355285645, 17.2081356048584, 19.13964080810547, 21.071144104003906, 23.002649307250977, 24.934154510498047, 26.865657806396484, 28.797163009643555, 30.728668212890625, 32.66017150878906, 34.5916748046875, 36.5231819152832, 38.45468521118164, 40.38618850708008, 42.31769561767578, 44.24919891357422, 46.180702209472656, 48.112205505371094, 50.04370880126953, 51.975215911865234, 53.90671920776367, 55.83822250366211, 57.76972961425781, 59.70123291015625, 61.63273620605469, 63.56424331665039]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 3.0, 2.0, 8.0, 8.0, 6.0, 10.0, 7.0, 12.0, 8.0, 11.0, 18.0, 31.0, 23.0, 26.0, 25.0, 30.0, 39.0, 39.0, 29.0, 44.0, 34.0, 51.0, 49.0, 35.0, 50.0, 43.0, 38.0, 33.0, 39.0, 31.0, 24.0, 32.0, 24.0, 27.0, 15.0, 22.0, 19.0, 13.0, 11.0, 11.0, 10.0, 3.0, 3.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-5.92578125, -5.7506103515625, -5.575439453125, -5.4002685546875, -5.22509765625, -5.0499267578125, -4.874755859375, -4.6995849609375, -4.5244140625, -4.3492431640625, -4.174072265625, -3.9989013671875, -3.82373046875, -3.6485595703125, -3.473388671875, -3.2982177734375, -3.123046875, -2.9478759765625, -2.772705078125, -2.5975341796875, -2.42236328125, -2.2471923828125, -2.072021484375, -1.8968505859375, -1.7216796875, -1.5465087890625, -1.371337890625, -1.1961669921875, -1.02099609375, -0.8458251953125, -0.670654296875, -0.4954833984375, -0.3203125, -0.1451416015625, 0.030029296875, 0.2052001953125, 0.38037109375, 0.5555419921875, 0.730712890625, 0.9058837890625, 1.0810546875, 1.2562255859375, 1.431396484375, 1.6065673828125, 1.78173828125, 1.9569091796875, 2.132080078125, 2.3072509765625, 2.482421875, 2.6575927734375, 2.832763671875, 3.0079345703125, 3.18310546875, 3.3582763671875, 3.533447265625, 3.7086181640625, 3.8837890625, 4.0589599609375, 4.234130859375, 4.4093017578125, 4.58447265625, 4.7596435546875, 4.934814453125, 5.1099853515625, 5.28515625]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 5.0, 7.0, 4.0, 3.0, 9.0, 5.0, 7.0, 17.0, 24.0, 22.0, 35.0, 65.0, 68.0, 141.0, 208.0, 348.0, 581.0, 1234.0, 2526.0, 5502.0, 12741.0, 31814.0, 97446.0, 437358.0, 1608510.0, 1477141.0, 380745.0, 88848.0, 28495.0, 11013.0, 4700.0, 2174.0, 1069.0, 583.0, 306.0, 165.0, 105.0, 78.0, 51.0, 41.0, 25.0, 20.0, 17.0, 4.0, 6.0, 8.0, 2.0, 5.0, 7.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-8.96875, -8.712158203125, -8.45556640625, -8.198974609375, -7.9423828125, -7.685791015625, -7.42919921875, -7.172607421875, -6.916015625, -6.659423828125, -6.40283203125, -6.146240234375, -5.8896484375, -5.633056640625, -5.37646484375, -5.119873046875, -4.86328125, -4.606689453125, -4.35009765625, -4.093505859375, -3.8369140625, -3.580322265625, -3.32373046875, -3.067138671875, -2.810546875, -2.553955078125, -2.29736328125, -2.040771484375, -1.7841796875, -1.527587890625, -1.27099609375, -1.014404296875, -0.7578125, -0.501220703125, -0.24462890625, 0.011962890625, 0.2685546875, 0.525146484375, 0.78173828125, 1.038330078125, 1.294921875, 1.551513671875, 1.80810546875, 2.064697265625, 2.3212890625, 2.577880859375, 2.83447265625, 3.091064453125, 3.34765625, 3.604248046875, 3.86083984375, 4.117431640625, 4.3740234375, 4.630615234375, 4.88720703125, 5.143798828125, 5.400390625, 5.656982421875, 5.91357421875, 6.170166015625, 6.4267578125, 6.683349609375, 6.93994140625, 7.196533203125, 7.453125]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 8.0, 3.0, 9.0, 10.0, 14.0, 20.0, 35.0, 35.0, 53.0, 65.0, 118.0, 172.0, 283.0, 442.0, 603.0, 592.0, 480.0, 368.0, 223.0, 169.0, 100.0, 84.0, 47.0, 33.0, 36.0, 24.0, 10.0, 14.0, 10.0, 5.0, 2.0, 2.0, 4.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.40625, -12.9478759765625, -12.489501953125, -12.0311279296875, -11.57275390625, -11.1143798828125, -10.656005859375, -10.1976318359375, -9.7392578125, -9.2808837890625, -8.822509765625, -8.3641357421875, -7.90576171875, -7.4473876953125, -6.989013671875, -6.5306396484375, -6.072265625, -5.6138916015625, -5.155517578125, -4.6971435546875, -4.23876953125, -3.7803955078125, -3.322021484375, -2.8636474609375, -2.4052734375, -1.9468994140625, -1.488525390625, -1.0301513671875, -0.57177734375, -0.1134033203125, 0.344970703125, 0.8033447265625, 1.26171875, 1.7200927734375, 2.178466796875, 2.6368408203125, 3.09521484375, 3.5535888671875, 4.011962890625, 4.4703369140625, 4.9287109375, 5.3870849609375, 5.845458984375, 6.3038330078125, 6.76220703125, 7.2205810546875, 7.678955078125, 8.1373291015625, 8.595703125, 9.0540771484375, 9.512451171875, 9.9708251953125, 10.42919921875, 10.8875732421875, 11.345947265625, 11.8043212890625, 12.2626953125, 12.7210693359375, 13.179443359375, 13.6378173828125, 14.09619140625, 14.5545654296875, 15.012939453125, 15.4713134765625, 15.9296875]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 5.0, 6.0, 10.0, 11.0, 13.0, 14.0, 28.0, 24.0, 56.0, 69.0, 113.0, 147.0, 261.0, 446.0, 1039.0, 2667.0, 10491.0, 58029.0, 565006.0, 3105035.0, 393084.0, 44936.0, 8522.0, 2272.0, 939.0, 411.0, 201.0, 145.0, 86.0, 58.0, 49.0, 31.0, 20.0, 16.0, 16.0, 14.0, 4.0, 4.0, 6.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-25.5, -24.7802734375, -24.060546875, -23.3408203125, -22.62109375, -21.9013671875, -21.181640625, -20.4619140625, -19.7421875, -19.0224609375, -18.302734375, -17.5830078125, -16.86328125, -16.1435546875, -15.423828125, -14.7041015625, -13.984375, -13.2646484375, -12.544921875, -11.8251953125, -11.10546875, -10.3857421875, -9.666015625, -8.9462890625, -8.2265625, -7.5068359375, -6.787109375, -6.0673828125, -5.34765625, -4.6279296875, -3.908203125, -3.1884765625, -2.46875, -1.7490234375, -1.029296875, -0.3095703125, 0.41015625, 1.1298828125, 1.849609375, 2.5693359375, 3.2890625, 4.0087890625, 4.728515625, 5.4482421875, 6.16796875, 6.8876953125, 7.607421875, 8.3271484375, 9.046875, 9.7666015625, 10.486328125, 11.2060546875, 11.92578125, 12.6455078125, 13.365234375, 14.0849609375, 14.8046875, 15.5244140625, 16.244140625, 16.9638671875, 17.68359375, 18.4033203125, 19.123046875, 19.8427734375, 20.5625]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 19.0, 43.0, 128.0, 231.0, 260.0, 175.0, 101.0, 41.0, 10.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-229.78533935546875, -224.9287109375, -220.07208251953125, -215.2154541015625, -210.35882568359375, -205.502197265625, -200.64556884765625, -195.78895568847656, -190.9323272705078, -186.07569885253906, -181.2190704345703, -176.36244201660156, -171.5058135986328, -166.64920043945312, -161.79257202148438, -156.93594360351562, -152.07931518554688, -147.22268676757812, -142.36605834960938, -137.50942993164062, -132.65280151367188, -127.79618072509766, -122.9395523071289, -118.08293151855469, -113.22628784179688, -108.36965942382812, -103.51303100585938, -98.65640258789062, -93.7997817993164, -88.94315338134766, -84.0865249633789, -79.22990417480469, -74.3732681274414, -69.51663970947266, -64.6600112915039, -59.80338668823242, -54.94676208496094, -50.09013366699219, -45.23350524902344, -40.37688064575195, -35.5202522277832, -30.663625717163086, -25.80699920654297, -20.95037078857422, -16.0937442779541, -11.237117767333984, -6.380489349365234, -1.52386474609375, 3.332763671875, 8.189390182495117, 13.04601764678955, 17.902645111083984, 22.7592716217041, 27.61589813232422, 32.47252655029297, 37.32915115356445, 42.1857795715332, 47.04240798950195, 51.89903259277344, 56.75566101074219, 61.61228942871094, 66.46891784667969, 71.32554626464844, 76.18216705322266, 81.0387954711914]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 5.0, 2.0, 4.0, 1.0, 3.0, 6.0, 4.0, 3.0, 11.0, 4.0, 6.0, 7.0, 10.0, 14.0, 17.0, 21.0, 29.0, 16.0, 25.0, 28.0, 31.0, 51.0, 46.0, 38.0, 38.0, 54.0, 44.0, 40.0, 38.0, 46.0, 29.0, 40.0, 24.0, 26.0, 42.0, 33.0, 31.0, 19.0, 26.0, 13.0, 23.0, 14.0, 8.0, 8.0, 6.0, 5.0, 5.0, 7.0, 6.0, 4.0, 0.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0], "bins": [-43.00959014892578, -41.74808120727539, -40.486576080322266, -39.225067138671875, -37.96356201171875, -36.70205307006836, -35.440547943115234, -34.179039001464844, -32.91753387451172, -31.65602684020996, -30.394519805908203, -29.133012771606445, -27.871505737304688, -26.60999870300293, -25.348491668701172, -24.08698272705078, -22.825475692749023, -21.563968658447266, -20.302461624145508, -19.04095458984375, -17.779447555541992, -16.517940521240234, -15.25643253326416, -13.994925498962402, -12.733418464660645, -11.471911430358887, -10.210404396057129, -8.948896408081055, -7.687389850616455, -6.425882816314697, -5.164375305175781, -3.9028682708740234, -2.6413612365722656, -1.3798540830612183, -0.1183469295501709, 1.143160343170166, 2.404667377471924, 3.6661744117736816, 4.927681922912598, 6.1891889572143555, 7.450695991516113, 8.712203025817871, 9.973710060119629, 11.235218048095703, 12.496725082397461, 13.758232116699219, 15.019739151000977, 16.281246185302734, 17.542753219604492, 18.80426025390625, 20.065767288208008, 21.327274322509766, 22.588781356811523, 23.85028839111328, 25.111797332763672, 26.373302459716797, 27.634811401367188, 28.896318435668945, 30.157825469970703, 31.41933250427246, 32.68083953857422, 33.94234848022461, 35.203853607177734, 36.465362548828125, 37.72686767578125]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 7.0, 6.0, 10.0, 2.0, 7.0, 8.0, 16.0, 12.0, 15.0, 20.0, 21.0, 24.0, 29.0, 31.0, 33.0, 29.0, 38.0, 33.0, 38.0, 55.0, 48.0, 46.0, 57.0, 44.0, 47.0, 35.0, 23.0, 42.0, 28.0, 33.0, 29.0, 21.0, 27.0, 18.0, 13.0, 11.0, 14.0, 5.0, 12.0, 7.0, 6.0, 6.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.13671875, -5.95758056640625, -5.7784423828125, -5.59930419921875, -5.420166015625, -5.24102783203125, -5.0618896484375, -4.88275146484375, -4.70361328125, -4.52447509765625, -4.3453369140625, -4.16619873046875, -3.987060546875, -3.80792236328125, -3.6287841796875, -3.44964599609375, -3.2705078125, -3.09136962890625, -2.9122314453125, -2.73309326171875, -2.553955078125, -2.37481689453125, -2.1956787109375, -2.01654052734375, -1.83740234375, -1.65826416015625, -1.4791259765625, -1.29998779296875, -1.120849609375, -0.94171142578125, -0.7625732421875, -0.58343505859375, -0.404296875, -0.22515869140625, -0.0460205078125, 0.13311767578125, 0.312255859375, 0.49139404296875, 0.6705322265625, 0.84967041015625, 1.02880859375, 1.20794677734375, 1.3870849609375, 1.56622314453125, 1.745361328125, 1.92449951171875, 2.1036376953125, 2.28277587890625, 2.4619140625, 2.64105224609375, 2.8201904296875, 2.99932861328125, 3.178466796875, 3.35760498046875, 3.5367431640625, 3.71588134765625, 3.89501953125, 4.07415771484375, 4.2532958984375, 4.43243408203125, 4.611572265625, 4.79071044921875, 4.9698486328125, 5.14898681640625, 5.328125]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 4.0, 5.0, 8.0, 8.0, 13.0, 20.0, 28.0, 43.0, 79.0, 89.0, 135.0, 226.0, 323.0, 420.0, 674.0, 1034.0, 1442.0, 1994.0, 3152.0, 4689.0, 7120.0, 11028.0, 17243.0, 27788.0, 45949.0, 75751.0, 122043.0, 174978.0, 184441.0, 138426.0, 87448.0, 53084.0, 32240.0, 19760.0, 12540.0, 8069.0, 5323.0, 3515.0, 2310.0, 1596.0, 1117.0, 781.0, 509.0, 362.0, 257.0, 165.0, 104.0, 77.0, 55.0, 33.0, 25.0, 14.0, 9.0, 7.0, 3.0, 2.0, 7.0, 2.0, 2.0, 1.0], "bins": [-0.199951171875, -0.19373130798339844, -0.18751144409179688, -0.1812915802001953, -0.17507171630859375, -0.1688518524169922, -0.16263198852539062, -0.15641212463378906, -0.1501922607421875, -0.14397239685058594, -0.13775253295898438, -0.1315326690673828, -0.12531280517578125, -0.11909294128417969, -0.11287307739257812, -0.10665321350097656, -0.100433349609375, -0.09421348571777344, -0.08799362182617188, -0.08177375793457031, -0.07555389404296875, -0.06933403015136719, -0.06311416625976562, -0.05689430236816406, -0.0506744384765625, -0.04445457458496094, -0.038234710693359375, -0.03201484680175781, -0.02579498291015625, -0.019575119018554688, -0.013355255126953125, -0.0071353912353515625, -0.00091552734375, 0.0053043365478515625, 0.011524200439453125, 0.017744064331054688, 0.02396392822265625, 0.030183792114257812, 0.036403656005859375, 0.04262351989746094, 0.0488433837890625, 0.05506324768066406, 0.061283111572265625, 0.06750297546386719, 0.07372283935546875, 0.07994270324707031, 0.08616256713867188, 0.09238243103027344, 0.098602294921875, 0.10482215881347656, 0.11104202270507812, 0.11726188659667969, 0.12348175048828125, 0.1297016143798828, 0.13592147827148438, 0.14214134216308594, 0.1483612060546875, 0.15458106994628906, 0.16080093383789062, 0.1670207977294922, 0.17324066162109375, 0.1794605255126953, 0.18568038940429688, 0.19190025329589844, 0.1981201171875]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 1.0, 4.0, 7.0, 9.0, 4.0, 7.0, 5.0, 15.0, 17.0, 16.0, 20.0, 28.0, 27.0, 36.0, 42.0, 39.0, 52.0, 41.0, 40.0, 49.0, 1069.0, 48.0, 68.0, 48.0, 42.0, 39.0, 47.0, 31.0, 34.0, 23.0, 18.0, 15.0, 22.0, 17.0, 9.0, 10.0, 11.0, 7.0, 8.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.4453125, -4.318572998046875, -4.19183349609375, -4.065093994140625, -3.9383544921875, -3.811614990234375, -3.68487548828125, -3.558135986328125, -3.431396484375, -3.304656982421875, -3.17791748046875, -3.051177978515625, -2.9244384765625, -2.797698974609375, -2.67095947265625, -2.544219970703125, -2.41748046875, -2.290740966796875, -2.16400146484375, -2.037261962890625, -1.9105224609375, -1.783782958984375, -1.65704345703125, -1.530303955078125, -1.403564453125, -1.276824951171875, -1.15008544921875, -1.023345947265625, -0.8966064453125, -0.769866943359375, -0.64312744140625, -0.516387939453125, -0.3896484375, -0.262908935546875, -0.13616943359375, -0.009429931640625, 0.1173095703125, 0.244049072265625, 0.37078857421875, 0.497528076171875, 0.624267578125, 0.751007080078125, 0.87774658203125, 1.004486083984375, 1.1312255859375, 1.257965087890625, 1.38470458984375, 1.511444091796875, 1.63818359375, 1.764923095703125, 1.89166259765625, 2.018402099609375, 2.1451416015625, 2.271881103515625, 2.39862060546875, 2.525360107421875, 2.652099609375, 2.778839111328125, 2.90557861328125, 3.032318115234375, 3.1590576171875, 3.285797119140625, 3.41253662109375, 3.539276123046875, 3.666015625]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 7.0, 2.0, 5.0, 6.0, 5.0, 16.0, 18.0, 32.0, 50.0, 67.0, 90.0, 154.0, 226.0, 431.0, 684.0, 953.0, 1517.0, 2518.0, 3931.0, 6319.0, 10213.0, 17493.0, 30721.0, 56139.0, 103474.0, 173920.0, 1271081.0, 176987.0, 105894.0, 57614.0, 31114.0, 17842.0, 10394.0, 6234.0, 4016.0, 2591.0, 1570.0, 1015.0, 685.0, 396.0, 249.0, 161.0, 109.0, 80.0, 38.0, 38.0, 12.0, 17.0, 4.0, 5.0, 7.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.2369384765625, -0.2300739288330078, -0.22320938110351562, -0.21634483337402344, -0.20948028564453125, -0.20261573791503906, -0.19575119018554688, -0.1888866424560547, -0.1820220947265625, -0.1751575469970703, -0.16829299926757812, -0.16142845153808594, -0.15456390380859375, -0.14769935607910156, -0.14083480834960938, -0.1339702606201172, -0.127105712890625, -0.12024116516113281, -0.11337661743164062, -0.10651206970214844, -0.09964752197265625, -0.09278297424316406, -0.08591842651367188, -0.07905387878417969, -0.0721893310546875, -0.06532478332519531, -0.058460235595703125, -0.05159568786621094, -0.04473114013671875, -0.03786659240722656, -0.031002044677734375, -0.024137496948242188, -0.01727294921875, -0.010408401489257812, -0.003543853759765625, 0.0033206939697265625, 0.01018524169921875, 0.017049789428710938, 0.023914337158203125, 0.030778884887695312, 0.0376434326171875, 0.04450798034667969, 0.051372528076171875, 0.05823707580566406, 0.06510162353515625, 0.07196617126464844, 0.07883071899414062, 0.08569526672363281, 0.092559814453125, 0.09942436218261719, 0.10628890991210938, 0.11315345764160156, 0.12001800537109375, 0.12688255310058594, 0.13374710083007812, 0.1406116485595703, 0.1474761962890625, 0.1543407440185547, 0.16120529174804688, 0.16806983947753906, 0.17493438720703125, 0.18179893493652344, 0.18866348266601562, 0.1955280303955078, 0.202392578125]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 0.0, 4.0, 2.0, 4.0, 6.0, 3.0, 5.0, 8.0, 9.0, 18.0, 8.0, 17.0, 19.0, 24.0, 34.0, 31.0, 39.0, 51.0, 48.0, 71.0, 61.0, 69.0, 69.0, 54.0, 54.0, 46.0, 56.0, 44.0, 30.0, 31.0, 17.0, 21.0, 10.0, 7.0, 5.0, 9.0, 7.0, 4.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.0010089874267578125, -0.0009813979268074036, -0.0009538084268569946, -0.0009262189269065857, -0.0008986294269561768, -0.0008710399270057678, -0.0008434504270553589, -0.00081586092710495, -0.000788271427154541, -0.0007606819272041321, -0.0007330924272537231, -0.0007055029273033142, -0.0006779134273529053, -0.0006503239274024963, -0.0006227344274520874, -0.0005951449275016785, -0.0005675554275512695, -0.0005399659276008606, -0.0005123764276504517, -0.0004847869277000427, -0.0004571974277496338, -0.00042960792779922485, -0.0004020184278488159, -0.000374428927898407, -0.00034683942794799805, -0.0003192499279975891, -0.0002916604280471802, -0.00026407092809677124, -0.0002364814281463623, -0.00020889192819595337, -0.00018130242824554443, -0.0001537129282951355, -0.00012612342834472656, -9.853392839431763e-05, -7.094442844390869e-05, -4.3354928493499756e-05, -1.576542854309082e-05, 1.1824071407318115e-05, 3.941357135772705e-05, 6.700307130813599e-05, 9.459257125854492e-05, 0.00012218207120895386, 0.0001497715711593628, 0.00017736107110977173, 0.00020495057106018066, 0.0002325400710105896, 0.00026012957096099854, 0.00028771907091140747, 0.0003153085708618164, 0.00034289807081222534, 0.0003704875707626343, 0.0003980770707130432, 0.00042566657066345215, 0.0004532560706138611, 0.00048084557056427, 0.000508435070514679, 0.0005360245704650879, 0.0005636140704154968, 0.0005912035703659058, 0.0006187930703163147, 0.0006463825702667236, 0.0006739720702171326, 0.0007015615701675415, 0.0007291510701179504, 0.0007567405700683594]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 3.0, 7.0, 6.0, 7.0, 10.0, 7.0, 19.0, 21.0, 31.0, 44.0, 57.0, 96.0, 130.0, 197.0, 406.0, 1296.0, 33110.0, 947216.0, 63008.0, 1776.0, 443.0, 210.0, 128.0, 78.0, 69.0, 40.0, 35.0, 23.0, 11.0, 19.0, 8.0, 10.0, 6.0, 8.0, 6.0, 6.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01247406005859375, -0.011966347694396973, -0.011458635330200195, -0.010950922966003418, -0.01044321060180664, -0.009935498237609863, -0.009427785873413086, -0.008920073509216309, -0.008412361145019531, -0.007904648780822754, -0.0073969364166259766, -0.006889224052429199, -0.006381511688232422, -0.0058737993240356445, -0.005366086959838867, -0.00485837459564209, -0.0043506622314453125, -0.003842949867248535, -0.003335237503051758, -0.0028275251388549805, -0.002319812774658203, -0.0018121004104614258, -0.0013043880462646484, -0.0007966756820678711, -0.00028896331787109375, 0.0002187490463256836, 0.0007264614105224609, 0.0012341737747192383, 0.0017418861389160156, 0.002249598503112793, 0.0027573108673095703, 0.0032650232315063477, 0.003772735595703125, 0.004280447959899902, 0.00478816032409668, 0.005295872688293457, 0.005803585052490234, 0.006311297416687012, 0.006819009780883789, 0.007326722145080566, 0.007834434509277344, 0.008342146873474121, 0.008849859237670898, 0.009357571601867676, 0.009865283966064453, 0.01037299633026123, 0.010880708694458008, 0.011388421058654785, 0.011896133422851562, 0.01240384578704834, 0.012911558151245117, 0.013419270515441895, 0.013926982879638672, 0.01443469524383545, 0.014942407608032227, 0.015450119972229004, 0.01595783233642578, 0.01646554470062256, 0.016973257064819336, 0.017480969429016113, 0.01798868179321289, 0.018496394157409668, 0.019004106521606445, 0.019511818885803223, 0.02001953125]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 38.0, 348.0, 509.0, 109.0, 8.0], "bins": [-0.008204471319913864, -0.008070535026490688, -0.007936597801744938, -0.007802661508321762, -0.007668725214898586, -0.007534788455814123, -0.00740085169672966, -0.007266915403306484, -0.007132978644222021, -0.006999041885137558, -0.006865105591714382, -0.006731168832629919, -0.006597232073545456, -0.00646329578012228, -0.006329359021037817, -0.006195422727614641, -0.006061485968530178, -0.005927549209445715, -0.005793612916022539, -0.005659676156938076, -0.0055257398635149, -0.005391803104430437, -0.005257866345345974, -0.005123930051922798, -0.004989993292838335, -0.004856056533753872, -0.004722120240330696, -0.004588183481246233, -0.00445424672216177, -0.004320310428738594, -0.004186373669654131, -0.004052437376230955, -0.003918501082807779, -0.00378456455655396, -0.0036506280303001404, -0.0035166912712156773, -0.003382754744961858, -0.0032488182187080383, -0.003114881459623575, -0.0029809449333697557, -0.0028470084071159363, -0.002713071880862117, -0.0025791353546082973, -0.0024451985955238342, -0.0023112620692700148, -0.0021773255430161953, -0.002043388783931732, -0.0019094522576779127, -0.0017755156150087714, -0.0016415789723396301, -0.0015076424460858107, -0.0013737059198319912, -0.00123976927716285, -0.0011058326344937086, -0.0009718961082398891, -0.0008379595237784088, -0.0007040229393169284, -0.000570086354855448, -0.00043614977039396763, -0.00030221318593248725, -0.00016827660147100687, -3.434001700952649e-05, 9.959656745195389e-05, 0.00023353315191343427, 0.0003674697072710842]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 7.0, 1.0, 4.0, 4.0, 10.0, 5.0, 11.0, 11.0, 11.0, 20.0, 23.0, 21.0, 36.0, 31.0, 40.0, 30.0, 38.0, 48.0, 62.0, 36.0, 39.0, 50.0, 54.0, 54.0, 39.0, 53.0, 37.0, 38.0, 27.0, 38.0, 27.0, 19.0, 20.0, 13.0, 8.0, 13.0, 10.0, 8.0, 11.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0005189776420593262, -0.0005028657615184784, -0.0004867538809776306, -0.00047064200043678284, -0.00045453011989593506, -0.0004384182393550873, -0.0004223063588142395, -0.0004061944782733917, -0.00039008259773254395, -0.00037397071719169617, -0.0003578588366508484, -0.0003417469561100006, -0.00032563507556915283, -0.00030952319502830505, -0.0002934113144874573, -0.0002772994339466095, -0.0002611875534057617, -0.00024507567286491394, -0.00022896379232406616, -0.00021285191178321838, -0.0001967400312423706, -0.00018062815070152283, -0.00016451627016067505, -0.00014840438961982727, -0.0001322925090789795, -0.00011618062853813171, -0.00010006874799728394, -8.395686745643616e-05, -6.784498691558838e-05, -5.17331063747406e-05, -3.562122583389282e-05, -1.9509345293045044e-05, -3.3974647521972656e-06, 1.2714415788650513e-05, 2.882629632949829e-05, 4.493817687034607e-05, 6.105005741119385e-05, 7.716193795204163e-05, 9.32738184928894e-05, 0.00010938569903373718, 0.00012549757957458496, 0.00014160946011543274, 0.00015772134065628052, 0.0001738332211971283, 0.00018994510173797607, 0.00020605698227882385, 0.00022216886281967163, 0.0002382807433605194, 0.0002543926239013672, 0.00027050450444221497, 0.00028661638498306274, 0.0003027282655239105, 0.0003188401460647583, 0.0003349520266056061, 0.00035106390714645386, 0.00036717578768730164, 0.0003832876682281494, 0.0003993995487689972, 0.00041551142930984497, 0.00043162330985069275, 0.00044773519039154053, 0.0004638470709323883, 0.0004799589514732361, 0.0004960708320140839, 0.0005121827125549316]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 7.0, 6.0, 10.0, 2.0, 7.0, 8.0, 16.0, 12.0, 15.0, 20.0, 21.0, 24.0, 29.0, 31.0, 33.0, 29.0, 38.0, 33.0, 38.0, 55.0, 48.0, 46.0, 57.0, 44.0, 47.0, 35.0, 23.0, 42.0, 28.0, 33.0, 29.0, 21.0, 27.0, 18.0, 13.0, 11.0, 14.0, 5.0, 12.0, 7.0, 6.0, 6.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.13671875, -5.95758056640625, -5.7784423828125, -5.59930419921875, -5.420166015625, -5.24102783203125, -5.0618896484375, -4.88275146484375, -4.70361328125, -4.52447509765625, -4.3453369140625, -4.16619873046875, -3.987060546875, -3.80792236328125, -3.6287841796875, -3.44964599609375, -3.2705078125, -3.09136962890625, -2.9122314453125, -2.73309326171875, -2.553955078125, -2.37481689453125, -2.1956787109375, -2.01654052734375, -1.83740234375, -1.65826416015625, -1.4791259765625, -1.29998779296875, -1.120849609375, -0.94171142578125, -0.7625732421875, -0.58343505859375, -0.404296875, -0.22515869140625, -0.0460205078125, 0.13311767578125, 0.312255859375, 0.49139404296875, 0.6705322265625, 0.84967041015625, 1.02880859375, 1.20794677734375, 1.3870849609375, 1.56622314453125, 1.745361328125, 1.92449951171875, 2.1036376953125, 2.28277587890625, 2.4619140625, 2.64105224609375, 2.8201904296875, 2.99932861328125, 3.178466796875, 3.35760498046875, 3.5367431640625, 3.71588134765625, 3.89501953125, 4.07415771484375, 4.2532958984375, 4.43243408203125, 4.611572265625, 4.79071044921875, 4.9698486328125, 5.14898681640625, 5.328125]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 5.0, 2.0, 4.0, 5.0, 10.0, 16.0, 14.0, 26.0, 42.0, 57.0, 67.0, 121.0, 160.0, 247.0, 344.0, 467.0, 698.0, 1003.0, 1577.0, 2474.0, 3700.0, 6010.0, 9479.0, 15745.0, 26281.0, 46757.0, 91435.0, 226742.0, 336484.0, 131250.0, 61493.0, 33608.0, 19740.0, 11788.0, 7347.0, 4630.0, 2916.0, 1853.0, 1194.0, 859.0, 611.0, 387.0, 298.0, 191.0, 146.0, 87.0, 59.0, 52.0, 29.0, 15.0, 17.0, 7.0, 6.0, 6.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0], "bins": [-3.28515625, -3.183197021484375, -3.08123779296875, -2.979278564453125, -2.8773193359375, -2.775360107421875, -2.67340087890625, -2.571441650390625, -2.469482421875, -2.367523193359375, -2.26556396484375, -2.163604736328125, -2.0616455078125, -1.959686279296875, -1.85772705078125, -1.755767822265625, -1.65380859375, -1.551849365234375, -1.44989013671875, -1.347930908203125, -1.2459716796875, -1.144012451171875, -1.04205322265625, -0.940093994140625, -0.838134765625, -0.736175537109375, -0.63421630859375, -0.532257080078125, -0.4302978515625, -0.328338623046875, -0.22637939453125, -0.124420166015625, -0.0224609375, 0.079498291015625, 0.18145751953125, 0.283416748046875, 0.3853759765625, 0.487335205078125, 0.58929443359375, 0.691253662109375, 0.793212890625, 0.895172119140625, 0.99713134765625, 1.099090576171875, 1.2010498046875, 1.303009033203125, 1.40496826171875, 1.506927490234375, 1.60888671875, 1.710845947265625, 1.81280517578125, 1.914764404296875, 2.0167236328125, 2.118682861328125, 2.22064208984375, 2.322601318359375, 2.424560546875, 2.526519775390625, 2.62847900390625, 2.730438232421875, 2.8323974609375, 2.934356689453125, 3.03631591796875, 3.138275146484375, 3.240234375]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 2.0, 6.0, 8.0, 8.0, 9.0, 4.0, 13.0, 9.0, 12.0, 18.0, 17.0, 23.0, 24.0, 34.0, 34.0, 39.0, 36.0, 43.0, 53.0, 47.0, 85.0, 157.0, 1650.0, 182.0, 91.0, 60.0, 53.0, 41.0, 43.0, 35.0, 26.0, 20.0, 27.0, 26.0, 24.0, 18.0, 12.0, 11.0, 12.0, 6.0, 10.0, 5.0, 7.0, 3.0, 6.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-18.40625, -17.803466796875, -17.20068359375, -16.597900390625, -15.9951171875, -15.392333984375, -14.78955078125, -14.186767578125, -13.583984375, -12.981201171875, -12.37841796875, -11.775634765625, -11.1728515625, -10.570068359375, -9.96728515625, -9.364501953125, -8.76171875, -8.158935546875, -7.55615234375, -6.953369140625, -6.3505859375, -5.747802734375, -5.14501953125, -4.542236328125, -3.939453125, -3.336669921875, -2.73388671875, -2.131103515625, -1.5283203125, -0.925537109375, -0.32275390625, 0.280029296875, 0.8828125, 1.485595703125, 2.08837890625, 2.691162109375, 3.2939453125, 3.896728515625, 4.49951171875, 5.102294921875, 5.705078125, 6.307861328125, 6.91064453125, 7.513427734375, 8.1162109375, 8.718994140625, 9.32177734375, 9.924560546875, 10.52734375, 11.130126953125, 11.73291015625, 12.335693359375, 12.9384765625, 13.541259765625, 14.14404296875, 14.746826171875, 15.349609375, 15.952392578125, 16.55517578125, 17.157958984375, 17.7607421875, 18.363525390625, 18.96630859375, 19.569091796875, 20.171875]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 5.0, 4.0, 7.0, 3.0, 15.0, 10.0, 22.0, 24.0, 26.0, 54.0, 69.0, 87.0, 113.0, 172.0, 253.0, 461.0, 1529.0, 19974.0, 3085578.0, 34077.0, 1837.0, 483.0, 269.0, 182.0, 111.0, 84.0, 74.0, 52.0, 48.0, 17.0, 23.0, 15.0, 6.0, 14.0, 8.0, 6.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.09375, -42.29833984375, -40.5029296875, -38.70751953125, -36.912109375, -35.11669921875, -33.3212890625, -31.52587890625, -29.73046875, -27.93505859375, -26.1396484375, -24.34423828125, -22.548828125, -20.75341796875, -18.9580078125, -17.16259765625, -15.3671875, -13.57177734375, -11.7763671875, -9.98095703125, -8.185546875, -6.39013671875, -4.5947265625, -2.79931640625, -1.00390625, 0.79150390625, 2.5869140625, 4.38232421875, 6.177734375, 7.97314453125, 9.7685546875, 11.56396484375, 13.359375, 15.15478515625, 16.9501953125, 18.74560546875, 20.541015625, 22.33642578125, 24.1318359375, 25.92724609375, 27.72265625, 29.51806640625, 31.3134765625, 33.10888671875, 34.904296875, 36.69970703125, 38.4951171875, 40.29052734375, 42.0859375, 43.88134765625, 45.6767578125, 47.47216796875, 49.267578125, 51.06298828125, 52.8583984375, 54.65380859375, 56.44921875, 58.24462890625, 60.0400390625, 61.83544921875, 63.630859375, 65.42626953125, 67.2216796875, 69.01708984375, 70.8125]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 10.0, 43.0, 207.0, 510.0, 200.0, 33.0, 10.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.089519500732422, -26.931842803955078, -23.774166107177734, -20.61648941040039, -17.458812713623047, -14.301136016845703, -11.14345932006836, -7.985782623291016, -4.828105926513672, -1.6704292297363281, 1.4872474670410156, 4.644924163818359, 7.802600860595703, 10.960277557373047, 14.11795425415039, 17.275630950927734, 20.433307647705078, 23.590984344482422, 26.748661041259766, 29.90633773803711, 33.06401443481445, 36.2216911315918, 39.37936782836914, 42.537044525146484, 45.69472122192383, 48.85239791870117, 52.010074615478516, 55.16775131225586, 58.3254280090332, 61.48310470581055, 64.64077758789062, 67.7984619140625, 70.95613098144531, 74.11380767822266, 77.271484375, 80.42916107177734, 83.58683776855469, 86.74451446533203, 89.90219116210938, 93.05986785888672, 96.21754455566406, 99.3752212524414, 102.53289794921875, 105.6905746459961, 108.84825134277344, 112.00592803955078, 115.16360473632812, 118.32128143310547, 121.47895812988281, 124.63663482666016, 127.7943115234375, 130.95199584960938, 134.1096649169922, 137.267333984375, 140.42501831054688, 143.58270263671875, 146.74037170410156, 149.89804077148438, 153.05572509765625, 156.21340942382812, 159.37107849121094, 162.52874755859375, 165.68643188476562, 168.8441162109375, 172.0017852783203]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 1.0, 4.0, 3.0, 2.0, 6.0, 2.0, 8.0, 12.0, 12.0, 19.0, 17.0, 17.0, 12.0, 14.0, 22.0, 20.0, 28.0, 32.0, 27.0, 34.0, 34.0, 44.0, 48.0, 40.0, 26.0, 33.0, 33.0, 48.0, 37.0, 41.0, 32.0, 29.0, 38.0, 34.0, 34.0, 30.0, 17.0, 22.0, 17.0, 9.0, 7.0, 15.0, 3.0, 10.0, 8.0, 11.0, 3.0, 4.0, 4.0, 2.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0], "bins": [-48.972808837890625, -47.49761962890625, -46.02243423461914, -44.547245025634766, -43.072059631347656, -41.59687042236328, -40.121681213378906, -38.6464958190918, -37.17131042480469, -35.69612121582031, -34.2209358215332, -32.74574661254883, -31.27056121826172, -29.795372009277344, -28.3201847076416, -26.84499740600586, -25.369808197021484, -23.894620895385742, -22.41943359375, -20.944244384765625, -19.469058990478516, -17.99386978149414, -16.5186824798584, -15.043495178222656, -13.568307876586914, -12.093120574951172, -10.61793327331543, -9.142745018005371, -7.667557716369629, -6.192370414733887, -4.717182159423828, -3.241994857788086, -1.7668075561523438, -0.29162001609802246, 1.1835675239562988, 2.658755302429199, 4.133942604064941, 5.609129905700684, 7.084318161010742, 8.559505462646484, 10.034692764282227, 11.509880065917969, 12.985067367553711, 14.46025562286377, 15.935442924499512, 17.410629272460938, 18.885818481445312, 20.361005783081055, 21.836193084716797, 23.31138038635254, 24.78656768798828, 26.261756896972656, 27.736942291259766, 29.21213150024414, 30.687318801879883, 32.162506103515625, 33.6376953125, 35.112884521484375, 36.588069915771484, 38.06325912475586, 39.53844451904297, 41.013633728027344, 42.48882293701172, 43.96400833129883, 45.43919372558594]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 6.0, 6.0, 2.0, 7.0, 9.0, 9.0, 8.0, 9.0, 23.0, 18.0, 22.0, 18.0, 29.0, 30.0, 27.0, 25.0, 32.0, 25.0, 44.0, 46.0, 40.0, 49.0, 43.0, 61.0, 41.0, 37.0, 41.0, 38.0, 42.0, 22.0, 25.0, 28.0, 23.0, 17.0, 16.0, 22.0, 22.0, 5.0, 8.0, 8.0, 8.0, 5.0, 6.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.9765625, -5.796142578125, -5.61572265625, -5.435302734375, -5.2548828125, -5.074462890625, -4.89404296875, -4.713623046875, -4.533203125, -4.352783203125, -4.17236328125, -3.991943359375, -3.8115234375, -3.631103515625, -3.45068359375, -3.270263671875, -3.08984375, -2.909423828125, -2.72900390625, -2.548583984375, -2.3681640625, -2.187744140625, -2.00732421875, -1.826904296875, -1.646484375, -1.466064453125, -1.28564453125, -1.105224609375, -0.9248046875, -0.744384765625, -0.56396484375, -0.383544921875, -0.203125, -0.022705078125, 0.15771484375, 0.338134765625, 0.5185546875, 0.698974609375, 0.87939453125, 1.059814453125, 1.240234375, 1.420654296875, 1.60107421875, 1.781494140625, 1.9619140625, 2.142333984375, 2.32275390625, 2.503173828125, 2.68359375, 2.864013671875, 3.04443359375, 3.224853515625, 3.4052734375, 3.585693359375, 3.76611328125, 3.946533203125, 4.126953125, 4.307373046875, 4.48779296875, 4.668212890625, 4.8486328125, 5.029052734375, 5.20947265625, 5.389892578125, 5.5703125]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 0.0, 4.0, 4.0, 7.0, 7.0, 5.0, 6.0, 13.0, 11.0, 18.0, 11.0, 15.0, 25.0, 34.0, 31.0, 39.0, 61.0, 112.0, 295.0, 1071.0, 5164.0, 37010.0, 669722.0, 3227088.0, 231374.0, 18305.0, 2715.0, 587.0, 198.0, 94.0, 43.0, 42.0, 31.0, 18.0, 25.0, 17.0, 17.0, 13.0, 14.0, 8.0, 10.0, 10.0, 2.0, 3.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-21.515625, -20.870361328125, -20.22509765625, -19.579833984375, -18.9345703125, -18.289306640625, -17.64404296875, -16.998779296875, -16.353515625, -15.708251953125, -15.06298828125, -14.417724609375, -13.7724609375, -13.127197265625, -12.48193359375, -11.836669921875, -11.19140625, -10.546142578125, -9.90087890625, -9.255615234375, -8.6103515625, -7.965087890625, -7.31982421875, -6.674560546875, -6.029296875, -5.384033203125, -4.73876953125, -4.093505859375, -3.4482421875, -2.802978515625, -2.15771484375, -1.512451171875, -0.8671875, -0.221923828125, 0.42333984375, 1.068603515625, 1.7138671875, 2.359130859375, 3.00439453125, 3.649658203125, 4.294921875, 4.940185546875, 5.58544921875, 6.230712890625, 6.8759765625, 7.521240234375, 8.16650390625, 8.811767578125, 9.45703125, 10.102294921875, 10.74755859375, 11.392822265625, 12.0380859375, 12.683349609375, 13.32861328125, 13.973876953125, 14.619140625, 15.264404296875, 15.90966796875, 16.554931640625, 17.2001953125, 17.845458984375, 18.49072265625, 19.135986328125, 19.78125]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 7.0, 2.0, 8.0, 26.0, 56.0, 65.0, 140.0, 182.0, 357.0, 663.0, 872.0, 723.0, 393.0, 242.0, 139.0, 83.0, 50.0, 23.0, 21.0, 14.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.203125, -24.53173828125, -23.8603515625, -23.18896484375, -22.517578125, -21.84619140625, -21.1748046875, -20.50341796875, -19.83203125, -19.16064453125, -18.4892578125, -17.81787109375, -17.146484375, -16.47509765625, -15.8037109375, -15.13232421875, -14.4609375, -13.78955078125, -13.1181640625, -12.44677734375, -11.775390625, -11.10400390625, -10.4326171875, -9.76123046875, -9.08984375, -8.41845703125, -7.7470703125, -7.07568359375, -6.404296875, -5.73291015625, -5.0615234375, -4.39013671875, -3.71875, -3.04736328125, -2.3759765625, -1.70458984375, -1.033203125, -0.36181640625, 0.3095703125, 0.98095703125, 1.65234375, 2.32373046875, 2.9951171875, 3.66650390625, 4.337890625, 5.00927734375, 5.6806640625, 6.35205078125, 7.0234375, 7.69482421875, 8.3662109375, 9.03759765625, 9.708984375, 10.38037109375, 11.0517578125, 11.72314453125, 12.39453125, 13.06591796875, 13.7373046875, 14.40869140625, 15.080078125, 15.75146484375, 16.4228515625, 17.09423828125, 17.765625]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 0.0, 4.0, 7.0, 12.0, 15.0, 33.0, 48.0, 87.0, 132.0, 235.0, 515.0, 1261.0, 6114.0, 110035.0, 3712962.0, 348129.0, 11660.0, 1785.0, 631.0, 289.0, 149.0, 90.0, 46.0, 12.0, 16.0, 7.0, 7.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.25, -33.9267578125, -32.603515625, -31.2802734375, -29.95703125, -28.6337890625, -27.310546875, -25.9873046875, -24.6640625, -23.3408203125, -22.017578125, -20.6943359375, -19.37109375, -18.0478515625, -16.724609375, -15.4013671875, -14.078125, -12.7548828125, -11.431640625, -10.1083984375, -8.78515625, -7.4619140625, -6.138671875, -4.8154296875, -3.4921875, -2.1689453125, -0.845703125, 0.4775390625, 1.80078125, 3.1240234375, 4.447265625, 5.7705078125, 7.09375, 8.4169921875, 9.740234375, 11.0634765625, 12.38671875, 13.7099609375, 15.033203125, 16.3564453125, 17.6796875, 19.0029296875, 20.326171875, 21.6494140625, 22.97265625, 24.2958984375, 25.619140625, 26.9423828125, 28.265625, 29.5888671875, 30.912109375, 32.2353515625, 33.55859375, 34.8818359375, 36.205078125, 37.5283203125, 38.8515625, 40.1748046875, 41.498046875, 42.8212890625, 44.14453125, 45.4677734375, 46.791015625, 48.1142578125, 49.4375]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 13.0, 76.0, 222.0, 374.0, 234.0, 70.0, 20.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-118.32682037353516, -111.55143737792969, -104.77606201171875, -98.00067901611328, -91.22529602050781, -84.44991302490234, -77.67453002929688, -70.89915466308594, -64.12377166748047, -57.348388671875, -50.5730094909668, -43.797630310058594, -37.022247314453125, -30.246864318847656, -23.471485137939453, -16.69610595703125, -9.920722961425781, -3.1453418731689453, 3.6300392150878906, 10.405420303344727, 17.180801391601562, 23.95618438720703, 30.731563568115234, 37.50694274902344, 44.282325744628906, 51.057708740234375, 57.83308792114258, 64.60846710205078, 71.38385009765625, 78.15923309326172, 84.93461608886719, 91.70999145507812, 98.48538208007812, 105.2607650756836, 112.03614807128906, 118.8115234375, 125.58690643310547, 132.36228942871094, 139.13766479492188, 145.91305541992188, 152.6884307861328, 159.46380615234375, 166.23919677734375, 173.0145721435547, 179.78994750976562, 186.56533813476562, 193.34071350097656, 200.1160888671875, 206.8914794921875, 213.66685485839844, 220.44224548339844, 227.21762084960938, 233.99301147460938, 240.7683868408203, 247.54376220703125, 254.31915283203125, 261.09454345703125, 267.86993408203125, 274.6452941894531, 281.4206848144531, 288.1960754394531, 294.971435546875, 301.746826171875, 308.522216796875, 315.2975769042969]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 7.0, 7.0, 10.0, 18.0, 18.0, 18.0, 16.0, 18.0, 24.0, 27.0, 31.0, 24.0, 38.0, 38.0, 47.0, 46.0, 47.0, 34.0, 54.0, 50.0, 45.0, 55.0, 38.0, 31.0, 44.0, 23.0, 32.0, 26.0, 29.0, 21.0, 16.0, 23.0, 14.0, 9.0, 6.0, 4.0, 2.0, 3.0, 6.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.972686767578125, -40.52600860595703, -39.07933044433594, -37.63264846801758, -36.185970306396484, -34.73929214477539, -33.29261016845703, -31.845932006835938, -30.399253845214844, -28.95257568359375, -27.505895614624023, -26.059215545654297, -24.612537384033203, -23.16585922241211, -21.719179153442383, -20.272499084472656, -18.825820922851562, -17.37914276123047, -15.932462692260742, -14.485783576965332, -13.039104461669922, -11.592425346374512, -10.145746231079102, -8.699067115783691, -7.252388000488281, -5.805708885192871, -4.359029769897461, -2.912350654602051, -1.4656715393066406, -0.01899242401123047, 1.4276866912841797, 2.87436580657959, 4.321044921875, 5.76772403717041, 7.21440315246582, 8.66108226776123, 10.10776138305664, 11.55444049835205, 13.001119613647461, 14.447798728942871, 15.894477844238281, 17.341156005859375, 18.7878360748291, 20.234516143798828, 21.681194305419922, 23.127872467041016, 24.574552536010742, 26.02123260498047, 27.467910766601562, 28.914588928222656, 30.361268997192383, 31.80794906616211, 33.2546272277832, 34.7013053894043, 36.147987365722656, 37.59466552734375, 39.041343688964844, 40.48802185058594, 41.93470001220703, 43.38138198852539, 44.828060150146484, 46.27473831176758, 47.72142028808594, 49.16809844970703, 50.614776611328125]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 6.0, 9.0, 11.0, 11.0, 9.0, 11.0, 15.0, 13.0, 19.0, 30.0, 29.0, 38.0, 26.0, 40.0, 39.0, 41.0, 57.0, 55.0, 58.0, 44.0, 51.0, 33.0, 57.0, 33.0, 44.0, 46.0, 30.0, 29.0, 18.0, 21.0, 13.0, 15.0, 13.0, 12.0, 8.0, 12.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.27734375, -6.06646728515625, -5.8555908203125, -5.64471435546875, -5.433837890625, -5.22296142578125, -5.0120849609375, -4.80120849609375, -4.59033203125, -4.37945556640625, -4.1685791015625, -3.95770263671875, -3.746826171875, -3.53594970703125, -3.3250732421875, -3.11419677734375, -2.9033203125, -2.69244384765625, -2.4815673828125, -2.27069091796875, -2.059814453125, -1.84893798828125, -1.6380615234375, -1.42718505859375, -1.21630859375, -1.00543212890625, -0.7945556640625, -0.58367919921875, -0.372802734375, -0.16192626953125, 0.0489501953125, 0.25982666015625, 0.470703125, 0.68157958984375, 0.8924560546875, 1.10333251953125, 1.314208984375, 1.52508544921875, 1.7359619140625, 1.94683837890625, 2.15771484375, 2.36859130859375, 2.5794677734375, 2.79034423828125, 3.001220703125, 3.21209716796875, 3.4229736328125, 3.63385009765625, 3.8447265625, 4.05560302734375, 4.2664794921875, 4.47735595703125, 4.688232421875, 4.89910888671875, 5.1099853515625, 5.32086181640625, 5.53173828125, 5.74261474609375, 5.9534912109375, 6.16436767578125, 6.375244140625, 6.58612060546875, 6.7969970703125, 7.00787353515625, 7.21875]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 8.0, 14.0, 16.0, 25.0, 44.0, 61.0, 97.0, 121.0, 267.0, 349.0, 535.0, 852.0, 1439.0, 2131.0, 3274.0, 5096.0, 8097.0, 13212.0, 21970.0, 37884.0, 67483.0, 122632.0, 197775.0, 218365.0, 147900.0, 83940.0, 46302.0, 26438.0, 15702.0, 9671.0, 6020.0, 3918.0, 2460.0, 1657.0, 1039.0, 688.0, 370.0, 244.0, 152.0, 106.0, 63.0, 52.0, 28.0, 22.0, 11.0, 12.0, 6.0, 7.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2427978515625, -0.23501014709472656, -0.22722244262695312, -0.2194347381591797, -0.21164703369140625, -0.2038593292236328, -0.19607162475585938, -0.18828392028808594, -0.1804962158203125, -0.17270851135253906, -0.16492080688476562, -0.1571331024169922, -0.14934539794921875, -0.1415576934814453, -0.13376998901367188, -0.12598228454589844, -0.118194580078125, -0.11040687561035156, -0.10261917114257812, -0.09483146667480469, -0.08704376220703125, -0.07925605773925781, -0.07146835327148438, -0.06368064880371094, -0.0558929443359375, -0.04810523986816406, -0.040317535400390625, -0.03252983093261719, -0.02474212646484375, -0.016954421997070312, -0.009166717529296875, -0.0013790130615234375, 0.00640869140625, 0.014196395874023438, 0.021984100341796875, 0.029771804809570312, 0.03755950927734375, 0.04534721374511719, 0.053134918212890625, 0.06092262268066406, 0.0687103271484375, 0.07649803161621094, 0.08428573608398438, 0.09207344055175781, 0.09986114501953125, 0.10764884948730469, 0.11543655395507812, 0.12322425842285156, 0.131011962890625, 0.13879966735839844, 0.14658737182617188, 0.1543750762939453, 0.16216278076171875, 0.1699504852294922, 0.17773818969726562, 0.18552589416503906, 0.1933135986328125, 0.20110130310058594, 0.20888900756835938, 0.2166767120361328, 0.22446441650390625, 0.2322521209716797, 0.24003982543945312, 0.24782752990722656, 0.255615234375]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 6.0, 5.0, 5.0, 12.0, 9.0, 10.0, 9.0, 10.0, 20.0, 19.0, 16.0, 17.0, 26.0, 30.0, 33.0, 33.0, 32.0, 30.0, 34.0, 33.0, 42.0, 40.0, 1057.0, 36.0, 43.0, 33.0, 48.0, 47.0, 41.0, 30.0, 30.0, 21.0, 33.0, 25.0, 17.0, 11.0, 17.0, 13.0, 14.0, 6.0, 10.0, 7.0, 5.0, 2.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.234375, -3.128662109375, -3.02294921875, -2.917236328125, -2.8115234375, -2.705810546875, -2.60009765625, -2.494384765625, -2.388671875, -2.282958984375, -2.17724609375, -2.071533203125, -1.9658203125, -1.860107421875, -1.75439453125, -1.648681640625, -1.54296875, -1.437255859375, -1.33154296875, -1.225830078125, -1.1201171875, -1.014404296875, -0.90869140625, -0.802978515625, -0.697265625, -0.591552734375, -0.48583984375, -0.380126953125, -0.2744140625, -0.168701171875, -0.06298828125, 0.042724609375, 0.1484375, 0.254150390625, 0.35986328125, 0.465576171875, 0.5712890625, 0.677001953125, 0.78271484375, 0.888427734375, 0.994140625, 1.099853515625, 1.20556640625, 1.311279296875, 1.4169921875, 1.522705078125, 1.62841796875, 1.734130859375, 1.83984375, 1.945556640625, 2.05126953125, 2.156982421875, 2.2626953125, 2.368408203125, 2.47412109375, 2.579833984375, 2.685546875, 2.791259765625, 2.89697265625, 3.002685546875, 3.1083984375, 3.214111328125, 3.31982421875, 3.425537109375, 3.53125]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 1.0, 4.0, 5.0, 12.0, 27.0, 34.0, 53.0, 62.0, 105.0, 139.0, 221.0, 341.0, 534.0, 796.0, 1194.0, 1727.0, 2552.0, 3809.0, 5684.0, 8591.0, 13200.0, 20685.0, 32680.0, 52196.0, 84277.0, 128880.0, 841873.0, 542253.0, 128636.0, 83669.0, 51872.0, 32294.0, 20106.0, 12924.0, 8465.0, 5580.0, 3795.0, 2584.0, 1741.0, 1202.0, 792.0, 541.0, 334.0, 232.0, 146.0, 98.0, 68.0, 46.0, 36.0, 23.0, 9.0, 7.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.174072265625, -0.1684551239013672, -0.16283798217773438, -0.15722084045410156, -0.15160369873046875, -0.14598655700683594, -0.14036941528320312, -0.1347522735595703, -0.1291351318359375, -0.12351799011230469, -0.11790084838867188, -0.11228370666503906, -0.10666656494140625, -0.10104942321777344, -0.09543228149414062, -0.08981513977050781, -0.084197998046875, -0.07858085632324219, -0.07296371459960938, -0.06734657287597656, -0.06172943115234375, -0.05611228942871094, -0.050495147705078125, -0.04487800598144531, -0.0392608642578125, -0.03364372253417969, -0.028026580810546875, -0.022409439086914062, -0.01679229736328125, -0.011175155639648438, -0.005558013916015625, 5.91278076171875e-05, 0.00567626953125, 0.011293411254882812, 0.016910552978515625, 0.022527694702148438, 0.02814483642578125, 0.03376197814941406, 0.039379119873046875, 0.04499626159667969, 0.0506134033203125, 0.05623054504394531, 0.061847686767578125, 0.06746482849121094, 0.07308197021484375, 0.07869911193847656, 0.08431625366210938, 0.08993339538574219, 0.095550537109375, 0.10116767883300781, 0.10678482055664062, 0.11240196228027344, 0.11801910400390625, 0.12363624572753906, 0.12925338745117188, 0.1348705291748047, 0.1404876708984375, 0.1461048126220703, 0.15172195434570312, 0.15733909606933594, 0.16295623779296875, 0.16857337951660156, 0.17419052124023438, 0.1798076629638672, 0.1854248046875]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 5.0, 4.0, 8.0, 4.0, 7.0, 22.0, 19.0, 38.0, 43.0, 50.0, 88.0, 130.0, 113.0, 131.0, 92.0, 81.0, 48.0, 39.0, 23.0, 15.0, 16.0, 3.0, 4.0, 3.0, 5.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0030002593994140625, -0.002918928861618042, -0.0028375983238220215, -0.002756267786026001, -0.0026749372482299805, -0.00259360671043396, -0.0025122761726379395, -0.002430945634841919, -0.0023496150970458984, -0.002268284559249878, -0.0021869540214538574, -0.002105623483657837, -0.0020242929458618164, -0.001942962408065796, -0.0018616318702697754, -0.0017803013324737549, -0.0016989707946777344, -0.0016176402568817139, -0.0015363097190856934, -0.0014549791812896729, -0.0013736486434936523, -0.0012923181056976318, -0.0012109875679016113, -0.0011296570301055908, -0.0010483264923095703, -0.0009669959545135498, -0.0008856654167175293, -0.0008043348789215088, -0.0007230043411254883, -0.0006416738033294678, -0.0005603432655334473, -0.00047901272773742676, -0.00039768218994140625, -0.00031635165214538574, -0.00023502111434936523, -0.00015369057655334473, -7.236003875732422e-05, 8.970499038696289e-06, 9.03010368347168e-05, 0.0001716315746307373, 0.0002529621124267578, 0.0003342926502227783, 0.00041562318801879883, 0.0004969537258148193, 0.0005782842636108398, 0.0006596148014068604, 0.0007409453392028809, 0.0008222758769989014, 0.0009036064147949219, 0.0009849369525909424, 0.0010662674903869629, 0.0011475980281829834, 0.001228928565979004, 0.0013102591037750244, 0.001391589641571045, 0.0014729201793670654, 0.001554250717163086, 0.0016355812549591064, 0.001716911792755127, 0.0017982423305511475, 0.001879572868347168, 0.0019609034061431885, 0.002042233943939209, 0.0021235644817352295, 0.00220489501953125]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 7.0, 5.0, 7.0, 6.0, 2.0, 12.0, 16.0, 24.0, 37.0, 61.0, 120.0, 251.0, 979.0, 918380.0, 127502.0, 617.0, 233.0, 111.0, 49.0, 48.0, 30.0, 19.0, 7.0, 9.0, 9.0, 4.0, 5.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.043243408203125, -0.04163551330566406, -0.040027618408203125, -0.03841972351074219, -0.03681182861328125, -0.03520393371582031, -0.033596038818359375, -0.03198814392089844, -0.0303802490234375, -0.028772354125976562, -0.027164459228515625, -0.025556564331054688, -0.02394866943359375, -0.022340774536132812, -0.020732879638671875, -0.019124984741210938, -0.01751708984375, -0.015909194946289062, -0.014301300048828125, -0.012693405151367188, -0.01108551025390625, -0.009477615356445312, -0.007869720458984375, -0.0062618255615234375, -0.0046539306640625, -0.0030460357666015625, -0.001438140869140625, 0.0001697540283203125, 0.00177764892578125, 0.0033855438232421875, 0.004993438720703125, 0.0066013336181640625, 0.008209228515625, 0.009817123413085938, 0.011425018310546875, 0.013032913208007812, 0.01464080810546875, 0.016248703002929688, 0.017856597900390625, 0.019464492797851562, 0.0210723876953125, 0.022680282592773438, 0.024288177490234375, 0.025896072387695312, 0.02750396728515625, 0.029111862182617188, 0.030719757080078125, 0.03232765197753906, 0.033935546875, 0.03554344177246094, 0.037151336669921875, 0.03875923156738281, 0.04036712646484375, 0.04197502136230469, 0.043582916259765625, 0.04519081115722656, 0.0467987060546875, 0.04840660095214844, 0.050014495849609375, 0.05162239074707031, 0.05323028564453125, 0.05483818054199219, 0.056446075439453125, 0.05805397033691406, 0.059661865234375]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 14.0, 330.0, 652.0, 20.0], "bins": [-0.019747210666537285, -0.01942947320640087, -0.019111737608909607, -0.018794000148773193, -0.01847626455128193, -0.018158527091145515, -0.01784079149365425, -0.017523054033517838, -0.017205318436026573, -0.01688758097589016, -0.016569845378398895, -0.01625210791826248, -0.015934372320771217, -0.015616635791957378, -0.01529889926314354, -0.014981161803007126, -0.014663425274193287, -0.014345688745379448, -0.014027952216565609, -0.01371021568775177, -0.013392479158937931, -0.013074742630124092, -0.012757006101310253, -0.012439269572496414, -0.01212153211236, -0.011803795583546162, -0.011486059054732323, -0.011168322525918484, -0.010850585997104645, -0.010532849468290806, -0.010215112939476967, -0.009897375479340553, -0.009579639881849289, -0.00926190335303545, -0.008944166824221611, -0.008626430295407772, -0.008308693766593933, -0.007990957237780094, -0.007673220243304968, -0.007355483714491129, -0.007037746720016003, -0.006720010191202164, -0.006402273662388325, -0.006084537133574486, -0.005766800604760647, -0.005449064075946808, -0.005131327081471682, -0.004813590552657843, -0.004495854489505291, -0.004178117960691452, -0.003860381431877613, -0.0035426446702331305, -0.0032249081414192915, -0.0029071716126054525, -0.00258943485096097, -0.002271698322147131, -0.0019539615605026484, -0.0016362250316888094, -0.0013184883864596486, -0.0010007517412304878, -0.0006830152124166489, -0.0003652786836028099, -4.754203837364912e-05, 0.00027019460685551167, 0.0005879311356693506]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 5.0, 1.0, 2.0, 4.0, 4.0, 2.0, 8.0, 9.0, 10.0, 11.0, 17.0, 22.0, 30.0, 16.0, 25.0, 27.0, 33.0, 27.0, 27.0, 37.0, 49.0, 34.0, 34.0, 32.0, 32.0, 38.0, 37.0, 36.0, 48.0, 40.0, 42.0, 30.0, 38.0, 28.0, 28.0, 29.0, 13.0, 23.0, 25.0, 14.0, 9.0, 8.0, 9.0, 4.0, 3.0, 2.0, 6.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.000812828540802002, -0.0007839063182473183, -0.0007549840956926346, -0.0007260618731379509, -0.0006971396505832672, -0.0006682174280285835, -0.0006392952054738998, -0.0006103729829192162, -0.0005814507603645325, -0.0005525285378098488, -0.0005236063152551651, -0.0004946840927004814, -0.00046576187014579773, -0.00043683964759111404, -0.00040791742503643036, -0.0003789952024817467, -0.000350072979927063, -0.0003211507573723793, -0.0002922285348176956, -0.00026330631226301193, -0.00023438408970832825, -0.00020546186715364456, -0.00017653964459896088, -0.0001476174220442772, -0.0001186951994895935, -8.977297693490982e-05, -6.0850754380226135e-05, -3.192853182554245e-05, -3.0063092708587646e-06, 2.591591328382492e-05, 5.4838135838508606e-05, 8.376035839319229e-05, 0.00011268258094787598, 0.00014160480350255966, 0.00017052702605724335, 0.00019944924861192703, 0.00022837147116661072, 0.0002572936937212944, 0.0002862159162759781, 0.0003151381388306618, 0.00034406036138534546, 0.00037298258394002914, 0.00040190480649471283, 0.0004308270290493965, 0.0004597492516040802, 0.0004886714741587639, 0.0005175936967134476, 0.0005465159192681313, 0.0005754381418228149, 0.0006043603643774986, 0.0006332825869321823, 0.000662204809486866, 0.0006911270320415497, 0.0007200492545962334, 0.000748971477150917, 0.0007778936997056007, 0.0008068159222602844, 0.0008357381448149681, 0.0008646603673696518, 0.0008935825899243355, 0.0009225048124790192, 0.0009514270350337029, 0.0009803492575883865, 0.0010092714801430702, 0.001038193702697754]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 6.0, 9.0, 11.0, 11.0, 9.0, 11.0, 15.0, 13.0, 19.0, 30.0, 29.0, 38.0, 26.0, 40.0, 39.0, 41.0, 57.0, 55.0, 58.0, 44.0, 51.0, 33.0, 57.0, 33.0, 44.0, 46.0, 30.0, 29.0, 18.0, 21.0, 13.0, 15.0, 13.0, 12.0, 8.0, 12.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.27734375, -6.06646728515625, -5.8555908203125, -5.64471435546875, -5.433837890625, -5.22296142578125, -5.0120849609375, -4.80120849609375, -4.59033203125, -4.37945556640625, -4.1685791015625, -3.95770263671875, -3.746826171875, -3.53594970703125, -3.3250732421875, -3.11419677734375, -2.9033203125, -2.69244384765625, -2.4815673828125, -2.27069091796875, -2.059814453125, -1.84893798828125, -1.6380615234375, -1.42718505859375, -1.21630859375, -1.00543212890625, -0.7945556640625, -0.58367919921875, -0.372802734375, -0.16192626953125, 0.0489501953125, 0.25982666015625, 0.470703125, 0.68157958984375, 0.8924560546875, 1.10333251953125, 1.314208984375, 1.52508544921875, 1.7359619140625, 1.94683837890625, 2.15771484375, 2.36859130859375, 2.5794677734375, 2.79034423828125, 3.001220703125, 3.21209716796875, 3.4229736328125, 3.63385009765625, 3.8447265625, 4.05560302734375, 4.2664794921875, 4.47735595703125, 4.688232421875, 4.89910888671875, 5.1099853515625, 5.32086181640625, 5.53173828125, 5.74261474609375, 5.9534912109375, 6.16436767578125, 6.375244140625, 6.58612060546875, 6.7969970703125, 7.00787353515625, 7.21875]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 7.0, 4.0, 9.0, 17.0, 17.0, 36.0, 47.0, 82.0, 116.0, 157.0, 250.0, 425.0, 706.0, 1223.0, 2244.0, 4474.0, 9466.0, 21204.0, 52809.0, 149474.0, 459954.0, 221224.0, 72266.0, 28422.0, 12046.0, 5563.0, 2710.0, 1369.0, 851.0, 486.0, 325.0, 171.0, 130.0, 88.0, 59.0, 43.0, 27.0, 19.0, 13.0, 13.0, 8.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.953125, -4.80596923828125, -4.6588134765625, -4.51165771484375, -4.364501953125, -4.21734619140625, -4.0701904296875, -3.92303466796875, -3.77587890625, -3.62872314453125, -3.4815673828125, -3.33441162109375, -3.187255859375, -3.04010009765625, -2.8929443359375, -2.74578857421875, -2.5986328125, -2.45147705078125, -2.3043212890625, -2.15716552734375, -2.010009765625, -1.86285400390625, -1.7156982421875, -1.56854248046875, -1.42138671875, -1.27423095703125, -1.1270751953125, -0.97991943359375, -0.832763671875, -0.68560791015625, -0.5384521484375, -0.39129638671875, -0.244140625, -0.09698486328125, 0.0501708984375, 0.19732666015625, 0.344482421875, 0.49163818359375, 0.6387939453125, 0.78594970703125, 0.93310546875, 1.08026123046875, 1.2274169921875, 1.37457275390625, 1.521728515625, 1.66888427734375, 1.8160400390625, 1.96319580078125, 2.1103515625, 2.25750732421875, 2.4046630859375, 2.55181884765625, 2.698974609375, 2.84613037109375, 2.9932861328125, 3.14044189453125, 3.28759765625, 3.43475341796875, 3.5819091796875, 3.72906494140625, 3.876220703125, 4.02337646484375, 4.1705322265625, 4.31768798828125, 4.46484375]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 5.0, 7.0, 10.0, 12.0, 10.0, 12.0, 25.0, 17.0, 23.0, 28.0, 34.0, 35.0, 55.0, 54.0, 62.0, 86.0, 188.0, 1710.0, 173.0, 85.0, 63.0, 64.0, 46.0, 48.0, 46.0, 33.0, 25.0, 28.0, 19.0, 16.0, 13.0, 6.0, 4.0, 4.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.09375, -24.34619140625, -23.5986328125, -22.85107421875, -22.103515625, -21.35595703125, -20.6083984375, -19.86083984375, -19.11328125, -18.36572265625, -17.6181640625, -16.87060546875, -16.123046875, -15.37548828125, -14.6279296875, -13.88037109375, -13.1328125, -12.38525390625, -11.6376953125, -10.89013671875, -10.142578125, -9.39501953125, -8.6474609375, -7.89990234375, -7.15234375, -6.40478515625, -5.6572265625, -4.90966796875, -4.162109375, -3.41455078125, -2.6669921875, -1.91943359375, -1.171875, -0.42431640625, 0.3232421875, 1.07080078125, 1.818359375, 2.56591796875, 3.3134765625, 4.06103515625, 4.80859375, 5.55615234375, 6.3037109375, 7.05126953125, 7.798828125, 8.54638671875, 9.2939453125, 10.04150390625, 10.7890625, 11.53662109375, 12.2841796875, 13.03173828125, 13.779296875, 14.52685546875, 15.2744140625, 16.02197265625, 16.76953125, 17.51708984375, 18.2646484375, 19.01220703125, 19.759765625, 20.50732421875, 21.2548828125, 22.00244140625, 22.75]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 14.0, 10.0, 19.0, 43.0, 79.0, 140.0, 253.0, 718.0, 8635.0, 3130730.0, 3974.0, 570.0, 230.0, 120.0, 70.0, 44.0, 29.0, 17.0, 11.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-92.6875, -89.42578125, -86.1640625, -82.90234375, -79.640625, -76.37890625, -73.1171875, -69.85546875, -66.59375, -63.33203125, -60.0703125, -56.80859375, -53.546875, -50.28515625, -47.0234375, -43.76171875, -40.5, -37.23828125, -33.9765625, -30.71484375, -27.453125, -24.19140625, -20.9296875, -17.66796875, -14.40625, -11.14453125, -7.8828125, -4.62109375, -1.359375, 1.90234375, 5.1640625, 8.42578125, 11.6875, 14.94921875, 18.2109375, 21.47265625, 24.734375, 27.99609375, 31.2578125, 34.51953125, 37.78125, 41.04296875, 44.3046875, 47.56640625, 50.828125, 54.08984375, 57.3515625, 60.61328125, 63.875, 67.13671875, 70.3984375, 73.66015625, 76.921875, 80.18359375, 83.4453125, 86.70703125, 89.96875, 93.23046875, 96.4921875, 99.75390625, 103.015625, 106.27734375, 109.5390625, 112.80078125, 116.0625]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [7.0, 632.0, 378.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.160194396972656, -11.76552963256836, 0.6291351318359375, 13.023799896240234, 25.41846466064453, 37.81312942504883, 50.207794189453125, 62.602455139160156, 74.99712371826172, 87.39178466796875, 99.78645324707031, 112.18112182617188, 124.5757827758789, 136.97044372558594, 149.3651123046875, 161.759765625, 174.15444946289062, 186.5491180419922, 198.94378662109375, 211.33843994140625, 223.7331085205078, 236.12777709960938, 248.52243041992188, 260.9171142578125, 273.311767578125, 285.7064208984375, 298.1011047363281, 310.4957580566406, 322.89044189453125, 335.28509521484375, 347.67974853515625, 360.07440185546875, 372.46905517578125, 384.86370849609375, 397.2583923339844, 409.6530456542969, 422.0477294921875, 434.4423828125, 446.8370361328125, 459.231689453125, 471.6263732910156, 484.0210266113281, 496.41571044921875, 508.81036376953125, 521.2050170898438, 533.5996704101562, 545.994384765625, 558.3890380859375, 570.78369140625, 583.1783447265625, 595.572998046875, 607.9677124023438, 620.3623657226562, 632.7570190429688, 645.1516723632812, 657.5463256835938, 669.9410400390625, 682.335693359375, 694.7303466796875, 707.1250610351562, 719.5197143554688, 731.9143676757812, 744.3090209960938, 756.7036743164062, 769.0983276367188]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 5.0, 4.0, 4.0, 5.0, 8.0, 9.0, 9.0, 8.0, 16.0, 12.0, 15.0, 23.0, 19.0, 20.0, 21.0, 26.0, 29.0, 24.0, 25.0, 35.0, 35.0, 34.0, 42.0, 46.0, 35.0, 40.0, 34.0, 34.0, 30.0, 36.0, 38.0, 26.0, 26.0, 27.0, 28.0, 22.0, 18.0, 21.0, 13.0, 13.0, 14.0, 12.0, 10.0, 12.0, 7.0, 9.0, 3.0, 4.0, 9.0, 5.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-49.03321075439453, -47.46977996826172, -45.90634536743164, -44.34291076660156, -42.77947998046875, -41.21604919433594, -39.65261459350586, -38.08917999267578, -36.52574920654297, -34.962318420410156, -33.39888381958008, -31.835451126098633, -30.272018432617188, -28.708585739135742, -27.145153045654297, -25.58172035217285, -24.018287658691406, -22.45485496520996, -20.891422271728516, -19.32798957824707, -17.764556884765625, -16.20112419128418, -14.637691497802734, -13.074258804321289, -11.510826110839844, -9.947393417358398, -8.383960723876953, -6.820528030395508, -5.2570953369140625, -3.693662643432617, -2.130229949951172, -0.5667972564697266, 0.9966354370117188, 2.560068130493164, 4.123500823974609, 5.686933517456055, 7.2503662109375, 8.813798904418945, 10.37723159790039, 11.940664291381836, 13.504096984863281, 15.067529678344727, 16.630962371826172, 18.194395065307617, 19.757827758789062, 21.321260452270508, 22.884693145751953, 24.4481258392334, 26.011558532714844, 27.57499122619629, 29.138423919677734, 30.70185661315918, 32.265289306640625, 33.82872009277344, 35.392154693603516, 36.955589294433594, 38.519020080566406, 40.08245086669922, 41.6458854675293, 43.209320068359375, 44.77275085449219, 46.336181640625, 47.89961624145508, 49.463050842285156, 51.02648162841797]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 5.0, 6.0, 6.0, 14.0, 16.0, 10.0, 9.0, 11.0, 18.0, 23.0, 26.0, 27.0, 23.0, 31.0, 42.0, 37.0, 50.0, 38.0, 49.0, 40.0, 63.0, 42.0, 46.0, 44.0, 48.0, 39.0, 40.0, 41.0, 26.0, 18.0, 12.0, 16.0, 18.0, 12.0, 12.0, 15.0, 7.0, 8.0, 6.0, 5.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.42578125, -6.21099853515625, -5.9962158203125, -5.78143310546875, -5.566650390625, -5.35186767578125, -5.1370849609375, -4.92230224609375, -4.70751953125, -4.49273681640625, -4.2779541015625, -4.06317138671875, -3.848388671875, -3.63360595703125, -3.4188232421875, -3.20404052734375, -2.9892578125, -2.77447509765625, -2.5596923828125, -2.34490966796875, -2.130126953125, -1.91534423828125, -1.7005615234375, -1.48577880859375, -1.27099609375, -1.05621337890625, -0.8414306640625, -0.62664794921875, -0.411865234375, -0.19708251953125, 0.0177001953125, 0.23248291015625, 0.447265625, 0.66204833984375, 0.8768310546875, 1.09161376953125, 1.306396484375, 1.52117919921875, 1.7359619140625, 1.95074462890625, 2.16552734375, 2.38031005859375, 2.5950927734375, 2.80987548828125, 3.024658203125, 3.23944091796875, 3.4542236328125, 3.66900634765625, 3.8837890625, 4.09857177734375, 4.3133544921875, 4.52813720703125, 4.742919921875, 4.95770263671875, 5.1724853515625, 5.38726806640625, 5.60205078125, 5.81683349609375, 6.0316162109375, 6.24639892578125, 6.461181640625, 6.67596435546875, 6.8907470703125, 7.10552978515625, 7.3203125]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 4.0, 8.0, 6.0, 7.0, 12.0, 8.0, 16.0, 21.0, 17.0, 21.0, 36.0, 39.0, 52.0, 135.0, 329.0, 1098.0, 4448.0, 23880.0, 254945.0, 3048754.0, 803402.0, 47426.0, 7231.0, 1534.0, 436.0, 139.0, 66.0, 45.0, 23.0, 23.0, 17.0, 15.0, 26.0, 11.0, 12.0, 8.0, 7.0, 8.0, 4.0, 0.0, 7.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.734375, -18.10302734375, -17.4716796875, -16.84033203125, -16.208984375, -15.57763671875, -14.9462890625, -14.31494140625, -13.68359375, -13.05224609375, -12.4208984375, -11.78955078125, -11.158203125, -10.52685546875, -9.8955078125, -9.26416015625, -8.6328125, -8.00146484375, -7.3701171875, -6.73876953125, -6.107421875, -5.47607421875, -4.8447265625, -4.21337890625, -3.58203125, -2.95068359375, -2.3193359375, -1.68798828125, -1.056640625, -0.42529296875, 0.2060546875, 0.83740234375, 1.46875, 2.10009765625, 2.7314453125, 3.36279296875, 3.994140625, 4.62548828125, 5.2568359375, 5.88818359375, 6.51953125, 7.15087890625, 7.7822265625, 8.41357421875, 9.044921875, 9.67626953125, 10.3076171875, 10.93896484375, 11.5703125, 12.20166015625, 12.8330078125, 13.46435546875, 14.095703125, 14.72705078125, 15.3583984375, 15.98974609375, 16.62109375, 17.25244140625, 17.8837890625, 18.51513671875, 19.146484375, 19.77783203125, 20.4091796875, 21.04052734375, 21.671875]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 1.0, 11.0, 11.0, 14.0, 27.0, 33.0, 57.0, 121.0, 180.0, 287.0, 487.0, 692.0, 794.0, 533.0, 291.0, 194.0, 122.0, 69.0, 39.0, 36.0, 32.0, 10.0, 11.0, 13.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.53125, -19.909912109375, -19.28857421875, -18.667236328125, -18.0458984375, -17.424560546875, -16.80322265625, -16.181884765625, -15.560546875, -14.939208984375, -14.31787109375, -13.696533203125, -13.0751953125, -12.453857421875, -11.83251953125, -11.211181640625, -10.58984375, -9.968505859375, -9.34716796875, -8.725830078125, -8.1044921875, -7.483154296875, -6.86181640625, -6.240478515625, -5.619140625, -4.997802734375, -4.37646484375, -3.755126953125, -3.1337890625, -2.512451171875, -1.89111328125, -1.269775390625, -0.6484375, -0.027099609375, 0.59423828125, 1.215576171875, 1.8369140625, 2.458251953125, 3.07958984375, 3.700927734375, 4.322265625, 4.943603515625, 5.56494140625, 6.186279296875, 6.8076171875, 7.428955078125, 8.05029296875, 8.671630859375, 9.29296875, 9.914306640625, 10.53564453125, 11.156982421875, 11.7783203125, 12.399658203125, 13.02099609375, 13.642333984375, 14.263671875, 14.885009765625, 15.50634765625, 16.127685546875, 16.7490234375, 17.370361328125, 17.99169921875, 18.613037109375, 19.234375]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 6.0, 8.0, 12.0, 16.0, 25.0, 36.0, 54.0, 95.0, 164.0, 323.0, 850.0, 6119.0, 438657.0, 3717398.0, 27766.0, 1773.0, 514.0, 219.0, 109.0, 55.0, 30.0, 20.0, 19.0, 7.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.71875, -57.80615234375, -55.8935546875, -53.98095703125, -52.068359375, -50.15576171875, -48.2431640625, -46.33056640625, -44.41796875, -42.50537109375, -40.5927734375, -38.68017578125, -36.767578125, -34.85498046875, -32.9423828125, -31.02978515625, -29.1171875, -27.20458984375, -25.2919921875, -23.37939453125, -21.466796875, -19.55419921875, -17.6416015625, -15.72900390625, -13.81640625, -11.90380859375, -9.9912109375, -8.07861328125, -6.166015625, -4.25341796875, -2.3408203125, -0.42822265625, 1.484375, 3.39697265625, 5.3095703125, 7.22216796875, 9.134765625, 11.04736328125, 12.9599609375, 14.87255859375, 16.78515625, 18.69775390625, 20.6103515625, 22.52294921875, 24.435546875, 26.34814453125, 28.2607421875, 30.17333984375, 32.0859375, 33.99853515625, 35.9111328125, 37.82373046875, 39.736328125, 41.64892578125, 43.5615234375, 45.47412109375, 47.38671875, 49.29931640625, 51.2119140625, 53.12451171875, 55.037109375, 56.94970703125, 58.8623046875, 60.77490234375, 62.6875]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 8.0, 16.0, 58.0, 155.0, 254.0, 241.0, 161.0, 76.0, 35.0, 13.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-144.9925079345703, -139.9916229248047, -134.99075317382812, -129.9898681640625, -124.98898315429688, -119.98810577392578, -114.98722839355469, -109.98634338378906, -104.98546600341797, -99.98458862304688, -94.98370361328125, -89.98282623291016, -84.98194885253906, -79.98106384277344, -74.98018646240234, -69.97930908203125, -64.97842407226562, -59.977542877197266, -54.976661682128906, -49.97578430175781, -44.97490310668945, -39.974021911621094, -34.97314453125, -29.97226333618164, -24.97138214111328, -19.970500946044922, -14.969621658325195, -9.968741416931152, -4.967861175537109, 0.03302001953125, 5.033899307250977, 10.034778594970703, 15.03564453125, 20.03652572631836, 25.037405014038086, 30.038284301757812, 35.03916549682617, 40.04004669189453, 45.040924072265625, 50.041805267333984, 55.042686462402344, 60.0435676574707, 65.04444885253906, 70.04532623291016, 75.04620361328125, 80.04708862304688, 85.04796600341797, 90.04884338378906, 95.04972839355469, 100.05060577392578, 105.0514907836914, 110.0523681640625, 115.05325317382812, 120.05413055419922, 125.05500793457031, 130.05589294433594, 135.0567626953125, 140.05764770507812, 145.0585174560547, 150.0594024658203, 155.06028747558594, 160.0611572265625, 165.06204223632812, 170.06292724609375, 175.06381225585938]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 4.0, 1.0, 8.0, 7.0, 8.0, 6.0, 13.0, 15.0, 14.0, 16.0, 22.0, 24.0, 30.0, 23.0, 39.0, 39.0, 32.0, 38.0, 45.0, 40.0, 37.0, 45.0, 49.0, 39.0, 36.0, 41.0, 50.0, 34.0, 27.0, 34.0, 27.0, 27.0, 27.0, 17.0, 18.0, 15.0, 12.0, 12.0, 15.0, 3.0, 5.0, 4.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-44.84051513671875, -43.42477798461914, -42.00904083251953, -40.59330749511719, -39.17757034301758, -37.76183319091797, -36.34609603881836, -34.93035888671875, -33.514625549316406, -32.0988883972168, -30.68315315246582, -29.26741600036621, -27.851680755615234, -26.435943603515625, -25.020206451416016, -23.604469299316406, -22.188732147216797, -20.772994995117188, -19.35725975036621, -17.9415225982666, -16.525787353515625, -15.110050201416016, -13.694313049316406, -12.278576850891113, -10.86284065246582, -9.447104454040527, -8.031368255615234, -6.615631103515625, -5.199894905090332, -3.784158706665039, -2.3684215545654297, -0.9526853561401367, 0.46305084228515625, 1.8787872791290283, 3.2945237159729004, 4.710260391235352, 6.1259965896606445, 7.5417327880859375, 8.957469940185547, 10.37320613861084, 11.788942337036133, 13.204678535461426, 14.620414733886719, 16.036151885986328, 17.451889038085938, 18.867624282836914, 20.283361434936523, 21.6990966796875, 23.11483383178711, 24.53057098388672, 25.946306228637695, 27.362043380737305, 28.77777862548828, 30.19351577758789, 31.6092529296875, 33.02499008178711, 34.44072723388672, 35.85646438598633, 37.27220153808594, 38.68793487548828, 40.10367202758789, 41.5194091796875, 42.93514633178711, 44.35088348388672, 45.76661682128906]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 7.0, 2.0, 5.0, 11.0, 7.0, 10.0, 11.0, 19.0, 21.0, 14.0, 23.0, 27.0, 27.0, 23.0, 33.0, 36.0, 29.0, 47.0, 40.0, 49.0, 55.0, 46.0, 58.0, 36.0, 41.0, 42.0, 35.0, 35.0, 31.0, 33.0, 24.0, 22.0, 23.0, 21.0, 15.0, 9.0, 10.0, 10.0, 5.0, 7.0, 2.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.61328125, -5.40667724609375, -5.2000732421875, -4.99346923828125, -4.786865234375, -4.58026123046875, -4.3736572265625, -4.16705322265625, -3.96044921875, -3.75384521484375, -3.5472412109375, -3.34063720703125, -3.134033203125, -2.92742919921875, -2.7208251953125, -2.51422119140625, -2.3076171875, -2.10101318359375, -1.8944091796875, -1.68780517578125, -1.481201171875, -1.27459716796875, -1.0679931640625, -0.86138916015625, -0.65478515625, -0.44818115234375, -0.2415771484375, -0.03497314453125, 0.171630859375, 0.37823486328125, 0.5848388671875, 0.79144287109375, 0.998046875, 1.20465087890625, 1.4112548828125, 1.61785888671875, 1.824462890625, 2.03106689453125, 2.2376708984375, 2.44427490234375, 2.65087890625, 2.85748291015625, 3.0640869140625, 3.27069091796875, 3.477294921875, 3.68389892578125, 3.8905029296875, 4.09710693359375, 4.3037109375, 4.51031494140625, 4.7169189453125, 4.92352294921875, 5.130126953125, 5.33673095703125, 5.5433349609375, 5.74993896484375, 5.95654296875, 6.16314697265625, 6.3697509765625, 6.57635498046875, 6.782958984375, 6.98956298828125, 7.1961669921875, 7.40277099609375, 7.609375]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 6.0, 9.0, 10.0, 13.0, 9.0, 32.0, 55.0, 61.0, 84.0, 148.0, 222.0, 346.0, 540.0, 796.0, 1280.0, 1894.0, 3083.0, 5029.0, 7777.0, 12608.0, 20554.0, 34149.0, 58376.0, 102723.0, 167428.0, 212522.0, 168940.0, 102371.0, 58696.0, 34140.0, 20484.0, 12504.0, 7910.0, 5038.0, 3116.0, 1971.0, 1304.0, 807.0, 522.0, 335.0, 249.0, 147.0, 110.0, 57.0, 30.0, 33.0, 24.0, 10.0, 2.0, 5.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2349853515625, -0.2272815704345703, -0.21957778930664062, -0.21187400817871094, -0.20417022705078125, -0.19646644592285156, -0.18876266479492188, -0.1810588836669922, -0.1733551025390625, -0.1656513214111328, -0.15794754028320312, -0.15024375915527344, -0.14253997802734375, -0.13483619689941406, -0.12713241577148438, -0.11942863464355469, -0.111724853515625, -0.10402107238769531, -0.09631729125976562, -0.08861351013183594, -0.08090972900390625, -0.07320594787597656, -0.06550216674804688, -0.05779838562011719, -0.0500946044921875, -0.04239082336425781, -0.034687042236328125, -0.026983261108398438, -0.01927947998046875, -0.011575698852539062, -0.003871917724609375, 0.0038318634033203125, 0.01153564453125, 0.019239425659179688, 0.026943206787109375, 0.03464698791503906, 0.04235076904296875, 0.05005455017089844, 0.057758331298828125, 0.06546211242675781, 0.0731658935546875, 0.08086967468261719, 0.08857345581054688, 0.09627723693847656, 0.10398101806640625, 0.11168479919433594, 0.11938858032226562, 0.1270923614501953, 0.134796142578125, 0.1424999237060547, 0.15020370483398438, 0.15790748596191406, 0.16561126708984375, 0.17331504821777344, 0.18101882934570312, 0.1887226104736328, 0.1964263916015625, 0.2041301727294922, 0.21183395385742188, 0.21953773498535156, 0.22724151611328125, 0.23494529724121094, 0.24264907836914062, 0.2503528594970703, 0.258056640625]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 3.0, 6.0, 4.0, 6.0, 9.0, 9.0, 13.0, 22.0, 10.0, 20.0, 21.0, 19.0, 19.0, 23.0, 35.0, 24.0, 32.0, 33.0, 32.0, 30.0, 36.0, 46.0, 32.0, 1070.0, 31.0, 43.0, 29.0, 34.0, 23.0, 37.0, 37.0, 33.0, 35.0, 22.0, 20.0, 20.0, 19.0, 18.0, 17.0, 9.0, 10.0, 5.0, 11.0, 7.0, 4.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-3.4375, -3.328643798828125, -3.21978759765625, -3.110931396484375, -3.0020751953125, -2.893218994140625, -2.78436279296875, -2.675506591796875, -2.566650390625, -2.457794189453125, -2.34893798828125, -2.240081787109375, -2.1312255859375, -2.022369384765625, -1.91351318359375, -1.804656982421875, -1.69580078125, -1.586944580078125, -1.47808837890625, -1.369232177734375, -1.2603759765625, -1.151519775390625, -1.04266357421875, -0.933807373046875, -0.824951171875, -0.716094970703125, -0.60723876953125, -0.498382568359375, -0.3895263671875, -0.280670166015625, -0.17181396484375, -0.062957763671875, 0.0458984375, 0.154754638671875, 0.26361083984375, 0.372467041015625, 0.4813232421875, 0.590179443359375, 0.69903564453125, 0.807891845703125, 0.916748046875, 1.025604248046875, 1.13446044921875, 1.243316650390625, 1.3521728515625, 1.461029052734375, 1.56988525390625, 1.678741455078125, 1.78759765625, 1.896453857421875, 2.00531005859375, 2.114166259765625, 2.2230224609375, 2.331878662109375, 2.44073486328125, 2.549591064453125, 2.658447265625, 2.767303466796875, 2.87615966796875, 2.985015869140625, 3.0938720703125, 3.202728271484375, 3.31158447265625, 3.420440673828125, 3.529296875]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 3.0, 2.0, 5.0, 12.0, 14.0, 25.0, 29.0, 47.0, 82.0, 126.0, 179.0, 257.0, 407.0, 570.0, 850.0, 1384.0, 1997.0, 2911.0, 4393.0, 6682.0, 10074.0, 15419.0, 24455.0, 38788.0, 61144.0, 96189.0, 139594.0, 1218607.0, 156229.0, 112953.0, 73952.0, 46730.0, 29184.0, 18625.0, 11863.0, 7798.0, 5177.0, 3435.0, 2261.0, 1579.0, 1039.0, 662.0, 471.0, 336.0, 182.0, 157.0, 88.0, 70.0, 46.0, 25.0, 9.0, 12.0, 6.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1844482421875, -0.17844009399414062, -0.17243194580078125, -0.16642379760742188, -0.1604156494140625, -0.15440750122070312, -0.14839935302734375, -0.14239120483398438, -0.136383056640625, -0.13037490844726562, -0.12436676025390625, -0.11835861206054688, -0.1123504638671875, -0.10634231567382812, -0.10033416748046875, -0.09432601928710938, -0.08831787109375, -0.08230972290039062, -0.07630157470703125, -0.07029342651367188, -0.0642852783203125, -0.058277130126953125, -0.05226898193359375, -0.046260833740234375, -0.040252685546875, -0.034244537353515625, -0.02823638916015625, -0.022228240966796875, -0.0162200927734375, -0.010211944580078125, -0.00420379638671875, 0.001804351806640625, 0.0078125, 0.013820648193359375, 0.01982879638671875, 0.025836944580078125, 0.0318450927734375, 0.037853240966796875, 0.04386138916015625, 0.049869537353515625, 0.055877685546875, 0.061885833740234375, 0.06789398193359375, 0.07390213012695312, 0.0799102783203125, 0.08591842651367188, 0.09192657470703125, 0.09793472290039062, 0.10394287109375, 0.10995101928710938, 0.11595916748046875, 0.12196731567382812, 0.1279754638671875, 0.13398361206054688, 0.13999176025390625, 0.14599990844726562, 0.152008056640625, 0.15801620483398438, 0.16402435302734375, 0.17003250122070312, 0.1760406494140625, 0.18204879760742188, 0.18805694580078125, 0.19406509399414062, 0.2000732421875]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 5.0, 2.0, 3.0, 5.0, 3.0, 3.0, 5.0, 9.0, 10.0, 14.0, 15.0, 11.0, 14.0, 20.0, 31.0, 38.0, 27.0, 30.0, 40.0, 40.0, 43.0, 62.0, 74.0, 48.0, 50.0, 44.0, 58.0, 38.0, 40.0, 37.0, 21.0, 31.0, 30.0, 14.0, 22.0, 10.0, 18.0, 3.0, 5.0, 4.0, 5.0, 4.0, 4.0, 4.0, 6.0, 4.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0009603500366210938, -0.0009234398603439331, -0.0008865296840667725, -0.0008496195077896118, -0.0008127093315124512, -0.0007757991552352905, -0.0007388889789581299, -0.0007019788026809692, -0.0006650686264038086, -0.000628158450126648, -0.0005912482738494873, -0.0005543380975723267, -0.000517427921295166, -0.00048051774501800537, -0.0004436075687408447, -0.0004066973924636841, -0.00036978721618652344, -0.0003328770399093628, -0.00029596686363220215, -0.0002590566873550415, -0.00022214651107788086, -0.00018523633480072021, -0.00014832615852355957, -0.00011141598224639893, -7.450580596923828e-05, -3.759562969207764e-05, -6.854534149169922e-07, 3.622472286224365e-05, 7.31348991394043e-05, 0.00011004507541656494, 0.00014695525169372559, 0.00018386542797088623, 0.00022077560424804688, 0.0002576857805252075, 0.00029459595680236816, 0.0003315061330795288, 0.00036841630935668945, 0.0004053264856338501, 0.00044223666191101074, 0.0004791468381881714, 0.000516057014465332, 0.0005529671907424927, 0.0005898773670196533, 0.000626787543296814, 0.0006636977195739746, 0.0007006078958511353, 0.0007375180721282959, 0.0007744282484054565, 0.0008113384246826172, 0.0008482486009597778, 0.0008851587772369385, 0.0009220689535140991, 0.0009589791297912598, 0.0009958893060684204, 0.001032799482345581, 0.0010697096586227417, 0.0011066198348999023, 0.001143530011177063, 0.0011804401874542236, 0.0012173503637313843, 0.001254260540008545, 0.0012911707162857056, 0.0013280808925628662, 0.0013649910688400269, 0.0014019012451171875]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 5.0, 2.0, 2.0, 4.0, 6.0, 4.0, 7.0, 11.0, 12.0, 14.0, 23.0, 28.0, 31.0, 42.0, 47.0, 62.0, 123.0, 138.0, 329.0, 662.0, 9598.0, 969671.0, 65545.0, 1207.0, 346.0, 195.0, 106.0, 86.0, 66.0, 45.0, 21.0, 36.0, 17.0, 10.0, 15.0, 9.0, 9.0, 4.0, 3.0, 2.0, 4.0, 1.0, 2.0, 3.0, 3.0, 0.0, 3.0], "bins": [-0.03033447265625, -0.02955007553100586, -0.02876567840576172, -0.027981281280517578, -0.027196884155273438, -0.026412487030029297, -0.025628089904785156, -0.024843692779541016, -0.024059295654296875, -0.023274898529052734, -0.022490501403808594, -0.021706104278564453, -0.020921707153320312, -0.020137310028076172, -0.01935291290283203, -0.01856851577758789, -0.01778411865234375, -0.01699972152709961, -0.01621532440185547, -0.015430927276611328, -0.014646530151367188, -0.013862133026123047, -0.013077735900878906, -0.012293338775634766, -0.011508941650390625, -0.010724544525146484, -0.009940147399902344, -0.009155750274658203, -0.008371353149414062, -0.007586956024169922, -0.006802558898925781, -0.006018161773681641, -0.0052337646484375, -0.004449367523193359, -0.0036649703979492188, -0.002880573272705078, -0.0020961761474609375, -0.0013117790222167969, -0.0005273818969726562, 0.0002570152282714844, 0.001041412353515625, 0.0018258094787597656, 0.0026102066040039062, 0.003394603729248047, 0.0041790008544921875, 0.004963397979736328, 0.005747795104980469, 0.006532192230224609, 0.00731658935546875, 0.00810098648071289, 0.008885383605957031, 0.009669780731201172, 0.010454177856445312, 0.011238574981689453, 0.012022972106933594, 0.012807369232177734, 0.013591766357421875, 0.014376163482666016, 0.015160560607910156, 0.015944957733154297, 0.016729354858398438, 0.017513751983642578, 0.01829814910888672, 0.01908254623413086, 0.019866943359375]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 6.0, 755.0, 257.0], "bins": [-0.028724489733576775, -0.02826743572950363, -0.02781037986278534, -0.027353325858712196, -0.026896271854639053, -0.02643921785056591, -0.025982161983847618, -0.025525107979774475, -0.025068053975701332, -0.02461099997162819, -0.024153944104909897, -0.023696890100836754, -0.02323983609676361, -0.022782782092690468, -0.022325726225972176, -0.021868672221899033, -0.02141161821782589, -0.020954564213752747, -0.020497508347034454, -0.02004045434296131, -0.01958340033888817, -0.019126346334815025, -0.018669290468096733, -0.01821223646402359, -0.017755182459950447, -0.017298128455877304, -0.016841072589159012, -0.01638401858508587, -0.015926964581012726, -0.015469909645617008, -0.015012855641543865, -0.014555800706148148, -0.01409874577075243, -0.013641690835356712, -0.01318463683128357, -0.012727581895887852, -0.012270527891814709, -0.011813472956418991, -0.011356418952345848, -0.01089936401695013, -0.010442310012876987, -0.00998525507748127, -0.009528201073408127, -0.00907114613801241, -0.008614092133939266, -0.008157037198543549, -0.007699983194470406, -0.007242928259074688, -0.006785873789340258, -0.006328819319605827, -0.005871764849871397, -0.005414710380136967, -0.004957655910402536, -0.004500601440668106, -0.0040435465052723885, -0.003586492268368602, -0.003129438031464815, -0.002672383561730385, -0.0022153290919959545, -0.0017582745058462024, -0.001301220036111772, -0.0008441654499620199, -0.0003871109802275896, 6.99434895068407e-05, 0.0005269980174489319]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 4.0, 11.0, 16.0, 10.0, 26.0, 25.0, 30.0, 45.0, 42.0, 43.0, 55.0, 50.0, 51.0, 69.0, 46.0, 61.0, 61.0, 69.0, 53.0, 52.0, 45.0, 36.0, 31.0, 20.0, 16.0, 12.0, 11.0, 9.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009450316429138184, -0.0009102430194616318, -0.0008754543960094452, -0.0008406657725572586, -0.000805877149105072, -0.0007710885256528854, -0.0007362999022006989, -0.0007015112787485123, -0.0006667226552963257, -0.0006319340318441391, -0.0005971454083919525, -0.0005623567849397659, -0.0005275681614875793, -0.0004927795380353928, -0.0004579909145832062, -0.0004232022911310196, -0.000388413667678833, -0.0003536250442266464, -0.00031883642077445984, -0.00028404779732227325, -0.00024925917387008667, -0.00021447055041790009, -0.0001796819269657135, -0.00014489330351352692, -0.00011010468006134033, -7.531605660915375e-05, -4.052743315696716e-05, -5.738809704780579e-06, 2.9049813747406006e-05, 6.383843719959259e-05, 9.862706065177917e-05, 0.00013341568410396576, 0.00016820430755615234, 0.00020299293100833893, 0.0002377815544605255, 0.0002725701779127121, 0.0003073588013648987, 0.00034214742481708527, 0.00037693604826927185, 0.00041172467172145844, 0.000446513295173645, 0.0004813019186258316, 0.0005160905420780182, 0.0005508791655302048, 0.0005856677889823914, 0.0006204564124345779, 0.0006552450358867645, 0.0006900336593389511, 0.0007248222827911377, 0.0007596109062433243, 0.0007943995296955109, 0.0008291881531476974, 0.000863976776599884, 0.0008987654000520706, 0.0009335540235042572, 0.0009683426469564438, 0.0010031312704086304, 0.001037919893860817, 0.0010727085173130035, 0.0011074971407651901, 0.0011422857642173767, 0.0011770743876695633, 0.0012118630111217499, 0.0012466516345739365, 0.001281440258026123]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 7.0, 2.0, 5.0, 11.0, 7.0, 10.0, 11.0, 19.0, 20.0, 15.0, 23.0, 27.0, 27.0, 23.0, 33.0, 36.0, 29.0, 47.0, 40.0, 49.0, 55.0, 46.0, 58.0, 36.0, 41.0, 42.0, 35.0, 35.0, 31.0, 33.0, 24.0, 22.0, 23.0, 21.0, 15.0, 9.0, 10.0, 10.0, 5.0, 7.0, 2.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.61328125, -5.40667724609375, -5.2000732421875, -4.99346923828125, -4.786865234375, -4.58026123046875, -4.3736572265625, -4.16705322265625, -3.96044921875, -3.75384521484375, -3.5472412109375, -3.34063720703125, -3.134033203125, -2.92742919921875, -2.7208251953125, -2.51422119140625, -2.3076171875, -2.10101318359375, -1.8944091796875, -1.68780517578125, -1.481201171875, -1.27459716796875, -1.0679931640625, -0.86138916015625, -0.65478515625, -0.44818115234375, -0.2415771484375, -0.03497314453125, 0.171630859375, 0.37823486328125, 0.5848388671875, 0.79144287109375, 0.998046875, 1.20465087890625, 1.4112548828125, 1.61785888671875, 1.824462890625, 2.03106689453125, 2.2376708984375, 2.44427490234375, 2.65087890625, 2.85748291015625, 3.0640869140625, 3.27069091796875, 3.477294921875, 3.68389892578125, 3.8905029296875, 4.09710693359375, 4.3037109375, 4.51031494140625, 4.7169189453125, 4.92352294921875, 5.130126953125, 5.33673095703125, 5.5433349609375, 5.74993896484375, 5.95654296875, 6.16314697265625, 6.3697509765625, 6.57635498046875, 6.782958984375, 6.98956298828125, 7.1961669921875, 7.40277099609375, 7.609375]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 2.0, 8.0, 11.0, 18.0, 29.0, 37.0, 49.0, 79.0, 133.0, 158.0, 246.0, 427.0, 615.0, 936.0, 1369.0, 2132.0, 3116.0, 4829.0, 7990.0, 14050.0, 29911.0, 84293.0, 337739.0, 392054.0, 96564.0, 32979.0, 15156.0, 8522.0, 5313.0, 3339.0, 2202.0, 1419.0, 947.0, 652.0, 386.0, 276.0, 161.0, 139.0, 86.0, 60.0, 38.0, 30.0, 13.0, 15.0, 8.0, 10.0, 5.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0], "bins": [-5.7578125, -5.5887451171875, -5.419677734375, -5.2506103515625, -5.08154296875, -4.9124755859375, -4.743408203125, -4.5743408203125, -4.4052734375, -4.2362060546875, -4.067138671875, -3.8980712890625, -3.72900390625, -3.5599365234375, -3.390869140625, -3.2218017578125, -3.052734375, -2.8836669921875, -2.714599609375, -2.5455322265625, -2.37646484375, -2.2073974609375, -2.038330078125, -1.8692626953125, -1.7001953125, -1.5311279296875, -1.362060546875, -1.1929931640625, -1.02392578125, -0.8548583984375, -0.685791015625, -0.5167236328125, -0.34765625, -0.1785888671875, -0.009521484375, 0.1595458984375, 0.32861328125, 0.4976806640625, 0.666748046875, 0.8358154296875, 1.0048828125, 1.1739501953125, 1.343017578125, 1.5120849609375, 1.68115234375, 1.8502197265625, 2.019287109375, 2.1883544921875, 2.357421875, 2.5264892578125, 2.695556640625, 2.8646240234375, 3.03369140625, 3.2027587890625, 3.371826171875, 3.5408935546875, 3.7099609375, 3.8790283203125, 4.048095703125, 4.2171630859375, 4.38623046875, 4.5552978515625, 4.724365234375, 4.8934326171875, 5.0625]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 0.0, 6.0, 7.0, 6.0, 5.0, 6.0, 6.0, 17.0, 22.0, 15.0, 30.0, 34.0, 26.0, 27.0, 29.0, 44.0, 37.0, 54.0, 37.0, 69.0, 95.0, 1403.0, 492.0, 108.0, 66.0, 59.0, 59.0, 31.0, 43.0, 43.0, 34.0, 18.0, 22.0, 20.0, 15.0, 13.0, 10.0, 13.0, 9.0, 5.0, 4.0, 2.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-18.046875, -17.424560546875, -16.80224609375, -16.179931640625, -15.5576171875, -14.935302734375, -14.31298828125, -13.690673828125, -13.068359375, -12.446044921875, -11.82373046875, -11.201416015625, -10.5791015625, -9.956787109375, -9.33447265625, -8.712158203125, -8.08984375, -7.467529296875, -6.84521484375, -6.222900390625, -5.6005859375, -4.978271484375, -4.35595703125, -3.733642578125, -3.111328125, -2.489013671875, -1.86669921875, -1.244384765625, -0.6220703125, 0.000244140625, 0.62255859375, 1.244873046875, 1.8671875, 2.489501953125, 3.11181640625, 3.734130859375, 4.3564453125, 4.978759765625, 5.60107421875, 6.223388671875, 6.845703125, 7.468017578125, 8.09033203125, 8.712646484375, 9.3349609375, 9.957275390625, 10.57958984375, 11.201904296875, 11.82421875, 12.446533203125, 13.06884765625, 13.691162109375, 14.3134765625, 14.935791015625, 15.55810546875, 16.180419921875, 16.802734375, 17.425048828125, 18.04736328125, 18.669677734375, 19.2919921875, 19.914306640625, 20.53662109375, 21.158935546875, 21.78125]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 4.0, 7.0, 7.0, 20.0, 18.0, 27.0, 61.0, 119.0, 226.0, 576.0, 3556.0, 3121108.0, 18394.0, 888.0, 306.0, 186.0, 79.0, 45.0, 28.0, 19.0, 10.0, 5.0, 5.0, 0.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-105.4375, -101.7607421875, -98.083984375, -94.4072265625, -90.73046875, -87.0537109375, -83.376953125, -79.7001953125, -76.0234375, -72.3466796875, -68.669921875, -64.9931640625, -61.31640625, -57.6396484375, -53.962890625, -50.2861328125, -46.609375, -42.9326171875, -39.255859375, -35.5791015625, -31.90234375, -28.2255859375, -24.548828125, -20.8720703125, -17.1953125, -13.5185546875, -9.841796875, -6.1650390625, -2.48828125, 1.1884765625, 4.865234375, 8.5419921875, 12.21875, 15.8955078125, 19.572265625, 23.2490234375, 26.92578125, 30.6025390625, 34.279296875, 37.9560546875, 41.6328125, 45.3095703125, 48.986328125, 52.6630859375, 56.33984375, 60.0166015625, 63.693359375, 67.3701171875, 71.046875, 74.7236328125, 78.400390625, 82.0771484375, 85.75390625, 89.4306640625, 93.107421875, 96.7841796875, 100.4609375, 104.1376953125, 107.814453125, 111.4912109375, 115.16796875, 118.8447265625, 122.521484375, 126.1982421875, 129.875]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 6.0, 6.0, 14.0, 37.0, 62.0, 89.0, 125.0, 157.0, 124.0, 122.0, 84.0, 77.0, 57.0, 26.0, 8.0, 8.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.1987190246582, -44.24102783203125, -43.28334045410156, -42.32564926147461, -41.36796188354492, -40.41027069091797, -39.45258331298828, -38.49489212036133, -37.537200927734375, -36.57950973510742, -35.621822357177734, -34.66413116455078, -33.706443786621094, -32.74875259399414, -31.79106330871582, -30.8333740234375, -29.87568473815918, -28.91799545288086, -27.96030616760254, -27.00261688232422, -26.044925689697266, -25.087236404418945, -24.129547119140625, -23.171857833862305, -22.214168548583984, -21.256479263305664, -20.298789978027344, -19.34109878540039, -18.38340950012207, -17.42572021484375, -16.46803092956543, -15.51034164428711, -14.552652359008789, -13.594963073730469, -12.637272834777832, -11.679583549499512, -10.721893310546875, -9.764204025268555, -8.806514739990234, -7.848824977874756, -6.891135215759277, -5.933445453643799, -4.97575569152832, -4.01806640625, -3.0603766441345215, -2.102686882019043, -1.1449975967407227, -0.18730783462524414, 0.7703819274902344, 1.7280715703964233, 2.6857612133026123, 3.6434507369995117, 4.60114049911499, 5.558830261230469, 6.516519546508789, 7.474209308624268, 8.431899070739746, 9.389588356018066, 10.347278594970703, 11.304967880249023, 12.262657165527344, 13.22034740447998, 14.1780366897583, 15.135726928710938, 16.093416213989258]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 4.0, 4.0, 2.0, 10.0, 4.0, 11.0, 9.0, 16.0, 11.0, 10.0, 31.0, 18.0, 27.0, 24.0, 25.0, 27.0, 27.0, 31.0, 42.0, 32.0, 31.0, 45.0, 40.0, 53.0, 37.0, 33.0, 29.0, 30.0, 31.0, 39.0, 29.0, 27.0, 33.0, 28.0, 24.0, 16.0, 15.0, 23.0, 11.0, 16.0, 13.0, 5.0, 8.0, 5.0, 2.0, 6.0, 6.0, 2.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 3.0], "bins": [-50.047149658203125, -48.50689697265625, -46.966644287109375, -45.4263916015625, -43.88613510131836, -42.345882415771484, -40.80562973022461, -39.265377044677734, -37.72512435913086, -36.184871673583984, -34.64461898803711, -33.10436248779297, -31.564111709594727, -30.02385711669922, -28.483604431152344, -26.94335174560547, -25.40309715270996, -23.862844467163086, -22.322589874267578, -20.782337188720703, -19.242084503173828, -17.701831817626953, -16.161577224731445, -14.62132453918457, -13.081070899963379, -11.540817260742188, -10.000564575195312, -8.460310935974121, -6.920057773590088, -5.379804611206055, -3.8395509719848633, -2.2992982864379883, -0.7590446472167969, 0.7812086343765259, 2.3214619159698486, 3.861715316772461, 5.401968479156494, 6.942221641540527, 8.482475280761719, 10.022727966308594, 11.562981605529785, 13.103235244750977, 14.643487930297852, 16.18374252319336, 17.723995208740234, 19.26424789428711, 20.804500579833984, 22.34475326538086, 23.885007858276367, 25.425260543823242, 26.96551513671875, 28.505767822265625, 30.0460205078125, 31.586273193359375, 33.12652587890625, 34.666778564453125, 36.207035064697266, 37.74728775024414, 39.287540435791016, 40.827796936035156, 42.36804962158203, 43.908302307128906, 45.44855499267578, 46.988807678222656, 48.52906036376953]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 1.0, 2.0, 4.0, 6.0, 7.0, 4.0, 8.0, 11.0, 12.0, 7.0, 21.0, 19.0, 16.0, 25.0, 22.0, 19.0, 24.0, 20.0, 42.0, 35.0, 49.0, 40.0, 47.0, 48.0, 47.0, 51.0, 44.0, 44.0, 35.0, 35.0, 25.0, 31.0, 27.0, 23.0, 25.0, 25.0, 23.0, 19.0, 12.0, 11.0, 10.0, 10.0, 9.0, 3.0, 3.0, 5.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.6875, -5.4798583984375, -5.272216796875, -5.0645751953125, -4.85693359375, -4.6492919921875, -4.441650390625, -4.2340087890625, -4.0263671875, -3.8187255859375, -3.611083984375, -3.4034423828125, -3.19580078125, -2.9881591796875, -2.780517578125, -2.5728759765625, -2.365234375, -2.1575927734375, -1.949951171875, -1.7423095703125, -1.53466796875, -1.3270263671875, -1.119384765625, -0.9117431640625, -0.7041015625, -0.4964599609375, -0.288818359375, -0.0811767578125, 0.12646484375, 0.3341064453125, 0.541748046875, 0.7493896484375, 0.95703125, 1.1646728515625, 1.372314453125, 1.5799560546875, 1.78759765625, 1.9952392578125, 2.202880859375, 2.4105224609375, 2.6181640625, 2.8258056640625, 3.033447265625, 3.2410888671875, 3.44873046875, 3.6563720703125, 3.864013671875, 4.0716552734375, 4.279296875, 4.4869384765625, 4.694580078125, 4.9022216796875, 5.10986328125, 5.3175048828125, 5.525146484375, 5.7327880859375, 5.9404296875, 6.1480712890625, 6.355712890625, 6.5633544921875, 6.77099609375, 6.9786376953125, 7.186279296875, 7.3939208984375, 7.6015625]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 4.0, 5.0, 4.0, 9.0, 11.0, 10.0, 3.0, 12.0, 27.0, 20.0, 43.0, 59.0, 106.0, 209.0, 465.0, 818.0, 1720.0, 3606.0, 8796.0, 23817.0, 88292.0, 514979.0, 2034073.0, 1239750.0, 208065.0, 44157.0, 14519.0, 5636.0, 2462.0, 1273.0, 597.0, 326.0, 161.0, 86.0, 54.0, 27.0, 24.0, 21.0, 7.0, 11.0, 9.0, 6.0, 2.0, 4.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.53125, -10.1773681640625, -9.823486328125, -9.4696044921875, -9.11572265625, -8.7618408203125, -8.407958984375, -8.0540771484375, -7.7001953125, -7.3463134765625, -6.992431640625, -6.6385498046875, -6.28466796875, -5.9307861328125, -5.576904296875, -5.2230224609375, -4.869140625, -4.5152587890625, -4.161376953125, -3.8074951171875, -3.45361328125, -3.0997314453125, -2.745849609375, -2.3919677734375, -2.0380859375, -1.6842041015625, -1.330322265625, -0.9764404296875, -0.62255859375, -0.2686767578125, 0.085205078125, 0.4390869140625, 0.79296875, 1.1468505859375, 1.500732421875, 1.8546142578125, 2.20849609375, 2.5623779296875, 2.916259765625, 3.2701416015625, 3.6240234375, 3.9779052734375, 4.331787109375, 4.6856689453125, 5.03955078125, 5.3934326171875, 5.747314453125, 6.1011962890625, 6.455078125, 6.8089599609375, 7.162841796875, 7.5167236328125, 7.87060546875, 8.2244873046875, 8.578369140625, 8.9322509765625, 9.2861328125, 9.6400146484375, 9.993896484375, 10.3477783203125, 10.70166015625, 11.0555419921875, 11.409423828125, 11.7633056640625, 12.1171875]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 0.0, 6.0, 7.0, 14.0, 12.0, 10.0, 9.0, 19.0, 27.0, 28.0, 43.0, 50.0, 78.0, 108.0, 157.0, 228.0, 314.0, 440.0, 520.0, 518.0, 408.0, 300.0, 207.0, 146.0, 106.0, 96.0, 67.0, 34.0, 33.0, 20.0, 17.0, 12.0, 10.0, 14.0, 2.0, 2.0, 4.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-14.015625, -13.6015625, -13.1875, -12.7734375, -12.359375, -11.9453125, -11.53125, -11.1171875, -10.703125, -10.2890625, -9.875, -9.4609375, -9.046875, -8.6328125, -8.21875, -7.8046875, -7.390625, -6.9765625, -6.5625, -6.1484375, -5.734375, -5.3203125, -4.90625, -4.4921875, -4.078125, -3.6640625, -3.25, -2.8359375, -2.421875, -2.0078125, -1.59375, -1.1796875, -0.765625, -0.3515625, 0.0625, 0.4765625, 0.890625, 1.3046875, 1.71875, 2.1328125, 2.546875, 2.9609375, 3.375, 3.7890625, 4.203125, 4.6171875, 5.03125, 5.4453125, 5.859375, 6.2734375, 6.6875, 7.1015625, 7.515625, 7.9296875, 8.34375, 8.7578125, 9.171875, 9.5859375, 10.0, 10.4140625, 10.828125, 11.2421875, 11.65625, 12.0703125, 12.484375]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 4.0, 3.0, 11.0, 12.0, 15.0, 17.0, 23.0, 25.0, 48.0, 66.0, 97.0, 119.0, 148.0, 259.0, 496.0, 1394.0, 7078.0, 81096.0, 2894375.0, 1164206.0, 38429.0, 4193.0, 999.0, 423.0, 187.0, 134.0, 114.0, 76.0, 49.0, 60.0, 24.0, 22.0, 17.0, 14.0, 15.0, 10.0, 7.0, 4.0, 5.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-35.84375, -34.6826171875, -33.521484375, -32.3603515625, -31.19921875, -30.0380859375, -28.876953125, -27.7158203125, -26.5546875, -25.3935546875, -24.232421875, -23.0712890625, -21.91015625, -20.7490234375, -19.587890625, -18.4267578125, -17.265625, -16.1044921875, -14.943359375, -13.7822265625, -12.62109375, -11.4599609375, -10.298828125, -9.1376953125, -7.9765625, -6.8154296875, -5.654296875, -4.4931640625, -3.33203125, -2.1708984375, -1.009765625, 0.1513671875, 1.3125, 2.4736328125, 3.634765625, 4.7958984375, 5.95703125, 7.1181640625, 8.279296875, 9.4404296875, 10.6015625, 11.7626953125, 12.923828125, 14.0849609375, 15.24609375, 16.4072265625, 17.568359375, 18.7294921875, 19.890625, 21.0517578125, 22.212890625, 23.3740234375, 24.53515625, 25.6962890625, 26.857421875, 28.0185546875, 29.1796875, 30.3408203125, 31.501953125, 32.6630859375, 33.82421875, 34.9853515625, 36.146484375, 37.3076171875, 38.46875]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 11.0, 22.0, 47.0, 106.0, 198.0, 221.0, 220.0, 102.0, 49.0, 23.0, 11.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-174.36886596679688, -170.2685089111328, -166.16815185546875, -162.06777954101562, -157.96742248535156, -153.8670654296875, -149.76670837402344, -145.66635131835938, -141.56597900390625, -137.4656219482422, -133.36526489257812, -129.264892578125, -125.16453552246094, -121.06417846679688, -116.96382141113281, -112.86346435546875, -108.76310729980469, -104.66275024414062, -100.56238555908203, -96.46202850341797, -92.36166381835938, -88.26130676269531, -84.16094970703125, -80.06059265136719, -75.9602279663086, -71.85987091064453, -67.75950622558594, -63.659149169921875, -59.55878829956055, -55.45842742919922, -51.358070373535156, -47.25770950317383, -43.15734100341797, -39.05698013305664, -34.95661926269531, -30.85626220703125, -26.755901336669922, -22.655540466308594, -18.5551815032959, -14.454822540283203, -10.354461669921875, -6.254101753234863, -2.1537418365478516, 1.9466180801391602, 6.046977996826172, 10.1473388671875, 14.247697830200195, 18.34805679321289, 22.44841766357422, 26.548778533935547, 30.649137496948242, 34.74949645996094, 38.849857330322266, 42.950218200683594, 47.050575256347656, 51.150936126708984, 55.25129699707031, 59.35165786743164, 63.45201873779297, 67.55237579345703, 71.65274047851562, 75.75309753417969, 79.85345458984375, 83.95381164550781, 88.0541763305664]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 1.0, 7.0, 3.0, 12.0, 11.0, 12.0, 10.0, 15.0, 17.0, 16.0, 14.0, 16.0, 18.0, 26.0, 25.0, 22.0, 32.0, 36.0, 40.0, 33.0, 30.0, 43.0, 46.0, 32.0, 43.0, 39.0, 34.0, 35.0, 27.0, 32.0, 40.0, 19.0, 30.0, 26.0, 21.0, 24.0, 23.0, 21.0, 18.0, 13.0, 9.0, 6.0, 5.0, 10.0, 6.0, 4.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-35.1571044921875, -33.83487319946289, -32.51264190673828, -31.19040870666504, -29.86817741394043, -28.54594612121582, -27.223712921142578, -25.90148162841797, -24.57925033569336, -23.25701904296875, -21.93478775024414, -20.6125545501709, -19.29032325744629, -17.96809196472168, -16.645858764648438, -15.323627471923828, -14.001396179199219, -12.67916488647461, -11.356932640075684, -10.034700393676758, -8.712469100952148, -7.390237331390381, -6.068005561828613, -4.7457733154296875, -3.423542022705078, -2.1013102531433105, -0.779078483581543, 0.5431532859802246, 1.8653850555419922, 3.1876168251037598, 4.509848594665527, 5.832080841064453, 7.1543121337890625, 8.476543426513672, 9.798775672912598, 11.121007919311523, 12.443239212036133, 13.765470504760742, 15.087702751159668, 16.409934997558594, 17.732166290283203, 19.054397583007812, 20.376628875732422, 21.698862075805664, 23.021093368530273, 24.343324661254883, 25.665557861328125, 26.987789154052734, 28.310020446777344, 29.632251739501953, 30.954483032226562, 32.27671432495117, 33.59894561767578, 34.921180725097656, 36.243412017822266, 37.565643310546875, 38.887874603271484, 40.210105895996094, 41.5323371887207, 42.85456848144531, 44.17680358886719, 45.4990348815918, 46.821266174316406, 48.143497467041016, 49.465728759765625]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 3.0, 4.0, 3.0, 8.0, 9.0, 7.0, 12.0, 10.0, 12.0, 18.0, 20.0, 16.0, 21.0, 21.0, 25.0, 19.0, 23.0, 25.0, 26.0, 40.0, 40.0, 35.0, 46.0, 42.0, 55.0, 39.0, 34.0, 43.0, 28.0, 43.0, 34.0, 34.0, 28.0, 16.0, 25.0, 19.0, 20.0, 18.0, 11.0, 11.0, 15.0, 14.0, 8.0, 4.0, 4.0, 2.0, 4.0, 2.0, 5.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.61328125, -5.43310546875, -5.2529296875, -5.07275390625, -4.892578125, -4.71240234375, -4.5322265625, -4.35205078125, -4.171875, -3.99169921875, -3.8115234375, -3.63134765625, -3.451171875, -3.27099609375, -3.0908203125, -2.91064453125, -2.73046875, -2.55029296875, -2.3701171875, -2.18994140625, -2.009765625, -1.82958984375, -1.6494140625, -1.46923828125, -1.2890625, -1.10888671875, -0.9287109375, -0.74853515625, -0.568359375, -0.38818359375, -0.2080078125, -0.02783203125, 0.15234375, 0.33251953125, 0.5126953125, 0.69287109375, 0.873046875, 1.05322265625, 1.2333984375, 1.41357421875, 1.59375, 1.77392578125, 1.9541015625, 2.13427734375, 2.314453125, 2.49462890625, 2.6748046875, 2.85498046875, 3.03515625, 3.21533203125, 3.3955078125, 3.57568359375, 3.755859375, 3.93603515625, 4.1162109375, 4.29638671875, 4.4765625, 4.65673828125, 4.8369140625, 5.01708984375, 5.197265625, 5.37744140625, 5.5576171875, 5.73779296875, 5.91796875]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 6.0, 19.0, 25.0, 32.0, 58.0, 68.0, 123.0, 185.0, 225.0, 333.0, 503.0, 776.0, 1121.0, 1675.0, 2493.0, 3524.0, 5527.0, 8410.0, 12255.0, 18770.0, 29755.0, 46974.0, 76042.0, 120553.0, 171668.0, 180762.0, 133842.0, 85291.0, 52742.0, 33077.0, 20793.0, 13653.0, 9205.0, 5736.0, 3990.0, 2728.0, 1806.0, 1212.0, 825.0, 530.0, 386.0, 275.0, 186.0, 148.0, 87.0, 58.0, 30.0, 28.0, 24.0, 12.0, 4.0, 2.0, 7.0, 2.0, 1.0], "bins": [-0.2340087890625, -0.22714996337890625, -0.2202911376953125, -0.21343231201171875, -0.206573486328125, -0.19971466064453125, -0.1928558349609375, -0.18599700927734375, -0.17913818359375, -0.17227935791015625, -0.1654205322265625, -0.15856170654296875, -0.151702880859375, -0.14484405517578125, -0.1379852294921875, -0.13112640380859375, -0.124267578125, -0.11740875244140625, -0.1105499267578125, -0.10369110107421875, -0.096832275390625, -0.08997344970703125, -0.0831146240234375, -0.07625579833984375, -0.06939697265625, -0.06253814697265625, -0.0556793212890625, -0.04882049560546875, -0.041961669921875, -0.03510284423828125, -0.0282440185546875, -0.02138519287109375, -0.0145263671875, -0.00766754150390625, -0.0008087158203125, 0.00605010986328125, 0.012908935546875, 0.01976776123046875, 0.0266265869140625, 0.03348541259765625, 0.04034423828125, 0.04720306396484375, 0.0540618896484375, 0.06092071533203125, 0.067779541015625, 0.07463836669921875, 0.0814971923828125, 0.08835601806640625, 0.09521484375, 0.10207366943359375, 0.1089324951171875, 0.11579132080078125, 0.122650146484375, 0.12950897216796875, 0.1363677978515625, 0.14322662353515625, 0.15008544921875, 0.15694427490234375, 0.1638031005859375, 0.17066192626953125, 0.177520751953125, 0.18437957763671875, 0.1912384033203125, 0.19809722900390625, 0.2049560546875]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 4.0, 1.0, 4.0, 1.0, 6.0, 6.0, 5.0, 9.0, 18.0, 13.0, 7.0, 15.0, 14.0, 15.0, 24.0, 26.0, 19.0, 29.0, 37.0, 31.0, 38.0, 37.0, 34.0, 30.0, 33.0, 33.0, 1049.0, 35.0, 33.0, 40.0, 30.0, 36.0, 29.0, 36.0, 27.0, 22.0, 22.0, 25.0, 19.0, 25.0, 19.0, 12.0, 10.0, 17.0, 4.0, 12.0, 8.0, 6.0, 6.0, 3.0, 7.0, 4.0, 3.0, 4.0, 1.0, 1.0, 3.0, 2.0, 3.0], "bins": [-3.3515625, -3.245941162109375, -3.14031982421875, -3.034698486328125, -2.9290771484375, -2.823455810546875, -2.71783447265625, -2.612213134765625, -2.506591796875, -2.400970458984375, -2.29534912109375, -2.189727783203125, -2.0841064453125, -1.978485107421875, -1.87286376953125, -1.767242431640625, -1.66162109375, -1.555999755859375, -1.45037841796875, -1.344757080078125, -1.2391357421875, -1.133514404296875, -1.02789306640625, -0.922271728515625, -0.816650390625, -0.711029052734375, -0.60540771484375, -0.499786376953125, -0.3941650390625, -0.288543701171875, -0.18292236328125, -0.077301025390625, 0.0283203125, 0.133941650390625, 0.23956298828125, 0.345184326171875, 0.4508056640625, 0.556427001953125, 0.66204833984375, 0.767669677734375, 0.873291015625, 0.978912353515625, 1.08453369140625, 1.190155029296875, 1.2957763671875, 1.401397705078125, 1.50701904296875, 1.612640380859375, 1.71826171875, 1.823883056640625, 1.92950439453125, 2.035125732421875, 2.1407470703125, 2.246368408203125, 2.35198974609375, 2.457611083984375, 2.563232421875, 2.668853759765625, 2.77447509765625, 2.880096435546875, 2.9857177734375, 3.091339111328125, 3.19696044921875, 3.302581787109375, 3.408203125]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 6.0, 12.0, 18.0, 22.0, 44.0, 97.0, 129.0, 163.0, 303.0, 425.0, 581.0, 848.0, 1294.0, 1841.0, 2696.0, 4031.0, 5861.0, 8853.0, 13127.0, 20538.0, 31773.0, 49924.0, 78791.0, 118039.0, 158997.0, 1210787.0, 132763.0, 90731.0, 57875.0, 36964.0, 23414.0, 15194.0, 9960.0, 6776.0, 4499.0, 3074.0, 2139.0, 1494.0, 1020.0, 672.0, 435.0, 327.0, 227.0, 125.0, 88.0, 57.0, 44.0, 29.0, 12.0, 8.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1885986328125, -0.18254661560058594, -0.17649459838867188, -0.1704425811767578, -0.16439056396484375, -0.1583385467529297, -0.15228652954101562, -0.14623451232910156, -0.1401824951171875, -0.13413047790527344, -0.12807846069335938, -0.12202644348144531, -0.11597442626953125, -0.10992240905761719, -0.10387039184570312, -0.09781837463378906, -0.091766357421875, -0.08571434020996094, -0.07966232299804688, -0.07361030578613281, -0.06755828857421875, -0.06150627136230469, -0.055454254150390625, -0.04940223693847656, -0.0433502197265625, -0.03729820251464844, -0.031246185302734375, -0.025194168090820312, -0.01914215087890625, -0.013090133666992188, -0.007038116455078125, -0.0009860992431640625, 0.00506591796875, 0.011117935180664062, 0.017169952392578125, 0.023221969604492188, 0.02927398681640625, 0.03532600402832031, 0.041378021240234375, 0.04743003845214844, 0.0534820556640625, 0.05953407287597656, 0.06558609008789062, 0.07163810729980469, 0.07769012451171875, 0.08374214172363281, 0.08979415893554688, 0.09584617614746094, 0.101898193359375, 0.10795021057128906, 0.11400222778320312, 0.12005424499511719, 0.12610626220703125, 0.1321582794189453, 0.13821029663085938, 0.14426231384277344, 0.1503143310546875, 0.15636634826660156, 0.16241836547851562, 0.1684703826904297, 0.17452239990234375, 0.1805744171142578, 0.18662643432617188, 0.19267845153808594, 0.19873046875]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 3.0, 5.0, 7.0, 6.0, 4.0, 9.0, 8.0, 15.0, 13.0, 10.0, 25.0, 26.0, 18.0, 25.0, 36.0, 50.0, 41.0, 49.0, 58.0, 55.0, 50.0, 64.0, 57.0, 43.0, 26.0, 39.0, 40.0, 35.0, 29.0, 27.0, 27.0, 18.0, 16.0, 13.0, 18.0, 7.0, 5.0, 8.0, 5.0, 3.0, 0.0, 3.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.0011959075927734375, -0.0011632367968559265, -0.0011305660009384155, -0.0010978952050209045, -0.0010652244091033936, -0.0010325536131858826, -0.0009998828172683716, -0.0009672120213508606, -0.0009345412254333496, -0.0009018704295158386, -0.0008691996335983276, -0.0008365288376808167, -0.0008038580417633057, -0.0007711872458457947, -0.0007385164499282837, -0.0007058456540107727, -0.0006731748580932617, -0.0006405040621757507, -0.0006078332662582397, -0.0005751624703407288, -0.0005424916744232178, -0.0005098208785057068, -0.0004771500825881958, -0.0004444792866706848, -0.00041180849075317383, -0.00037913769483566284, -0.00034646689891815186, -0.00031379610300064087, -0.0002811253070831299, -0.0002484545111656189, -0.0002157837152481079, -0.00018311291933059692, -0.00015044212341308594, -0.00011777132749557495, -8.510053157806396e-05, -5.242973566055298e-05, -1.9758939743041992e-05, 1.2911856174468994e-05, 4.558265209197998e-05, 7.825344800949097e-05, 0.00011092424392700195, 0.00014359503984451294, 0.00017626583576202393, 0.0002089366316795349, 0.0002416074275970459, 0.0002742782235145569, 0.00030694901943206787, 0.00033961981534957886, 0.00037229061126708984, 0.00040496140718460083, 0.0004376322031021118, 0.0004703029990196228, 0.0005029737949371338, 0.0005356445908546448, 0.0005683153867721558, 0.0006009861826896667, 0.0006336569786071777, 0.0006663277745246887, 0.0006989985704421997, 0.0007316693663597107, 0.0007643401622772217, 0.0007970109581947327, 0.0008296817541122437, 0.0008623525500297546, 0.0008950233459472656]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 5.0, 11.0, 5.0, 8.0, 11.0, 15.0, 21.0, 27.0, 22.0, 27.0, 40.0, 43.0, 40.0, 62.0, 69.0, 97.0, 126.0, 279.0, 587.0, 3130.0, 228594.0, 802391.0, 11031.0, 867.0, 341.0, 171.0, 115.0, 85.0, 55.0, 55.0, 30.0, 32.0, 29.0, 15.0, 15.0, 12.0, 22.0, 12.0, 16.0, 9.0, 5.0, 5.0, 7.0, 3.0, 2.0, 4.0, 2.0, 2.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0165863037109375, -0.0160367488861084, -0.015487194061279297, -0.014937639236450195, -0.014388084411621094, -0.013838529586791992, -0.01328897476196289, -0.012739419937133789, -0.012189865112304688, -0.011640310287475586, -0.011090755462646484, -0.010541200637817383, -0.009991645812988281, -0.00944209098815918, -0.008892536163330078, -0.008342981338500977, -0.007793426513671875, -0.0072438716888427734, -0.006694316864013672, -0.00614476203918457, -0.005595207214355469, -0.005045652389526367, -0.004496097564697266, -0.003946542739868164, -0.0033969879150390625, -0.002847433090209961, -0.0022978782653808594, -0.0017483234405517578, -0.0011987686157226562, -0.0006492137908935547, -9.965896606445312e-05, 0.00044989585876464844, 0.00099945068359375, 0.0015490055084228516, 0.002098560333251953, 0.0026481151580810547, 0.0031976699829101562, 0.003747224807739258, 0.004296779632568359, 0.004846334457397461, 0.0053958892822265625, 0.005945444107055664, 0.006494998931884766, 0.007044553756713867, 0.007594108581542969, 0.00814366340637207, 0.008693218231201172, 0.009242773056030273, 0.009792327880859375, 0.010341882705688477, 0.010891437530517578, 0.01144099235534668, 0.011990547180175781, 0.012540102005004883, 0.013089656829833984, 0.013639211654663086, 0.014188766479492188, 0.014738321304321289, 0.01528787612915039, 0.015837430953979492, 0.016386985778808594, 0.016936540603637695, 0.017486095428466797, 0.0180356502532959, 0.018585205078125]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 6.0, 258.0, 707.0, 45.0], "bins": [-0.015550359152257442, -0.015300635248422623, -0.015050911344587803, -0.014801187440752983, -0.014551463536918163, -0.014301739633083344, -0.014052014797925949, -0.01380229089409113, -0.01355256699025631, -0.01330284308642149, -0.01305311918258667, -0.01280339527875185, -0.01255367137491703, -0.012303946539759636, -0.01205422356724739, -0.011804498732089996, -0.011554775759577751, -0.011305051855742931, -0.011055327951908112, -0.010805604048073292, -0.010555880144238472, -0.010306155309081078, -0.010056432336568832, -0.009806707501411438, -0.009556983597576618, -0.009307259693741798, -0.009057535789906979, -0.008807811886072159, -0.008558087982237339, -0.00830836407840252, -0.008058639243245125, -0.007808915805071592, -0.007559190969914198, -0.007309467066079378, -0.007059743162244558, -0.006810018792748451, -0.0065602948889136314, -0.006310570985078812, -0.006060847081243992, -0.005811123177409172, -0.005561398807913065, -0.005311674904078245, -0.005061951000243425, -0.004812226630747318, -0.0045625027269124985, -0.004312778823077679, -0.004063054919242859, -0.003813331015408039, -0.0035636071115732193, -0.0033138832077383995, -0.003064159071072936, -0.0028144351672381163, -0.002564711030572653, -0.002314987126737833, -0.0020652632229030132, -0.0018155392026528716, -0.0015658150659874082, -0.0013160910457372665, -0.0010663671419024467, -0.0008166431216523051, -0.0005669191014021635, -0.0003171950811520219, -6.747117731720209e-05, 0.00018225284293293953, 0.00043197686318308115]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 12.0, 7.0, 15.0, 25.0, 15.0, 24.0, 23.0, 31.0, 26.0, 32.0, 42.0, 46.0, 50.0, 57.0, 46.0, 56.0, 52.0, 63.0, 63.0, 47.0, 48.0, 30.0, 29.0, 31.0, 30.0, 14.0, 22.0, 15.0, 11.0, 5.0, 15.0, 10.0, 4.0, 5.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.000784754753112793, -0.0007599294185638428, -0.0007351040840148926, -0.0007102787494659424, -0.0006854534149169922, -0.000660628080368042, -0.0006358027458190918, -0.0006109774112701416, -0.0005861520767211914, -0.0005613267421722412, -0.000536501407623291, -0.0005116760730743408, -0.0004868507385253906, -0.00046202540397644043, -0.00043720006942749023, -0.00041237473487854004, -0.00038754940032958984, -0.00036272406578063965, -0.00033789873123168945, -0.00031307339668273926, -0.00028824806213378906, -0.00026342272758483887, -0.00023859739303588867, -0.00021377205848693848, -0.00018894672393798828, -0.00016412138938903809, -0.0001392960548400879, -0.0001144707202911377, -8.96453857421875e-05, -6.48200511932373e-05, -3.999471664428711e-05, -1.5169382095336914e-05, 9.655952453613281e-06, 3.4481287002563477e-05, 5.930662155151367e-05, 8.413195610046387e-05, 0.00010895729064941406, 0.00013378262519836426, 0.00015860795974731445, 0.00018343329429626465, 0.00020825862884521484, 0.00023308396339416504, 0.00025790929794311523, 0.00028273463249206543, 0.0003075599670410156, 0.0003323853015899658, 0.000357210636138916, 0.0003820359706878662, 0.0004068613052368164, 0.0004316866397857666, 0.0004565119743347168, 0.000481337308883667, 0.0005061626434326172, 0.0005309879779815674, 0.0005558133125305176, 0.0005806386470794678, 0.000605463981628418, 0.0006302893161773682, 0.0006551146507263184, 0.0006799399852752686, 0.0007047653198242188, 0.0007295906543731689, 0.0007544159889221191, 0.0007792413234710693, 0.0008040666580200195]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 4.0, 4.0, 3.0, 8.0, 9.0, 7.0, 10.0, 12.0, 12.0, 18.0, 20.0, 16.0, 21.0, 20.0, 25.0, 20.0, 23.0, 25.0, 26.0, 39.0, 41.0, 35.0, 46.0, 42.0, 55.0, 39.0, 34.0, 42.0, 29.0, 42.0, 35.0, 34.0, 28.0, 16.0, 25.0, 20.0, 19.0, 18.0, 11.0, 11.0, 15.0, 14.0, 8.0, 4.0, 4.0, 1.0, 5.0, 2.0, 5.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.6171875, -5.43695068359375, -5.2567138671875, -5.07647705078125, -4.896240234375, -4.71600341796875, -4.5357666015625, -4.35552978515625, -4.17529296875, -3.99505615234375, -3.8148193359375, -3.63458251953125, -3.454345703125, -3.27410888671875, -3.0938720703125, -2.91363525390625, -2.7333984375, -2.55316162109375, -2.3729248046875, -2.19268798828125, -2.012451171875, -1.83221435546875, -1.6519775390625, -1.47174072265625, -1.29150390625, -1.11126708984375, -0.9310302734375, -0.75079345703125, -0.570556640625, -0.39031982421875, -0.2100830078125, -0.02984619140625, 0.150390625, 0.33062744140625, 0.5108642578125, 0.69110107421875, 0.871337890625, 1.05157470703125, 1.2318115234375, 1.41204833984375, 1.59228515625, 1.77252197265625, 1.9527587890625, 2.13299560546875, 2.313232421875, 2.49346923828125, 2.6737060546875, 2.85394287109375, 3.0341796875, 3.21441650390625, 3.3946533203125, 3.57489013671875, 3.755126953125, 3.93536376953125, 4.1156005859375, 4.29583740234375, 4.47607421875, 4.65631103515625, 4.8365478515625, 5.01678466796875, 5.197021484375, 5.37725830078125, 5.5574951171875, 5.73773193359375, 5.91796875]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 5.0, 5.0, 5.0, 9.0, 10.0, 16.0, 15.0, 26.0, 33.0, 51.0, 73.0, 112.0, 172.0, 218.0, 378.0, 551.0, 958.0, 1389.0, 2169.0, 4015.0, 7543.0, 16719.0, 49234.0, 223808.0, 560839.0, 121653.0, 32134.0, 12237.0, 5619.0, 3224.0, 1879.0, 1195.0, 801.0, 479.0, 315.0, 221.0, 167.0, 67.0, 66.0, 37.0, 29.0, 25.0, 14.0, 15.0, 4.0, 9.0, 3.0, 7.0, 7.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.7578125, -5.57965087890625, -5.4014892578125, -5.22332763671875, -5.045166015625, -4.86700439453125, -4.6888427734375, -4.51068115234375, -4.33251953125, -4.15435791015625, -3.9761962890625, -3.79803466796875, -3.619873046875, -3.44171142578125, -3.2635498046875, -3.08538818359375, -2.9072265625, -2.72906494140625, -2.5509033203125, -2.37274169921875, -2.194580078125, -2.01641845703125, -1.8382568359375, -1.66009521484375, -1.48193359375, -1.30377197265625, -1.1256103515625, -0.94744873046875, -0.769287109375, -0.59112548828125, -0.4129638671875, -0.23480224609375, -0.056640625, 0.12152099609375, 0.2996826171875, 0.47784423828125, 0.656005859375, 0.83416748046875, 1.0123291015625, 1.19049072265625, 1.36865234375, 1.54681396484375, 1.7249755859375, 1.90313720703125, 2.081298828125, 2.25946044921875, 2.4376220703125, 2.61578369140625, 2.7939453125, 2.97210693359375, 3.1502685546875, 3.32843017578125, 3.506591796875, 3.68475341796875, 3.8629150390625, 4.04107666015625, 4.21923828125, 4.39739990234375, 4.5755615234375, 4.75372314453125, 4.931884765625, 5.11004638671875, 5.2882080078125, 5.46636962890625, 5.64453125]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 8.0, 6.0, 17.0, 5.0, 21.0, 23.0, 22.0, 30.0, 26.0, 23.0, 36.0, 33.0, 35.0, 47.0, 46.0, 57.0, 98.0, 1520.0, 449.0, 110.0, 64.0, 43.0, 35.0, 41.0, 30.0, 32.0, 35.0, 25.0, 19.0, 19.0, 15.0, 16.0, 10.0, 18.0, 8.0, 6.0, 6.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-22.234375, -21.598876953125, -20.96337890625, -20.327880859375, -19.6923828125, -19.056884765625, -18.42138671875, -17.785888671875, -17.150390625, -16.514892578125, -15.87939453125, -15.243896484375, -14.6083984375, -13.972900390625, -13.33740234375, -12.701904296875, -12.06640625, -11.430908203125, -10.79541015625, -10.159912109375, -9.5244140625, -8.888916015625, -8.25341796875, -7.617919921875, -6.982421875, -6.346923828125, -5.71142578125, -5.075927734375, -4.4404296875, -3.804931640625, -3.16943359375, -2.533935546875, -1.8984375, -1.262939453125, -0.62744140625, 0.008056640625, 0.6435546875, 1.279052734375, 1.91455078125, 2.550048828125, 3.185546875, 3.821044921875, 4.45654296875, 5.092041015625, 5.7275390625, 6.363037109375, 6.99853515625, 7.634033203125, 8.26953125, 8.905029296875, 9.54052734375, 10.176025390625, 10.8115234375, 11.447021484375, 12.08251953125, 12.718017578125, 13.353515625, 13.989013671875, 14.62451171875, 15.260009765625, 15.8955078125, 16.531005859375, 17.16650390625, 17.802001953125, 18.4375]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 4.0, 5.0, 6.0, 8.0, 7.0, 24.0, 20.0, 28.0, 27.0, 40.0, 65.0, 102.0, 139.0, 216.0, 338.0, 813.0, 9978.0, 3111454.0, 20230.0, 1063.0, 377.0, 224.0, 165.0, 99.0, 58.0, 58.0, 40.0, 34.0, 16.0, 19.0, 13.0, 9.0, 7.0, 5.0, 4.0, 2.0, 2.0, 3.0, 2.0, 2.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-52.84375, -50.99560546875, -49.1474609375, -47.29931640625, -45.451171875, -43.60302734375, -41.7548828125, -39.90673828125, -38.05859375, -36.21044921875, -34.3623046875, -32.51416015625, -30.666015625, -28.81787109375, -26.9697265625, -25.12158203125, -23.2734375, -21.42529296875, -19.5771484375, -17.72900390625, -15.880859375, -14.03271484375, -12.1845703125, -10.33642578125, -8.48828125, -6.64013671875, -4.7919921875, -2.94384765625, -1.095703125, 0.75244140625, 2.6005859375, 4.44873046875, 6.296875, 8.14501953125, 9.9931640625, 11.84130859375, 13.689453125, 15.53759765625, 17.3857421875, 19.23388671875, 21.08203125, 22.93017578125, 24.7783203125, 26.62646484375, 28.474609375, 30.32275390625, 32.1708984375, 34.01904296875, 35.8671875, 37.71533203125, 39.5634765625, 41.41162109375, 43.259765625, 45.10791015625, 46.9560546875, 48.80419921875, 50.65234375, 52.50048828125, 54.3486328125, 56.19677734375, 58.044921875, 59.89306640625, 61.7412109375, 63.58935546875, 65.4375]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 5.0, 41.0, 550.0, 406.0, 17.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.66655731201172, -20.241098403930664, -16.81563949584961, -13.390178680419922, -9.964719772338867, -6.5392608642578125, -3.113800048828125, 0.3116588592529297, 3.7371177673339844, 7.162577152252197, 10.58803653717041, 14.013496398925781, 17.438955307006836, 20.86441421508789, 24.289875030517578, 27.715333938598633, 31.140792846679688, 34.566253662109375, 37.9917106628418, 41.417171478271484, 44.842628479003906, 48.268089294433594, 51.69355010986328, 55.11901092529297, 58.54446792602539, 61.96992874145508, 65.3953857421875, 68.82084655761719, 72.24630737304688, 75.67176818847656, 79.09722900390625, 82.5226821899414, 85.94815063476562, 89.37361145019531, 92.799072265625, 96.22453308105469, 99.64998626708984, 103.07544708251953, 106.50090789794922, 109.9263687133789, 113.35182189941406, 116.77728271484375, 120.20274353027344, 123.62820434570312, 127.05365753173828, 130.4791259765625, 133.90457153320312, 137.3300323486328, 140.7554931640625, 144.1809539794922, 147.60641479492188, 151.03187561035156, 154.45733642578125, 157.88278198242188, 161.30825805664062, 164.73370361328125, 168.1591796875, 171.5846405029297, 175.01010131835938, 178.43556213378906, 181.86102294921875, 185.28646850585938, 188.71194458007812, 192.13739013671875, 195.56285095214844]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 5.0, 0.0, 1.0, 2.0, 6.0, 1.0, 6.0, 8.0, 12.0, 11.0, 5.0, 9.0, 12.0, 19.0, 16.0, 21.0, 24.0, 23.0, 28.0, 30.0, 43.0, 31.0, 38.0, 35.0, 43.0, 38.0, 39.0, 32.0, 27.0, 44.0, 37.0, 37.0, 33.0, 33.0, 33.0, 26.0, 25.0, 22.0, 21.0, 21.0, 14.0, 14.0, 11.0, 18.0, 10.0, 10.0, 11.0, 3.0, 7.0, 4.0, 2.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0], "bins": [-45.92561721801758, -44.51010513305664, -43.09458923339844, -41.6790771484375, -40.26356506347656, -38.848052978515625, -37.43254089355469, -36.017024993896484, -34.60151290893555, -33.18600082397461, -31.77048683166504, -30.35497283935547, -28.93946075439453, -27.523948669433594, -26.108434677124023, -24.692920684814453, -23.277408599853516, -21.861896514892578, -20.446382522583008, -19.030868530273438, -17.6153564453125, -16.199844360351562, -14.784330368041992, -13.368817329406738, -11.953304290771484, -10.53779125213623, -9.122278213500977, -7.706765174865723, -6.291252136230469, -4.875739097595215, -3.460226058959961, -2.044713020324707, -0.6291961669921875, 0.7863168716430664, 2.2018299102783203, 3.617342948913574, 5.032855987548828, 6.448369026184082, 7.863882064819336, 9.27939510345459, 10.694908142089844, 12.110421180725098, 13.525934219360352, 14.941447257995605, 16.35696029663086, 17.772472381591797, 19.187986373901367, 20.603500366210938, 22.019012451171875, 23.434524536132812, 24.850038528442383, 26.265552520751953, 27.68106460571289, 29.096576690673828, 30.5120906829834, 31.92760467529297, 33.343116760253906, 34.758628845214844, 36.17414093017578, 37.589656829833984, 39.00516891479492, 40.42068099975586, 41.83619689941406, 43.251708984375, 44.66722106933594]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 7.0, 4.0, 6.0, 6.0, 8.0, 10.0, 11.0, 17.0, 21.0, 15.0, 13.0, 22.0, 22.0, 31.0, 15.0, 21.0, 41.0, 35.0, 38.0, 34.0, 46.0, 44.0, 41.0, 53.0, 31.0, 36.0, 45.0, 32.0, 35.0, 34.0, 34.0, 23.0, 33.0, 17.0, 23.0, 12.0, 17.0, 17.0, 10.0, 7.0, 13.0, 4.0, 1.0, 7.0, 3.0, 2.0, 3.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.7109375, -5.5186767578125, -5.326416015625, -5.1341552734375, -4.94189453125, -4.7496337890625, -4.557373046875, -4.3651123046875, -4.1728515625, -3.9805908203125, -3.788330078125, -3.5960693359375, -3.40380859375, -3.2115478515625, -3.019287109375, -2.8270263671875, -2.634765625, -2.4425048828125, -2.250244140625, -2.0579833984375, -1.86572265625, -1.6734619140625, -1.481201171875, -1.2889404296875, -1.0966796875, -0.9044189453125, -0.712158203125, -0.5198974609375, -0.32763671875, -0.1353759765625, 0.056884765625, 0.2491455078125, 0.44140625, 0.6336669921875, 0.825927734375, 1.0181884765625, 1.21044921875, 1.4027099609375, 1.594970703125, 1.7872314453125, 1.9794921875, 2.1717529296875, 2.364013671875, 2.5562744140625, 2.74853515625, 2.9407958984375, 3.133056640625, 3.3253173828125, 3.517578125, 3.7098388671875, 3.902099609375, 4.0943603515625, 4.28662109375, 4.4788818359375, 4.671142578125, 4.8634033203125, 5.0556640625, 5.2479248046875, 5.440185546875, 5.6324462890625, 5.82470703125, 6.0169677734375, 6.209228515625, 6.4014892578125, 6.59375]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 3.0, 2.0, 6.0, 10.0, 8.0, 12.0, 14.0, 14.0, 17.0, 26.0, 18.0, 33.0, 37.0, 57.0, 57.0, 91.0, 139.0, 251.0, 480.0, 919.0, 2075.0, 4502.0, 11113.0, 30767.0, 108962.0, 575347.0, 1995968.0, 1161194.0, 221940.0, 50821.0, 16979.0, 6587.0, 2823.0, 1352.0, 625.0, 341.0, 227.0, 119.0, 75.0, 52.0, 42.0, 45.0, 26.0, 34.0, 17.0, 9.0, 9.0, 10.0, 8.0, 8.0, 3.0, 0.0, 7.0, 3.0, 3.0, 0.0, 4.0, 0.0, 2.0, 1.0, 2.0], "bins": [-9.8359375, -9.5050048828125, -9.174072265625, -8.8431396484375, -8.51220703125, -8.1812744140625, -7.850341796875, -7.5194091796875, -7.1884765625, -6.8575439453125, -6.526611328125, -6.1956787109375, -5.86474609375, -5.5338134765625, -5.202880859375, -4.8719482421875, -4.541015625, -4.2100830078125, -3.879150390625, -3.5482177734375, -3.21728515625, -2.8863525390625, -2.555419921875, -2.2244873046875, -1.8935546875, -1.5626220703125, -1.231689453125, -0.9007568359375, -0.56982421875, -0.2388916015625, 0.092041015625, 0.4229736328125, 0.75390625, 1.0848388671875, 1.415771484375, 1.7467041015625, 2.07763671875, 2.4085693359375, 2.739501953125, 3.0704345703125, 3.4013671875, 3.7322998046875, 4.063232421875, 4.3941650390625, 4.72509765625, 5.0560302734375, 5.386962890625, 5.7178955078125, 6.048828125, 6.3797607421875, 6.710693359375, 7.0416259765625, 7.37255859375, 7.7034912109375, 8.034423828125, 8.3653564453125, 8.6962890625, 9.0272216796875, 9.358154296875, 9.6890869140625, 10.02001953125, 10.3509521484375, 10.681884765625, 11.0128173828125, 11.34375]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 8.0, 5.0, 8.0, 16.0, 15.0, 20.0, 20.0, 28.0, 48.0, 66.0, 104.0, 138.0, 176.0, 263.0, 381.0, 533.0, 563.0, 484.0, 357.0, 253.0, 196.0, 126.0, 71.0, 58.0, 28.0, 36.0, 24.0, 18.0, 11.0, 10.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.1171875, -13.680419921875, -13.24365234375, -12.806884765625, -12.3701171875, -11.933349609375, -11.49658203125, -11.059814453125, -10.623046875, -10.186279296875, -9.74951171875, -9.312744140625, -8.8759765625, -8.439208984375, -8.00244140625, -7.565673828125, -7.12890625, -6.692138671875, -6.25537109375, -5.818603515625, -5.3818359375, -4.945068359375, -4.50830078125, -4.071533203125, -3.634765625, -3.197998046875, -2.76123046875, -2.324462890625, -1.8876953125, -1.450927734375, -1.01416015625, -0.577392578125, -0.140625, 0.296142578125, 0.73291015625, 1.169677734375, 1.6064453125, 2.043212890625, 2.47998046875, 2.916748046875, 3.353515625, 3.790283203125, 4.22705078125, 4.663818359375, 5.1005859375, 5.537353515625, 5.97412109375, 6.410888671875, 6.84765625, 7.284423828125, 7.72119140625, 8.157958984375, 8.5947265625, 9.031494140625, 9.46826171875, 9.905029296875, 10.341796875, 10.778564453125, 11.21533203125, 11.652099609375, 12.0888671875, 12.525634765625, 12.96240234375, 13.399169921875, 13.8359375]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 8.0, 7.0, 14.0, 17.0, 19.0, 24.0, 46.0, 75.0, 73.0, 118.0, 204.0, 340.0, 630.0, 3030.0, 69945.0, 3871502.0, 240499.0, 5920.0, 805.0, 302.0, 212.0, 147.0, 107.0, 72.0, 35.0, 31.0, 30.0, 14.0, 15.0, 13.0, 8.0, 8.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-49.90625, -48.22216796875, -46.5380859375, -44.85400390625, -43.169921875, -41.48583984375, -39.8017578125, -38.11767578125, -36.43359375, -34.74951171875, -33.0654296875, -31.38134765625, -29.697265625, -28.01318359375, -26.3291015625, -24.64501953125, -22.9609375, -21.27685546875, -19.5927734375, -17.90869140625, -16.224609375, -14.54052734375, -12.8564453125, -11.17236328125, -9.48828125, -7.80419921875, -6.1201171875, -4.43603515625, -2.751953125, -1.06787109375, 0.6162109375, 2.30029296875, 3.984375, 5.66845703125, 7.3525390625, 9.03662109375, 10.720703125, 12.40478515625, 14.0888671875, 15.77294921875, 17.45703125, 19.14111328125, 20.8251953125, 22.50927734375, 24.193359375, 25.87744140625, 27.5615234375, 29.24560546875, 30.9296875, 32.61376953125, 34.2978515625, 35.98193359375, 37.666015625, 39.35009765625, 41.0341796875, 42.71826171875, 44.40234375, 46.08642578125, 47.7705078125, 49.45458984375, 51.138671875, 52.82275390625, 54.5068359375, 56.19091796875, 57.875]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 84.0, 569.0, 333.0, 25.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-222.63157653808594, -210.79522705078125, -198.95889282226562, -187.12254333496094, -175.28619384765625, -163.44985961914062, -151.61351013183594, -139.77716064453125, -127.9408187866211, -116.10447692871094, -104.26812744140625, -92.4317855834961, -80.59544372558594, -68.75909423828125, -56.922752380371094, -45.086402893066406, -33.25006103515625, -21.413715362548828, -9.577371597290039, 2.25897216796875, 14.095317840576172, 25.931663513183594, 37.76800537109375, 49.60435485839844, 61.440696716308594, 73.27703857421875, 85.11338806152344, 96.9497299194336, 108.78607177734375, 120.62242126464844, 132.45877075195312, 144.29510498046875, 156.13143920898438, 167.96778869628906, 179.8041229248047, 191.64047241210938, 203.47682189941406, 215.31317138671875, 227.14950561523438, 238.98585510253906, 250.82220458984375, 262.6585388183594, 274.4949035644531, 286.33123779296875, 298.1675720214844, 310.0039367675781, 321.84027099609375, 333.6766357421875, 345.512939453125, 357.3492736816406, 369.1856384277344, 381.02197265625, 392.8583068847656, 404.6946716308594, 416.531005859375, 428.36737060546875, 440.2037048339844, 452.0400390625, 463.87640380859375, 475.7127380371094, 487.549072265625, 499.38543701171875, 511.2217712402344, 523.05810546875, 534.8944702148438]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 4.0, 3.0, 5.0, 13.0, 8.0, 17.0, 4.0, 16.0, 16.0, 21.0, 20.0, 32.0, 28.0, 30.0, 50.0, 41.0, 41.0, 45.0, 44.0, 50.0, 49.0, 34.0, 41.0, 43.0, 47.0, 37.0, 36.0, 30.0, 29.0, 27.0, 29.0, 23.0, 24.0, 16.0, 13.0, 7.0, 4.0, 11.0, 6.0, 2.0, 7.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.037445068359375, -43.67934036254883, -42.32123565673828, -40.963134765625, -39.60503005981445, -38.246925354003906, -36.888824462890625, -35.53071975708008, -34.17261505126953, -32.814510345458984, -31.45640754699707, -30.098304748535156, -28.74020004272461, -27.382095336914062, -26.02399253845215, -24.665889739990234, -23.307785034179688, -21.94968032836914, -20.591577529907227, -19.233474731445312, -17.875370025634766, -16.51726531982422, -15.159162521362305, -13.801058769226074, -12.442955017089844, -11.084851264953613, -9.726747512817383, -8.368643760681152, -7.010540008544922, -5.652436256408691, -4.294332504272461, -2.9362287521362305, -1.578125, -0.22002124786376953, 1.138082504272461, 2.4961862564086914, 3.854290008544922, 5.212393760681152, 6.570497512817383, 7.928601264953613, 9.286705017089844, 10.644808769226074, 12.002912521362305, 13.361016273498535, 14.719120025634766, 16.077224731445312, 17.435327529907227, 18.79343032836914, 20.151535034179688, 21.509639739990234, 22.86774253845215, 24.225845336914062, 25.58395004272461, 26.942054748535156, 28.30015754699707, 29.658260345458984, 31.01636505126953, 32.37446975708008, 33.732574462890625, 35.090675354003906, 36.44878005981445, 37.806884765625, 39.16498565673828, 40.52309036254883, 41.881195068359375]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 4.0, 3.0, 5.0, 3.0, 5.0, 4.0, 8.0, 5.0, 6.0, 15.0, 15.0, 19.0, 13.0, 15.0, 20.0, 26.0, 25.0, 21.0, 33.0, 23.0, 39.0, 40.0, 33.0, 33.0, 42.0, 49.0, 39.0, 42.0, 31.0, 35.0, 26.0, 41.0, 36.0, 35.0, 28.0, 21.0, 21.0, 14.0, 16.0, 16.0, 21.0, 13.0, 14.0, 10.0, 6.0, 5.0, 8.0, 5.0, 4.0, 4.0, 3.0, 5.0, 4.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-5.58203125, -5.4080810546875, -5.234130859375, -5.0601806640625, -4.88623046875, -4.7122802734375, -4.538330078125, -4.3643798828125, -4.1904296875, -4.0164794921875, -3.842529296875, -3.6685791015625, -3.49462890625, -3.3206787109375, -3.146728515625, -2.9727783203125, -2.798828125, -2.6248779296875, -2.450927734375, -2.2769775390625, -2.10302734375, -1.9290771484375, -1.755126953125, -1.5811767578125, -1.4072265625, -1.2332763671875, -1.059326171875, -0.8853759765625, -0.71142578125, -0.5374755859375, -0.363525390625, -0.1895751953125, -0.015625, 0.1583251953125, 0.332275390625, 0.5062255859375, 0.68017578125, 0.8541259765625, 1.028076171875, 1.2020263671875, 1.3759765625, 1.5499267578125, 1.723876953125, 1.8978271484375, 2.07177734375, 2.2457275390625, 2.419677734375, 2.5936279296875, 2.767578125, 2.9415283203125, 3.115478515625, 3.2894287109375, 3.46337890625, 3.6373291015625, 3.811279296875, 3.9852294921875, 4.1591796875, 4.3331298828125, 4.507080078125, 4.6810302734375, 4.85498046875, 5.0289306640625, 5.202880859375, 5.3768310546875, 5.55078125]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 7.0, 7.0, 11.0, 12.0, 20.0, 16.0, 34.0, 59.0, 80.0, 109.0, 118.0, 237.0, 298.0, 463.0, 598.0, 856.0, 1213.0, 1691.0, 2492.0, 3510.0, 5317.0, 7828.0, 11368.0, 18080.0, 27844.0, 44023.0, 69778.0, 108039.0, 153187.0, 174778.0, 142633.0, 97390.0, 62798.0, 39417.0, 24800.0, 16203.0, 10715.0, 7057.0, 4601.0, 3269.0, 2292.0, 1577.0, 1071.0, 842.0, 535.0, 358.0, 270.0, 205.0, 126.0, 113.0, 58.0, 50.0, 38.0, 19.0, 25.0, 11.0, 6.0, 8.0, 6.0, 2.0, 2.0], "bins": [-0.2139892578125, -0.2073802947998047, -0.20077133178710938, -0.19416236877441406, -0.18755340576171875, -0.18094444274902344, -0.17433547973632812, -0.1677265167236328, -0.1611175537109375, -0.1545085906982422, -0.14789962768554688, -0.14129066467285156, -0.13468170166015625, -0.12807273864746094, -0.12146377563476562, -0.11485481262207031, -0.108245849609375, -0.10163688659667969, -0.09502792358398438, -0.08841896057128906, -0.08180999755859375, -0.07520103454589844, -0.06859207153320312, -0.06198310852050781, -0.0553741455078125, -0.04876518249511719, -0.042156219482421875, -0.03554725646972656, -0.02893829345703125, -0.022329330444335938, -0.015720367431640625, -0.009111404418945312, -0.00250244140625, 0.0041065216064453125, 0.010715484619140625, 0.017324447631835938, 0.02393341064453125, 0.030542373657226562, 0.037151336669921875, 0.04376029968261719, 0.0503692626953125, 0.05697822570800781, 0.06358718872070312, 0.07019615173339844, 0.07680511474609375, 0.08341407775878906, 0.09002304077148438, 0.09663200378417969, 0.103240966796875, 0.10984992980957031, 0.11645889282226562, 0.12306785583496094, 0.12967681884765625, 0.13628578186035156, 0.14289474487304688, 0.1495037078857422, 0.1561126708984375, 0.1627216339111328, 0.16933059692382812, 0.17593955993652344, 0.18254852294921875, 0.18915748596191406, 0.19576644897460938, 0.2023754119873047, 0.208984375]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 7.0, 5.0, 9.0, 7.0, 15.0, 9.0, 13.0, 17.0, 30.0, 22.0, 29.0, 31.0, 29.0, 28.0, 27.0, 31.0, 33.0, 41.0, 34.0, 35.0, 37.0, 1063.0, 36.0, 45.0, 38.0, 35.0, 34.0, 34.0, 28.0, 26.0, 27.0, 21.0, 17.0, 33.0, 17.0, 15.0, 10.0, 20.0, 6.0, 10.0, 5.0, 4.0, 4.0, 3.0, 1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.8125, -3.691009521484375, -3.56951904296875, -3.448028564453125, -3.3265380859375, -3.205047607421875, -3.08355712890625, -2.962066650390625, -2.840576171875, -2.719085693359375, -2.59759521484375, -2.476104736328125, -2.3546142578125, -2.233123779296875, -2.11163330078125, -1.990142822265625, -1.86865234375, -1.747161865234375, -1.62567138671875, -1.504180908203125, -1.3826904296875, -1.261199951171875, -1.13970947265625, -1.018218994140625, -0.896728515625, -0.775238037109375, -0.65374755859375, -0.532257080078125, -0.4107666015625, -0.289276123046875, -0.16778564453125, -0.046295166015625, 0.0751953125, 0.196685791015625, 0.31817626953125, 0.439666748046875, 0.5611572265625, 0.682647705078125, 0.80413818359375, 0.925628662109375, 1.047119140625, 1.168609619140625, 1.29010009765625, 1.411590576171875, 1.5330810546875, 1.654571533203125, 1.77606201171875, 1.897552490234375, 2.01904296875, 2.140533447265625, 2.26202392578125, 2.383514404296875, 2.5050048828125, 2.626495361328125, 2.74798583984375, 2.869476318359375, 2.990966796875, 3.112457275390625, 3.23394775390625, 3.355438232421875, 3.4769287109375, 3.598419189453125, 3.71990966796875, 3.841400146484375, 3.962890625]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 3.0, 7.0, 2.0, 5.0, 19.0, 18.0, 35.0, 63.0, 79.0, 105.0, 176.0, 236.0, 343.0, 561.0, 806.0, 1167.0, 1710.0, 2484.0, 3823.0, 5869.0, 8654.0, 13451.0, 20344.0, 32031.0, 49634.0, 78189.0, 117792.0, 161272.0, 1209627.0, 132863.0, 90693.0, 58348.0, 37290.0, 23797.0, 15314.0, 10121.0, 6684.0, 4514.0, 2935.0, 1969.0, 1343.0, 851.0, 616.0, 443.0, 261.0, 196.0, 116.0, 97.0, 74.0, 42.0, 33.0, 14.0, 7.0, 6.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1981201171875, -0.19176483154296875, -0.1854095458984375, -0.17905426025390625, -0.172698974609375, -0.16634368896484375, -0.1599884033203125, -0.15363311767578125, -0.14727783203125, -0.14092254638671875, -0.1345672607421875, -0.12821197509765625, -0.121856689453125, -0.11550140380859375, -0.1091461181640625, -0.10279083251953125, -0.096435546875, -0.09008026123046875, -0.0837249755859375, -0.07736968994140625, -0.071014404296875, -0.06465911865234375, -0.0583038330078125, -0.05194854736328125, -0.04559326171875, -0.03923797607421875, -0.0328826904296875, -0.02652740478515625, -0.020172119140625, -0.01381683349609375, -0.0074615478515625, -0.00110626220703125, 0.0052490234375, 0.01160430908203125, 0.0179595947265625, 0.02431488037109375, 0.030670166015625, 0.03702545166015625, 0.0433807373046875, 0.04973602294921875, 0.05609130859375, 0.06244659423828125, 0.0688018798828125, 0.07515716552734375, 0.081512451171875, 0.08786773681640625, 0.0942230224609375, 0.10057830810546875, 0.10693359375, 0.11328887939453125, 0.1196441650390625, 0.12599945068359375, 0.132354736328125, 0.13871002197265625, 0.1450653076171875, 0.15142059326171875, 0.15777587890625, 0.16413116455078125, 0.1704864501953125, 0.17684173583984375, 0.183197021484375, 0.18955230712890625, 0.1959075927734375, 0.20226287841796875, 0.2086181640625]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 2.0, 5.0, 6.0, 3.0, 7.0, 7.0, 7.0, 20.0, 19.0, 24.0, 22.0, 51.0, 69.0, 68.0, 85.0, 97.0, 125.0, 76.0, 79.0, 50.0, 42.0, 30.0, 24.0, 14.0, 18.0, 18.0, 7.0, 4.0, 4.0, 8.0, 2.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0024356842041015625, -0.0023657381534576416, -0.0022957921028137207, -0.0022258460521698, -0.002155900001525879, -0.002085953950881958, -0.002016007900238037, -0.0019460618495941162, -0.0018761157989501953, -0.0018061697483062744, -0.0017362236976623535, -0.0016662776470184326, -0.0015963315963745117, -0.0015263855457305908, -0.00145643949508667, -0.001386493444442749, -0.0013165473937988281, -0.0012466013431549072, -0.0011766552925109863, -0.0011067092418670654, -0.0010367631912231445, -0.0009668171405792236, -0.0008968710899353027, -0.0008269250392913818, -0.0007569789886474609, -0.00068703293800354, -0.0006170868873596191, -0.0005471408367156982, -0.00047719478607177734, -0.00040724873542785645, -0.00033730268478393555, -0.00026735663414001465, -0.00019741058349609375, -0.00012746453285217285, -5.751848220825195e-05, 1.2427568435668945e-05, 8.237361907958984e-05, 0.00015231966972351074, 0.00022226572036743164, 0.00029221177101135254, 0.00036215782165527344, 0.00043210387229919434, 0.0005020499229431152, 0.0005719959735870361, 0.000641942024230957, 0.0007118880748748779, 0.0007818341255187988, 0.0008517801761627197, 0.0009217262268066406, 0.0009916722774505615, 0.0010616183280944824, 0.0011315643787384033, 0.0012015104293823242, 0.0012714564800262451, 0.001341402530670166, 0.001411348581314087, 0.0014812946319580078, 0.0015512406826019287, 0.0016211867332458496, 0.0016911327838897705, 0.0017610788345336914, 0.0018310248851776123, 0.0019009709358215332, 0.001970916986465454, 0.002040863037109375]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 7.0, 7.0, 16.0, 15.0, 15.0, 26.0, 37.0, 64.0, 101.0, 189.0, 378.0, 2656.0, 1032479.0, 11536.0, 499.0, 210.0, 117.0, 54.0, 41.0, 29.0, 18.0, 10.0, 7.0, 7.0, 10.0, 7.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.045989990234375, -0.04443788528442383, -0.042885780334472656, -0.041333675384521484, -0.03978157043457031, -0.03822946548461914, -0.03667736053466797, -0.0351252555847168, -0.033573150634765625, -0.03202104568481445, -0.03046894073486328, -0.02891683578491211, -0.027364730834960938, -0.025812625885009766, -0.024260520935058594, -0.022708415985107422, -0.02115631103515625, -0.019604206085205078, -0.018052101135253906, -0.016499996185302734, -0.014947891235351562, -0.01339578628540039, -0.011843681335449219, -0.010291576385498047, -0.008739471435546875, -0.007187366485595703, -0.005635261535644531, -0.004083156585693359, -0.0025310516357421875, -0.0009789466857910156, 0.0005731582641601562, 0.002125263214111328, 0.0036773681640625, 0.005229473114013672, 0.006781578063964844, 0.008333683013916016, 0.009885787963867188, 0.01143789291381836, 0.012989997863769531, 0.014542102813720703, 0.016094207763671875, 0.017646312713623047, 0.01919841766357422, 0.02075052261352539, 0.022302627563476562, 0.023854732513427734, 0.025406837463378906, 0.026958942413330078, 0.02851104736328125, 0.030063152313232422, 0.031615257263183594, 0.033167362213134766, 0.03471946716308594, 0.03627157211303711, 0.03782367706298828, 0.03937578201293945, 0.040927886962890625, 0.0424799919128418, 0.04403209686279297, 0.04558420181274414, 0.04713630676269531, 0.048688411712646484, 0.050240516662597656, 0.05179262161254883, 0.0533447265625]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 18.0, 1001.0], "bins": [-0.05769195035099983, -0.05678222328424454, -0.05587249621748924, -0.05496276915073395, -0.05405304208397865, -0.05314331501722336, -0.05223359167575836, -0.05132386460900307, -0.05041413754224777, -0.04950441047549248, -0.04859468340873718, -0.04768495634198189, -0.04677522927522659, -0.0458655059337616, -0.0449557788670063, -0.04404605180025101, -0.04313632473349571, -0.04222659766674042, -0.04131687059998512, -0.04040714353322983, -0.03949741646647453, -0.03858768939971924, -0.03767796605825424, -0.03676823899149895, -0.03585851192474365, -0.03494878485798836, -0.03403905779123306, -0.03312933072447777, -0.03221960365772247, -0.03130988031625748, -0.030400151386857033, -0.029490426182746887, -0.028580697253346443, -0.02767097018659115, -0.026761243119835854, -0.025851517915725708, -0.024941790848970413, -0.02403206378221512, -0.023122336715459824, -0.02221260964870453, -0.021302884444594383, -0.02039315737783909, -0.019483430311083794, -0.018573705106973648, -0.017663978040218353, -0.01675425097346306, -0.015844523906707764, -0.014934797771275043, -0.014025070704519749, -0.013115343637764454, -0.012205617502331734, -0.011295890435576439, -0.010386164300143719, -0.009476437233388424, -0.008566711097955704, -0.007656984031200409, -0.0067472574301064014, -0.005837530829012394, -0.0049278042279183865, -0.004018077626824379, -0.003108350792899728, -0.0021986239589750767, -0.0012888973578810692, -0.0003791707567870617, 0.0005305556696839631]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 3.0, 4.0, 5.0, 14.0, 22.0, 19.0, 23.0, 31.0, 56.0, 72.0, 58.0, 86.0, 78.0, 67.0, 82.0, 73.0, 61.0, 53.0, 61.0, 28.0, 32.0, 33.0, 15.0, 13.0, 14.0, 9.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008837580680847168, -0.0008252281695604324, -0.0007666982710361481, -0.0007081683725118637, -0.0006496384739875793, -0.000591108575463295, -0.0005325786769390106, -0.00047404877841472626, -0.0004155188798904419, -0.00035698898136615753, -0.00029845908284187317, -0.0002399291843175888, -0.00018139928579330444, -0.00012286938726902008, -6.433948874473572e-05, -5.809590220451355e-06, 5.272030830383301e-05, 0.00011125020682811737, 0.00016978010535240173, 0.0002283100038766861, 0.00028683990240097046, 0.0003453698009252548, 0.0004038996994495392, 0.00046242959797382355, 0.0005209594964981079, 0.0005794893950223923, 0.0006380192935466766, 0.000696549192070961, 0.0007550790905952454, 0.0008136089891195297, 0.0008721388876438141, 0.0009306687861680984, 0.0009891986846923828, 0.0010477285832166672, 0.0011062584817409515, 0.001164788380265236, 0.0012233182787895203, 0.0012818481773138046, 0.001340378075838089, 0.0013989079743623734, 0.0014574378728866577, 0.001515967771410942, 0.0015744976699352264, 0.0016330275684595108, 0.0016915574669837952, 0.0017500873655080795, 0.001808617264032364, 0.0018671471625566483, 0.0019256770610809326, 0.001984206959605217, 0.0020427368581295013, 0.0021012667566537857, 0.00215979665517807, 0.0022183265537023544, 0.002276856452226639, 0.002335386350750923, 0.0023939162492752075, 0.002452446147799492, 0.0025109760463237762, 0.0025695059448480606, 0.002628035843372345, 0.0026865657418966293, 0.0027450956404209137, 0.002803625538945198, 0.0028621554374694824]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 4.0, 3.0, 5.0, 3.0, 5.0, 4.0, 8.0, 5.0, 6.0, 15.0, 15.0, 19.0, 13.0, 15.0, 20.0, 26.0, 25.0, 21.0, 33.0, 23.0, 39.0, 40.0, 33.0, 33.0, 42.0, 49.0, 39.0, 42.0, 31.0, 35.0, 26.0, 40.0, 37.0, 35.0, 28.0, 21.0, 21.0, 14.0, 17.0, 15.0, 21.0, 13.0, 14.0, 10.0, 6.0, 5.0, 8.0, 5.0, 4.0, 4.0, 3.0, 5.0, 4.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-5.58203125, -5.4080810546875, -5.234130859375, -5.0601806640625, -4.88623046875, -4.7122802734375, -4.538330078125, -4.3643798828125, -4.1904296875, -4.0164794921875, -3.842529296875, -3.6685791015625, -3.49462890625, -3.3206787109375, -3.146728515625, -2.9727783203125, -2.798828125, -2.6248779296875, -2.450927734375, -2.2769775390625, -2.10302734375, -1.9290771484375, -1.755126953125, -1.5811767578125, -1.4072265625, -1.2332763671875, -1.059326171875, -0.8853759765625, -0.71142578125, -0.5374755859375, -0.363525390625, -0.1895751953125, -0.015625, 0.1583251953125, 0.332275390625, 0.5062255859375, 0.68017578125, 0.8541259765625, 1.028076171875, 1.2020263671875, 1.3759765625, 1.5499267578125, 1.723876953125, 1.8978271484375, 2.07177734375, 2.2457275390625, 2.419677734375, 2.5936279296875, 2.767578125, 2.9415283203125, 3.115478515625, 3.2894287109375, 3.46337890625, 3.6373291015625, 3.811279296875, 3.9852294921875, 4.1591796875, 4.3331298828125, 4.507080078125, 4.6810302734375, 4.85498046875, 5.0289306640625, 5.202880859375, 5.3768310546875, 5.55078125]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 5.0, 5.0, 11.0, 13.0, 23.0, 30.0, 46.0, 87.0, 114.0, 223.0, 375.0, 621.0, 1131.0, 2085.0, 3876.0, 7830.0, 16065.0, 35664.0, 90616.0, 310274.0, 389073.0, 110997.0, 41823.0, 18738.0, 8975.0, 4565.0, 2304.0, 1278.0, 732.0, 398.0, 214.0, 130.0, 87.0, 58.0, 34.0, 20.0, 14.0, 11.0, 5.0, 3.0, 4.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.57421875, -5.39495849609375, -5.2156982421875, -5.03643798828125, -4.857177734375, -4.67791748046875, -4.4986572265625, -4.31939697265625, -4.14013671875, -3.96087646484375, -3.7816162109375, -3.60235595703125, -3.423095703125, -3.24383544921875, -3.0645751953125, -2.88531494140625, -2.7060546875, -2.52679443359375, -2.3475341796875, -2.16827392578125, -1.989013671875, -1.80975341796875, -1.6304931640625, -1.45123291015625, -1.27197265625, -1.09271240234375, -0.9134521484375, -0.73419189453125, -0.554931640625, -0.37567138671875, -0.1964111328125, -0.01715087890625, 0.162109375, 0.34136962890625, 0.5206298828125, 0.69989013671875, 0.879150390625, 1.05841064453125, 1.2376708984375, 1.41693115234375, 1.59619140625, 1.77545166015625, 1.9547119140625, 2.13397216796875, 2.313232421875, 2.49249267578125, 2.6717529296875, 2.85101318359375, 3.0302734375, 3.20953369140625, 3.3887939453125, 3.56805419921875, 3.747314453125, 3.92657470703125, 4.1058349609375, 4.28509521484375, 4.46435546875, 4.64361572265625, 4.8228759765625, 5.00213623046875, 5.181396484375, 5.36065673828125, 5.5399169921875, 5.71917724609375, 5.8984375]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 1.0, 14.0, 11.0, 15.0, 12.0, 18.0, 33.0, 21.0, 27.0, 45.0, 35.0, 47.0, 57.0, 67.0, 99.0, 363.0, 1630.0, 110.0, 82.0, 49.0, 38.0, 48.0, 35.0, 41.0, 37.0, 33.0, 23.0, 18.0, 15.0, 12.0, 5.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.609375, -21.7763671875, -20.943359375, -20.1103515625, -19.27734375, -18.4443359375, -17.611328125, -16.7783203125, -15.9453125, -15.1123046875, -14.279296875, -13.4462890625, -12.61328125, -11.7802734375, -10.947265625, -10.1142578125, -9.28125, -8.4482421875, -7.615234375, -6.7822265625, -5.94921875, -5.1162109375, -4.283203125, -3.4501953125, -2.6171875, -1.7841796875, -0.951171875, -0.1181640625, 0.71484375, 1.5478515625, 2.380859375, 3.2138671875, 4.046875, 4.8798828125, 5.712890625, 6.5458984375, 7.37890625, 8.2119140625, 9.044921875, 9.8779296875, 10.7109375, 11.5439453125, 12.376953125, 13.2099609375, 14.04296875, 14.8759765625, 15.708984375, 16.5419921875, 17.375, 18.2080078125, 19.041015625, 19.8740234375, 20.70703125, 21.5400390625, 22.373046875, 23.2060546875, 24.0390625, 24.8720703125, 25.705078125, 26.5380859375, 27.37109375, 28.2041015625, 29.037109375, 29.8701171875, 30.703125]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 5.0, 7.0, 12.0, 19.0, 22.0, 26.0, 34.0, 65.0, 79.0, 113.0, 164.0, 179.0, 250.0, 515.0, 3803.0, 2560797.0, 575637.0, 2626.0, 442.0, 245.0, 184.0, 115.0, 112.0, 75.0, 45.0, 36.0, 27.0, 17.0, 14.0, 11.0, 15.0, 5.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-72.125, -70.17236328125, -68.2197265625, -66.26708984375, -64.314453125, -62.36181640625, -60.4091796875, -58.45654296875, -56.50390625, -54.55126953125, -52.5986328125, -50.64599609375, -48.693359375, -46.74072265625, -44.7880859375, -42.83544921875, -40.8828125, -38.93017578125, -36.9775390625, -35.02490234375, -33.072265625, -31.11962890625, -29.1669921875, -27.21435546875, -25.26171875, -23.30908203125, -21.3564453125, -19.40380859375, -17.451171875, -15.49853515625, -13.5458984375, -11.59326171875, -9.640625, -7.68798828125, -5.7353515625, -3.78271484375, -1.830078125, 0.12255859375, 2.0751953125, 4.02783203125, 5.98046875, 7.93310546875, 9.8857421875, 11.83837890625, 13.791015625, 15.74365234375, 17.6962890625, 19.64892578125, 21.6015625, 23.55419921875, 25.5068359375, 27.45947265625, 29.412109375, 31.36474609375, 33.3173828125, 35.27001953125, 37.22265625, 39.17529296875, 41.1279296875, 43.08056640625, 45.033203125, 46.98583984375, 48.9384765625, 50.89111328125, 52.84375]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [40.0, 933.0, 48.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.907072067260742, -6.170079231262207, 4.566913604736328, 15.30390739440918, 26.0408992767334, 36.77789306640625, 47.51488494873047, 58.25187683105469, 68.9888687133789, 79.72586059570312, 90.46285247802734, 101.19984436035156, 111.93684387207031, 122.673828125, 133.41082763671875, 144.1478271484375, 154.8848114013672, 165.62181091308594, 176.35879516601562, 187.09579467773438, 197.83277893066406, 208.5697784423828, 219.3067626953125, 230.04376220703125, 240.78076171875, 251.51776123046875, 262.2547607421875, 272.9917297363281, 283.7287292480469, 294.4657287597656, 305.2027282714844, 315.939697265625, 326.6767272949219, 337.4137268066406, 348.1507263183594, 358.8876953125, 369.62469482421875, 380.3616943359375, 391.09869384765625, 401.835693359375, 412.5726623535156, 423.3096618652344, 434.0466613769531, 444.78363037109375, 455.5206298828125, 466.25762939453125, 476.99462890625, 487.73162841796875, 498.4686279296875, 509.20562744140625, 519.942626953125, 530.6796264648438, 541.4166259765625, 552.153564453125, 562.8905639648438, 573.6275634765625, 584.3645629882812, 595.1015625, 605.8385620117188, 616.5755615234375, 627.3125610351562, 638.0494995117188, 648.7864990234375, 659.5234985351562, 670.260498046875]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 4.0, 7.0, 4.0, 5.0, 5.0, 9.0, 15.0, 13.0, 12.0, 15.0, 24.0, 22.0, 17.0, 22.0, 36.0, 29.0, 30.0, 39.0, 27.0, 53.0, 37.0, 51.0, 48.0, 30.0, 39.0, 44.0, 59.0, 34.0, 26.0, 36.0, 23.0, 22.0, 16.0, 26.0, 25.0, 22.0, 16.0, 16.0, 11.0, 10.0, 8.0, 4.0, 6.0, 4.0, 4.0, 2.0, 1.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-44.36754608154297, -42.76799774169922, -41.16844940185547, -39.56890106201172, -37.96935272216797, -36.36980438232422, -34.77025604248047, -33.17070388793945, -31.571155548095703, -29.971607208251953, -28.372058868408203, -26.772510528564453, -25.17296028137207, -23.57341194152832, -21.97386360168457, -20.374313354492188, -18.77476692199707, -17.17521858215332, -15.575669288635254, -13.976120948791504, -12.376571655273438, -10.777023315429688, -9.177474975585938, -7.577925682067871, -5.978377342224121, -4.378828525543213, -2.779279947280884, -1.1797313690185547, 0.4198174476623535, 2.0193662643432617, 3.6189146041870117, 5.218463897705078, 6.818012237548828, 8.417560577392578, 10.017109870910645, 11.616658210754395, 13.216207504272461, 14.815755844116211, 16.41530418395996, 18.014854431152344, 19.614402770996094, 21.213951110839844, 22.813499450683594, 24.413047790527344, 26.012598037719727, 27.612146377563477, 29.211694717407227, 30.81124496459961, 32.410789489746094, 34.010337829589844, 35.609886169433594, 37.209434509277344, 38.808982849121094, 40.408531188964844, 42.008079528808594, 43.60763168334961, 45.20718002319336, 46.80672836303711, 48.40627670288086, 50.00582504272461, 51.60537338256836, 53.204925537109375, 54.804473876953125, 56.404022216796875, 58.003570556640625]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 2.0, 5.0, 3.0, 3.0, 6.0, 8.0, 8.0, 8.0, 11.0, 20.0, 12.0, 22.0, 26.0, 16.0, 19.0, 26.0, 24.0, 34.0, 23.0, 41.0, 35.0, 32.0, 47.0, 44.0, 41.0, 45.0, 37.0, 42.0, 33.0, 36.0, 30.0, 27.0, 29.0, 24.0, 22.0, 18.0, 26.0, 20.0, 20.0, 16.0, 9.0, 12.0, 6.0, 7.0, 6.0, 6.0, 6.0, 3.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.99609375, -5.806884765625, -5.61767578125, -5.428466796875, -5.2392578125, -5.050048828125, -4.86083984375, -4.671630859375, -4.482421875, -4.293212890625, -4.10400390625, -3.914794921875, -3.7255859375, -3.536376953125, -3.34716796875, -3.157958984375, -2.96875, -2.779541015625, -2.59033203125, -2.401123046875, -2.2119140625, -2.022705078125, -1.83349609375, -1.644287109375, -1.455078125, -1.265869140625, -1.07666015625, -0.887451171875, -0.6982421875, -0.509033203125, -0.31982421875, -0.130615234375, 0.05859375, 0.247802734375, 0.43701171875, 0.626220703125, 0.8154296875, 1.004638671875, 1.19384765625, 1.383056640625, 1.572265625, 1.761474609375, 1.95068359375, 2.139892578125, 2.3291015625, 2.518310546875, 2.70751953125, 2.896728515625, 3.0859375, 3.275146484375, 3.46435546875, 3.653564453125, 3.8427734375, 4.031982421875, 4.22119140625, 4.410400390625, 4.599609375, 4.788818359375, 4.97802734375, 5.167236328125, 5.3564453125, 5.545654296875, 5.73486328125, 5.924072265625, 6.11328125]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 3.0, 6.0, 3.0, 7.0, 2.0, 6.0, 9.0, 7.0, 9.0, 10.0, 9.0, 17.0, 20.0, 26.0, 42.0, 46.0, 57.0, 100.0, 193.0, 427.0, 908.0, 2603.0, 7785.0, 30996.0, 213521.0, 2292961.0, 1494165.0, 119831.0, 20980.0, 5756.0, 1986.0, 806.0, 380.0, 204.0, 125.0, 73.0, 44.0, 29.0, 29.0, 13.0, 22.0, 17.0, 11.0, 6.0, 15.0, 7.0, 7.0, 3.0, 4.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.03125, -14.5107421875, -13.990234375, -13.4697265625, -12.94921875, -12.4287109375, -11.908203125, -11.3876953125, -10.8671875, -10.3466796875, -9.826171875, -9.3056640625, -8.78515625, -8.2646484375, -7.744140625, -7.2236328125, -6.703125, -6.1826171875, -5.662109375, -5.1416015625, -4.62109375, -4.1005859375, -3.580078125, -3.0595703125, -2.5390625, -2.0185546875, -1.498046875, -0.9775390625, -0.45703125, 0.0634765625, 0.583984375, 1.1044921875, 1.625, 2.1455078125, 2.666015625, 3.1865234375, 3.70703125, 4.2275390625, 4.748046875, 5.2685546875, 5.7890625, 6.3095703125, 6.830078125, 7.3505859375, 7.87109375, 8.3916015625, 8.912109375, 9.4326171875, 9.953125, 10.4736328125, 10.994140625, 11.5146484375, 12.03515625, 12.5556640625, 13.076171875, 13.5966796875, 14.1171875, 14.6376953125, 15.158203125, 15.6787109375, 16.19921875, 16.7197265625, 17.240234375, 17.7607421875, 18.28125]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 6.0, 12.0, 13.0, 27.0, 37.0, 70.0, 104.0, 182.0, 269.0, 409.0, 676.0, 782.0, 536.0, 338.0, 184.0, 153.0, 102.0, 49.0, 37.0, 31.0, 18.0, 19.0, 6.0, 5.0, 3.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-21.71875, -21.150390625, -20.58203125, -20.013671875, -19.4453125, -18.876953125, -18.30859375, -17.740234375, -17.171875, -16.603515625, -16.03515625, -15.466796875, -14.8984375, -14.330078125, -13.76171875, -13.193359375, -12.625, -12.056640625, -11.48828125, -10.919921875, -10.3515625, -9.783203125, -9.21484375, -8.646484375, -8.078125, -7.509765625, -6.94140625, -6.373046875, -5.8046875, -5.236328125, -4.66796875, -4.099609375, -3.53125, -2.962890625, -2.39453125, -1.826171875, -1.2578125, -0.689453125, -0.12109375, 0.447265625, 1.015625, 1.583984375, 2.15234375, 2.720703125, 3.2890625, 3.857421875, 4.42578125, 4.994140625, 5.5625, 6.130859375, 6.69921875, 7.267578125, 7.8359375, 8.404296875, 8.97265625, 9.541015625, 10.109375, 10.677734375, 11.24609375, 11.814453125, 12.3828125, 12.951171875, 13.51953125, 14.087890625, 14.65625]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 4.0, 1.0, 12.0, 11.0, 23.0, 29.0, 33.0, 66.0, 119.0, 183.0, 288.0, 619.0, 3361.0, 280137.0, 3887482.0, 19777.0, 1200.0, 399.0, 216.0, 139.0, 63.0, 41.0, 32.0, 22.0, 11.0, 8.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.875, -54.623046875, -52.37109375, -50.119140625, -47.8671875, -45.615234375, -43.36328125, -41.111328125, -38.859375, -36.607421875, -34.35546875, -32.103515625, -29.8515625, -27.599609375, -25.34765625, -23.095703125, -20.84375, -18.591796875, -16.33984375, -14.087890625, -11.8359375, -9.583984375, -7.33203125, -5.080078125, -2.828125, -0.576171875, 1.67578125, 3.927734375, 6.1796875, 8.431640625, 10.68359375, 12.935546875, 15.1875, 17.439453125, 19.69140625, 21.943359375, 24.1953125, 26.447265625, 28.69921875, 30.951171875, 33.203125, 35.455078125, 37.70703125, 39.958984375, 42.2109375, 44.462890625, 46.71484375, 48.966796875, 51.21875, 53.470703125, 55.72265625, 57.974609375, 60.2265625, 62.478515625, 64.73046875, 66.982421875, 69.234375, 71.486328125, 73.73828125, 75.990234375, 78.2421875, 80.494140625, 82.74609375, 84.998046875, 87.25]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 12.0, 42.0, 187.0, 354.0, 287.0, 105.0, 25.0, 7.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-127.70011901855469, -121.52505493164062, -115.34999084472656, -109.17493438720703, -102.99987030029297, -96.8248062133789, -90.64974975585938, -84.47468566894531, -78.29962158203125, -72.12455749511719, -65.94949340820312, -59.774436950683594, -53.59937286376953, -47.42430877685547, -41.24924850463867, -35.074188232421875, -28.899124145507812, -22.724061965942383, -16.548999786376953, -10.373937606811523, -4.198875427246094, 1.976186752319336, 8.151248931884766, 14.326309204101562, 20.501373291015625, 26.676435470581055, 32.851497650146484, 39.02655792236328, 45.201622009277344, 51.376686096191406, 57.5517463684082, 63.726806640625, 69.90188598632812, 76.07695007324219, 82.25201416015625, 88.42707061767578, 94.60213470458984, 100.7771987915039, 106.95225524902344, 113.1273193359375, 119.30238342285156, 125.47744750976562, 131.6525115966797, 137.82757568359375, 144.00262451171875, 150.1776885986328, 156.35275268554688, 162.52781677246094, 168.702880859375, 174.87794494628906, 181.05300903320312, 187.2280731201172, 193.40313720703125, 199.57818603515625, 205.7532501220703, 211.92831420898438, 218.10337829589844, 224.2784423828125, 230.45350646972656, 236.62857055664062, 242.80361938476562, 248.9786834716797, 255.15374755859375, 261.32879638671875, 267.5038757324219]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 4.0, 5.0, 3.0, 9.0, 7.0, 17.0, 7.0, 10.0, 12.0, 16.0, 18.0, 31.0, 26.0, 23.0, 33.0, 36.0, 30.0, 30.0, 31.0, 41.0, 50.0, 47.0, 46.0, 45.0, 35.0, 48.0, 38.0, 33.0, 46.0, 36.0, 23.0, 22.0, 19.0, 19.0, 21.0, 26.0, 8.0, 12.0, 13.0, 8.0, 7.0, 5.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-41.65663146972656, -40.322784423828125, -38.98893737792969, -37.65509033203125, -36.32124710083008, -34.98740005493164, -33.6535530090332, -32.319705963134766, -30.98586082458496, -29.652013778686523, -28.31816864013672, -26.98432159423828, -25.650474548339844, -24.31662940979004, -22.9827823638916, -21.648937225341797, -20.31509017944336, -18.981243133544922, -17.647397994995117, -16.31355094909668, -14.979704856872559, -13.645858764648438, -12.31201171875, -10.978165626525879, -9.644319534301758, -8.310473442077637, -6.976626873016357, -5.642780303955078, -4.308934211730957, -2.975088119506836, -1.6412410736083984, -0.30739498138427734, 1.0264511108398438, 2.360297441482544, 3.694143772125244, 5.027990341186523, 6.3618364334106445, 7.695682525634766, 9.029529571533203, 10.363375663757324, 11.697221755981445, 13.031067848205566, 14.364913940429688, 15.698760986328125, 17.032608032226562, 18.366453170776367, 19.700300216674805, 21.03414535522461, 22.367992401123047, 23.701839447021484, 25.03568458557129, 26.369531631469727, 27.70337677001953, 29.03722381591797, 30.371070861816406, 31.704917907714844, 33.03876495361328, 34.37261199951172, 35.706459045410156, 37.040306091308594, 38.374149322509766, 39.7079963684082, 41.04184341430664, 42.37569046020508, 43.70953369140625]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 5.0, 8.0, 12.0, 4.0, 10.0, 12.0, 14.0, 15.0, 19.0, 18.0, 17.0, 22.0, 25.0, 33.0, 28.0, 33.0, 34.0, 35.0, 60.0, 34.0, 42.0, 42.0, 46.0, 46.0, 42.0, 47.0, 36.0, 32.0, 26.0, 29.0, 36.0, 21.0, 21.0, 14.0, 16.0, 18.0, 7.0, 4.0, 13.0, 8.0, 3.0, 9.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.8359375, -6.6302490234375, -6.424560546875, -6.2188720703125, -6.01318359375, -5.8074951171875, -5.601806640625, -5.3961181640625, -5.1904296875, -4.9847412109375, -4.779052734375, -4.5733642578125, -4.36767578125, -4.1619873046875, -3.956298828125, -3.7506103515625, -3.544921875, -3.3392333984375, -3.133544921875, -2.9278564453125, -2.72216796875, -2.5164794921875, -2.310791015625, -2.1051025390625, -1.8994140625, -1.6937255859375, -1.488037109375, -1.2823486328125, -1.07666015625, -0.8709716796875, -0.665283203125, -0.4595947265625, -0.25390625, -0.0482177734375, 0.157470703125, 0.3631591796875, 0.56884765625, 0.7745361328125, 0.980224609375, 1.1859130859375, 1.3916015625, 1.5972900390625, 1.802978515625, 2.0086669921875, 2.21435546875, 2.4200439453125, 2.625732421875, 2.8314208984375, 3.037109375, 3.2427978515625, 3.448486328125, 3.6541748046875, 3.85986328125, 4.0655517578125, 4.271240234375, 4.4769287109375, 4.6826171875, 4.8883056640625, 5.093994140625, 5.2996826171875, 5.50537109375, 5.7110595703125, 5.916748046875, 6.1224365234375, 6.328125]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 2.0, 8.0, 10.0, 13.0, 27.0, 33.0, 46.0, 75.0, 105.0, 194.0, 311.0, 564.0, 839.0, 1413.0, 2197.0, 3523.0, 5768.0, 9717.0, 16453.0, 28849.0, 52375.0, 95410.0, 163024.0, 222039.0, 185876.0, 113968.0, 62833.0, 34248.0, 19601.0, 11311.0, 6747.0, 4149.0, 2630.0, 1644.0, 1004.0, 576.0, 356.0, 246.0, 151.0, 77.0, 51.0, 28.0, 24.0, 23.0, 5.0, 8.0, 6.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.28955078125, -0.28040313720703125, -0.2712554931640625, -0.26210784912109375, -0.252960205078125, -0.24381256103515625, -0.2346649169921875, -0.22551727294921875, -0.21636962890625, -0.20722198486328125, -0.1980743408203125, -0.18892669677734375, -0.179779052734375, -0.17063140869140625, -0.1614837646484375, -0.15233612060546875, -0.1431884765625, -0.13404083251953125, -0.1248931884765625, -0.11574554443359375, -0.106597900390625, -0.09745025634765625, -0.0883026123046875, -0.07915496826171875, -0.07000732421875, -0.06085968017578125, -0.0517120361328125, -0.04256439208984375, -0.033416748046875, -0.02426910400390625, -0.0151214599609375, -0.00597381591796875, 0.003173828125, 0.01232147216796875, 0.0214691162109375, 0.03061676025390625, 0.039764404296875, 0.04891204833984375, 0.0580596923828125, 0.06720733642578125, 0.07635498046875, 0.08550262451171875, 0.0946502685546875, 0.10379791259765625, 0.112945556640625, 0.12209320068359375, 0.1312408447265625, 0.14038848876953125, 0.1495361328125, 0.15868377685546875, 0.1678314208984375, 0.17697906494140625, 0.186126708984375, 0.19527435302734375, 0.2044219970703125, 0.21356964111328125, 0.22271728515625, 0.23186492919921875, 0.2410125732421875, 0.25016021728515625, 0.259307861328125, 0.26845550537109375, 0.2776031494140625, 0.28675079345703125, 0.2958984375]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 7.0, 7.0, 7.0, 8.0, 8.0, 8.0, 19.0, 12.0, 18.0, 14.0, 19.0, 20.0, 37.0, 32.0, 31.0, 37.0, 34.0, 42.0, 42.0, 41.0, 29.0, 1058.0, 41.0, 35.0, 42.0, 38.0, 34.0, 37.0, 38.0, 30.0, 29.0, 26.0, 20.0, 23.0, 15.0, 22.0, 14.0, 11.0, 13.0, 9.0, 3.0, 7.0, 7.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.53125, -3.40264892578125, -3.2740478515625, -3.14544677734375, -3.016845703125, -2.88824462890625, -2.7596435546875, -2.63104248046875, -2.50244140625, -2.37384033203125, -2.2452392578125, -2.11663818359375, -1.988037109375, -1.85943603515625, -1.7308349609375, -1.60223388671875, -1.4736328125, -1.34503173828125, -1.2164306640625, -1.08782958984375, -0.959228515625, -0.83062744140625, -0.7020263671875, -0.57342529296875, -0.44482421875, -0.31622314453125, -0.1876220703125, -0.05902099609375, 0.069580078125, 0.19818115234375, 0.3267822265625, 0.45538330078125, 0.583984375, 0.71258544921875, 0.8411865234375, 0.96978759765625, 1.098388671875, 1.22698974609375, 1.3555908203125, 1.48419189453125, 1.61279296875, 1.74139404296875, 1.8699951171875, 1.99859619140625, 2.127197265625, 2.25579833984375, 2.3843994140625, 2.51300048828125, 2.6416015625, 2.77020263671875, 2.8988037109375, 3.02740478515625, 3.156005859375, 3.28460693359375, 3.4132080078125, 3.54180908203125, 3.67041015625, 3.79901123046875, 3.9276123046875, 4.05621337890625, 4.184814453125, 4.31341552734375, 4.4420166015625, 4.57061767578125, 4.69921875]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [5.0, 2.0, 5.0, 5.0, 5.0, 7.0, 12.0, 22.0, 46.0, 72.0, 107.0, 178.0, 281.0, 435.0, 695.0, 1120.0, 1698.0, 2625.0, 3929.0, 6205.0, 9889.0, 15297.0, 25093.0, 41170.0, 68006.0, 106097.0, 153280.0, 1227419.0, 152935.0, 105477.0, 67002.0, 41058.0, 24812.0, 15264.0, 9509.0, 6254.0, 3882.0, 2561.0, 1710.0, 1084.0, 703.0, 461.0, 293.0, 166.0, 98.0, 64.0, 39.0, 22.0, 12.0, 12.0, 13.0, 2.0, 4.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1959228515625, -0.1887950897216797, -0.18166732788085938, -0.17453956604003906, -0.16741180419921875, -0.16028404235839844, -0.15315628051757812, -0.1460285186767578, -0.1389007568359375, -0.1317729949951172, -0.12464523315429688, -0.11751747131347656, -0.11038970947265625, -0.10326194763183594, -0.09613418579101562, -0.08900642395019531, -0.081878662109375, -0.07475090026855469, -0.06762313842773438, -0.06049537658691406, -0.05336761474609375, -0.04623985290527344, -0.039112091064453125, -0.03198432922363281, -0.0248565673828125, -0.017728805541992188, -0.010601043701171875, -0.0034732818603515625, 0.00365447998046875, 0.010782241821289062, 0.017910003662109375, 0.025037765502929688, 0.03216552734375, 0.03929328918457031, 0.046421051025390625, 0.05354881286621094, 0.06067657470703125, 0.06780433654785156, 0.07493209838867188, 0.08205986022949219, 0.0891876220703125, 0.09631538391113281, 0.10344314575195312, 0.11057090759277344, 0.11769866943359375, 0.12482643127441406, 0.13195419311523438, 0.1390819549560547, 0.146209716796875, 0.1533374786376953, 0.16046524047851562, 0.16759300231933594, 0.17472076416015625, 0.18184852600097656, 0.18897628784179688, 0.1961040496826172, 0.2032318115234375, 0.2103595733642578, 0.21748733520507812, 0.22461509704589844, 0.23174285888671875, 0.23887062072753906, 0.24599838256835938, 0.2531261444091797, 0.26025390625]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 8.0, 4.0, 8.0, 14.0, 22.0, 14.0, 26.0, 37.0, 29.0, 46.0, 64.0, 78.0, 68.0, 55.0, 69.0, 56.0, 56.0, 52.0, 49.0, 40.0, 45.0, 46.0, 18.0, 20.0, 13.0, 14.0, 10.0, 5.0, 9.0, 6.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0012903213500976562, -0.0012526065111160278, -0.0012148916721343994, -0.001177176833152771, -0.0011394619941711426, -0.0011017471551895142, -0.0010640323162078857, -0.0010263174772262573, -0.000988602638244629, -0.0009508877992630005, -0.0009131729602813721, -0.0008754581212997437, -0.0008377432823181152, -0.0008000284433364868, -0.0007623136043548584, -0.00072459876537323, -0.0006868839263916016, -0.0006491690874099731, -0.0006114542484283447, -0.0005737394094467163, -0.0005360245704650879, -0.0004983097314834595, -0.00046059489250183105, -0.00042288005352020264, -0.0003851652145385742, -0.0003474503755569458, -0.0003097355365753174, -0.00027202069759368896, -0.00023430585861206055, -0.00019659101963043213, -0.0001588761806488037, -0.00012116134166717529, -8.344650268554688e-05, -4.573166370391846e-05, -8.016824722290039e-06, 2.969801425933838e-05, 6.74128532409668e-05, 0.00010512769222259521, 0.00014284253120422363, 0.00018055737018585205, 0.00021827220916748047, 0.0002559870481491089, 0.0002937018871307373, 0.0003314167261123657, 0.00036913156509399414, 0.00040684640407562256, 0.000444561243057251, 0.0004822760820388794, 0.0005199909210205078, 0.0005577057600021362, 0.0005954205989837646, 0.0006331354379653931, 0.0006708502769470215, 0.0007085651159286499, 0.0007462799549102783, 0.0007839947938919067, 0.0008217096328735352, 0.0008594244718551636, 0.000897139310836792, 0.0009348541498184204, 0.0009725689888000488, 0.0010102838277816772, 0.0010479986667633057, 0.001085713505744934, 0.0011234283447265625]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 2.0, 7.0, 5.0, 8.0, 10.0, 14.0, 9.0, 16.0, 25.0, 29.0, 34.0, 58.0, 81.0, 77.0, 153.0, 193.0, 416.0, 3361.0, 463024.0, 575665.0, 4175.0, 514.0, 201.0, 143.0, 81.0, 59.0, 46.0, 31.0, 22.0, 18.0, 22.0, 8.0, 10.0, 11.0, 4.0, 6.0, 3.0, 5.0, 4.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0208892822265625, -0.02019357681274414, -0.01949787139892578, -0.018802165985107422, -0.018106460571289062, -0.017410755157470703, -0.016715049743652344, -0.016019344329833984, -0.015323638916015625, -0.014627933502197266, -0.013932228088378906, -0.013236522674560547, -0.012540817260742188, -0.011845111846923828, -0.011149406433105469, -0.01045370101928711, -0.00975799560546875, -0.00906229019165039, -0.008366584777832031, -0.007670879364013672, -0.0069751739501953125, -0.006279468536376953, -0.005583763122558594, -0.004888057708740234, -0.004192352294921875, -0.0034966468811035156, -0.0028009414672851562, -0.002105236053466797, -0.0014095306396484375, -0.0007138252258300781, -1.811981201171875e-05, 0.0006775856018066406, 0.001373291015625, 0.0020689964294433594, 0.0027647018432617188, 0.003460407257080078, 0.0041561126708984375, 0.004851818084716797, 0.005547523498535156, 0.006243228912353516, 0.006938934326171875, 0.007634639739990234, 0.008330345153808594, 0.009026050567626953, 0.009721755981445312, 0.010417461395263672, 0.011113166809082031, 0.01180887222290039, 0.01250457763671875, 0.01320028305053711, 0.013895988464355469, 0.014591693878173828, 0.015287399291992188, 0.015983104705810547, 0.016678810119628906, 0.017374515533447266, 0.018070220947265625, 0.018765926361083984, 0.019461631774902344, 0.020157337188720703, 0.020853042602539062, 0.021548748016357422, 0.02224445343017578, 0.02294015884399414, 0.0236358642578125]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 111.0, 787.0, 117.0], "bins": [-0.016888847574591637, -0.01661873236298561, -0.016348615288734436, -0.01607850007712841, -0.015808383002877235, -0.01553826779127121, -0.01526815164834261, -0.014998035505414009, -0.014727920293807983, -0.014457804150879383, -0.014187688007950783, -0.013917572796344757, -0.013647456653416157, -0.013377340510487556, -0.013107224367558956, -0.012837108224630356, -0.01256699301302433, -0.01229687687009573, -0.01202676072716713, -0.011756645515561104, -0.011486529372632504, -0.011216413229703903, -0.010946297086775303, -0.010676180943846703, -0.010406064800918102, -0.010135948657989502, -0.009865832515060902, -0.009595717303454876, -0.009325601160526276, -0.009055485017597675, -0.008785368874669075, -0.00851525366306305, -0.008245136588811874, -0.007975020445883274, -0.007704904768615961, -0.007434788625687361, -0.007164672948420048, -0.0068945568054914474, -0.006624440662562847, -0.006354324985295534, -0.006084209308028221, -0.005814093165099621, -0.005543977487832308, -0.0052738613449037075, -0.0050037456676363945, -0.004733629524707794, -0.004463513381779194, -0.004193397704511881, -0.0039232815615832806, -0.003653165651485324, -0.0033830497413873672, -0.003112933598458767, -0.002842817921191454, -0.0025727017782628536, -0.002302585868164897, -0.0020324699580669403, -0.0017623540479689837, -0.001492238137871027, -0.0012221222277730703, -0.0009520062012597919, -0.0006818902911618352, -0.00041177438106387854, -0.00014165835455060005, 0.0001284575555473566, 0.0003985734365414828]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 8.0, 10.0, 10.0, 12.0, 26.0, 12.0, 23.0, 24.0, 45.0, 27.0, 27.0, 37.0, 42.0, 40.0, 42.0, 33.0, 45.0, 58.0, 40.0, 49.0, 39.0, 51.0, 45.0, 46.0, 32.0, 27.0, 21.0, 21.0, 21.0, 13.0, 20.0, 16.0, 8.0, 4.0, 6.0, 8.0, 5.0, 6.0, 5.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005409121513366699, -0.0005204863846302032, -0.0005000606179237366, -0.0004796348512172699, -0.0004592090845108032, -0.00043878331780433655, -0.0004183575510978699, -0.0003979317843914032, -0.0003775060176849365, -0.00035708025097846985, -0.0003366544842720032, -0.0003162287175655365, -0.0002958029508590698, -0.00027537718415260315, -0.0002549514174461365, -0.0002345256507396698, -0.00021409988403320312, -0.00019367411732673645, -0.00017324835062026978, -0.0001528225839138031, -0.00013239681720733643, -0.00011197105050086975, -9.154528379440308e-05, -7.11195170879364e-05, -5.0693750381469727e-05, -3.0267983675003052e-05, -9.842216968536377e-06, 1.0583549737930298e-05, 3.100931644439697e-05, 5.143508315086365e-05, 7.186084985733032e-05, 9.2286616563797e-05, 0.00011271238327026367, 0.00013313814997673035, 0.00015356391668319702, 0.0001739896833896637, 0.00019441545009613037, 0.00021484121680259705, 0.00023526698350906372, 0.0002556927502155304, 0.00027611851692199707, 0.00029654428362846375, 0.0003169700503349304, 0.0003373958170413971, 0.00035782158374786377, 0.00037824735045433044, 0.0003986731171607971, 0.0004190988838672638, 0.00043952465057373047, 0.00045995041728019714, 0.0004803761839866638, 0.0005008019506931305, 0.0005212277173995972, 0.0005416534841060638, 0.0005620792508125305, 0.0005825050175189972, 0.0006029307842254639, 0.0006233565509319305, 0.0006437823176383972, 0.0006642080843448639, 0.0006846338510513306, 0.0007050596177577972, 0.0007254853844642639, 0.0007459111511707306, 0.0007663369178771973]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 5.0, 8.0, 12.0, 4.0, 10.0, 12.0, 14.0, 15.0, 19.0, 18.0, 17.0, 22.0, 25.0, 33.0, 28.0, 33.0, 34.0, 35.0, 60.0, 34.0, 42.0, 42.0, 46.0, 46.0, 42.0, 47.0, 36.0, 32.0, 26.0, 29.0, 36.0, 21.0, 21.0, 14.0, 16.0, 18.0, 7.0, 4.0, 13.0, 8.0, 3.0, 9.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.8359375, -6.6302490234375, -6.424560546875, -6.2188720703125, -6.01318359375, -5.8074951171875, -5.601806640625, -5.3961181640625, -5.1904296875, -4.9847412109375, -4.779052734375, -4.5733642578125, -4.36767578125, -4.1619873046875, -3.956298828125, -3.7506103515625, -3.544921875, -3.3392333984375, -3.133544921875, -2.9278564453125, -2.72216796875, -2.5164794921875, -2.310791015625, -2.1051025390625, -1.8994140625, -1.6937255859375, -1.488037109375, -1.2823486328125, -1.07666015625, -0.8709716796875, -0.665283203125, -0.4595947265625, -0.25390625, -0.0482177734375, 0.157470703125, 0.3631591796875, 0.56884765625, 0.7745361328125, 0.980224609375, 1.1859130859375, 1.3916015625, 1.5972900390625, 1.802978515625, 2.0086669921875, 2.21435546875, 2.4200439453125, 2.625732421875, 2.8314208984375, 3.037109375, 3.2427978515625, 3.448486328125, 3.6541748046875, 3.85986328125, 4.0655517578125, 4.271240234375, 4.4769287109375, 4.6826171875, 4.8883056640625, 5.093994140625, 5.2996826171875, 5.50537109375, 5.7110595703125, 5.916748046875, 6.1224365234375, 6.328125]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 7.0, 2.0, 9.0, 11.0, 18.0, 15.0, 18.0, 24.0, 39.0, 49.0, 55.0, 81.0, 143.0, 200.0, 311.0, 643.0, 1240.0, 2626.0, 5773.0, 13079.0, 30428.0, 79600.0, 289188.0, 438974.0, 113986.0, 40489.0, 17114.0, 7540.0, 3399.0, 1601.0, 795.0, 400.0, 231.0, 128.0, 93.0, 54.0, 40.0, 34.0, 43.0, 27.0, 11.0, 9.0, 7.0, 11.0, 6.0, 3.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-6.98828125, -6.77752685546875, -6.5667724609375, -6.35601806640625, -6.145263671875, -5.93450927734375, -5.7237548828125, -5.51300048828125, -5.30224609375, -5.09149169921875, -4.8807373046875, -4.66998291015625, -4.459228515625, -4.24847412109375, -4.0377197265625, -3.82696533203125, -3.6162109375, -3.40545654296875, -3.1947021484375, -2.98394775390625, -2.773193359375, -2.56243896484375, -2.3516845703125, -2.14093017578125, -1.93017578125, -1.71942138671875, -1.5086669921875, -1.29791259765625, -1.087158203125, -0.87640380859375, -0.6656494140625, -0.45489501953125, -0.244140625, -0.03338623046875, 0.1773681640625, 0.38812255859375, 0.598876953125, 0.80963134765625, 1.0203857421875, 1.23114013671875, 1.44189453125, 1.65264892578125, 1.8634033203125, 2.07415771484375, 2.284912109375, 2.49566650390625, 2.7064208984375, 2.91717529296875, 3.1279296875, 3.33868408203125, 3.5494384765625, 3.76019287109375, 3.970947265625, 4.18170166015625, 4.3924560546875, 4.60321044921875, 4.81396484375, 5.02471923828125, 5.2354736328125, 5.44622802734375, 5.656982421875, 5.86773681640625, 6.0784912109375, 6.28924560546875, 6.5]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0, 5.0, 5.0, 7.0, 4.0, 7.0, 13.0, 10.0, 14.0, 19.0, 17.0, 18.0, 30.0, 28.0, 36.0, 39.0, 30.0, 35.0, 49.0, 41.0, 51.0, 82.0, 240.0, 1604.0, 191.0, 48.0, 56.0, 39.0, 34.0, 38.0, 40.0, 22.0, 31.0, 25.0, 24.0, 18.0, 16.0, 16.0, 14.0, 13.0, 8.0, 9.0, 1.0, 9.0, 4.0, 3.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-16.8125, -16.239990234375, -15.66748046875, -15.094970703125, -14.5224609375, -13.949951171875, -13.37744140625, -12.804931640625, -12.232421875, -11.659912109375, -11.08740234375, -10.514892578125, -9.9423828125, -9.369873046875, -8.79736328125, -8.224853515625, -7.65234375, -7.079833984375, -6.50732421875, -5.934814453125, -5.3623046875, -4.789794921875, -4.21728515625, -3.644775390625, -3.072265625, -2.499755859375, -1.92724609375, -1.354736328125, -0.7822265625, -0.209716796875, 0.36279296875, 0.935302734375, 1.5078125, 2.080322265625, 2.65283203125, 3.225341796875, 3.7978515625, 4.370361328125, 4.94287109375, 5.515380859375, 6.087890625, 6.660400390625, 7.23291015625, 7.805419921875, 8.3779296875, 8.950439453125, 9.52294921875, 10.095458984375, 10.66796875, 11.240478515625, 11.81298828125, 12.385498046875, 12.9580078125, 13.530517578125, 14.10302734375, 14.675537109375, 15.248046875, 15.820556640625, 16.39306640625, 16.965576171875, 17.5380859375, 18.110595703125, 18.68310546875, 19.255615234375, 19.828125]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 7.0, 2.0, 5.0, 11.0, 8.0, 11.0, 16.0, 17.0, 23.0, 32.0, 36.0, 38.0, 72.0, 79.0, 104.0, 151.0, 258.0, 444.0, 1274.0, 8152.0, 1674827.0, 1449424.0, 8108.0, 1254.0, 437.0, 234.0, 145.0, 128.0, 88.0, 68.0, 48.0, 42.0, 39.0, 21.0, 29.0, 16.0, 14.0, 12.0, 1.0, 9.0, 5.0, 4.0, 3.0, 1.0, 6.0, 3.0, 0.0, 3.0, 0.0, 1.0], "bins": [-52.9375, -51.4248046875, -49.912109375, -48.3994140625, -46.88671875, -45.3740234375, -43.861328125, -42.3486328125, -40.8359375, -39.3232421875, -37.810546875, -36.2978515625, -34.78515625, -33.2724609375, -31.759765625, -30.2470703125, -28.734375, -27.2216796875, -25.708984375, -24.1962890625, -22.68359375, -21.1708984375, -19.658203125, -18.1455078125, -16.6328125, -15.1201171875, -13.607421875, -12.0947265625, -10.58203125, -9.0693359375, -7.556640625, -6.0439453125, -4.53125, -3.0185546875, -1.505859375, 0.0068359375, 1.51953125, 3.0322265625, 4.544921875, 6.0576171875, 7.5703125, 9.0830078125, 10.595703125, 12.1083984375, 13.62109375, 15.1337890625, 16.646484375, 18.1591796875, 19.671875, 21.1845703125, 22.697265625, 24.2099609375, 25.72265625, 27.2353515625, 28.748046875, 30.2607421875, 31.7734375, 33.2861328125, 34.798828125, 36.3115234375, 37.82421875, 39.3369140625, 40.849609375, 42.3623046875, 43.875]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [3.0, 219.0, 786.0, 11.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.13313865661621, -12.336052894592285, -2.5389671325683594, 7.258119583129883, 17.055204391479492, 26.8522891998291, 36.649375915527344, 46.44645690917969, 56.24354553222656, 66.04063415527344, 75.83771514892578, 85.63480377197266, 95.431884765625, 105.22897338867188, 115.02606201171875, 124.8231430053711, 134.6202392578125, 144.41732788085938, 154.21441650390625, 164.01150512695312, 173.80857849121094, 183.6056671142578, 193.4027557373047, 203.1998291015625, 212.99691772460938, 222.79400634765625, 232.59109497070312, 242.38818359375, 252.1852569580078, 261.98236083984375, 271.7794189453125, 281.5765075683594, 291.3736267089844, 301.17071533203125, 310.9678039550781, 320.764892578125, 330.5619812011719, 340.35906982421875, 350.1561279296875, 359.9532165527344, 369.75030517578125, 379.5473937988281, 389.344482421875, 399.1415710449219, 408.93865966796875, 418.7357177734375, 428.5328369140625, 438.32989501953125, 448.12701416015625, 457.9241027832031, 467.72119140625, 477.5182800292969, 487.31536865234375, 497.1124267578125, 506.9095458984375, 516.7066040039062, 526.503662109375, 536.3007202148438, 546.0978393554688, 555.8948974609375, 565.6920166015625, 575.4890747070312, 585.2861938476562, 595.083251953125, 604.88037109375]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 5.0, 4.0, 8.0, 7.0, 18.0, 11.0, 11.0, 20.0, 21.0, 13.0, 18.0, 29.0, 30.0, 28.0, 31.0, 37.0, 34.0, 55.0, 33.0, 42.0, 35.0, 31.0, 46.0, 46.0, 43.0, 42.0, 41.0, 33.0, 30.0, 26.0, 24.0, 21.0, 17.0, 22.0, 20.0, 16.0, 13.0, 9.0, 4.0, 8.0, 6.0, 6.0, 6.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-46.55403137207031, -44.99959182739258, -43.445152282714844, -41.890708923339844, -40.33626937866211, -38.781829833984375, -37.22739028930664, -35.672950744628906, -34.118507385253906, -32.56406784057617, -31.009626388549805, -29.45518684387207, -27.900745391845703, -26.34630584716797, -24.791866302490234, -23.2374267578125, -21.682987213134766, -20.12854766845703, -18.574106216430664, -17.01966667175293, -15.465226173400879, -13.910785675048828, -12.356346130371094, -10.801905632019043, -9.247465133666992, -7.693024635314941, -6.138584613800049, -4.584144592285156, -3.0297040939331055, -1.4752635955810547, 0.07917594909667969, 1.6336164474487305, 3.1880569458007812, 4.742497444152832, 6.296937465667725, 7.851377487182617, 9.405817985534668, 10.960258483886719, 12.514698028564453, 14.069138526916504, 15.623579025268555, 17.17801856994629, 18.732460021972656, 20.28689956665039, 21.841339111328125, 23.395780563354492, 24.950220108032227, 26.504661560058594, 28.059101104736328, 29.613540649414062, 31.16798210144043, 32.72241973876953, 34.27686309814453, 35.831302642822266, 37.3857421875, 38.940181732177734, 40.49462127685547, 42.0490608215332, 43.60350036621094, 45.15794372558594, 46.71238327026367, 48.266822814941406, 49.82126235961914, 51.375701904296875, 52.930145263671875]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 4.0, 7.0, 8.0, 8.0, 8.0, 11.0, 16.0, 14.0, 24.0, 17.0, 19.0, 23.0, 22.0, 34.0, 33.0, 26.0, 31.0, 34.0, 47.0, 44.0, 44.0, 48.0, 53.0, 46.0, 47.0, 30.0, 24.0, 39.0, 43.0, 29.0, 29.0, 21.0, 21.0, 23.0, 8.0, 8.0, 14.0, 8.0, 7.0, 12.0, 11.0, 2.0, 3.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.37109375, -7.15032958984375, -6.9295654296875, -6.70880126953125, -6.488037109375, -6.26727294921875, -6.0465087890625, -5.82574462890625, -5.60498046875, -5.38421630859375, -5.1634521484375, -4.94268798828125, -4.721923828125, -4.50115966796875, -4.2803955078125, -4.05963134765625, -3.8388671875, -3.61810302734375, -3.3973388671875, -3.17657470703125, -2.955810546875, -2.73504638671875, -2.5142822265625, -2.29351806640625, -2.07275390625, -1.85198974609375, -1.6312255859375, -1.41046142578125, -1.189697265625, -0.96893310546875, -0.7481689453125, -0.52740478515625, -0.306640625, -0.08587646484375, 0.1348876953125, 0.35565185546875, 0.576416015625, 0.79718017578125, 1.0179443359375, 1.23870849609375, 1.45947265625, 1.68023681640625, 1.9010009765625, 2.12176513671875, 2.342529296875, 2.56329345703125, 2.7840576171875, 3.00482177734375, 3.2255859375, 3.44635009765625, 3.6671142578125, 3.88787841796875, 4.108642578125, 4.32940673828125, 4.5501708984375, 4.77093505859375, 4.99169921875, 5.21246337890625, 5.4332275390625, 5.65399169921875, 5.874755859375, 6.09552001953125, 6.3162841796875, 6.53704833984375, 6.7578125]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 4.0, 6.0, 4.0, 8.0, 8.0, 10.0, 13.0, 13.0, 21.0, 12.0, 24.0, 40.0, 50.0, 94.0, 115.0, 223.0, 479.0, 962.0, 2576.0, 7575.0, 29735.0, 203845.0, 2343875.0, 1461936.0, 112385.0, 20366.0, 5913.0, 2056.0, 841.0, 420.0, 222.0, 142.0, 86.0, 58.0, 33.0, 24.0, 27.0, 12.0, 12.0, 8.0, 12.0, 5.0, 10.0, 6.0, 7.0, 5.0, 0.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0], "bins": [-18.921875, -18.36328125, -17.8046875, -17.24609375, -16.6875, -16.12890625, -15.5703125, -15.01171875, -14.453125, -13.89453125, -13.3359375, -12.77734375, -12.21875, -11.66015625, -11.1015625, -10.54296875, -9.984375, -9.42578125, -8.8671875, -8.30859375, -7.75, -7.19140625, -6.6328125, -6.07421875, -5.515625, -4.95703125, -4.3984375, -3.83984375, -3.28125, -2.72265625, -2.1640625, -1.60546875, -1.046875, -0.48828125, 0.0703125, 0.62890625, 1.1875, 1.74609375, 2.3046875, 2.86328125, 3.421875, 3.98046875, 4.5390625, 5.09765625, 5.65625, 6.21484375, 6.7734375, 7.33203125, 7.890625, 8.44921875, 9.0078125, 9.56640625, 10.125, 10.68359375, 11.2421875, 11.80078125, 12.359375, 12.91796875, 13.4765625, 14.03515625, 14.59375, 15.15234375, 15.7109375, 16.26953125, 16.828125]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 7.0, 10.0, 10.0, 17.0, 31.0, 45.0, 59.0, 112.0, 186.0, 322.0, 568.0, 818.0, 752.0, 437.0, 258.0, 180.0, 94.0, 62.0, 45.0, 30.0, 13.0, 11.0, 3.0, 3.0, 3.0, 6.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.46875, -23.8377685546875, -23.206787109375, -22.5758056640625, -21.94482421875, -21.3138427734375, -20.682861328125, -20.0518798828125, -19.4208984375, -18.7899169921875, -18.158935546875, -17.5279541015625, -16.89697265625, -16.2659912109375, -15.635009765625, -15.0040283203125, -14.373046875, -13.7420654296875, -13.111083984375, -12.4801025390625, -11.84912109375, -11.2181396484375, -10.587158203125, -9.9561767578125, -9.3251953125, -8.6942138671875, -8.063232421875, -7.4322509765625, -6.80126953125, -6.1702880859375, -5.539306640625, -4.9083251953125, -4.27734375, -3.6463623046875, -3.015380859375, -2.3843994140625, -1.75341796875, -1.1224365234375, -0.491455078125, 0.1395263671875, 0.7705078125, 1.4014892578125, 2.032470703125, 2.6634521484375, 3.29443359375, 3.9254150390625, 4.556396484375, 5.1873779296875, 5.818359375, 6.4493408203125, 7.080322265625, 7.7113037109375, 8.34228515625, 8.9732666015625, 9.604248046875, 10.2352294921875, 10.8662109375, 11.4971923828125, 12.128173828125, 12.7591552734375, 13.39013671875, 14.0211181640625, 14.652099609375, 15.2830810546875, 15.9140625]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 5.0, 3.0, 3.0, 10.0, 17.0, 26.0, 61.0, 64.0, 102.0, 205.0, 395.0, 936.0, 14244.0, 4030065.0, 145167.0, 1920.0, 497.0, 260.0, 119.0, 68.0, 48.0, 25.0, 19.0, 11.0, 10.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-74.1875, -71.30078125, -68.4140625, -65.52734375, -62.640625, -59.75390625, -56.8671875, -53.98046875, -51.09375, -48.20703125, -45.3203125, -42.43359375, -39.546875, -36.66015625, -33.7734375, -30.88671875, -28.0, -25.11328125, -22.2265625, -19.33984375, -16.453125, -13.56640625, -10.6796875, -7.79296875, -4.90625, -2.01953125, 0.8671875, 3.75390625, 6.640625, 9.52734375, 12.4140625, 15.30078125, 18.1875, 21.07421875, 23.9609375, 26.84765625, 29.734375, 32.62109375, 35.5078125, 38.39453125, 41.28125, 44.16796875, 47.0546875, 49.94140625, 52.828125, 55.71484375, 58.6015625, 61.48828125, 64.375, 67.26171875, 70.1484375, 73.03515625, 75.921875, 78.80859375, 81.6953125, 84.58203125, 87.46875, 90.35546875, 93.2421875, 96.12890625, 99.015625, 101.90234375, 104.7890625, 107.67578125, 110.5625]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 13.0, 73.0, 260.0, 391.0, 208.0, 60.0, 11.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-344.0726623535156, -337.2384033203125, -330.40411376953125, -323.56982421875, -316.7355651855469, -309.90130615234375, -303.0670166015625, -296.23272705078125, -289.3984680175781, -282.564208984375, -275.72991943359375, -268.8956298828125, -262.0613708496094, -255.2270965576172, -248.392822265625, -241.5585479736328, -234.72427368164062, -227.88999938964844, -221.05572509765625, -214.22145080566406, -207.38717651367188, -200.5529022216797, -193.7186279296875, -186.8843536376953, -180.05007934570312, -173.21580505371094, -166.38153076171875, -159.54725646972656, -152.71298217773438, -145.8787078857422, -139.04443359375, -132.2101593017578, -125.37590026855469, -118.5416259765625, -111.70735168457031, -104.87307739257812, -98.03880310058594, -91.20452880859375, -84.37025451660156, -77.53598022460938, -70.70170593261719, -63.867431640625, -57.03315734863281, -50.198883056640625, -43.36460876464844, -36.53033447265625, -29.696060180664062, -22.861785888671875, -16.027511596679688, -9.1932373046875, -2.3589630126953125, 4.475311279296875, 11.309585571289062, 18.14385986328125, 24.978134155273438, 31.812408447265625, 38.64668273925781, 45.48095703125, 52.31523132324219, 59.149505615234375, 65.98377990722656, 72.81805419921875, 79.65232849121094, 86.48660278320312, 93.32087707519531]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 3.0, 2.0, 8.0, 16.0, 10.0, 7.0, 14.0, 16.0, 12.0, 19.0, 24.0, 23.0, 21.0, 23.0, 38.0, 26.0, 32.0, 29.0, 30.0, 35.0, 31.0, 41.0, 46.0, 34.0, 42.0, 40.0, 36.0, 35.0, 38.0, 30.0, 26.0, 24.0, 29.0, 21.0, 17.0, 28.0, 24.0, 15.0, 15.0, 7.0, 5.0, 7.0, 6.0, 5.0, 3.0, 2.0, 2.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-38.93145751953125, -37.70090866088867, -36.470359802246094, -35.23981475830078, -34.0092658996582, -32.778717041015625, -31.54817008972168, -30.317623138427734, -29.087074279785156, -27.856525421142578, -26.625978469848633, -25.395431518554688, -24.16488265991211, -22.93433380126953, -21.703786849975586, -20.47323989868164, -19.242691040039062, -18.012142181396484, -16.78159523010254, -15.551047325134277, -14.320499420166016, -13.089951515197754, -11.859403610229492, -10.62885570526123, -9.398307800292969, -8.167759895324707, -6.937211990356445, -5.706664085388184, -4.476116180419922, -3.24556827545166, -2.0150203704833984, -0.7844724655151367, 0.446075439453125, 1.6766233444213867, 2.9071712493896484, 4.13771915435791, 5.368267059326172, 6.598814964294434, 7.829362869262695, 9.059910774230957, 10.290458679199219, 11.52100658416748, 12.751554489135742, 13.982102394104004, 15.212650299072266, 16.443199157714844, 17.67374610900879, 18.904293060302734, 20.134841918945312, 21.36539077758789, 22.595937728881836, 23.82648468017578, 25.05703353881836, 26.287582397460938, 27.518129348754883, 28.748676300048828, 29.979225158691406, 31.209774017333984, 32.44032287597656, 33.670867919921875, 34.90141677856445, 36.13196563720703, 37.362510681152344, 38.59305953979492, 39.8236083984375]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 4.0, 4.0, 8.0, 7.0, 12.0, 6.0, 9.0, 19.0, 8.0, 18.0, 21.0, 27.0, 22.0, 40.0, 42.0, 36.0, 45.0, 38.0, 59.0, 47.0, 48.0, 60.0, 53.0, 59.0, 41.0, 36.0, 42.0, 37.0, 31.0, 23.0, 28.0, 20.0, 10.0, 11.0, 12.0, 8.0, 7.0, 5.0, 6.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.61328125, -6.34320068359375, -6.0731201171875, -5.80303955078125, -5.532958984375, -5.26287841796875, -4.9927978515625, -4.72271728515625, -4.45263671875, -4.18255615234375, -3.9124755859375, -3.64239501953125, -3.372314453125, -3.10223388671875, -2.8321533203125, -2.56207275390625, -2.2919921875, -2.02191162109375, -1.7518310546875, -1.48175048828125, -1.211669921875, -0.94158935546875, -0.6715087890625, -0.40142822265625, -0.13134765625, 0.13873291015625, 0.4088134765625, 0.67889404296875, 0.948974609375, 1.21905517578125, 1.4891357421875, 1.75921630859375, 2.029296875, 2.29937744140625, 2.5694580078125, 2.83953857421875, 3.109619140625, 3.37969970703125, 3.6497802734375, 3.91986083984375, 4.18994140625, 4.46002197265625, 4.7301025390625, 5.00018310546875, 5.270263671875, 5.54034423828125, 5.8104248046875, 6.08050537109375, 6.3505859375, 6.62066650390625, 6.8907470703125, 7.16082763671875, 7.430908203125, 7.70098876953125, 7.9710693359375, 8.24114990234375, 8.51123046875, 8.78131103515625, 9.0513916015625, 9.32147216796875, 9.591552734375, 9.86163330078125, 10.1317138671875, 10.40179443359375, 10.671875]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 7.0, 9.0, 19.0, 27.0, 34.0, 41.0, 102.0, 163.0, 270.0, 486.0, 778.0, 1337.0, 2234.0, 3850.0, 6536.0, 11564.0, 21165.0, 39941.0, 77894.0, 148132.0, 239583.0, 221042.0, 128362.0, 67212.0, 34928.0, 18441.0, 10263.0, 5904.0, 3433.0, 2015.0, 1139.0, 667.0, 397.0, 230.0, 130.0, 83.0, 43.0, 30.0, 21.0, 10.0, 9.0, 8.0, 6.0, 5.0, 5.0, 0.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.339111328125, -0.32813262939453125, -0.3171539306640625, -0.30617523193359375, -0.295196533203125, -0.28421783447265625, -0.2732391357421875, -0.26226043701171875, -0.25128173828125, -0.24030303955078125, -0.2293243408203125, -0.21834564208984375, -0.207366943359375, -0.19638824462890625, -0.1854095458984375, -0.17443084716796875, -0.1634521484375, -0.15247344970703125, -0.1414947509765625, -0.13051605224609375, -0.119537353515625, -0.10855865478515625, -0.0975799560546875, -0.08660125732421875, -0.07562255859375, -0.06464385986328125, -0.0536651611328125, -0.04268646240234375, -0.031707763671875, -0.02072906494140625, -0.0097503662109375, 0.00122833251953125, 0.01220703125, 0.02318572998046875, 0.0341644287109375, 0.04514312744140625, 0.056121826171875, 0.06710052490234375, 0.0780792236328125, 0.08905792236328125, 0.10003662109375, 0.11101531982421875, 0.1219940185546875, 0.13297271728515625, 0.143951416015625, 0.15493011474609375, 0.1659088134765625, 0.17688751220703125, 0.1878662109375, 0.19884490966796875, 0.2098236083984375, 0.22080230712890625, 0.231781005859375, 0.24275970458984375, 0.2537384033203125, 0.26471710205078125, 0.27569580078125, 0.28667449951171875, 0.2976531982421875, 0.30863189697265625, 0.319610595703125, 0.33058929443359375, 0.3415679931640625, 0.35254669189453125, 0.363525390625]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 8.0, 6.0, 2.0, 6.0, 6.0, 11.0, 11.0, 8.0, 12.0, 26.0, 22.0, 22.0, 25.0, 23.0, 37.0, 31.0, 39.0, 35.0, 40.0, 46.0, 66.0, 1050.0, 40.0, 42.0, 48.0, 29.0, 41.0, 34.0, 34.0, 39.0, 26.0, 24.0, 22.0, 18.0, 20.0, 14.0, 14.0, 13.0, 11.0, 12.0, 4.0, 5.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0], "bins": [-5.1484375, -4.99810791015625, -4.8477783203125, -4.69744873046875, -4.547119140625, -4.39678955078125, -4.2464599609375, -4.09613037109375, -3.94580078125, -3.79547119140625, -3.6451416015625, -3.49481201171875, -3.344482421875, -3.19415283203125, -3.0438232421875, -2.89349365234375, -2.7431640625, -2.59283447265625, -2.4425048828125, -2.29217529296875, -2.141845703125, -1.99151611328125, -1.8411865234375, -1.69085693359375, -1.54052734375, -1.39019775390625, -1.2398681640625, -1.08953857421875, -0.939208984375, -0.78887939453125, -0.6385498046875, -0.48822021484375, -0.337890625, -0.18756103515625, -0.0372314453125, 0.11309814453125, 0.263427734375, 0.41375732421875, 0.5640869140625, 0.71441650390625, 0.86474609375, 1.01507568359375, 1.1654052734375, 1.31573486328125, 1.466064453125, 1.61639404296875, 1.7667236328125, 1.91705322265625, 2.0673828125, 2.21771240234375, 2.3680419921875, 2.51837158203125, 2.668701171875, 2.81903076171875, 2.9693603515625, 3.11968994140625, 3.27001953125, 3.42034912109375, 3.5706787109375, 3.72100830078125, 3.871337890625, 4.02166748046875, 4.1719970703125, 4.32232666015625, 4.47265625]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 7.0, 3.0, 11.0, 17.0, 22.0, 40.0, 47.0, 101.0, 127.0, 221.0, 338.0, 459.0, 718.0, 1143.0, 1798.0, 2664.0, 4230.0, 6395.0, 10133.0, 16481.0, 26617.0, 44181.0, 74683.0, 120662.0, 173340.0, 1234756.0, 143229.0, 91772.0, 55392.0, 33105.0, 19901.0, 12477.0, 7821.0, 5054.0, 3256.0, 1990.0, 1322.0, 927.0, 607.0, 413.0, 248.0, 143.0, 104.0, 64.0, 49.0, 28.0, 21.0, 7.0, 8.0, 3.0, 2.0, 1.0, 3.0, 3.0, 2.0], "bins": [-0.28076171875, -0.2725543975830078, -0.2643470764160156, -0.25613975524902344, -0.24793243408203125, -0.23972511291503906, -0.23151779174804688, -0.2233104705810547, -0.2151031494140625, -0.2068958282470703, -0.19868850708007812, -0.19048118591308594, -0.18227386474609375, -0.17406654357910156, -0.16585922241210938, -0.1576519012451172, -0.149444580078125, -0.1412372589111328, -0.13302993774414062, -0.12482261657714844, -0.11661529541015625, -0.10840797424316406, -0.10020065307617188, -0.09199333190917969, -0.0837860107421875, -0.07557868957519531, -0.06737136840820312, -0.05916404724121094, -0.05095672607421875, -0.04274940490722656, -0.034542083740234375, -0.026334762573242188, -0.01812744140625, -0.009920120239257812, -0.001712799072265625, 0.0064945220947265625, 0.01470184326171875, 0.022909164428710938, 0.031116485595703125, 0.03932380676269531, 0.0475311279296875, 0.05573844909667969, 0.06394577026367188, 0.07215309143066406, 0.08036041259765625, 0.08856773376464844, 0.09677505493164062, 0.10498237609863281, 0.113189697265625, 0.12139701843261719, 0.12960433959960938, 0.13781166076660156, 0.14601898193359375, 0.15422630310058594, 0.16243362426757812, 0.1706409454345703, 0.1788482666015625, 0.1870555877685547, 0.19526290893554688, 0.20347023010253906, 0.21167755126953125, 0.21988487243652344, 0.22809219360351562, 0.2362995147705078, 0.2445068359375]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 6.0, 5.0, 8.0, 6.0, 5.0, 13.0, 8.0, 10.0, 14.0, 19.0, 25.0, 26.0, 38.0, 44.0, 37.0, 70.0, 61.0, 67.0, 79.0, 54.0, 60.0, 57.0, 53.0, 51.0, 32.0, 26.0, 27.0, 25.0, 18.0, 8.0, 14.0, 10.0, 4.0, 8.0, 6.0, 0.0, 4.0, 5.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.001613616943359375, -0.0015697330236434937, -0.0015258491039276123, -0.001481965184211731, -0.0014380812644958496, -0.0013941973447799683, -0.001350313425064087, -0.0013064295053482056, -0.0012625455856323242, -0.0012186616659164429, -0.0011747777462005615, -0.0011308938264846802, -0.0010870099067687988, -0.0010431259870529175, -0.0009992420673370361, -0.0009553581476211548, -0.0009114742279052734, -0.0008675903081893921, -0.0008237063884735107, -0.0007798224687576294, -0.000735938549041748, -0.0006920546293258667, -0.0006481707096099854, -0.000604286789894104, -0.0005604028701782227, -0.0005165189504623413, -0.00047263503074645996, -0.0004287511110305786, -0.00038486719131469727, -0.0003409832715988159, -0.00029709935188293457, -0.0002532154321670532, -0.00020933151245117188, -0.00016544759273529053, -0.00012156367301940918, -7.767975330352783e-05, -3.3795833587646484e-05, 1.0088086128234863e-05, 5.397200584411621e-05, 9.785592555999756e-05, 0.0001417398452758789, 0.00018562376499176025, 0.0002295076847076416, 0.00027339160442352295, 0.0003172755241394043, 0.00036115944385528564, 0.000405043363571167, 0.00044892728328704834, 0.0004928112030029297, 0.000536695122718811, 0.0005805790424346924, 0.0006244629621505737, 0.0006683468818664551, 0.0007122308015823364, 0.0007561147212982178, 0.0007999986410140991, 0.0008438825607299805, 0.0008877664804458618, 0.0009316504001617432, 0.0009755343198776245, 0.0010194182395935059, 0.0010633021593093872, 0.0011071860790252686, 0.00115106999874115, 0.0011949539184570312]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 4.0, 2.0, 1.0, 8.0, 9.0, 12.0, 9.0, 12.0, 26.0, 31.0, 38.0, 49.0, 62.0, 98.0, 148.0, 289.0, 662.0, 22591.0, 1012694.0, 10462.0, 547.0, 264.0, 146.0, 113.0, 62.0, 51.0, 41.0, 22.0, 21.0, 21.0, 10.0, 15.0, 8.0, 7.0, 8.0, 5.0, 2.0, 5.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0247650146484375, -0.02382826805114746, -0.022891521453857422, -0.021954774856567383, -0.021018028259277344, -0.020081281661987305, -0.019144535064697266, -0.018207788467407227, -0.017271041870117188, -0.01633429527282715, -0.01539754867553711, -0.01446080207824707, -0.013524055480957031, -0.012587308883666992, -0.011650562286376953, -0.010713815689086914, -0.009777069091796875, -0.008840322494506836, -0.007903575897216797, -0.006966829299926758, -0.006030082702636719, -0.00509333610534668, -0.004156589508056641, -0.0032198429107666016, -0.0022830963134765625, -0.0013463497161865234, -0.0004096031188964844, 0.0005271434783935547, 0.0014638900756835938, 0.002400636672973633, 0.003337383270263672, 0.004274129867553711, 0.00521087646484375, 0.006147623062133789, 0.007084369659423828, 0.008021116256713867, 0.008957862854003906, 0.009894609451293945, 0.010831356048583984, 0.011768102645874023, 0.012704849243164062, 0.013641595840454102, 0.01457834243774414, 0.01551508903503418, 0.01645183563232422, 0.017388582229614258, 0.018325328826904297, 0.019262075424194336, 0.020198822021484375, 0.021135568618774414, 0.022072315216064453, 0.023009061813354492, 0.02394580841064453, 0.02488255500793457, 0.02581930160522461, 0.02675604820251465, 0.027692794799804688, 0.028629541397094727, 0.029566287994384766, 0.030503034591674805, 0.031439781188964844, 0.03237652778625488, 0.03331327438354492, 0.03425002098083496, 0.035186767578125]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 638.0, 378.0], "bins": [-0.03230256959795952, -0.03178941458463669, -0.031276263296604156, -0.030763108283281326, -0.030249955132603645, -0.029736801981925964, -0.029223646968603134, -0.028710493817925453, -0.028197340667247772, -0.02768418751657009, -0.02717103250324726, -0.02665787935256958, -0.0261447262018919, -0.025631573051214218, -0.025118418037891388, -0.024605264887213707, -0.024092111736536026, -0.023578958585858345, -0.023065803572535515, -0.022552650421857834, -0.022039497271180153, -0.021526344120502472, -0.02101318910717964, -0.02050003595650196, -0.01998688094317913, -0.01947372779250145, -0.01896057277917862, -0.01844741962850094, -0.017934266477823257, -0.017421113327145576, -0.016907958313822746, -0.016394805163145065, -0.015881650149822235, -0.01536849606782198, -0.014855342917144299, -0.014342188835144043, -0.013829035684466362, -0.013315881602466106, -0.01280272752046585, -0.01228957436978817, -0.011776421219110489, -0.011263267137110233, -0.010750113986432552, -0.010236959904432297, -0.009723806753754616, -0.00921065267175436, -0.008697498589754105, -0.008184345439076424, -0.007671191357076168, -0.0071580377407372, -0.0066448841243982315, -0.006131730042397976, -0.005618576891720295, -0.005105422809720039, -0.004592269193381071, -0.004079115577042103, -0.003565962193533778, -0.00305280857719481, -0.002539654728025198, -0.0020265011116862297, -0.0015133474953472614, -0.0010001938790082932, -0.0004870400298386812, 2.6113586500287056e-05, 0.0005392672610469162]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 4.0, 8.0, 3.0, 9.0, 11.0, 15.0, 17.0, 30.0, 39.0, 40.0, 47.0, 29.0, 55.0, 57.0, 70.0, 71.0, 69.0, 62.0, 46.0, 55.0, 46.0, 54.0, 49.0, 25.0, 21.0, 21.0, 16.0, 14.0, 9.0, 10.0, 7.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007166266441345215, -0.0006812242791056633, -0.0006458219140768051, -0.0006104195490479469, -0.0005750171840190887, -0.0005396148189902306, -0.0005042124539613724, -0.0004688100889325142, -0.000433407723903656, -0.0003980053588747978, -0.00036260299384593964, -0.00032720062881708145, -0.00029179826378822327, -0.0002563958987593651, -0.0002209935337305069, -0.0001855911687016487, -0.00015018880367279053, -0.00011478643864393234, -7.938407361507416e-05, -4.398170858621597e-05, -8.579343557357788e-06, 2.6823021471500397e-05, 6.222538650035858e-05, 9.762775152921677e-05, 0.00013303011655807495, 0.00016843248158693314, 0.00020383484661579132, 0.0002392372116446495, 0.0002746395766735077, 0.0003100419417023659, 0.00034544430673122406, 0.00038084667176008224, 0.00041624903678894043, 0.0004516514018177986, 0.0004870537668466568, 0.000522456131875515, 0.0005578584969043732, 0.0005932608619332314, 0.0006286632269620895, 0.0006640655919909477, 0.0006994679570198059, 0.0007348703220486641, 0.0007702726870775223, 0.0008056750521063805, 0.0008410774171352386, 0.0008764797821640968, 0.000911882147192955, 0.0009472845122218132, 0.0009826868772506714, 0.0010180892422795296, 0.0010534916073083878, 0.001088893972337246, 0.0011242963373661041, 0.0011596987023949623, 0.0011951010674238205, 0.0012305034324526787, 0.0012659057974815369, 0.001301308162510395, 0.0013367105275392532, 0.0013721128925681114, 0.0014075152575969696, 0.0014429176226258278, 0.001478319987654686, 0.0015137223526835442, 0.0015491247177124023]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 4.0, 4.0, 8.0, 7.0, 12.0, 6.0, 9.0, 19.0, 8.0, 18.0, 21.0, 27.0, 22.0, 40.0, 42.0, 36.0, 45.0, 38.0, 59.0, 47.0, 48.0, 60.0, 53.0, 59.0, 41.0, 36.0, 42.0, 37.0, 31.0, 23.0, 28.0, 20.0, 10.0, 11.0, 12.0, 8.0, 7.0, 5.0, 6.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.61328125, -6.34320068359375, -6.0731201171875, -5.80303955078125, -5.532958984375, -5.26287841796875, -4.9927978515625, -4.72271728515625, -4.45263671875, -4.18255615234375, -3.9124755859375, -3.64239501953125, -3.372314453125, -3.10223388671875, -2.8321533203125, -2.56207275390625, -2.2919921875, -2.02191162109375, -1.7518310546875, -1.48175048828125, -1.211669921875, -0.94158935546875, -0.6715087890625, -0.40142822265625, -0.13134765625, 0.13873291015625, 0.4088134765625, 0.67889404296875, 0.948974609375, 1.21905517578125, 1.4891357421875, 1.75921630859375, 2.029296875, 2.29937744140625, 2.5694580078125, 2.83953857421875, 3.109619140625, 3.37969970703125, 3.6497802734375, 3.91986083984375, 4.18994140625, 4.46002197265625, 4.7301025390625, 5.00018310546875, 5.270263671875, 5.54034423828125, 5.8104248046875, 6.08050537109375, 6.3505859375, 6.62066650390625, 6.8907470703125, 7.16082763671875, 7.430908203125, 7.70098876953125, 7.9710693359375, 8.24114990234375, 8.51123046875, 8.78131103515625, 9.0513916015625, 9.32147216796875, 9.591552734375, 9.86163330078125, 10.1317138671875, 10.40179443359375, 10.671875]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 1.0, 4.0, 6.0, 8.0, 10.0, 15.0, 10.0, 21.0, 34.0, 33.0, 57.0, 75.0, 137.0, 231.0, 448.0, 847.0, 1830.0, 3768.0, 9652.0, 30505.0, 197025.0, 699141.0, 75323.0, 17697.0, 6240.0, 2652.0, 1316.0, 633.0, 335.0, 167.0, 110.0, 88.0, 46.0, 25.0, 23.0, 17.0, 11.0, 9.0, 4.0, 8.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.046875, -11.5703125, -11.09375, -10.6171875, -10.140625, -9.6640625, -9.1875, -8.7109375, -8.234375, -7.7578125, -7.28125, -6.8046875, -6.328125, -5.8515625, -5.375, -4.8984375, -4.421875, -3.9453125, -3.46875, -2.9921875, -2.515625, -2.0390625, -1.5625, -1.0859375, -0.609375, -0.1328125, 0.34375, 0.8203125, 1.296875, 1.7734375, 2.25, 2.7265625, 3.203125, 3.6796875, 4.15625, 4.6328125, 5.109375, 5.5859375, 6.0625, 6.5390625, 7.015625, 7.4921875, 7.96875, 8.4453125, 8.921875, 9.3984375, 9.875, 10.3515625, 10.828125, 11.3046875, 11.78125, 12.2578125, 12.734375, 13.2109375, 13.6875, 14.1640625, 14.640625, 15.1171875, 15.59375, 16.0703125, 16.546875, 17.0234375, 17.5, 17.9765625, 18.453125]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 2.0, 5.0, 3.0, 1.0, 7.0, 7.0, 9.0, 9.0, 12.0, 12.0, 12.0, 19.0, 25.0, 20.0, 32.0, 19.0, 28.0, 27.0, 45.0, 56.0, 67.0, 95.0, 163.0, 1658.0, 195.0, 92.0, 53.0, 48.0, 40.0, 31.0, 42.0, 30.0, 34.0, 30.0, 23.0, 19.0, 15.0, 15.0, 10.0, 3.0, 13.0, 8.0, 3.0, 6.0, 5.0, 6.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.296875, -20.60107421875, -19.9052734375, -19.20947265625, -18.513671875, -17.81787109375, -17.1220703125, -16.42626953125, -15.73046875, -15.03466796875, -14.3388671875, -13.64306640625, -12.947265625, -12.25146484375, -11.5556640625, -10.85986328125, -10.1640625, -9.46826171875, -8.7724609375, -8.07666015625, -7.380859375, -6.68505859375, -5.9892578125, -5.29345703125, -4.59765625, -3.90185546875, -3.2060546875, -2.51025390625, -1.814453125, -1.11865234375, -0.4228515625, 0.27294921875, 0.96875, 1.66455078125, 2.3603515625, 3.05615234375, 3.751953125, 4.44775390625, 5.1435546875, 5.83935546875, 6.53515625, 7.23095703125, 7.9267578125, 8.62255859375, 9.318359375, 10.01416015625, 10.7099609375, 11.40576171875, 12.1015625, 12.79736328125, 13.4931640625, 14.18896484375, 14.884765625, 15.58056640625, 16.2763671875, 16.97216796875, 17.66796875, 18.36376953125, 19.0595703125, 19.75537109375, 20.451171875, 21.14697265625, 21.8427734375, 22.53857421875, 23.234375]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 6.0, 2.0, 10.0, 6.0, 9.0, 12.0, 8.0, 22.0, 23.0, 22.0, 35.0, 44.0, 52.0, 70.0, 103.0, 155.0, 278.0, 879.0, 10442.0, 3053192.0, 77289.0, 1941.0, 421.0, 205.0, 148.0, 76.0, 54.0, 42.0, 33.0, 27.0, 25.0, 15.0, 14.0, 14.0, 7.0, 11.0, 8.0, 4.0, 4.0, 4.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-89.4375, -87.06640625, -84.6953125, -82.32421875, -79.953125, -77.58203125, -75.2109375, -72.83984375, -70.46875, -68.09765625, -65.7265625, -63.35546875, -60.984375, -58.61328125, -56.2421875, -53.87109375, -51.5, -49.12890625, -46.7578125, -44.38671875, -42.015625, -39.64453125, -37.2734375, -34.90234375, -32.53125, -30.16015625, -27.7890625, -25.41796875, -23.046875, -20.67578125, -18.3046875, -15.93359375, -13.5625, -11.19140625, -8.8203125, -6.44921875, -4.078125, -1.70703125, 0.6640625, 3.03515625, 5.40625, 7.77734375, 10.1484375, 12.51953125, 14.890625, 17.26171875, 19.6328125, 22.00390625, 24.375, 26.74609375, 29.1171875, 31.48828125, 33.859375, 36.23046875, 38.6015625, 40.97265625, 43.34375, 45.71484375, 48.0859375, 50.45703125, 52.828125, 55.19921875, 57.5703125, 59.94140625, 62.3125]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 14.0, 43.0, 90.0, 139.0, 212.0, 209.0, 150.0, 83.0, 39.0, 17.0, 7.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.482486724853516, -36.93428039550781, -35.386077880859375, -33.83787155151367, -32.28966522216797, -30.7414608001709, -29.193256378173828, -27.645050048828125, -26.096845626831055, -24.548641204833984, -23.00043487548828, -21.45223045349121, -19.90402603149414, -18.355819702148438, -16.807615280151367, -15.25940990447998, -13.711204528808594, -12.162999153137207, -10.61479377746582, -9.06658935546875, -7.518383979797363, -5.970178604125977, -4.421974182128906, -2.8737688064575195, -1.3255634307861328, 0.2226417064666748, 1.7708468437194824, 3.319051742553711, 4.867257118225098, 6.415462493896484, 7.963666915893555, 9.511872291564941, 11.060073852539062, 12.60827922821045, 14.156484603881836, 15.704689025878906, 17.25289535522461, 18.80109977722168, 20.34930419921875, 21.897510528564453, 23.445714950561523, 24.993919372558594, 26.542125701904297, 28.090330123901367, 29.638534545898438, 31.18674087524414, 32.734947204589844, 34.28314971923828, 35.831356048583984, 37.37956237792969, 38.927764892578125, 40.47597122192383, 42.02417755126953, 43.57238006591797, 45.12058639526367, 46.668792724609375, 48.21699523925781, 49.765201568603516, 51.31340408325195, 52.861610412597656, 54.40981674194336, 55.95802307128906, 57.5062255859375, 59.0544319152832, 60.602638244628906]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 5.0, 5.0, 5.0, 8.0, 11.0, 15.0, 12.0, 6.0, 15.0, 23.0, 22.0, 22.0, 29.0, 24.0, 30.0, 32.0, 35.0, 27.0, 38.0, 37.0, 41.0, 34.0, 41.0, 42.0, 55.0, 42.0, 38.0, 35.0, 30.0, 17.0, 25.0, 37.0, 28.0, 20.0, 20.0, 11.0, 15.0, 13.0, 13.0, 7.0, 8.0, 6.0, 1.0, 8.0, 4.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-60.09169387817383, -58.18912124633789, -56.28654861450195, -54.38397216796875, -52.48139953613281, -50.578826904296875, -48.67625427246094, -46.773681640625, -44.87110900878906, -42.968536376953125, -41.06596374511719, -39.16339111328125, -37.26081466674805, -35.35824203491211, -33.45566940307617, -31.553096771240234, -29.65052032470703, -27.747947692871094, -25.845373153686523, -23.942800521850586, -22.040225982666016, -20.137653350830078, -18.23508071899414, -16.332508087158203, -14.429933547973633, -12.527359962463379, -10.624786376953125, -8.722213745117188, -6.819640159606934, -4.91706657409668, -3.014493942260742, -1.1119203567504883, 0.7906494140625, 2.693222761154175, 4.59579610824585, 6.498369216918945, 8.4009428024292, 10.303516387939453, 12.20608901977539, 14.108662605285645, 16.0112361907959, 17.913808822631836, 19.816383361816406, 21.718955993652344, 23.62152862548828, 25.52410316467285, 27.42667579650879, 29.32925033569336, 31.231822967529297, 33.134395599365234, 35.03696823120117, 36.939544677734375, 38.84211730957031, 40.74468994140625, 42.64726257324219, 44.549835205078125, 46.45240783691406, 48.35498046875, 50.25755310058594, 52.160125732421875, 54.06270217895508, 55.965274810791016, 57.86784744262695, 59.77042007446289, 61.672996520996094]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 4.0, 7.0, 4.0, 8.0, 13.0, 8.0, 9.0, 18.0, 25.0, 19.0, 16.0, 26.0, 33.0, 34.0, 45.0, 42.0, 54.0, 48.0, 47.0, 58.0, 60.0, 42.0, 47.0, 46.0, 41.0, 42.0, 40.0, 23.0, 29.0, 22.0, 18.0, 19.0, 17.0, 13.0, 9.0, 3.0, 6.0, 4.0, 4.0, 4.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.671875, -7.3841552734375, -7.096435546875, -6.8087158203125, -6.52099609375, -6.2332763671875, -5.945556640625, -5.6578369140625, -5.3701171875, -5.0823974609375, -4.794677734375, -4.5069580078125, -4.21923828125, -3.9315185546875, -3.643798828125, -3.3560791015625, -3.068359375, -2.7806396484375, -2.492919921875, -2.2052001953125, -1.91748046875, -1.6297607421875, -1.342041015625, -1.0543212890625, -0.7666015625, -0.4788818359375, -0.191162109375, 0.0965576171875, 0.38427734375, 0.6719970703125, 0.959716796875, 1.2474365234375, 1.53515625, 1.8228759765625, 2.110595703125, 2.3983154296875, 2.68603515625, 2.9737548828125, 3.261474609375, 3.5491943359375, 3.8369140625, 4.1246337890625, 4.412353515625, 4.7000732421875, 4.98779296875, 5.2755126953125, 5.563232421875, 5.8509521484375, 6.138671875, 6.4263916015625, 6.714111328125, 7.0018310546875, 7.28955078125, 7.5772705078125, 7.864990234375, 8.1527099609375, 8.4404296875, 8.7281494140625, 9.015869140625, 9.3035888671875, 9.59130859375, 9.8790283203125, 10.166748046875, 10.4544677734375, 10.7421875]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 7.0, 6.0, 7.0, 14.0, 7.0, 24.0, 32.0, 57.0, 74.0, 162.0, 272.0, 533.0, 934.0, 1743.0, 3455.0, 6815.0, 14429.0, 33966.0, 94577.0, 356020.0, 1238235.0, 1619793.0, 585649.0, 151768.0, 47917.0, 19258.0, 8784.0, 4550.0, 2296.0, 1280.0, 685.0, 400.0, 212.0, 108.0, 74.0, 40.0, 25.0, 23.0, 18.0, 11.0, 12.0, 6.0, 9.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.4296875, -9.1065673828125, -8.783447265625, -8.4603271484375, -8.13720703125, -7.8140869140625, -7.490966796875, -7.1678466796875, -6.8447265625, -6.5216064453125, -6.198486328125, -5.8753662109375, -5.55224609375, -5.2291259765625, -4.906005859375, -4.5828857421875, -4.259765625, -3.9366455078125, -3.613525390625, -3.2904052734375, -2.96728515625, -2.6441650390625, -2.321044921875, -1.9979248046875, -1.6748046875, -1.3516845703125, -1.028564453125, -0.7054443359375, -0.38232421875, -0.0592041015625, 0.263916015625, 0.5870361328125, 0.91015625, 1.2332763671875, 1.556396484375, 1.8795166015625, 2.20263671875, 2.5257568359375, 2.848876953125, 3.1719970703125, 3.4951171875, 3.8182373046875, 4.141357421875, 4.4644775390625, 4.78759765625, 5.1107177734375, 5.433837890625, 5.7569580078125, 6.080078125, 6.4031982421875, 6.726318359375, 7.0494384765625, 7.37255859375, 7.6956787109375, 8.018798828125, 8.3419189453125, 8.6650390625, 8.9881591796875, 9.311279296875, 9.6343994140625, 9.95751953125, 10.2806396484375, 10.603759765625, 10.9268798828125, 11.25]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 3.0, 3.0, 10.0, 6.0, 10.0, 11.0, 9.0, 15.0, 17.0, 26.0, 45.0, 54.0, 56.0, 78.0, 110.0, 126.0, 179.0, 204.0, 287.0, 362.0, 438.0, 409.0, 372.0, 283.0, 223.0, 162.0, 128.0, 89.0, 76.0, 66.0, 44.0, 43.0, 30.0, 25.0, 13.0, 19.0, 18.0, 4.0, 5.0, 6.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.3203125, -10.943115234375, -10.56591796875, -10.188720703125, -9.8115234375, -9.434326171875, -9.05712890625, -8.679931640625, -8.302734375, -7.925537109375, -7.54833984375, -7.171142578125, -6.7939453125, -6.416748046875, -6.03955078125, -5.662353515625, -5.28515625, -4.907958984375, -4.53076171875, -4.153564453125, -3.7763671875, -3.399169921875, -3.02197265625, -2.644775390625, -2.267578125, -1.890380859375, -1.51318359375, -1.135986328125, -0.7587890625, -0.381591796875, -0.00439453125, 0.372802734375, 0.75, 1.127197265625, 1.50439453125, 1.881591796875, 2.2587890625, 2.635986328125, 3.01318359375, 3.390380859375, 3.767578125, 4.144775390625, 4.52197265625, 4.899169921875, 5.2763671875, 5.653564453125, 6.03076171875, 6.407958984375, 6.78515625, 7.162353515625, 7.53955078125, 7.916748046875, 8.2939453125, 8.671142578125, 9.04833984375, 9.425537109375, 9.802734375, 10.179931640625, 10.55712890625, 10.934326171875, 11.3115234375, 11.688720703125, 12.06591796875, 12.443115234375, 12.8203125]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 10.0, 7.0, 14.0, 15.0, 23.0, 34.0, 36.0, 61.0, 83.0, 125.0, 164.0, 275.0, 446.0, 948.0, 5323.0, 74960.0, 3273676.0, 809970.0, 23774.0, 2550.0, 695.0, 377.0, 195.0, 156.0, 106.0, 77.0, 42.0, 44.0, 24.0, 23.0, 15.0, 9.0, 9.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-55.21875, -53.75830078125, -52.2978515625, -50.83740234375, -49.376953125, -47.91650390625, -46.4560546875, -44.99560546875, -43.53515625, -42.07470703125, -40.6142578125, -39.15380859375, -37.693359375, -36.23291015625, -34.7724609375, -33.31201171875, -31.8515625, -30.39111328125, -28.9306640625, -27.47021484375, -26.009765625, -24.54931640625, -23.0888671875, -21.62841796875, -20.16796875, -18.70751953125, -17.2470703125, -15.78662109375, -14.326171875, -12.86572265625, -11.4052734375, -9.94482421875, -8.484375, -7.02392578125, -5.5634765625, -4.10302734375, -2.642578125, -1.18212890625, 0.2783203125, 1.73876953125, 3.19921875, 4.65966796875, 6.1201171875, 7.58056640625, 9.041015625, 10.50146484375, 11.9619140625, 13.42236328125, 14.8828125, 16.34326171875, 17.8037109375, 19.26416015625, 20.724609375, 22.18505859375, 23.6455078125, 25.10595703125, 26.56640625, 28.02685546875, 29.4873046875, 30.94775390625, 32.408203125, 33.86865234375, 35.3291015625, 36.78955078125, 38.25]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 228.0, 737.0, 47.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-240.26731872558594, -223.49526977539062, -206.72323608398438, -189.95118713378906, -173.17913818359375, -156.40708923339844, -139.63504028320312, -122.86300659179688, -106.09095764160156, -89.31890869140625, -72.54686737060547, -55.77482223510742, -39.002777099609375, -22.230728149414062, -5.458686828613281, 11.3133544921875, 28.085403442382812, 44.85744857788086, 61.629493713378906, 78.40153503417969, 95.173583984375, 111.94563293457031, 128.71768188476562, 145.48971557617188, 162.2617645263672, 179.0338134765625, 195.80584716796875, 212.57789611816406, 229.34994506835938, 246.1219940185547, 262.89404296875, 279.66607666015625, 296.43817138671875, 313.210205078125, 329.9822692871094, 346.7543029785156, 363.5263671875, 380.29840087890625, 397.0704345703125, 413.84246826171875, 430.6145324707031, 447.3865661621094, 464.15863037109375, 480.9306640625, 497.70269775390625, 514.4747314453125, 531.246826171875, 548.0188598632812, 564.7908935546875, 581.5629272460938, 598.3349609375, 615.1070556640625, 631.8790893554688, 648.651123046875, 665.4231567382812, 682.1951904296875, 698.96728515625, 715.7393188476562, 732.5113525390625, 749.283447265625, 766.0554809570312, 782.8275146484375, 799.5995483398438, 816.37158203125, 833.1436157226562]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 5.0, 6.0, 15.0, 15.0, 11.0, 28.0, 13.0, 23.0, 18.0, 27.0, 37.0, 48.0, 39.0, 51.0, 48.0, 46.0, 52.0, 70.0, 49.0, 44.0, 46.0, 49.0, 49.0, 36.0, 38.0, 26.0, 16.0, 12.0, 29.0, 18.0, 18.0, 7.0, 5.0, 5.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-68.327392578125, -66.49560546875, -64.663818359375, -62.83202362060547, -61.00023651123047, -59.16844940185547, -57.3366584777832, -55.50486755371094, -53.67308044433594, -51.84129333496094, -50.00950241088867, -48.177711486816406, -46.345924377441406, -44.514137268066406, -42.68234634399414, -40.850555419921875, -39.018768310546875, -37.186981201171875, -35.35519027709961, -33.523399353027344, -31.691612243652344, -29.85982322692871, -28.028034210205078, -26.196245193481445, -24.364456176757812, -22.53266716003418, -20.700878143310547, -18.869089126586914, -17.03730010986328, -15.205511093139648, -13.373722076416016, -11.541933059692383, -9.71014404296875, -7.878355026245117, -6.046566009521484, -4.214776992797852, -2.3829879760742188, -0.5511989593505859, 1.2805900573730469, 3.1123790740966797, 4.9441680908203125, 6.775957107543945, 8.607746124267578, 10.439535140991211, 12.271324157714844, 14.103113174438477, 15.93490219116211, 17.766691207885742, 19.598480224609375, 21.430269241333008, 23.26205825805664, 25.093847274780273, 26.925636291503906, 28.75742530822754, 30.589214324951172, 32.42100524902344, 34.25279235839844, 36.08457946777344, 37.9163703918457, 39.74816131591797, 41.57994842529297, 43.41173553466797, 45.243526458740234, 47.0753173828125, 48.9071044921875]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 2.0, 4.0, 0.0, 3.0, 1.0, 6.0, 4.0, 7.0, 11.0, 8.0, 13.0, 13.0, 9.0, 10.0, 13.0, 21.0, 26.0, 26.0, 30.0, 27.0, 34.0, 26.0, 26.0, 49.0, 37.0, 41.0, 38.0, 39.0, 43.0, 50.0, 43.0, 37.0, 32.0, 30.0, 31.0, 22.0, 21.0, 20.0, 17.0, 20.0, 22.0, 23.0, 12.0, 17.0, 8.0, 10.0, 11.0, 5.0, 6.0, 1.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.9921875, -6.77020263671875, -6.5482177734375, -6.32623291015625, -6.104248046875, -5.88226318359375, -5.6602783203125, -5.43829345703125, -5.21630859375, -4.99432373046875, -4.7723388671875, -4.55035400390625, -4.328369140625, -4.10638427734375, -3.8843994140625, -3.66241455078125, -3.4404296875, -3.21844482421875, -2.9964599609375, -2.77447509765625, -2.552490234375, -2.33050537109375, -2.1085205078125, -1.88653564453125, -1.66455078125, -1.44256591796875, -1.2205810546875, -0.99859619140625, -0.776611328125, -0.55462646484375, -0.3326416015625, -0.11065673828125, 0.111328125, 0.33331298828125, 0.5552978515625, 0.77728271484375, 0.999267578125, 1.22125244140625, 1.4432373046875, 1.66522216796875, 1.88720703125, 2.10919189453125, 2.3311767578125, 2.55316162109375, 2.775146484375, 2.99713134765625, 3.2191162109375, 3.44110107421875, 3.6630859375, 3.88507080078125, 4.1070556640625, 4.32904052734375, 4.551025390625, 4.77301025390625, 4.9949951171875, 5.21697998046875, 5.43896484375, 5.66094970703125, 5.8829345703125, 6.10491943359375, 6.326904296875, 6.54888916015625, 6.7708740234375, 6.99285888671875, 7.21484375]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 8.0, 8.0, 8.0, 13.0, 25.0, 54.0, 62.0, 95.0, 136.0, 217.0, 334.0, 506.0, 693.0, 1108.0, 1639.0, 2564.0, 3890.0, 5975.0, 9247.0, 14783.0, 23958.0, 39715.0, 66253.0, 108466.0, 164166.0, 194211.0, 153761.0, 99664.0, 60564.0, 36498.0, 21892.0, 13480.0, 8599.0, 5506.0, 3531.0, 2334.0, 1511.0, 1022.0, 693.0, 466.0, 296.0, 215.0, 129.0, 82.0, 61.0, 48.0, 27.0, 21.0, 9.0, 3.0, 5.0, 4.0, 1.0, 2.0, 3.0, 2.0, 1.0], "bins": [-0.289794921875, -0.280853271484375, -0.27191162109375, -0.262969970703125, -0.2540283203125, -0.245086669921875, -0.23614501953125, -0.227203369140625, -0.21826171875, -0.209320068359375, -0.20037841796875, -0.191436767578125, -0.1824951171875, -0.173553466796875, -0.16461181640625, -0.155670166015625, -0.146728515625, -0.137786865234375, -0.12884521484375, -0.119903564453125, -0.1109619140625, -0.102020263671875, -0.09307861328125, -0.084136962890625, -0.0751953125, -0.066253662109375, -0.05731201171875, -0.048370361328125, -0.0394287109375, -0.030487060546875, -0.02154541015625, -0.012603759765625, -0.003662109375, 0.005279541015625, 0.01422119140625, 0.023162841796875, 0.0321044921875, 0.041046142578125, 0.04998779296875, 0.058929443359375, 0.06787109375, 0.076812744140625, 0.08575439453125, 0.094696044921875, 0.1036376953125, 0.112579345703125, 0.12152099609375, 0.130462646484375, 0.139404296875, 0.148345947265625, 0.15728759765625, 0.166229248046875, 0.1751708984375, 0.184112548828125, 0.19305419921875, 0.201995849609375, 0.2109375, 0.219879150390625, 0.22882080078125, 0.237762451171875, 0.2467041015625, 0.255645751953125, 0.26458740234375, 0.273529052734375, 0.282470703125]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 2.0, 4.0, 2.0, 3.0, 6.0, 8.0, 8.0, 17.0, 15.0, 15.0, 29.0, 21.0, 27.0, 34.0, 30.0, 31.0, 37.0, 44.0, 52.0, 51.0, 41.0, 1074.0, 49.0, 46.0, 35.0, 41.0, 32.0, 27.0, 25.0, 35.0, 28.0, 28.0, 18.0, 33.0, 22.0, 12.0, 11.0, 7.0, 5.0, 8.0, 2.0, 8.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.66796875, -4.503662109375, -4.33935546875, -4.175048828125, -4.0107421875, -3.846435546875, -3.68212890625, -3.517822265625, -3.353515625, -3.189208984375, -3.02490234375, -2.860595703125, -2.6962890625, -2.531982421875, -2.36767578125, -2.203369140625, -2.0390625, -1.874755859375, -1.71044921875, -1.546142578125, -1.3818359375, -1.217529296875, -1.05322265625, -0.888916015625, -0.724609375, -0.560302734375, -0.39599609375, -0.231689453125, -0.0673828125, 0.096923828125, 0.26123046875, 0.425537109375, 0.58984375, 0.754150390625, 0.91845703125, 1.082763671875, 1.2470703125, 1.411376953125, 1.57568359375, 1.739990234375, 1.904296875, 2.068603515625, 2.23291015625, 2.397216796875, 2.5615234375, 2.725830078125, 2.89013671875, 3.054443359375, 3.21875, 3.383056640625, 3.54736328125, 3.711669921875, 3.8759765625, 4.040283203125, 4.20458984375, 4.368896484375, 4.533203125, 4.697509765625, 4.86181640625, 5.026123046875, 5.1904296875, 5.354736328125, 5.51904296875, 5.683349609375, 5.84765625]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 2.0, 10.0, 10.0, 11.0, 16.0, 31.0, 43.0, 71.0, 144.0, 182.0, 285.0, 473.0, 696.0, 1058.0, 1735.0, 2816.0, 4195.0, 6880.0, 11361.0, 18452.0, 30536.0, 51300.0, 85534.0, 136521.0, 1202217.0, 212986.0, 128613.0, 79412.0, 47814.0, 28488.0, 17201.0, 10562.0, 6487.0, 3964.0, 2535.0, 1655.0, 991.0, 679.0, 408.0, 272.0, 176.0, 110.0, 67.0, 53.0, 31.0, 33.0, 7.0, 5.0, 3.0, 6.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.257568359375, -0.24866485595703125, -0.2397613525390625, -0.23085784912109375, -0.221954345703125, -0.21305084228515625, -0.2041473388671875, -0.19524383544921875, -0.18634033203125, -0.17743682861328125, -0.1685333251953125, -0.15962982177734375, -0.150726318359375, -0.14182281494140625, -0.1329193115234375, -0.12401580810546875, -0.1151123046875, -0.10620880126953125, -0.0973052978515625, -0.08840179443359375, -0.079498291015625, -0.07059478759765625, -0.0616912841796875, -0.05278778076171875, -0.04388427734375, -0.03498077392578125, -0.0260772705078125, -0.01717376708984375, -0.008270263671875, 0.00063323974609375, 0.0095367431640625, 0.01844024658203125, 0.02734375, 0.03624725341796875, 0.0451507568359375, 0.05405426025390625, 0.062957763671875, 0.07186126708984375, 0.0807647705078125, 0.08966827392578125, 0.09857177734375, 0.10747528076171875, 0.1163787841796875, 0.12528228759765625, 0.134185791015625, 0.14308929443359375, 0.1519927978515625, 0.16089630126953125, 0.1697998046875, 0.17870330810546875, 0.1876068115234375, 0.19651031494140625, 0.205413818359375, 0.21431732177734375, 0.2232208251953125, 0.23212432861328125, 0.24102783203125, 0.24993133544921875, 0.2588348388671875, 0.26773834228515625, 0.276641845703125, 0.28554534912109375, 0.2944488525390625, 0.30335235595703125, 0.312255859375]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 4.0, 6.0, 5.0, 5.0, 8.0, 6.0, 11.0, 19.0, 16.0, 26.0, 32.0, 31.0, 40.0, 48.0, 47.0, 49.0, 74.0, 66.0, 69.0, 58.0, 60.0, 55.0, 49.0, 38.0, 28.0, 25.0, 20.0, 8.0, 26.0, 17.0, 14.0, 11.0, 7.0, 6.0, 3.0, 6.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0016031265258789062, -0.0015493333339691162, -0.0014955401420593262, -0.0014417469501495361, -0.001387953758239746, -0.001334160566329956, -0.001280367374420166, -0.001226574182510376, -0.001172780990600586, -0.001118987798690796, -0.0010651946067810059, -0.0010114014148712158, -0.0009576082229614258, -0.0009038150310516357, -0.0008500218391418457, -0.0007962286472320557, -0.0007424354553222656, -0.0006886422634124756, -0.0006348490715026855, -0.0005810558795928955, -0.0005272626876831055, -0.00047346949577331543, -0.0004196763038635254, -0.00036588311195373535, -0.0003120899200439453, -0.0002582967281341553, -0.00020450353622436523, -0.0001507103443145752, -9.691715240478516e-05, -4.312396049499512e-05, 1.0669231414794922e-05, 6.446242332458496e-05, 0.000118255615234375, 0.00017204880714416504, 0.00022584199905395508, 0.0002796351909637451, 0.00033342838287353516, 0.0003872215747833252, 0.00044101476669311523, 0.0004948079586029053, 0.0005486011505126953, 0.0006023943424224854, 0.0006561875343322754, 0.0007099807262420654, 0.0007637739181518555, 0.0008175671100616455, 0.0008713603019714355, 0.0009251534938812256, 0.0009789466857910156, 0.0010327398777008057, 0.0010865330696105957, 0.0011403262615203857, 0.0011941194534301758, 0.0012479126453399658, 0.0013017058372497559, 0.001355499029159546, 0.001409292221069336, 0.001463085412979126, 0.001516878604888916, 0.001570671796798706, 0.001624464988708496, 0.0016782581806182861, 0.0017320513725280762, 0.0017858445644378662, 0.0018396377563476562]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 7.0, 6.0, 4.0, 10.0, 6.0, 9.0, 20.0, 19.0, 25.0, 31.0, 30.0, 52.0, 74.0, 71.0, 102.0, 167.0, 295.0, 812.0, 23714.0, 1007473.0, 14158.0, 617.0, 293.0, 139.0, 114.0, 64.0, 71.0, 36.0, 29.0, 25.0, 15.0, 16.0, 9.0, 11.0, 3.0, 10.0, 5.0, 2.0, 2.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.037109375, -0.03603219985961914, -0.03495502471923828, -0.03387784957885742, -0.03280067443847656, -0.0317234992980957, -0.030646324157714844, -0.029569149017333984, -0.028491973876953125, -0.027414798736572266, -0.026337623596191406, -0.025260448455810547, -0.024183273315429688, -0.023106098175048828, -0.02202892303466797, -0.02095174789428711, -0.01987457275390625, -0.01879739761352539, -0.01772022247314453, -0.016643047332763672, -0.015565872192382812, -0.014488697052001953, -0.013411521911621094, -0.012334346771240234, -0.011257171630859375, -0.010179996490478516, -0.009102821350097656, -0.008025646209716797, -0.0069484710693359375, -0.005871295928955078, -0.004794120788574219, -0.0037169456481933594, -0.0026397705078125, -0.0015625953674316406, -0.00048542022705078125, 0.0005917549133300781, 0.0016689300537109375, 0.002746105194091797, 0.0038232803344726562, 0.004900455474853516, 0.005977630615234375, 0.007054805755615234, 0.008131980895996094, 0.009209156036376953, 0.010286331176757812, 0.011363506317138672, 0.012440681457519531, 0.01351785659790039, 0.01459503173828125, 0.01567220687866211, 0.01674938201904297, 0.017826557159423828, 0.018903732299804688, 0.019980907440185547, 0.021058082580566406, 0.022135257720947266, 0.023212432861328125, 0.024289608001708984, 0.025366783142089844, 0.026443958282470703, 0.027521133422851562, 0.028598308563232422, 0.02967548370361328, 0.03075265884399414, 0.031829833984375]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 574.0, 441.0], "bins": [-0.03360971808433533, -0.03307604789733887, -0.03254237771034241, -0.032008711248636246, -0.031475041061639786, -0.030941370874643326, -0.030407702550292015, -0.029874032363295555, -0.029340364038944244, -0.028806693851947784, -0.028273025527596474, -0.027739355340600014, -0.027205687016248703, -0.026672016829252243, -0.026138348504900932, -0.025604678317904472, -0.025071008130908012, -0.024537337943911552, -0.02400366961956024, -0.023469999432563782, -0.02293633110821247, -0.02240266092121601, -0.0218689925968647, -0.02133532240986824, -0.02080165222287178, -0.02026798203587532, -0.01973431371152401, -0.01920064352452755, -0.01866697520017624, -0.01813330501317978, -0.01759963668882847, -0.01706596650183201, -0.016532298177480698, -0.015998627990484238, -0.015464959666132927, -0.014931290410459042, -0.014397621154785156, -0.013863950967788696, -0.013330281712114811, -0.012796612456440926, -0.012262944132089615, -0.01172927487641573, -0.011195605620741844, -0.010661936365067959, -0.010128267109394073, -0.009594596922397614, -0.009060927666723728, -0.008527258411049843, -0.007993589155375957, -0.007459919899702072, -0.006926250644028187, -0.006392580922693014, -0.005858911667019129, -0.0053252424113452435, -0.004791572690010071, -0.0042579034343361855, -0.0037242341786623, -0.0031905649229884148, -0.0026568954344838858, -0.0021232259459793568, -0.0015895566903054714, -0.001055887434631586, -0.0005222179461270571, 1.1451542377471924e-05, 0.0005451207980513573]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 1.0, 3.0, 4.0, 6.0, 8.0, 15.0, 17.0, 17.0, 22.0, 25.0, 30.0, 34.0, 46.0, 35.0, 48.0, 50.0, 54.0, 40.0, 61.0, 52.0, 63.0, 58.0, 49.0, 46.0, 46.0, 38.0, 27.0, 21.0, 18.0, 13.0, 23.0, 9.0, 6.0, 9.0, 6.0, 4.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008813142776489258, -0.0008425358682870865, -0.0008037574589252472, -0.0007649790495634079, -0.0007262006402015686, -0.0006874222308397293, -0.00064864382147789, -0.0006098654121160507, -0.0005710870027542114, -0.0005323085933923721, -0.0004935301840305328, -0.00045475177466869354, -0.00041597336530685425, -0.00037719495594501495, -0.00033841654658317566, -0.00029963813722133636, -0.00026085972785949707, -0.00022208131849765778, -0.00018330290913581848, -0.0001445244997739792, -0.00010574609041213989, -6.69676810503006e-05, -2.8189271688461304e-05, 1.058913767337799e-05, 4.9367547035217285e-05, 8.814595639705658e-05, 0.00012692436575889587, 0.00016570277512073517, 0.00020448118448257446, 0.00024325959384441376, 0.00028203800320625305, 0.00032081641256809235, 0.00035959482192993164, 0.00039837323129177094, 0.00043715164065361023, 0.0004759300500154495, 0.0005147084593772888, 0.0005534868687391281, 0.0005922652781009674, 0.0006310436874628067, 0.000669822096824646, 0.0007086005061864853, 0.0007473789155483246, 0.0007861573249101639, 0.0008249357342720032, 0.0008637141436338425, 0.0009024925529956818, 0.0009412709623575211, 0.0009800493717193604, 0.0010188277810811996, 0.001057606190443039, 0.0010963845998048782, 0.0011351630091667175, 0.0011739414185285568, 0.0012127198278903961, 0.0012514982372522354, 0.0012902766466140747, 0.001329055055975914, 0.0013678334653377533, 0.0014066118746995926, 0.0014453902840614319, 0.0014841686934232712, 0.0015229471027851105, 0.0015617255121469498, 0.001600503921508789]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 2.0, 4.0, 0.0, 3.0, 1.0, 6.0, 4.0, 7.0, 11.0, 8.0, 13.0, 13.0, 9.0, 10.0, 13.0, 21.0, 26.0, 26.0, 30.0, 26.0, 35.0, 26.0, 26.0, 49.0, 37.0, 41.0, 38.0, 39.0, 43.0, 50.0, 43.0, 37.0, 32.0, 30.0, 31.0, 22.0, 21.0, 20.0, 17.0, 20.0, 22.0, 23.0, 12.0, 17.0, 8.0, 10.0, 11.0, 5.0, 6.0, 1.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.9921875, -6.77020263671875, -6.5482177734375, -6.32623291015625, -6.104248046875, -5.88226318359375, -5.6602783203125, -5.43829345703125, -5.21630859375, -4.99432373046875, -4.7723388671875, -4.55035400390625, -4.328369140625, -4.10638427734375, -3.8843994140625, -3.66241455078125, -3.4404296875, -3.21844482421875, -2.9964599609375, -2.77447509765625, -2.552490234375, -2.33050537109375, -2.1085205078125, -1.88653564453125, -1.66455078125, -1.44256591796875, -1.2205810546875, -0.99859619140625, -0.776611328125, -0.55462646484375, -0.3326416015625, -0.11065673828125, 0.111328125, 0.33331298828125, 0.5552978515625, 0.77728271484375, 0.999267578125, 1.22125244140625, 1.4432373046875, 1.66522216796875, 1.88720703125, 2.10919189453125, 2.3311767578125, 2.55316162109375, 2.775146484375, 2.99713134765625, 3.2191162109375, 3.44110107421875, 3.6630859375, 3.88507080078125, 4.1070556640625, 4.32904052734375, 4.551025390625, 4.77301025390625, 4.9949951171875, 5.21697998046875, 5.43896484375, 5.66094970703125, 5.8829345703125, 6.10491943359375, 6.326904296875, 6.54888916015625, 6.7708740234375, 6.99285888671875, 7.21484375]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 6.0, 6.0, 8.0, 10.0, 15.0, 13.0, 16.0, 40.0, 44.0, 68.0, 85.0, 125.0, 178.0, 288.0, 368.0, 562.0, 896.0, 1457.0, 2210.0, 3659.0, 5969.0, 10338.0, 17468.0, 32782.0, 64371.0, 150615.0, 361402.0, 215254.0, 85828.0, 40881.0, 22086.0, 12353.0, 7172.0, 4377.0, 2758.0, 1667.0, 1044.0, 673.0, 449.0, 338.0, 203.0, 135.0, 94.0, 76.0, 49.0, 44.0, 28.0, 18.0, 13.0, 9.0, 10.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-6.203125, -6.00732421875, -5.8115234375, -5.61572265625, -5.419921875, -5.22412109375, -5.0283203125, -4.83251953125, -4.63671875, -4.44091796875, -4.2451171875, -4.04931640625, -3.853515625, -3.65771484375, -3.4619140625, -3.26611328125, -3.0703125, -2.87451171875, -2.6787109375, -2.48291015625, -2.287109375, -2.09130859375, -1.8955078125, -1.69970703125, -1.50390625, -1.30810546875, -1.1123046875, -0.91650390625, -0.720703125, -0.52490234375, -0.3291015625, -0.13330078125, 0.0625, 0.25830078125, 0.4541015625, 0.64990234375, 0.845703125, 1.04150390625, 1.2373046875, 1.43310546875, 1.62890625, 1.82470703125, 2.0205078125, 2.21630859375, 2.412109375, 2.60791015625, 2.8037109375, 2.99951171875, 3.1953125, 3.39111328125, 3.5869140625, 3.78271484375, 3.978515625, 4.17431640625, 4.3701171875, 4.56591796875, 4.76171875, 4.95751953125, 5.1533203125, 5.34912109375, 5.544921875, 5.74072265625, 5.9365234375, 6.13232421875, 6.328125]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 6.0, 8.0, 9.0, 8.0, 10.0, 22.0, 9.0, 10.0, 11.0, 27.0, 20.0, 29.0, 23.0, 43.0, 44.0, 48.0, 38.0, 52.0, 79.0, 162.0, 1504.0, 325.0, 121.0, 57.0, 52.0, 49.0, 38.0, 38.0, 31.0, 24.0, 25.0, 24.0, 17.0, 18.0, 15.0, 7.0, 12.0, 10.0, 9.0, 7.0, 3.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.5, -20.779052734375, -20.05810546875, -19.337158203125, -18.6162109375, -17.895263671875, -17.17431640625, -16.453369140625, -15.732421875, -15.011474609375, -14.29052734375, -13.569580078125, -12.8486328125, -12.127685546875, -11.40673828125, -10.685791015625, -9.96484375, -9.243896484375, -8.52294921875, -7.802001953125, -7.0810546875, -6.360107421875, -5.63916015625, -4.918212890625, -4.197265625, -3.476318359375, -2.75537109375, -2.034423828125, -1.3134765625, -0.592529296875, 0.12841796875, 0.849365234375, 1.5703125, 2.291259765625, 3.01220703125, 3.733154296875, 4.4541015625, 5.175048828125, 5.89599609375, 6.616943359375, 7.337890625, 8.058837890625, 8.77978515625, 9.500732421875, 10.2216796875, 10.942626953125, 11.66357421875, 12.384521484375, 13.10546875, 13.826416015625, 14.54736328125, 15.268310546875, 15.9892578125, 16.710205078125, 17.43115234375, 18.152099609375, 18.873046875, 19.593994140625, 20.31494140625, 21.035888671875, 21.7568359375, 22.477783203125, 23.19873046875, 23.919677734375, 24.640625]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 3.0, 0.0, 5.0, 3.0, 7.0, 8.0, 9.0, 17.0, 14.0, 13.0, 24.0, 29.0, 44.0, 50.0, 50.0, 86.0, 105.0, 158.0, 257.0, 438.0, 1370.0, 13128.0, 960979.0, 2148501.0, 17431.0, 1522.0, 466.0, 249.0, 172.0, 138.0, 121.0, 63.0, 53.0, 35.0, 31.0, 23.0, 20.0, 26.0, 17.0, 12.0, 9.0, 6.0, 11.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-40.90625, -39.6298828125, -38.353515625, -37.0771484375, -35.80078125, -34.5244140625, -33.248046875, -31.9716796875, -30.6953125, -29.4189453125, -28.142578125, -26.8662109375, -25.58984375, -24.3134765625, -23.037109375, -21.7607421875, -20.484375, -19.2080078125, -17.931640625, -16.6552734375, -15.37890625, -14.1025390625, -12.826171875, -11.5498046875, -10.2734375, -8.9970703125, -7.720703125, -6.4443359375, -5.16796875, -3.8916015625, -2.615234375, -1.3388671875, -0.0625, 1.2138671875, 2.490234375, 3.7666015625, 5.04296875, 6.3193359375, 7.595703125, 8.8720703125, 10.1484375, 11.4248046875, 12.701171875, 13.9775390625, 15.25390625, 16.5302734375, 17.806640625, 19.0830078125, 20.359375, 21.6357421875, 22.912109375, 24.1884765625, 25.46484375, 26.7412109375, 28.017578125, 29.2939453125, 30.5703125, 31.8466796875, 33.123046875, 34.3994140625, 35.67578125, 36.9521484375, 38.228515625, 39.5048828125, 40.78125]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 24.0, 877.0, 119.0], "bins": [-616.415283203125, -606.567626953125, -596.719970703125, -586.8722534179688, -577.0245971679688, -567.1769409179688, -557.3292846679688, -547.4815673828125, -537.6339111328125, -527.7862548828125, -517.9385986328125, -508.0909118652344, -498.24322509765625, -488.39556884765625, -478.5478820800781, -468.7002258300781, -458.8525390625, -449.0048828125, -439.1571960449219, -429.3095397949219, -419.46185302734375, -409.61419677734375, -399.7665100097656, -389.9188537597656, -380.0711975097656, -370.2235412597656, -360.3758544921875, -350.5281982421875, -340.6805114746094, -330.8328552246094, -320.98516845703125, -311.13751220703125, -301.289794921875, -291.442138671875, -281.5944519042969, -271.7467956542969, -261.89910888671875, -252.0514373779297, -242.20376586914062, -232.35610961914062, -222.50843811035156, -212.6607666015625, -202.81309509277344, -192.96542358398438, -183.1177520751953, -173.27008056640625, -163.42242431640625, -153.57473754882812, -143.72706604003906, -133.87939453125, -124.03172302246094, -114.18405151367188, -104.33638000488281, -94.48870849609375, -84.64104461669922, -74.79337310791016, -64.94570922851562, -55.09803771972656, -45.2503662109375, -35.4026985168457, -25.55502700805664, -15.707355499267578, -5.859687805175781, 3.9879837036132812, 13.83565902709961]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 8.0, 1.0, 5.0, 6.0, 3.0, 9.0, 3.0, 12.0, 13.0, 26.0, 18.0, 24.0, 18.0, 24.0, 30.0, 31.0, 28.0, 33.0, 29.0, 38.0, 37.0, 27.0, 42.0, 44.0, 37.0, 40.0, 36.0, 40.0, 30.0, 33.0, 28.0, 35.0, 29.0, 23.0, 16.0, 23.0, 24.0, 17.0, 17.0, 10.0, 9.0, 8.0, 7.0, 7.0, 6.0, 6.0, 5.0, 3.0, 2.0, 3.0, 6.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-50.04601287841797, -48.5070686340332, -46.96812438964844, -45.42918395996094, -43.89023971557617, -42.351295471191406, -40.812355041503906, -39.27341079711914, -37.734466552734375, -36.19552230834961, -34.656578063964844, -33.117637634277344, -31.578693389892578, -30.039749145507812, -28.50080680847168, -26.961864471435547, -25.42292022705078, -23.883975982666016, -22.345033645629883, -20.80609130859375, -19.267147064208984, -17.72820281982422, -16.189260482788086, -14.650317192077637, -13.111373901367188, -11.572430610656738, -10.033487319946289, -8.49454402923584, -6.955600738525391, -5.416657447814941, -3.877714157104492, -2.338770866394043, -0.7998275756835938, 0.7391157150268555, 2.2780590057373047, 3.817002296447754, 5.355945587158203, 6.894888877868652, 8.433832168579102, 9.97277545928955, 11.51171875, 13.05066204071045, 14.589605331420898, 16.12854766845703, 17.667491912841797, 19.206436157226562, 20.745378494262695, 22.284320831298828, 23.823265075683594, 25.36220932006836, 26.901151657104492, 28.440093994140625, 29.97903823852539, 31.517982482910156, 33.056922912597656, 34.59586715698242, 36.13481140136719, 37.67375564575195, 39.21269989013672, 40.75164031982422, 42.290584564208984, 43.82952880859375, 45.36846923828125, 46.907413482666016, 48.44635772705078]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 1.0, 3.0, 2.0, 2.0, 3.0, 5.0, 7.0, 10.0, 7.0, 8.0, 15.0, 11.0, 10.0, 11.0, 23.0, 22.0, 16.0, 37.0, 19.0, 30.0, 37.0, 33.0, 33.0, 35.0, 33.0, 36.0, 36.0, 49.0, 45.0, 47.0, 36.0, 34.0, 26.0, 38.0, 27.0, 23.0, 19.0, 18.0, 25.0, 24.0, 20.0, 12.0, 13.0, 17.0, 9.0, 8.0, 8.0, 7.0, 7.0, 2.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-6.890625, -6.670166015625, -6.44970703125, -6.229248046875, -6.0087890625, -5.788330078125, -5.56787109375, -5.347412109375, -5.126953125, -4.906494140625, -4.68603515625, -4.465576171875, -4.2451171875, -4.024658203125, -3.80419921875, -3.583740234375, -3.36328125, -3.142822265625, -2.92236328125, -2.701904296875, -2.4814453125, -2.260986328125, -2.04052734375, -1.820068359375, -1.599609375, -1.379150390625, -1.15869140625, -0.938232421875, -0.7177734375, -0.497314453125, -0.27685546875, -0.056396484375, 0.1640625, 0.384521484375, 0.60498046875, 0.825439453125, 1.0458984375, 1.266357421875, 1.48681640625, 1.707275390625, 1.927734375, 2.148193359375, 2.36865234375, 2.589111328125, 2.8095703125, 3.030029296875, 3.25048828125, 3.470947265625, 3.69140625, 3.911865234375, 4.13232421875, 4.352783203125, 4.5732421875, 4.793701171875, 5.01416015625, 5.234619140625, 5.455078125, 5.675537109375, 5.89599609375, 6.116455078125, 6.3369140625, 6.557373046875, 6.77783203125, 6.998291015625, 7.21875]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 5.0, 1.0, 8.0, 7.0, 9.0, 11.0, 17.0, 14.0, 25.0, 26.0, 40.0, 62.0, 63.0, 167.0, 337.0, 809.0, 1943.0, 5019.0, 15375.0, 54462.0, 309866.0, 2272461.0, 1324261.0, 157233.0, 34898.0, 10594.0, 3752.0, 1479.0, 614.0, 298.0, 139.0, 79.0, 55.0, 29.0, 26.0, 14.0, 23.0, 16.0, 9.0, 11.0, 8.0, 5.0, 2.0, 5.0, 3.0, 3.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-15.46875, -14.9501953125, -14.431640625, -13.9130859375, -13.39453125, -12.8759765625, -12.357421875, -11.8388671875, -11.3203125, -10.8017578125, -10.283203125, -9.7646484375, -9.24609375, -8.7275390625, -8.208984375, -7.6904296875, -7.171875, -6.6533203125, -6.134765625, -5.6162109375, -5.09765625, -4.5791015625, -4.060546875, -3.5419921875, -3.0234375, -2.5048828125, -1.986328125, -1.4677734375, -0.94921875, -0.4306640625, 0.087890625, 0.6064453125, 1.125, 1.6435546875, 2.162109375, 2.6806640625, 3.19921875, 3.7177734375, 4.236328125, 4.7548828125, 5.2734375, 5.7919921875, 6.310546875, 6.8291015625, 7.34765625, 7.8662109375, 8.384765625, 8.9033203125, 9.421875, 9.9404296875, 10.458984375, 10.9775390625, 11.49609375, 12.0146484375, 12.533203125, 13.0517578125, 13.5703125, 14.0888671875, 14.607421875, 15.1259765625, 15.64453125, 16.1630859375, 16.681640625, 17.2001953125, 17.71875]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 8.0, 8.0, 18.0, 28.0, 42.0, 102.0, 162.0, 324.0, 590.0, 1022.0, 832.0, 441.0, 236.0, 118.0, 61.0, 50.0, 12.0, 15.0, 5.0, 7.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-41.4375, -40.5701904296875, -39.702880859375, -38.8355712890625, -37.96826171875, -37.1009521484375, -36.233642578125, -35.3663330078125, -34.4990234375, -33.6317138671875, -32.764404296875, -31.8970947265625, -31.02978515625, -30.1624755859375, -29.295166015625, -28.4278564453125, -27.560546875, -26.6932373046875, -25.825927734375, -24.9586181640625, -24.09130859375, -23.2239990234375, -22.356689453125, -21.4893798828125, -20.6220703125, -19.7547607421875, -18.887451171875, -18.0201416015625, -17.15283203125, -16.2855224609375, -15.418212890625, -14.5509033203125, -13.68359375, -12.8162841796875, -11.948974609375, -11.0816650390625, -10.21435546875, -9.3470458984375, -8.479736328125, -7.6124267578125, -6.7451171875, -5.8778076171875, -5.010498046875, -4.1431884765625, -3.27587890625, -2.4085693359375, -1.541259765625, -0.6739501953125, 0.193359375, 1.0606689453125, 1.927978515625, 2.7952880859375, 3.66259765625, 4.5299072265625, 5.397216796875, 6.2645263671875, 7.1318359375, 7.9991455078125, 8.866455078125, 9.7337646484375, 10.60107421875, 11.4683837890625, 12.335693359375, 13.2030029296875, 14.0703125]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 8.0, 18.0, 20.0, 31.0, 70.0, 145.0, 224.0, 507.0, 1547.0, 33185.0, 3982904.0, 171214.0, 3106.0, 655.0, 319.0, 154.0, 86.0, 46.0, 24.0, 15.0, 12.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.875, -48.1484375, -45.421875, -42.6953125, -39.96875, -37.2421875, -34.515625, -31.7890625, -29.0625, -26.3359375, -23.609375, -20.8828125, -18.15625, -15.4296875, -12.703125, -9.9765625, -7.25, -4.5234375, -1.796875, 0.9296875, 3.65625, 6.3828125, 9.109375, 11.8359375, 14.5625, 17.2890625, 20.015625, 22.7421875, 25.46875, 28.1953125, 30.921875, 33.6484375, 36.375, 39.1015625, 41.828125, 44.5546875, 47.28125, 50.0078125, 52.734375, 55.4609375, 58.1875, 60.9140625, 63.640625, 66.3671875, 69.09375, 71.8203125, 74.546875, 77.2734375, 80.0, 82.7265625, 85.453125, 88.1796875, 90.90625, 93.6328125, 96.359375, 99.0859375, 101.8125, 104.5390625, 107.265625, 109.9921875, 112.71875, 115.4453125, 118.171875, 120.8984375, 123.625]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 1.0, 5.0, 2.0, 3.0, 9.0, 11.0, 20.0, 20.0, 32.0, 54.0, 54.0, 71.0, 56.0, 69.0, 65.0, 102.0, 76.0, 76.0, 71.0, 46.0, 38.0, 41.0, 19.0, 20.0, 10.0, 17.0, 9.0, 5.0, 5.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.636550903320312, -27.158437728881836, -25.68032455444336, -24.202213287353516, -22.72410011291504, -21.245986938476562, -19.767873764038086, -18.28976058959961, -16.811649322509766, -15.333536148071289, -13.855423927307129, -12.377310752868652, -10.899198532104492, -9.421085357666016, -7.942972183227539, -6.464859962463379, -4.986745834350586, -3.5086331367492676, -2.03052020072937, -0.5524072647094727, 0.9257054328918457, 2.403818130493164, 3.8819313049316406, 5.360043525695801, 6.838156700134277, 8.316269874572754, 9.794382095336914, 11.27249526977539, 12.750608444213867, 14.228720664978027, 15.706833839416504, 17.184946060180664, 18.66305923461914, 20.141172409057617, 21.619285583496094, 23.097396850585938, 24.575510025024414, 26.05362319946289, 27.531736373901367, 29.009849548339844, 30.487960815429688, 31.966073989868164, 33.44418716430664, 34.922298431396484, 36.400413513183594, 37.87852478027344, 39.35663604736328, 40.83475112915039, 42.3128662109375, 43.790977478027344, 45.26909255981445, 46.7472038269043, 48.225318908691406, 49.70343017578125, 51.181541442871094, 52.6596565246582, 54.13776779174805, 55.61587905883789, 57.093994140625, 58.572105407714844, 60.05022048950195, 61.5283317565918, 63.006446838378906, 64.48455810546875, 65.9626693725586]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 8.0, 7.0, 7.0, 12.0, 9.0, 14.0, 14.0, 13.0, 19.0, 23.0, 21.0, 25.0, 31.0, 31.0, 37.0, 29.0, 41.0, 44.0, 40.0, 42.0, 47.0, 50.0, 36.0, 48.0, 30.0, 35.0, 28.0, 34.0, 31.0, 28.0, 16.0, 33.0, 18.0, 21.0, 12.0, 13.0, 8.0, 10.0, 5.0, 8.0, 7.0, 4.0, 5.0, 1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-43.999542236328125, -42.56181716918945, -41.124088287353516, -39.686363220214844, -38.24863815307617, -36.8109130859375, -35.37318420410156, -33.93545913696289, -32.49773406982422, -31.060007095336914, -29.622282028198242, -28.184555053710938, -26.746829986572266, -25.30910301208496, -23.871376037597656, -22.433650970458984, -20.995922088623047, -19.558195114135742, -18.12047004699707, -16.682743072509766, -15.245017051696777, -13.807291030883789, -12.369564056396484, -10.931838035583496, -9.494112014770508, -8.05638599395752, -6.618659496307373, -5.180932998657227, -3.7432069778442383, -2.30548095703125, -0.8677539825439453, 0.569972038269043, 2.0076980590820312, 3.4454243183135986, 4.883150577545166, 6.3208770751953125, 7.758603096008301, 9.196329116821289, 10.634056091308594, 12.071782112121582, 13.50950813293457, 14.947234153747559, 16.384960174560547, 17.82268714904785, 19.260414123535156, 20.698139190673828, 22.135866165161133, 23.573593139648438, 25.01131820678711, 26.449045181274414, 27.886770248413086, 29.32449722290039, 30.762222290039062, 32.199951171875, 33.63767623901367, 35.075401306152344, 36.51313018798828, 37.95085525512695, 39.38858413696289, 40.82630920410156, 42.264034271240234, 43.701759338378906, 45.139488220214844, 46.577213287353516, 48.01493835449219]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 9.0, 5.0, 3.0, 5.0, 7.0, 11.0, 15.0, 15.0, 14.0, 17.0, 29.0, 25.0, 31.0, 27.0, 33.0, 32.0, 37.0, 43.0, 23.0, 38.0, 49.0, 35.0, 44.0, 24.0, 40.0, 47.0, 31.0, 41.0, 24.0, 28.0, 27.0, 24.0, 25.0, 21.0, 19.0, 22.0, 15.0, 5.0, 9.0, 6.0, 7.0, 12.0, 7.0, 8.0, 2.0, 5.0, 1.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.94140625, -7.6932373046875, -7.445068359375, -7.1968994140625, -6.94873046875, -6.7005615234375, -6.452392578125, -6.2042236328125, -5.9560546875, -5.7078857421875, -5.459716796875, -5.2115478515625, -4.96337890625, -4.7152099609375, -4.467041015625, -4.2188720703125, -3.970703125, -3.7225341796875, -3.474365234375, -3.2261962890625, -2.97802734375, -2.7298583984375, -2.481689453125, -2.2335205078125, -1.9853515625, -1.7371826171875, -1.489013671875, -1.2408447265625, -0.99267578125, -0.7445068359375, -0.496337890625, -0.2481689453125, 0.0, 0.2481689453125, 0.496337890625, 0.7445068359375, 0.99267578125, 1.2408447265625, 1.489013671875, 1.7371826171875, 1.9853515625, 2.2335205078125, 2.481689453125, 2.7298583984375, 2.97802734375, 3.2261962890625, 3.474365234375, 3.7225341796875, 3.970703125, 4.2188720703125, 4.467041015625, 4.7152099609375, 4.96337890625, 5.2115478515625, 5.459716796875, 5.7078857421875, 5.9560546875, 6.2042236328125, 6.452392578125, 6.7005615234375, 6.94873046875, 7.1968994140625, 7.445068359375, 7.6932373046875, 7.94140625]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 5.0, 6.0, 10.0, 26.0, 27.0, 44.0, 57.0, 57.0, 109.0, 149.0, 263.0, 300.0, 471.0, 601.0, 952.0, 1314.0, 1917.0, 2918.0, 4280.0, 6177.0, 9342.0, 13922.0, 21199.0, 32337.0, 49142.0, 74669.0, 110261.0, 148973.0, 163891.0, 131669.0, 92064.0, 61803.0, 40200.0, 26562.0, 17334.0, 11635.0, 7569.0, 5134.0, 3477.0, 2354.0, 1665.0, 1113.0, 785.0, 512.0, 380.0, 267.0, 222.0, 120.0, 84.0, 62.0, 55.0, 27.0, 25.0, 17.0, 8.0, 6.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.28466796875, -0.2758445739746094, -0.26702117919921875, -0.2581977844238281, -0.2493743896484375, -0.24055099487304688, -0.23172760009765625, -0.22290420532226562, -0.214080810546875, -0.20525741577148438, -0.19643402099609375, -0.18761062622070312, -0.1787872314453125, -0.16996383666992188, -0.16114044189453125, -0.15231704711914062, -0.14349365234375, -0.13467025756835938, -0.12584686279296875, -0.11702346801757812, -0.1082000732421875, -0.09937667846679688, -0.09055328369140625, -0.08172988891601562, -0.072906494140625, -0.06408309936523438, -0.05525970458984375, -0.046436309814453125, -0.0376129150390625, -0.028789520263671875, -0.01996612548828125, -0.011142730712890625, -0.0023193359375, 0.006504058837890625, 0.01532745361328125, 0.024150848388671875, 0.0329742431640625, 0.041797637939453125, 0.05062103271484375, 0.059444427490234375, 0.068267822265625, 0.07709121704101562, 0.08591461181640625, 0.09473800659179688, 0.1035614013671875, 0.11238479614257812, 0.12120819091796875, 0.13003158569335938, 0.13885498046875, 0.14767837524414062, 0.15650177001953125, 0.16532516479492188, 0.1741485595703125, 0.18297195434570312, 0.19179534912109375, 0.20061874389648438, 0.209442138671875, 0.21826553344726562, 0.22708892822265625, 0.23591232299804688, 0.2447357177734375, 0.2535591125488281, 0.26238250732421875, 0.2712059020996094, 0.280029296875]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 4.0, 2.0, 9.0, 7.0, 7.0, 8.0, 17.0, 10.0, 20.0, 15.0, 13.0, 18.0, 32.0, 29.0, 33.0, 44.0, 37.0, 28.0, 44.0, 38.0, 47.0, 43.0, 1063.0, 40.0, 37.0, 28.0, 33.0, 42.0, 31.0, 31.0, 26.0, 27.0, 20.0, 14.0, 22.0, 18.0, 12.0, 8.0, 18.0, 16.0, 11.0, 3.0, 9.0, 4.0, 2.0, 3.0, 2.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1796875, -5.015625, -4.8515625, -4.6875, -4.5234375, -4.359375, -4.1953125, -4.03125, -3.8671875, -3.703125, -3.5390625, -3.375, -3.2109375, -3.046875, -2.8828125, -2.71875, -2.5546875, -2.390625, -2.2265625, -2.0625, -1.8984375, -1.734375, -1.5703125, -1.40625, -1.2421875, -1.078125, -0.9140625, -0.75, -0.5859375, -0.421875, -0.2578125, -0.09375, 0.0703125, 0.234375, 0.3984375, 0.5625, 0.7265625, 0.890625, 1.0546875, 1.21875, 1.3828125, 1.546875, 1.7109375, 1.875, 2.0390625, 2.203125, 2.3671875, 2.53125, 2.6953125, 2.859375, 3.0234375, 3.1875, 3.3515625, 3.515625, 3.6796875, 3.84375, 4.0078125, 4.171875, 4.3359375, 4.5, 4.6640625, 4.828125, 4.9921875, 5.15625, 5.3203125]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 6.0, 6.0, 19.0, 24.0, 46.0, 65.0, 117.0, 163.0, 235.0, 383.0, 588.0, 830.0, 1329.0, 2002.0, 3038.0, 4543.0, 6982.0, 10966.0, 17054.0, 27330.0, 43833.0, 71136.0, 112164.0, 161253.0, 1229631.0, 144915.0, 96226.0, 60222.0, 37312.0, 22877.0, 14689.0, 9472.0, 6098.0, 3950.0, 2660.0, 1616.0, 1145.0, 792.0, 497.0, 319.0, 229.0, 142.0, 89.0, 58.0, 35.0, 16.0, 15.0, 8.0, 8.0, 7.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.284423828125, -0.2753448486328125, -0.266265869140625, -0.2571868896484375, -0.24810791015625, -0.2390289306640625, -0.229949951171875, -0.2208709716796875, -0.2117919921875, -0.2027130126953125, -0.193634033203125, -0.1845550537109375, -0.17547607421875, -0.1663970947265625, -0.157318115234375, -0.1482391357421875, -0.13916015625, -0.1300811767578125, -0.121002197265625, -0.1119232177734375, -0.10284423828125, -0.0937652587890625, -0.084686279296875, -0.0756072998046875, -0.0665283203125, -0.0574493408203125, -0.048370361328125, -0.0392913818359375, -0.03021240234375, -0.0211334228515625, -0.012054443359375, -0.0029754638671875, 0.006103515625, 0.0151824951171875, 0.024261474609375, 0.0333404541015625, 0.04241943359375, 0.0514984130859375, 0.060577392578125, 0.0696563720703125, 0.0787353515625, 0.0878143310546875, 0.096893310546875, 0.1059722900390625, 0.11505126953125, 0.1241302490234375, 0.133209228515625, 0.1422882080078125, 0.1513671875, 0.1604461669921875, 0.169525146484375, 0.1786041259765625, 0.18768310546875, 0.1967620849609375, 0.205841064453125, 0.2149200439453125, 0.2239990234375, 0.2330780029296875, 0.242156982421875, 0.2512359619140625, 0.26031494140625, 0.2693939208984375, 0.278472900390625, 0.2875518798828125, 0.296630859375]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 5.0, 3.0, 1.0, 1.0, 4.0, 1.0, 3.0, 3.0, 5.0, 2.0, 6.0, 11.0, 12.0, 14.0, 26.0, 24.0, 29.0, 37.0, 32.0, 53.0, 58.0, 54.0, 64.0, 52.0, 71.0, 61.0, 50.0, 48.0, 48.0, 38.0, 37.0, 32.0, 31.0, 23.0, 12.0, 9.0, 7.0, 7.0, 9.0, 5.0, 6.0, 5.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0013418197631835938, -0.0012940019369125366, -0.0012461841106414795, -0.0011983662843704224, -0.0011505484580993652, -0.001102730631828308, -0.001054912805557251, -0.0010070949792861938, -0.0009592771530151367, -0.0009114593267440796, -0.0008636415004730225, -0.0008158236742019653, -0.0007680058479309082, -0.0007201880216598511, -0.0006723701953887939, -0.0006245523691177368, -0.0005767345428466797, -0.0005289167165756226, -0.00048109889030456543, -0.0004332810640335083, -0.00038546323776245117, -0.00033764541149139404, -0.0002898275852203369, -0.00024200975894927979, -0.00019419193267822266, -0.00014637410640716553, -9.85562801361084e-05, -5.073845386505127e-05, -2.9206275939941406e-06, 4.489719867706299e-05, 9.271502494812012e-05, 0.00014053285121917725, 0.00018835067749023438, 0.0002361685037612915, 0.00028398633003234863, 0.00033180415630340576, 0.0003796219825744629, 0.00042743980884552, 0.00047525763511657715, 0.0005230754613876343, 0.0005708932876586914, 0.0006187111139297485, 0.0006665289402008057, 0.0007143467664718628, 0.0007621645927429199, 0.000809982419013977, 0.0008578002452850342, 0.0009056180715560913, 0.0009534358978271484, 0.0010012537240982056, 0.0010490715503692627, 0.0010968893766403198, 0.001144707202911377, 0.001192525029182434, 0.0012403428554534912, 0.0012881606817245483, 0.0013359785079956055, 0.0013837963342666626, 0.0014316141605377197, 0.0014794319868087769, 0.001527249813079834, 0.0015750676393508911, 0.0016228854656219482, 0.0016707032918930054, 0.0017185211181640625]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 6.0, 1.0, 4.0, 3.0, 12.0, 6.0, 10.0, 13.0, 10.0, 13.0, 30.0, 33.0, 52.0, 59.0, 99.0, 115.0, 157.0, 256.0, 597.0, 10387.0, 992586.0, 42316.0, 834.0, 287.0, 189.0, 137.0, 76.0, 71.0, 53.0, 30.0, 23.0, 20.0, 20.0, 8.0, 9.0, 9.0, 5.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 7.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0345458984375, -0.033576011657714844, -0.03260612487792969, -0.03163623809814453, -0.030666351318359375, -0.02969646453857422, -0.028726577758789062, -0.027756690979003906, -0.02678680419921875, -0.025816917419433594, -0.024847030639648438, -0.02387714385986328, -0.022907257080078125, -0.02193737030029297, -0.020967483520507812, -0.019997596740722656, -0.0190277099609375, -0.018057823181152344, -0.017087936401367188, -0.01611804962158203, -0.015148162841796875, -0.014178276062011719, -0.013208389282226562, -0.012238502502441406, -0.01126861572265625, -0.010298728942871094, -0.009328842163085938, -0.008358955383300781, -0.007389068603515625, -0.006419181823730469, -0.0054492950439453125, -0.004479408264160156, -0.003509521484375, -0.0025396347045898438, -0.0015697479248046875, -0.0005998611450195312, 0.000370025634765625, 0.0013399124145507812, 0.0023097991943359375, 0.0032796859741210938, 0.00424957275390625, 0.005219459533691406, 0.0061893463134765625, 0.007159233093261719, 0.008129119873046875, 0.009099006652832031, 0.010068893432617188, 0.011038780212402344, 0.0120086669921875, 0.012978553771972656, 0.013948440551757812, 0.014918327331542969, 0.015888214111328125, 0.01685810089111328, 0.017827987670898438, 0.018797874450683594, 0.01976776123046875, 0.020737648010253906, 0.021707534790039062, 0.02267742156982422, 0.023647308349609375, 0.02461719512939453, 0.025587081909179688, 0.026556968688964844, 0.02752685546875]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 12.0, 295.0, 642.0, 64.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.014963106252253056, -0.01470190566033125, -0.014440705068409443, -0.014179504476487637, -0.01391830388456583, -0.013657104223966599, -0.013395903632044792, -0.013134703040122986, -0.01287350244820118, -0.012612301856279373, -0.012351101264357567, -0.01208990067243576, -0.011828700080513954, -0.011567499488592148, -0.011306298896670341, -0.01104509923607111, -0.010783897712826729, -0.010522697120904922, -0.010261496528983116, -0.01000029593706131, -0.009739095345139503, -0.009477894753217697, -0.00921669416129589, -0.008955494500696659, -0.008694293908774853, -0.008433093316853046, -0.00817189272493124, -0.007910692133009434, -0.007649492006748915, -0.007388291414827108, -0.007127090822905302, -0.006865890230983496, -0.006604690104722977, -0.00634348951280117, -0.006082288920879364, -0.005821088328957558, -0.005559888202697039, -0.005298687610775232, -0.005037487018853426, -0.00477628642693162, -0.004515086300671101, -0.004253885708749294, -0.003992685116827488, -0.0037314847577363253, -0.0034702843986451626, -0.0032090838067233562, -0.00294788321480155, -0.0026866826228797436, -0.0024254820309579372, -0.002164281439036131, -0.0019030810799449682, -0.0016418804880231619, -0.0013806800125166774, -0.0011194795370101929, -0.0008582789450883865, -0.000597078469581902, -0.0003358779940754175, -7.467748946510255e-05, 0.0001865230151452124, 0.00044772354885935783, 0.0007089240243658423, 0.0009701244998723269, 0.0012313250917941332, 0.0014925255673006177, 0.0017537260428071022]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 2.0, 8.0, 6.0, 6.0, 9.0, 11.0, 13.0, 20.0, 17.0, 24.0, 27.0, 34.0, 43.0, 42.0, 31.0, 56.0, 48.0, 38.0, 41.0, 34.0, 38.0, 46.0, 49.0, 36.0, 38.0, 39.0, 43.0, 28.0, 19.0, 23.0, 24.0, 21.0, 18.0, 11.0, 7.0, 5.0, 7.0, 11.0, 9.0, 8.0, 3.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.0009286999702453613, -0.0009017419070005417, -0.000874783843755722, -0.0008478257805109024, -0.0008208677172660828, -0.0007939096540212631, -0.0007669515907764435, -0.0007399935275316238, -0.0007130354642868042, -0.0006860774010419846, -0.0006591193377971649, -0.0006321612745523453, -0.0006052032113075256, -0.000578245148062706, -0.0005512870848178864, -0.0005243290215730667, -0.0004973709583282471, -0.00047041289508342743, -0.0004434548318386078, -0.00041649676859378815, -0.0003895387053489685, -0.00036258064210414886, -0.0003356225788593292, -0.0003086645156145096, -0.00028170645236968994, -0.0002547483891248703, -0.00022779032588005066, -0.00020083226263523102, -0.00017387419939041138, -0.00014691613614559174, -0.0001199580729007721, -9.300000965595245e-05, -6.604194641113281e-05, -3.908388316631317e-05, -1.212581992149353e-05, 1.483224332332611e-05, 4.179030656814575e-05, 6.874836981296539e-05, 9.570643305778503e-05, 0.00012266449630260468, 0.00014962255954742432, 0.00017658062279224396, 0.0002035386860370636, 0.00023049674928188324, 0.0002574548125267029, 0.0002844128757715225, 0.00031137093901634216, 0.0003383290022611618, 0.00036528706550598145, 0.0003922451287508011, 0.00041920319199562073, 0.00044616125524044037, 0.00047311931848526, 0.0005000773817300797, 0.0005270354449748993, 0.0005539935082197189, 0.0005809515714645386, 0.0006079096347093582, 0.0006348676979541779, 0.0006618257611989975, 0.0006887838244438171, 0.0007157418876886368, 0.0007426999509334564, 0.0007696580141782761, 0.0007966160774230957]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 9.0, 5.0, 3.0, 5.0, 7.0, 11.0, 15.0, 15.0, 14.0, 17.0, 29.0, 25.0, 31.0, 27.0, 33.0, 32.0, 37.0, 43.0, 23.0, 38.0, 49.0, 35.0, 44.0, 24.0, 40.0, 47.0, 31.0, 41.0, 24.0, 27.0, 28.0, 24.0, 25.0, 21.0, 19.0, 22.0, 15.0, 5.0, 9.0, 6.0, 7.0, 12.0, 7.0, 8.0, 2.0, 5.0, 1.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.94140625, -7.6932373046875, -7.445068359375, -7.1968994140625, -6.94873046875, -6.7005615234375, -6.452392578125, -6.2042236328125, -5.9560546875, -5.7078857421875, -5.459716796875, -5.2115478515625, -4.96337890625, -4.7152099609375, -4.467041015625, -4.2188720703125, -3.970703125, -3.7225341796875, -3.474365234375, -3.2261962890625, -2.97802734375, -2.7298583984375, -2.481689453125, -2.2335205078125, -1.9853515625, -1.7371826171875, -1.489013671875, -1.2408447265625, -0.99267578125, -0.7445068359375, -0.496337890625, -0.2481689453125, 0.0, 0.2481689453125, 0.496337890625, 0.7445068359375, 0.99267578125, 1.2408447265625, 1.489013671875, 1.7371826171875, 1.9853515625, 2.2335205078125, 2.481689453125, 2.7298583984375, 2.97802734375, 3.2261962890625, 3.474365234375, 3.7225341796875, 3.970703125, 4.2188720703125, 4.467041015625, 4.7152099609375, 4.96337890625, 5.2115478515625, 5.459716796875, 5.7078857421875, 5.9560546875, 6.2042236328125, 6.452392578125, 6.7005615234375, 6.94873046875, 7.1968994140625, 7.445068359375, 7.6932373046875, 7.94140625]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 10.0, 6.0, 3.0, 6.0, 12.0, 18.0, 16.0, 30.0, 30.0, 39.0, 60.0, 66.0, 95.0, 145.0, 215.0, 381.0, 809.0, 1790.0, 4685.0, 13617.0, 54015.0, 575231.0, 340828.0, 38817.0, 10637.0, 3804.0, 1457.0, 685.0, 342.0, 194.0, 130.0, 91.0, 72.0, 53.0, 32.0, 31.0, 24.0, 6.0, 13.0, 8.0, 12.0, 9.0, 8.0, 11.0, 1.0, 4.0, 1.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-15.890625, -15.3924560546875, -14.894287109375, -14.3961181640625, -13.89794921875, -13.3997802734375, -12.901611328125, -12.4034423828125, -11.9052734375, -11.4071044921875, -10.908935546875, -10.4107666015625, -9.91259765625, -9.4144287109375, -8.916259765625, -8.4180908203125, -7.919921875, -7.4217529296875, -6.923583984375, -6.4254150390625, -5.92724609375, -5.4290771484375, -4.930908203125, -4.4327392578125, -3.9345703125, -3.4364013671875, -2.938232421875, -2.4400634765625, -1.94189453125, -1.4437255859375, -0.945556640625, -0.4473876953125, 0.05078125, 0.5489501953125, 1.047119140625, 1.5452880859375, 2.04345703125, 2.5416259765625, 3.039794921875, 3.5379638671875, 4.0361328125, 4.5343017578125, 5.032470703125, 5.5306396484375, 6.02880859375, 6.5269775390625, 7.025146484375, 7.5233154296875, 8.021484375, 8.5196533203125, 9.017822265625, 9.5159912109375, 10.01416015625, 10.5123291015625, 11.010498046875, 11.5086669921875, 12.0068359375, 12.5050048828125, 13.003173828125, 13.5013427734375, 13.99951171875, 14.4976806640625, 14.995849609375, 15.4940185546875, 15.9921875]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 3.0, 2.0, 1.0, 5.0, 5.0, 2.0, 11.0, 10.0, 9.0, 12.0, 11.0, 17.0, 22.0, 22.0, 28.0, 31.0, 21.0, 34.0, 39.0, 40.0, 44.0, 89.0, 318.0, 1637.0, 150.0, 61.0, 41.0, 48.0, 50.0, 35.0, 39.0, 38.0, 28.0, 25.0, 30.0, 18.0, 20.0, 11.0, 2.0, 6.0, 7.0, 14.0, 5.0, 3.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-30.53125, -29.6875, -28.84375, -28.0, -27.15625, -26.3125, -25.46875, -24.625, -23.78125, -22.9375, -22.09375, -21.25, -20.40625, -19.5625, -18.71875, -17.875, -17.03125, -16.1875, -15.34375, -14.5, -13.65625, -12.8125, -11.96875, -11.125, -10.28125, -9.4375, -8.59375, -7.75, -6.90625, -6.0625, -5.21875, -4.375, -3.53125, -2.6875, -1.84375, -1.0, -0.15625, 0.6875, 1.53125, 2.375, 3.21875, 4.0625, 4.90625, 5.75, 6.59375, 7.4375, 8.28125, 9.125, 9.96875, 10.8125, 11.65625, 12.5, 13.34375, 14.1875, 15.03125, 15.875, 16.71875, 17.5625, 18.40625, 19.25, 20.09375, 20.9375, 21.78125, 22.625, 23.46875]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 4.0, 2.0, 3.0, 3.0, 6.0, 8.0, 12.0, 5.0, 9.0, 10.0, 20.0, 24.0, 31.0, 40.0, 47.0, 42.0, 62.0, 85.0, 139.0, 206.0, 423.0, 1547.0, 34928.0, 3082981.0, 22927.0, 1171.0, 355.0, 175.0, 108.0, 65.0, 68.0, 33.0, 38.0, 22.0, 25.0, 12.0, 16.0, 12.0, 9.0, 9.0, 10.0, 5.0, 3.0, 5.0, 1.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.0, -51.0693359375, -49.138671875, -47.2080078125, -45.27734375, -43.3466796875, -41.416015625, -39.4853515625, -37.5546875, -35.6240234375, -33.693359375, -31.7626953125, -29.83203125, -27.9013671875, -25.970703125, -24.0400390625, -22.109375, -20.1787109375, -18.248046875, -16.3173828125, -14.38671875, -12.4560546875, -10.525390625, -8.5947265625, -6.6640625, -4.7333984375, -2.802734375, -0.8720703125, 1.05859375, 2.9892578125, 4.919921875, 6.8505859375, 8.78125, 10.7119140625, 12.642578125, 14.5732421875, 16.50390625, 18.4345703125, 20.365234375, 22.2958984375, 24.2265625, 26.1572265625, 28.087890625, 30.0185546875, 31.94921875, 33.8798828125, 35.810546875, 37.7412109375, 39.671875, 41.6025390625, 43.533203125, 45.4638671875, 47.39453125, 49.3251953125, 51.255859375, 53.1865234375, 55.1171875, 57.0478515625, 58.978515625, 60.9091796875, 62.83984375, 64.7705078125, 66.701171875, 68.6318359375, 70.5625]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 8.0, 91.0, 349.0, 414.0, 123.0, 26.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-154.79124450683594, -151.87733459472656, -148.96343994140625, -146.04953002929688, -143.13563537597656, -140.2217254638672, -137.3078155517578, -134.3939208984375, -131.48001098632812, -128.56610107421875, -125.65220642089844, -122.73829650878906, -119.82439422607422, -116.91049194335938, -113.99658966064453, -111.08268737792969, -108.16877746582031, -105.25487518310547, -102.34097290039062, -99.42706298828125, -96.5131607055664, -93.59925842285156, -90.68535614013672, -87.77145385742188, -84.85755157470703, -81.94364929199219, -79.02974700927734, -76.11583709716797, -73.20193481445312, -70.28803253173828, -67.37413024902344, -64.46022033691406, -61.54631805419922, -58.632415771484375, -55.718509674072266, -52.80460739135742, -49.89070129394531, -46.97679901123047, -44.062896728515625, -41.148990631103516, -38.235084533691406, -35.32118225097656, -32.40727615356445, -29.49337387084961, -26.5794677734375, -23.665565490722656, -20.75166130065918, -17.837757110595703, -14.92385482788086, -12.009950637817383, -9.096046447753906, -6.182143211364746, -3.2682390213012695, -0.35433483123779297, 2.559568405151367, 5.473472595214844, 8.38737678527832, 11.301280975341797, 14.215185165405273, 17.12908935546875, 20.042991638183594, 22.956897735595703, 25.870800018310547, 28.784704208374023, 31.6986083984375]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 4.0, 3.0, 5.0, 6.0, 6.0, 9.0, 11.0, 18.0, 16.0, 21.0, 25.0, 19.0, 26.0, 32.0, 32.0, 41.0, 42.0, 55.0, 41.0, 43.0, 56.0, 47.0, 46.0, 48.0, 43.0, 39.0, 42.0, 36.0, 34.0, 26.0, 17.0, 23.0, 22.0, 20.0, 12.0, 9.0, 7.0, 9.0, 7.0, 6.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.4991683959961, -71.23080444335938, -68.96244049072266, -66.69407653808594, -64.42571258544922, -62.1573486328125, -59.88898468017578, -57.62062072753906, -55.352256774902344, -53.083892822265625, -50.815528869628906, -48.54716491699219, -46.27880096435547, -44.01043701171875, -41.74207305908203, -39.47370910644531, -37.20534133911133, -34.93697738647461, -32.66861343383789, -30.400249481201172, -28.131885528564453, -25.863521575927734, -23.595155715942383, -21.326791763305664, -19.058427810668945, -16.790063858032227, -14.521699905395508, -12.253334999084473, -9.984971046447754, -7.716607093811035, -5.4482421875, -3.1798782348632812, -0.9115142822265625, 1.3568499088287354, 3.625214099884033, 5.89357852935791, 8.161942481994629, 10.430306434631348, 12.698671340942383, 14.967035293579102, 17.23539924621582, 19.50376319885254, 21.772127151489258, 24.04049301147461, 26.308856964111328, 28.577220916748047, 30.845584869384766, 33.113948822021484, 35.3823127746582, 37.65067672729492, 39.91904067993164, 42.18740463256836, 44.45576858520508, 46.7241325378418, 48.99250030517578, 51.2608642578125, 53.52922821044922, 55.79759216308594, 58.065956115722656, 60.334320068359375, 62.602684020996094, 64.87104797363281, 67.13941192626953, 69.40777587890625, 71.67613983154297]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 5.0, 4.0, 7.0, 7.0, 6.0, 6.0, 12.0, 12.0, 22.0, 22.0, 30.0, 28.0, 36.0, 20.0, 47.0, 38.0, 35.0, 40.0, 29.0, 37.0, 37.0, 45.0, 47.0, 37.0, 43.0, 42.0, 30.0, 32.0, 26.0, 33.0, 24.0, 26.0, 26.0, 20.0, 13.0, 17.0, 6.0, 7.0, 12.0, 10.0, 3.0, 8.0, 6.0, 5.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.78125, -8.509765625, -8.23828125, -7.966796875, -7.6953125, -7.423828125, -7.15234375, -6.880859375, -6.609375, -6.337890625, -6.06640625, -5.794921875, -5.5234375, -5.251953125, -4.98046875, -4.708984375, -4.4375, -4.166015625, -3.89453125, -3.623046875, -3.3515625, -3.080078125, -2.80859375, -2.537109375, -2.265625, -1.994140625, -1.72265625, -1.451171875, -1.1796875, -0.908203125, -0.63671875, -0.365234375, -0.09375, 0.177734375, 0.44921875, 0.720703125, 0.9921875, 1.263671875, 1.53515625, 1.806640625, 2.078125, 2.349609375, 2.62109375, 2.892578125, 3.1640625, 3.435546875, 3.70703125, 3.978515625, 4.25, 4.521484375, 4.79296875, 5.064453125, 5.3359375, 5.607421875, 5.87890625, 6.150390625, 6.421875, 6.693359375, 6.96484375, 7.236328125, 7.5078125, 7.779296875, 8.05078125, 8.322265625, 8.59375]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 4.0, 3.0, 1.0, 9.0, 8.0, 9.0, 12.0, 17.0, 29.0, 36.0, 54.0, 81.0, 133.0, 187.0, 386.0, 788.0, 1565.0, 3765.0, 9340.0, 26395.0, 96564.0, 604459.0, 2476818.0, 802293.0, 120610.0, 31630.0, 11043.0, 4272.0, 1893.0, 840.0, 403.0, 219.0, 132.0, 74.0, 57.0, 27.0, 37.0, 20.0, 17.0, 18.0, 11.0, 4.0, 7.0, 5.0, 4.0, 4.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-17.375, -16.841552734375, -16.30810546875, -15.774658203125, -15.2412109375, -14.707763671875, -14.17431640625, -13.640869140625, -13.107421875, -12.573974609375, -12.04052734375, -11.507080078125, -10.9736328125, -10.440185546875, -9.90673828125, -9.373291015625, -8.83984375, -8.306396484375, -7.77294921875, -7.239501953125, -6.7060546875, -6.172607421875, -5.63916015625, -5.105712890625, -4.572265625, -4.038818359375, -3.50537109375, -2.971923828125, -2.4384765625, -1.905029296875, -1.37158203125, -0.838134765625, -0.3046875, 0.228759765625, 0.76220703125, 1.295654296875, 1.8291015625, 2.362548828125, 2.89599609375, 3.429443359375, 3.962890625, 4.496337890625, 5.02978515625, 5.563232421875, 6.0966796875, 6.630126953125, 7.16357421875, 7.697021484375, 8.23046875, 8.763916015625, 9.29736328125, 9.830810546875, 10.3642578125, 10.897705078125, 11.43115234375, 11.964599609375, 12.498046875, 13.031494140625, 13.56494140625, 14.098388671875, 14.6318359375, 15.165283203125, 15.69873046875, 16.232177734375, 16.765625]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 4.0, 0.0, 2.0, 4.0, 5.0, 5.0, 8.0, 9.0, 17.0, 14.0, 22.0, 33.0, 37.0, 41.0, 62.0, 69.0, 116.0, 168.0, 231.0, 314.0, 348.0, 464.0, 481.0, 377.0, 318.0, 255.0, 165.0, 130.0, 81.0, 76.0, 56.0, 30.0, 34.0, 28.0, 19.0, 16.0, 5.0, 8.0, 4.0, 5.0, 2.0, 4.0, 7.0, 5.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-14.4609375, -14.03662109375, -13.6123046875, -13.18798828125, -12.763671875, -12.33935546875, -11.9150390625, -11.49072265625, -11.06640625, -10.64208984375, -10.2177734375, -9.79345703125, -9.369140625, -8.94482421875, -8.5205078125, -8.09619140625, -7.671875, -7.24755859375, -6.8232421875, -6.39892578125, -5.974609375, -5.55029296875, -5.1259765625, -4.70166015625, -4.27734375, -3.85302734375, -3.4287109375, -3.00439453125, -2.580078125, -2.15576171875, -1.7314453125, -1.30712890625, -0.8828125, -0.45849609375, -0.0341796875, 0.39013671875, 0.814453125, 1.23876953125, 1.6630859375, 2.08740234375, 2.51171875, 2.93603515625, 3.3603515625, 3.78466796875, 4.208984375, 4.63330078125, 5.0576171875, 5.48193359375, 5.90625, 6.33056640625, 6.7548828125, 7.17919921875, 7.603515625, 8.02783203125, 8.4521484375, 8.87646484375, 9.30078125, 9.72509765625, 10.1494140625, 10.57373046875, 10.998046875, 11.42236328125, 11.8466796875, 12.27099609375, 12.6953125]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 8.0, 5.0, 6.0, 5.0, 9.0, 11.0, 7.0, 15.0, 20.0, 20.0, 35.0, 68.0, 66.0, 92.0, 138.0, 223.0, 359.0, 661.0, 1481.0, 3970.0, 12927.0, 54265.0, 382199.0, 3058667.0, 581876.0, 72605.0, 15888.0, 4933.0, 1765.0, 768.0, 400.0, 231.0, 151.0, 107.0, 73.0, 54.0, 46.0, 31.0, 34.0, 25.0, 9.0, 9.0, 5.0, 7.0, 4.0, 3.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.1875, -27.265869140625, -26.34423828125, -25.422607421875, -24.5009765625, -23.579345703125, -22.65771484375, -21.736083984375, -20.814453125, -19.892822265625, -18.97119140625, -18.049560546875, -17.1279296875, -16.206298828125, -15.28466796875, -14.363037109375, -13.44140625, -12.519775390625, -11.59814453125, -10.676513671875, -9.7548828125, -8.833251953125, -7.91162109375, -6.989990234375, -6.068359375, -5.146728515625, -4.22509765625, -3.303466796875, -2.3818359375, -1.460205078125, -0.53857421875, 0.383056640625, 1.3046875, 2.226318359375, 3.14794921875, 4.069580078125, 4.9912109375, 5.912841796875, 6.83447265625, 7.756103515625, 8.677734375, 9.599365234375, 10.52099609375, 11.442626953125, 12.3642578125, 13.285888671875, 14.20751953125, 15.129150390625, 16.05078125, 16.972412109375, 17.89404296875, 18.815673828125, 19.7373046875, 20.658935546875, 21.58056640625, 22.502197265625, 23.423828125, 24.345458984375, 25.26708984375, 26.188720703125, 27.1103515625, 28.031982421875, 28.95361328125, 29.875244140625, 30.796875]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 8.0, 10.0, 21.0, 21.0, 33.0, 61.0, 84.0, 87.0, 112.0, 114.0, 116.0, 92.0, 79.0, 54.0, 41.0, 26.0, 16.0, 16.0, 3.0, 5.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-33.2737922668457, -31.25328254699707, -29.232770919799805, -27.212261199951172, -25.191749572753906, -23.171239852905273, -21.15073013305664, -19.130218505859375, -17.109708786010742, -15.089198112487793, -13.068687438964844, -11.048177719116211, -9.027667045593262, -7.0071563720703125, -4.98664665222168, -2.9661359786987305, -0.9456253051757812, 1.0748851299285889, 3.095395565032959, 5.11590576171875, 7.136416435241699, 9.156927108764648, 11.177436828613281, 13.19794750213623, 15.21845817565918, 17.238967895507812, 19.259479522705078, 21.27998924255371, 23.300498962402344, 25.32101058959961, 27.341520309448242, 29.362030029296875, 31.382545471191406, 33.40305709838867, 35.42356491088867, 37.44407653808594, 39.4645881652832, 41.48509979248047, 43.50560760498047, 45.526119232177734, 47.546630859375, 49.567142486572266, 51.587650299072266, 53.60816192626953, 55.6286735534668, 57.64918518066406, 59.66969299316406, 61.69020462036133, 63.71071243286133, 65.7312240600586, 67.7517318725586, 69.77224731445312, 71.79275512695312, 73.81326293945312, 75.83377075195312, 77.85428619384766, 79.87479400634766, 81.89530181884766, 83.91581726074219, 85.93632507324219, 87.95683288574219, 89.97734832763672, 91.99785614013672, 94.01836395263672, 96.03887939453125]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 5.0, 4.0, 2.0, 2.0, 4.0, 9.0, 11.0, 8.0, 11.0, 17.0, 19.0, 16.0, 20.0, 31.0, 21.0, 29.0, 18.0, 28.0, 37.0, 34.0, 35.0, 34.0, 46.0, 45.0, 45.0, 44.0, 45.0, 38.0, 37.0, 39.0, 29.0, 29.0, 34.0, 27.0, 25.0, 14.0, 22.0, 22.0, 14.0, 11.0, 14.0, 7.0, 8.0, 9.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-45.069252014160156, -43.62033462524414, -42.17141342163086, -40.722496032714844, -39.27357864379883, -37.82465744018555, -36.37574005126953, -34.92681884765625, -33.477901458740234, -32.02898406982422, -30.58006477355957, -29.131145477294922, -27.682226181030273, -26.233306884765625, -24.78438949584961, -23.33547019958496, -21.886552810668945, -20.437633514404297, -18.98871612548828, -17.539796829223633, -16.090877532958984, -14.641959190368652, -13.19304084777832, -11.744121551513672, -10.29520320892334, -8.846284866333008, -7.397365570068359, -5.948447227478027, -4.499528408050537, -3.050609588623047, -1.6016912460327148, -0.1527719497680664, 1.2961463928222656, 2.745065212249756, 4.193984031677246, 5.642902374267578, 7.091821193695068, 8.540740013122559, 9.98965835571289, 11.438577651977539, 12.887495994567871, 14.336414337158203, 15.785333633422852, 17.2342529296875, 18.683170318603516, 20.132089614868164, 21.581008911132812, 23.029926300048828, 24.478845596313477, 25.927764892578125, 27.37668228149414, 28.82560157775879, 30.274520874023438, 31.723438262939453, 33.17235565185547, 34.62127685546875, 36.070194244384766, 37.51911163330078, 38.96803283691406, 40.41695022583008, 41.865867614746094, 43.314788818359375, 44.76370620727539, 46.212623596191406, 47.66154479980469]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 11.0, 5.0, 5.0, 14.0, 13.0, 14.0, 16.0, 16.0, 14.0, 33.0, 21.0, 32.0, 42.0, 39.0, 44.0, 31.0, 42.0, 33.0, 45.0, 43.0, 51.0, 41.0, 37.0, 40.0, 40.0, 38.0, 17.0, 32.0, 21.0, 29.0, 27.0, 10.0, 16.0, 15.0, 8.0, 10.0, 18.0, 11.0, 4.0, 5.0, 5.0, 3.0, 6.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.515625, -9.232177734375, -8.94873046875, -8.665283203125, -8.3818359375, -8.098388671875, -7.81494140625, -7.531494140625, -7.248046875, -6.964599609375, -6.68115234375, -6.397705078125, -6.1142578125, -5.830810546875, -5.54736328125, -5.263916015625, -4.98046875, -4.697021484375, -4.41357421875, -4.130126953125, -3.8466796875, -3.563232421875, -3.27978515625, -2.996337890625, -2.712890625, -2.429443359375, -2.14599609375, -1.862548828125, -1.5791015625, -1.295654296875, -1.01220703125, -0.728759765625, -0.4453125, -0.161865234375, 0.12158203125, 0.405029296875, 0.6884765625, 0.971923828125, 1.25537109375, 1.538818359375, 1.822265625, 2.105712890625, 2.38916015625, 2.672607421875, 2.9560546875, 3.239501953125, 3.52294921875, 3.806396484375, 4.08984375, 4.373291015625, 4.65673828125, 4.940185546875, 5.2236328125, 5.507080078125, 5.79052734375, 6.073974609375, 6.357421875, 6.640869140625, 6.92431640625, 7.207763671875, 7.4912109375, 7.774658203125, 8.05810546875, 8.341552734375, 8.625]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 5.0, 9.0, 22.0, 21.0, 34.0, 38.0, 75.0, 101.0, 145.0, 182.0, 317.0, 449.0, 646.0, 1000.0, 1444.0, 2155.0, 3243.0, 4787.0, 7575.0, 11364.0, 18185.0, 29552.0, 47937.0, 78211.0, 121322.0, 169236.0, 179620.0, 134887.0, 88951.0, 55026.0, 33551.0, 20748.0, 12938.0, 8257.0, 5441.0, 3608.0, 2396.0, 1620.0, 1066.0, 767.0, 519.0, 366.0, 245.0, 170.0, 108.0, 76.0, 49.0, 36.0, 17.0, 15.0, 8.0, 10.0, 3.0, 4.0, 0.0, 4.0], "bins": [-0.35498046875, -0.34458160400390625, -0.3341827392578125, -0.32378387451171875, -0.313385009765625, -0.30298614501953125, -0.2925872802734375, -0.28218841552734375, -0.27178955078125, -0.26139068603515625, -0.2509918212890625, -0.24059295654296875, -0.230194091796875, -0.21979522705078125, -0.2093963623046875, -0.19899749755859375, -0.1885986328125, -0.17819976806640625, -0.1678009033203125, -0.15740203857421875, -0.147003173828125, -0.13660430908203125, -0.1262054443359375, -0.11580657958984375, -0.10540771484375, -0.09500885009765625, -0.0846099853515625, -0.07421112060546875, -0.063812255859375, -0.05341339111328125, -0.0430145263671875, -0.03261566162109375, -0.022216796875, -0.01181793212890625, -0.0014190673828125, 0.00897979736328125, 0.019378662109375, 0.02977752685546875, 0.0401763916015625, 0.05057525634765625, 0.06097412109375, 0.07137298583984375, 0.0817718505859375, 0.09217071533203125, 0.102569580078125, 0.11296844482421875, 0.1233673095703125, 0.13376617431640625, 0.1441650390625, 0.15456390380859375, 0.1649627685546875, 0.17536163330078125, 0.185760498046875, 0.19615936279296875, 0.2065582275390625, 0.21695709228515625, 0.22735595703125, 0.23775482177734375, 0.2481536865234375, 0.25855255126953125, 0.268951416015625, 0.27935028076171875, 0.2897491455078125, 0.30014801025390625, 0.310546875]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 0.0, 5.0, 3.0, 7.0, 8.0, 18.0, 10.0, 14.0, 25.0, 18.0, 17.0, 29.0, 23.0, 38.0, 31.0, 44.0, 43.0, 52.0, 54.0, 40.0, 1076.0, 40.0, 57.0, 35.0, 41.0, 46.0, 37.0, 29.0, 27.0, 24.0, 28.0, 26.0, 15.0, 18.0, 9.0, 13.0, 7.0, 6.0, 9.0, 2.0, 7.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.33984375, -7.13720703125, -6.9345703125, -6.73193359375, -6.529296875, -6.32666015625, -6.1240234375, -5.92138671875, -5.71875, -5.51611328125, -5.3134765625, -5.11083984375, -4.908203125, -4.70556640625, -4.5029296875, -4.30029296875, -4.09765625, -3.89501953125, -3.6923828125, -3.48974609375, -3.287109375, -3.08447265625, -2.8818359375, -2.67919921875, -2.4765625, -2.27392578125, -2.0712890625, -1.86865234375, -1.666015625, -1.46337890625, -1.2607421875, -1.05810546875, -0.85546875, -0.65283203125, -0.4501953125, -0.24755859375, -0.044921875, 0.15771484375, 0.3603515625, 0.56298828125, 0.765625, 0.96826171875, 1.1708984375, 1.37353515625, 1.576171875, 1.77880859375, 1.9814453125, 2.18408203125, 2.38671875, 2.58935546875, 2.7919921875, 2.99462890625, 3.197265625, 3.39990234375, 3.6025390625, 3.80517578125, 4.0078125, 4.21044921875, 4.4130859375, 4.61572265625, 4.818359375, 5.02099609375, 5.2236328125, 5.42626953125, 5.62890625]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 5.0, 15.0, 16.0, 36.0, 56.0, 81.0, 125.0, 193.0, 318.0, 567.0, 899.0, 1472.0, 2373.0, 4094.0, 6602.0, 11217.0, 18951.0, 32894.0, 57432.0, 100971.0, 165616.0, 1261762.0, 174949.0, 108873.0, 61696.0, 35370.0, 20241.0, 11984.0, 7217.0, 4438.0, 2618.0, 1563.0, 990.0, 592.0, 344.0, 216.0, 111.0, 81.0, 47.0, 32.0, 25.0, 21.0, 14.0, 6.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.391357421875, -0.380035400390625, -0.36871337890625, -0.357391357421875, -0.3460693359375, -0.334747314453125, -0.32342529296875, -0.312103271484375, -0.30078125, -0.289459228515625, -0.27813720703125, -0.266815185546875, -0.2554931640625, -0.244171142578125, -0.23284912109375, -0.221527099609375, -0.210205078125, -0.198883056640625, -0.18756103515625, -0.176239013671875, -0.1649169921875, -0.153594970703125, -0.14227294921875, -0.130950927734375, -0.11962890625, -0.108306884765625, -0.09698486328125, -0.085662841796875, -0.0743408203125, -0.063018798828125, -0.05169677734375, -0.040374755859375, -0.029052734375, -0.017730712890625, -0.00640869140625, 0.004913330078125, 0.0162353515625, 0.027557373046875, 0.03887939453125, 0.050201416015625, 0.0615234375, 0.072845458984375, 0.08416748046875, 0.095489501953125, 0.1068115234375, 0.118133544921875, 0.12945556640625, 0.140777587890625, 0.152099609375, 0.163421630859375, 0.17474365234375, 0.186065673828125, 0.1973876953125, 0.208709716796875, 0.22003173828125, 0.231353759765625, 0.24267578125, 0.253997802734375, 0.26531982421875, 0.276641845703125, 0.2879638671875, 0.299285888671875, 0.31060791015625, 0.321929931640625, 0.333251953125]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 6.0, 6.0, 8.0, 2.0, 11.0, 19.0, 13.0, 18.0, 22.0, 26.0, 34.0, 35.0, 32.0, 54.0, 50.0, 58.0, 64.0, 45.0, 58.0, 35.0, 48.0, 39.0, 55.0, 39.0, 36.0, 35.0, 25.0, 24.0, 24.0, 15.0, 11.0, 16.0, 7.0, 10.0, 4.0, 4.0, 5.0, 4.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0015134811401367188, -0.0014705806970596313, -0.001427680253982544, -0.0013847798109054565, -0.0013418793678283691, -0.0012989789247512817, -0.0012560784816741943, -0.001213178038597107, -0.0011702775955200195, -0.0011273771524429321, -0.0010844767093658447, -0.0010415762662887573, -0.00099867582321167, -0.0009557753801345825, -0.0009128749370574951, -0.0008699744939804077, -0.0008270740509033203, -0.0007841736078262329, -0.0007412731647491455, -0.0006983727216720581, -0.0006554722785949707, -0.0006125718355178833, -0.0005696713924407959, -0.0005267709493637085, -0.0004838705062866211, -0.0004409700632095337, -0.0003980696201324463, -0.0003551691770553589, -0.0003122687339782715, -0.0002693682909011841, -0.00022646784782409668, -0.00018356740474700928, -0.00014066696166992188, -9.776651859283447e-05, -5.486607551574707e-05, -1.1965632438659668e-05, 3.0934810638427734e-05, 7.383525371551514e-05, 0.00011673569679260254, 0.00015963613986968994, 0.00020253658294677734, 0.00024543702602386475, 0.00028833746910095215, 0.00033123791217803955, 0.00037413835525512695, 0.00041703879833221436, 0.00045993924140930176, 0.0005028396844863892, 0.0005457401275634766, 0.000588640570640564, 0.0006315410137176514, 0.0006744414567947388, 0.0007173418998718262, 0.0007602423429489136, 0.000803142786026001, 0.0008460432291030884, 0.0008889436721801758, 0.0009318441152572632, 0.0009747445583343506, 0.001017645001411438, 0.0010605454444885254, 0.0011034458875656128, 0.0011463463306427002, 0.0011892467737197876, 0.001232147216796875]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 1.0, 11.0, 6.0, 10.0, 18.0, 15.0, 23.0, 22.0, 34.0, 45.0, 57.0, 67.0, 93.0, 139.0, 212.0, 445.0, 1912.0, 98081.0, 934739.0, 10808.0, 834.0, 309.0, 166.0, 133.0, 79.0, 69.0, 62.0, 33.0, 26.0, 22.0, 22.0, 21.0, 14.0, 5.0, 7.0, 3.0, 8.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0251312255859375, -0.024242639541625977, -0.023354053497314453, -0.02246546745300293, -0.021576881408691406, -0.020688295364379883, -0.01979970932006836, -0.018911123275756836, -0.018022537231445312, -0.01713395118713379, -0.016245365142822266, -0.015356779098510742, -0.014468193054199219, -0.013579607009887695, -0.012691020965576172, -0.011802434921264648, -0.010913848876953125, -0.010025262832641602, -0.009136676788330078, -0.008248090744018555, -0.007359504699707031, -0.006470918655395508, -0.005582332611083984, -0.004693746566772461, -0.0038051605224609375, -0.002916574478149414, -0.0020279884338378906, -0.0011394023895263672, -0.00025081634521484375, 0.0006377696990966797, 0.0015263557434082031, 0.0024149417877197266, 0.00330352783203125, 0.0041921138763427734, 0.005080699920654297, 0.00596928596496582, 0.006857872009277344, 0.007746458053588867, 0.00863504409790039, 0.009523630142211914, 0.010412216186523438, 0.011300802230834961, 0.012189388275146484, 0.013077974319458008, 0.013966560363769531, 0.014855146408081055, 0.015743732452392578, 0.0166323184967041, 0.017520904541015625, 0.01840949058532715, 0.019298076629638672, 0.020186662673950195, 0.02107524871826172, 0.021963834762573242, 0.022852420806884766, 0.02374100685119629, 0.024629592895507812, 0.025518178939819336, 0.02640676498413086, 0.027295351028442383, 0.028183937072753906, 0.02907252311706543, 0.029961109161376953, 0.030849695205688477, 0.03173828125]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 8.0, 66.0, 320.0, 461.0, 138.0, 24.0], "bins": [-0.010835172608494759, -0.010658183135092258, -0.010481193661689758, -0.010304203256964684, -0.010127213783562183, -0.009950224310159683, -0.009773234836757183, -0.009596245363354683, -0.009419254958629608, -0.009242265485227108, -0.009065276011824608, -0.008888285607099533, -0.008711296133697033, -0.008534306660294533, -0.008357317186892033, -0.008180327713489532, -0.008003338240087032, -0.007826348766684532, -0.007649358827620745, -0.0074723693542182446, -0.007295379415154457, -0.007118389941751957, -0.006941400468349457, -0.006764410994946957, -0.006587421055883169, -0.006410431582480669, -0.0062334416434168816, -0.006056452170014381, -0.005879462696611881, -0.005702472757548094, -0.005525483284145594, -0.005348493345081806, -0.005171503406018019, -0.004994513932615519, -0.004817523993551731, -0.004640534520149231, -0.004463545046746731, -0.004286555107682943, -0.004109565634280443, -0.003932575695216656, -0.0037555862218141556, -0.0035785965155810118, -0.003401606809347868, -0.003224617335945368, -0.003047627629712224, -0.00287063792347908, -0.00269364845007658, -0.0025166587438434362, -0.0023396690376102924, -0.0021626793313771486, -0.001985689625144005, -0.0018087001517415047, -0.0016317104455083609, -0.001454720739275217, -0.001277731149457395, -0.001100741559639573, -0.0009237519698217511, -0.0007467623217962682, -0.0005697726737707853, -0.00039278302574530244, -0.00021579337771981955, -3.880372969433665e-05, 0.00013818591833114624, 0.0003151755081489682, 0.000492165214382112]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 6.0, 3.0, 9.0, 7.0, 8.0, 15.0, 24.0, 27.0, 13.0, 32.0, 37.0, 30.0, 28.0, 35.0, 46.0, 36.0, 24.0, 44.0, 35.0, 49.0, 64.0, 42.0, 38.0, 50.0, 38.0, 28.0, 36.0, 32.0, 27.0, 25.0, 18.0, 28.0, 17.0, 15.0, 12.0, 11.0, 6.0, 1.0, 3.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009185075759887695, -0.0008911099284887314, -0.0008637122809886932, -0.0008363146334886551, -0.0008089169859886169, -0.0007815193384885788, -0.0007541216909885406, -0.0007267240434885025, -0.0006993263959884644, -0.0006719287484884262, -0.0006445311009883881, -0.0006171334534883499, -0.0005897358059883118, -0.0005623381584882736, -0.0005349405109882355, -0.0005075428634881973, -0.0004801452159881592, -0.00045274756848812103, -0.0004253499209880829, -0.00039795227348804474, -0.0003705546259880066, -0.00034315697848796844, -0.0003157593309879303, -0.00028836168348789215, -0.000260964035987854, -0.00023356638848781586, -0.0002061687409877777, -0.00017877109348773956, -0.00015137344598770142, -0.00012397579848766327, -9.657815098762512e-05, -6.918050348758698e-05, -4.178285598754883e-05, -1.4385208487510681e-05, 1.3012439012527466e-05, 4.041008651256561e-05, 6.780773401260376e-05, 9.52053815126419e-05, 0.00012260302901268005, 0.0001500006765127182, 0.00017739832401275635, 0.0002047959715127945, 0.00023219361901283264, 0.0002595912665128708, 0.00028698891401290894, 0.0003143865615129471, 0.00034178420901298523, 0.0003691818565130234, 0.0003965795040130615, 0.00042397715151309967, 0.0004513747990131378, 0.00047877244651317596, 0.0005061700940132141, 0.0005335677415132523, 0.0005609653890132904, 0.0005883630365133286, 0.0006157606840133667, 0.0006431583315134048, 0.000670555979013443, 0.0006979536265134811, 0.0007253512740135193, 0.0007527489215135574, 0.0007801465690135956, 0.0008075442165136337, 0.0008349418640136719]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 11.0, 5.0, 5.0, 14.0, 13.0, 14.0, 16.0, 16.0, 14.0, 33.0, 21.0, 32.0, 42.0, 39.0, 44.0, 31.0, 42.0, 33.0, 45.0, 43.0, 51.0, 41.0, 37.0, 40.0, 40.0, 38.0, 17.0, 32.0, 21.0, 29.0, 27.0, 10.0, 16.0, 15.0, 8.0, 10.0, 18.0, 11.0, 4.0, 5.0, 5.0, 3.0, 6.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.515625, -9.232177734375, -8.94873046875, -8.665283203125, -8.3818359375, -8.098388671875, -7.81494140625, -7.531494140625, -7.248046875, -6.964599609375, -6.68115234375, -6.397705078125, -6.1142578125, -5.830810546875, -5.54736328125, -5.263916015625, -4.98046875, -4.697021484375, -4.41357421875, -4.130126953125, -3.8466796875, -3.563232421875, -3.27978515625, -2.996337890625, -2.712890625, -2.429443359375, -2.14599609375, -1.862548828125, -1.5791015625, -1.295654296875, -1.01220703125, -0.728759765625, -0.4453125, -0.161865234375, 0.12158203125, 0.405029296875, 0.6884765625, 0.971923828125, 1.25537109375, 1.538818359375, 1.822265625, 2.105712890625, 2.38916015625, 2.672607421875, 2.9560546875, 3.239501953125, 3.52294921875, 3.806396484375, 4.08984375, 4.373291015625, 4.65673828125, 4.940185546875, 5.2236328125, 5.507080078125, 5.79052734375, 6.073974609375, 6.357421875, 6.640869140625, 6.92431640625, 7.207763671875, 7.4912109375, 7.774658203125, 8.05810546875, 8.341552734375, 8.625]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 6.0, 5.0, 8.0, 16.0, 12.0, 15.0, 23.0, 36.0, 40.0, 38.0, 66.0, 86.0, 116.0, 188.0, 230.0, 320.0, 474.0, 821.0, 1695.0, 4418.0, 15232.0, 78417.0, 801719.0, 115446.0, 18970.0, 5519.0, 1944.0, 941.0, 505.0, 334.0, 245.0, 158.0, 130.0, 89.0, 51.0, 55.0, 30.0, 29.0, 26.0, 34.0, 15.0, 9.0, 11.0, 12.0, 8.0, 8.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-23.859375, -23.14892578125, -22.4384765625, -21.72802734375, -21.017578125, -20.30712890625, -19.5966796875, -18.88623046875, -18.17578125, -17.46533203125, -16.7548828125, -16.04443359375, -15.333984375, -14.62353515625, -13.9130859375, -13.20263671875, -12.4921875, -11.78173828125, -11.0712890625, -10.36083984375, -9.650390625, -8.93994140625, -8.2294921875, -7.51904296875, -6.80859375, -6.09814453125, -5.3876953125, -4.67724609375, -3.966796875, -3.25634765625, -2.5458984375, -1.83544921875, -1.125, -0.41455078125, 0.2958984375, 1.00634765625, 1.716796875, 2.42724609375, 3.1376953125, 3.84814453125, 4.55859375, 5.26904296875, 5.9794921875, 6.68994140625, 7.400390625, 8.11083984375, 8.8212890625, 9.53173828125, 10.2421875, 10.95263671875, 11.6630859375, 12.37353515625, 13.083984375, 13.79443359375, 14.5048828125, 15.21533203125, 15.92578125, 16.63623046875, 17.3466796875, 18.05712890625, 18.767578125, 19.47802734375, 20.1884765625, 20.89892578125, 21.609375]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 5.0, 7.0, 7.0, 3.0, 10.0, 9.0, 14.0, 23.0, 14.0, 25.0, 22.0, 18.0, 33.0, 34.0, 39.0, 40.0, 38.0, 56.0, 70.0, 101.0, 287.0, 1552.0, 150.0, 80.0, 45.0, 45.0, 40.0, 41.0, 37.0, 31.0, 33.0, 26.0, 20.0, 20.0, 18.0, 13.0, 8.0, 8.0, 6.0, 7.0, 5.0, 3.0, 4.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.765625, -22.95263671875, -22.1396484375, -21.32666015625, -20.513671875, -19.70068359375, -18.8876953125, -18.07470703125, -17.26171875, -16.44873046875, -15.6357421875, -14.82275390625, -14.009765625, -13.19677734375, -12.3837890625, -11.57080078125, -10.7578125, -9.94482421875, -9.1318359375, -8.31884765625, -7.505859375, -6.69287109375, -5.8798828125, -5.06689453125, -4.25390625, -3.44091796875, -2.6279296875, -1.81494140625, -1.001953125, -0.18896484375, 0.6240234375, 1.43701171875, 2.25, 3.06298828125, 3.8759765625, 4.68896484375, 5.501953125, 6.31494140625, 7.1279296875, 7.94091796875, 8.75390625, 9.56689453125, 10.3798828125, 11.19287109375, 12.005859375, 12.81884765625, 13.6318359375, 14.44482421875, 15.2578125, 16.07080078125, 16.8837890625, 17.69677734375, 18.509765625, 19.32275390625, 20.1357421875, 20.94873046875, 21.76171875, 22.57470703125, 23.3876953125, 24.20068359375, 25.013671875, 25.82666015625, 26.6396484375, 27.45263671875, 28.265625]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 5.0, 4.0, 5.0, 11.0, 8.0, 11.0, 13.0, 21.0, 31.0, 24.0, 36.0, 44.0, 51.0, 63.0, 109.0, 163.0, 353.0, 1119.0, 9880.0, 2771013.0, 355451.0, 5583.0, 828.0, 292.0, 154.0, 90.0, 62.0, 65.0, 42.0, 27.0, 25.0, 29.0, 17.0, 17.0, 10.0, 5.0, 14.0, 6.0, 6.0, 5.0, 3.0, 4.0, 5.0, 2.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0], "bins": [-77.9375, -75.568359375, -73.19921875, -70.830078125, -68.4609375, -66.091796875, -63.72265625, -61.353515625, -58.984375, -56.615234375, -54.24609375, -51.876953125, -49.5078125, -47.138671875, -44.76953125, -42.400390625, -40.03125, -37.662109375, -35.29296875, -32.923828125, -30.5546875, -28.185546875, -25.81640625, -23.447265625, -21.078125, -18.708984375, -16.33984375, -13.970703125, -11.6015625, -9.232421875, -6.86328125, -4.494140625, -2.125, 0.244140625, 2.61328125, 4.982421875, 7.3515625, 9.720703125, 12.08984375, 14.458984375, 16.828125, 19.197265625, 21.56640625, 23.935546875, 26.3046875, 28.673828125, 31.04296875, 33.412109375, 35.78125, 38.150390625, 40.51953125, 42.888671875, 45.2578125, 47.626953125, 49.99609375, 52.365234375, 54.734375, 57.103515625, 59.47265625, 61.841796875, 64.2109375, 66.580078125, 68.94921875, 71.318359375, 73.6875]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 12.0, 20.0, 37.0, 83.0, 128.0, 171.0, 203.0, 153.0, 100.0, 53.0, 24.0, 17.0, 5.0, 3.0, 3.0, 1.0, 2.0], "bins": [-86.56210327148438, -84.93534851074219, -83.30858612060547, -81.68183135986328, -80.05506896972656, -78.42831420898438, -76.80155944824219, -75.17479705810547, -73.54804229736328, -71.9212875366211, -70.29452514648438, -68.66777038574219, -67.041015625, -65.41425323486328, -63.787498474121094, -62.16073989868164, -60.53398132324219, -58.907222747802734, -57.28046417236328, -55.653709411621094, -54.02695083618164, -52.40019226074219, -50.7734375, -49.14667892456055, -47.519920349121094, -45.89316177368164, -44.26640319824219, -42.6396484375, -41.01288986206055, -39.386131286621094, -37.759376525878906, -36.13261795043945, -34.505863189697266, -32.87910461425781, -31.252347946166992, -29.625591278076172, -27.99883270263672, -26.372074127197266, -24.745317459106445, -23.118560791015625, -21.491802215576172, -19.86504364013672, -18.2382869720459, -16.611530303955078, -14.984771728515625, -13.358014106750488, -11.731256484985352, -10.104498863220215, -8.477741241455078, -6.850983619689941, -5.224225997924805, -3.597468376159668, -1.9707107543945312, -0.34395313262939453, 1.2828044891357422, 2.909562110900879, 4.536319732666016, 6.163077354431152, 7.789834976196289, 9.416592597961426, 11.043350219726562, 12.6701078414917, 14.296865463256836, 15.923623085021973, 17.55038070678711]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 6.0, 3.0, 6.0, 6.0, 10.0, 16.0, 11.0, 14.0, 14.0, 16.0, 29.0, 22.0, 19.0, 26.0, 42.0, 39.0, 34.0, 35.0, 22.0, 47.0, 37.0, 43.0, 50.0, 39.0, 38.0, 42.0, 29.0, 41.0, 42.0, 29.0, 29.0, 25.0, 22.0, 20.0, 18.0, 13.0, 12.0, 19.0, 11.0, 8.0, 4.0, 4.0, 7.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.55349731445312, -65.46846008300781, -63.383426666259766, -61.29838943481445, -59.213356018066406, -57.128318786621094, -55.04328155517578, -52.95824432373047, -50.87321090698242, -48.78817367553711, -46.70314025878906, -44.61810302734375, -42.53306579589844, -40.44803237915039, -38.36299514770508, -36.27796173095703, -34.19292449951172, -32.107887268066406, -30.02285385131836, -27.937816619873047, -25.852781295776367, -23.767745971679688, -21.682708740234375, -19.597673416137695, -17.512638092041016, -15.427602767944336, -13.34256649017334, -11.257530212402344, -9.172494888305664, -7.087459564208984, -5.002423286437988, -2.917387008666992, -0.8323516845703125, 1.2526841163635254, 3.3377199172973633, 5.422755718231201, 7.507791519165039, 9.592826843261719, 11.677863121032715, 13.762899398803711, 15.84793472290039, 17.93297004699707, 20.01800537109375, 22.103042602539062, 24.188077926635742, 26.273113250732422, 28.358150482177734, 30.443185806274414, 32.528221130371094, 34.613258361816406, 36.69829177856445, 38.783329010009766, 40.86836242675781, 42.953399658203125, 45.03843688964844, 47.12347412109375, 49.2085075378418, 51.29354476928711, 53.378578186035156, 55.46361541748047, 57.54865264892578, 59.63368606567383, 61.71872329711914, 63.80375671386719, 65.8887939453125]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 1.0, 5.0, 5.0, 3.0, 3.0, 8.0, 12.0, 15.0, 13.0, 15.0, 14.0, 18.0, 27.0, 28.0, 32.0, 29.0, 34.0, 39.0, 22.0, 47.0, 42.0, 40.0, 50.0, 47.0, 47.0, 37.0, 33.0, 34.0, 32.0, 27.0, 33.0, 24.0, 23.0, 27.0, 20.0, 17.0, 19.0, 11.0, 13.0, 10.0, 7.0, 8.0, 8.0, 9.0, 3.0, 5.0, 6.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0], "bins": [-9.8359375, -9.5491943359375, -9.262451171875, -8.9757080078125, -8.68896484375, -8.4022216796875, -8.115478515625, -7.8287353515625, -7.5419921875, -7.2552490234375, -6.968505859375, -6.6817626953125, -6.39501953125, -6.1082763671875, -5.821533203125, -5.5347900390625, -5.248046875, -4.9613037109375, -4.674560546875, -4.3878173828125, -4.10107421875, -3.8143310546875, -3.527587890625, -3.2408447265625, -2.9541015625, -2.6673583984375, -2.380615234375, -2.0938720703125, -1.80712890625, -1.5203857421875, -1.233642578125, -0.9468994140625, -0.66015625, -0.3734130859375, -0.086669921875, 0.2000732421875, 0.48681640625, 0.7735595703125, 1.060302734375, 1.3470458984375, 1.6337890625, 1.9205322265625, 2.207275390625, 2.4940185546875, 2.78076171875, 3.0675048828125, 3.354248046875, 3.6409912109375, 3.927734375, 4.2144775390625, 4.501220703125, 4.7879638671875, 5.07470703125, 5.3614501953125, 5.648193359375, 5.9349365234375, 6.2216796875, 6.5084228515625, 6.795166015625, 7.0819091796875, 7.36865234375, 7.6553955078125, 7.942138671875, 8.2288818359375, 8.515625]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 4.0, 2.0, 12.0, 6.0, 7.0, 12.0, 21.0, 25.0, 30.0, 70.0, 110.0, 153.0, 261.0, 466.0, 923.0, 1957.0, 4417.0, 11372.0, 33402.0, 138623.0, 1026046.0, 2449390.0, 419245.0, 72303.0, 21245.0, 7836.0, 3227.0, 1449.0, 675.0, 373.0, 228.0, 151.0, 64.0, 39.0, 32.0, 31.0, 16.0, 16.0, 11.0, 5.0, 8.0, 5.0, 6.0, 5.0, 8.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.703125, -19.111328125, -18.51953125, -17.927734375, -17.3359375, -16.744140625, -16.15234375, -15.560546875, -14.96875, -14.376953125, -13.78515625, -13.193359375, -12.6015625, -12.009765625, -11.41796875, -10.826171875, -10.234375, -9.642578125, -9.05078125, -8.458984375, -7.8671875, -7.275390625, -6.68359375, -6.091796875, -5.5, -4.908203125, -4.31640625, -3.724609375, -3.1328125, -2.541015625, -1.94921875, -1.357421875, -0.765625, -0.173828125, 0.41796875, 1.009765625, 1.6015625, 2.193359375, 2.78515625, 3.376953125, 3.96875, 4.560546875, 5.15234375, 5.744140625, 6.3359375, 6.927734375, 7.51953125, 8.111328125, 8.703125, 9.294921875, 9.88671875, 10.478515625, 11.0703125, 11.662109375, 12.25390625, 12.845703125, 13.4375, 14.029296875, 14.62109375, 15.212890625, 15.8046875, 16.396484375, 16.98828125, 17.580078125, 18.171875]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 1.0, 5.0, 5.0, 10.0, 14.0, 22.0, 18.0, 47.0, 56.0, 92.0, 165.0, 293.0, 474.0, 785.0, 783.0, 514.0, 293.0, 204.0, 123.0, 54.0, 47.0, 28.0, 15.0, 9.0, 6.0, 5.0, 4.0, 6.0, 1.0, 1.0, 3.0, 1.0], "bins": [-35.25, -34.4847412109375, -33.719482421875, -32.9542236328125, -32.18896484375, -31.4237060546875, -30.658447265625, -29.8931884765625, -29.1279296875, -28.3626708984375, -27.597412109375, -26.8321533203125, -26.06689453125, -25.3016357421875, -24.536376953125, -23.7711181640625, -23.005859375, -22.2406005859375, -21.475341796875, -20.7100830078125, -19.94482421875, -19.1795654296875, -18.414306640625, -17.6490478515625, -16.8837890625, -16.1185302734375, -15.353271484375, -14.5880126953125, -13.82275390625, -13.0574951171875, -12.292236328125, -11.5269775390625, -10.76171875, -9.9964599609375, -9.231201171875, -8.4659423828125, -7.70068359375, -6.9354248046875, -6.170166015625, -5.4049072265625, -4.6396484375, -3.8743896484375, -3.109130859375, -2.3438720703125, -1.57861328125, -0.8133544921875, -0.048095703125, 0.7171630859375, 1.482421875, 2.2476806640625, 3.012939453125, 3.7781982421875, 4.54345703125, 5.3087158203125, 6.073974609375, 6.8392333984375, 7.6044921875, 8.3697509765625, 9.135009765625, 9.9002685546875, 10.66552734375, 11.4307861328125, 12.196044921875, 12.9613037109375, 13.7265625]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 5.0, 4.0, 15.0, 16.0, 17.0, 40.0, 41.0, 78.0, 152.0, 236.0, 434.0, 1112.0, 4738.0, 51021.0, 2884004.0, 1217103.0, 29986.0, 3429.0, 942.0, 372.0, 201.0, 124.0, 76.0, 46.0, 35.0, 18.0, 15.0, 10.0, 10.0, 6.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.90625, -45.02294921875, -43.1396484375, -41.25634765625, -39.373046875, -37.48974609375, -35.6064453125, -33.72314453125, -31.83984375, -29.95654296875, -28.0732421875, -26.18994140625, -24.306640625, -22.42333984375, -20.5400390625, -18.65673828125, -16.7734375, -14.89013671875, -13.0068359375, -11.12353515625, -9.240234375, -7.35693359375, -5.4736328125, -3.59033203125, -1.70703125, 0.17626953125, 2.0595703125, 3.94287109375, 5.826171875, 7.70947265625, 9.5927734375, 11.47607421875, 13.359375, 15.24267578125, 17.1259765625, 19.00927734375, 20.892578125, 22.77587890625, 24.6591796875, 26.54248046875, 28.42578125, 30.30908203125, 32.1923828125, 34.07568359375, 35.958984375, 37.84228515625, 39.7255859375, 41.60888671875, 43.4921875, 45.37548828125, 47.2587890625, 49.14208984375, 51.025390625, 52.90869140625, 54.7919921875, 56.67529296875, 58.55859375, 60.44189453125, 62.3251953125, 64.20849609375, 66.091796875, 67.97509765625, 69.8583984375, 71.74169921875, 73.625]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 11.0, 28.0, 47.0, 105.0, 168.0, 221.0, 190.0, 128.0, 74.0, 23.0, 11.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-102.39513397216797, -97.68354034423828, -92.9719467163086, -88.2603530883789, -83.54875946044922, -78.83716583251953, -74.12557220458984, -69.41397857666016, -64.70238494873047, -59.99079132080078, -55.279197692871094, -50.567604064941406, -45.85601043701172, -41.14441680908203, -36.432823181152344, -31.721229553222656, -27.00963592529297, -22.29804229736328, -17.586448669433594, -12.874855041503906, -8.163261413574219, -3.4516677856445312, 1.2599258422851562, 5.971519470214844, 10.683113098144531, 15.394706726074219, 20.106300354003906, 24.817893981933594, 29.52948760986328, 34.24108123779297, 38.952674865722656, 43.664268493652344, 48.3758544921875, 53.08744812011719, 57.799041748046875, 62.51063537597656, 67.22222900390625, 71.93382263183594, 76.64541625976562, 81.35700988769531, 86.068603515625, 90.78019714355469, 95.49179077148438, 100.20338439941406, 104.91497802734375, 109.62657165527344, 114.33816528320312, 119.04975891113281, 123.7613525390625, 128.4729461669922, 133.18453979492188, 137.89613342285156, 142.60772705078125, 147.31932067871094, 152.03091430664062, 156.7425079345703, 161.4541015625, 166.1656951904297, 170.87728881835938, 175.58888244628906, 180.30047607421875, 185.01206970214844, 189.72366333007812, 194.4352569580078, 199.1468505859375]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 6.0, 5.0, 9.0, 9.0, 9.0, 11.0, 15.0, 14.0, 11.0, 18.0, 16.0, 22.0, 30.0, 26.0, 31.0, 35.0, 31.0, 24.0, 31.0, 41.0, 36.0, 46.0, 36.0, 40.0, 40.0, 41.0, 29.0, 37.0, 26.0, 30.0, 24.0, 32.0, 31.0, 26.0, 18.0, 21.0, 11.0, 13.0, 17.0, 14.0, 14.0, 9.0, 5.0, 2.0, 5.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-54.53190612792969, -52.936702728271484, -51.34150314331055, -49.746299743652344, -48.15109634399414, -46.5558967590332, -44.960693359375, -43.36549377441406, -41.77029037475586, -40.175086975097656, -38.57988739013672, -36.984683990478516, -35.38948059082031, -33.794281005859375, -32.19907760620117, -30.6038761138916, -29.0086727142334, -27.413471221923828, -25.818267822265625, -24.223066329956055, -22.627864837646484, -21.03266143798828, -19.43745994567871, -17.84225845336914, -16.247055053710938, -14.65185260772705, -13.05665111541748, -11.461448669433594, -9.866247177124023, -8.271044731140137, -6.67584228515625, -5.08064079284668, -3.4854393005371094, -1.8902372121810913, -0.29503512382507324, 1.3001670837402344, 2.895369052886963, 4.490571022033691, 6.085773468017578, 7.680974960327148, 9.276177406311035, 10.871379852294922, 12.466581344604492, 14.061783790588379, 15.656986236572266, 17.252187728881836, 18.847389221191406, 20.44259262084961, 22.03779411315918, 23.63299560546875, 25.228199005126953, 26.823400497436523, 28.418601989746094, 30.013805389404297, 31.609006881713867, 33.20420837402344, 34.79941177368164, 36.394615173339844, 37.98981475830078, 39.585018157958984, 41.18022155761719, 42.775421142578125, 44.37062454223633, 45.96582794189453, 47.56102752685547]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 2.0, 0.0, 2.0, 2.0, 4.0, 8.0, 14.0, 5.0, 6.0, 12.0, 15.0, 16.0, 28.0, 26.0, 28.0, 29.0, 30.0, 20.0, 41.0, 38.0, 41.0, 50.0, 39.0, 43.0, 43.0, 43.0, 46.0, 36.0, 37.0, 31.0, 29.0, 34.0, 30.0, 22.0, 14.0, 28.0, 19.0, 20.0, 9.0, 10.0, 18.0, 8.0, 7.0, 5.0, 5.0, 6.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0], "bins": [-10.1640625, -9.849853515625, -9.53564453125, -9.221435546875, -8.9072265625, -8.593017578125, -8.27880859375, -7.964599609375, -7.650390625, -7.336181640625, -7.02197265625, -6.707763671875, -6.3935546875, -6.079345703125, -5.76513671875, -5.450927734375, -5.13671875, -4.822509765625, -4.50830078125, -4.194091796875, -3.8798828125, -3.565673828125, -3.25146484375, -2.937255859375, -2.623046875, -2.308837890625, -1.99462890625, -1.680419921875, -1.3662109375, -1.052001953125, -0.73779296875, -0.423583984375, -0.109375, 0.204833984375, 0.51904296875, 0.833251953125, 1.1474609375, 1.461669921875, 1.77587890625, 2.090087890625, 2.404296875, 2.718505859375, 3.03271484375, 3.346923828125, 3.6611328125, 3.975341796875, 4.28955078125, 4.603759765625, 4.91796875, 5.232177734375, 5.54638671875, 5.860595703125, 6.1748046875, 6.489013671875, 6.80322265625, 7.117431640625, 7.431640625, 7.745849609375, 8.06005859375, 8.374267578125, 8.6884765625, 9.002685546875, 9.31689453125, 9.631103515625, 9.9453125]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 2.0, 6.0, 2.0, 11.0, 18.0, 19.0, 48.0, 56.0, 70.0, 139.0, 205.0, 375.0, 489.0, 912.0, 1341.0, 2207.0, 3517.0, 5841.0, 9504.0, 15959.0, 27271.0, 47074.0, 82074.0, 139998.0, 209329.0, 197217.0, 127283.0, 73947.0, 42135.0, 24702.0, 14310.0, 8512.0, 5263.0, 3251.0, 1973.0, 1247.0, 804.0, 507.0, 311.0, 206.0, 150.0, 97.0, 66.0, 35.0, 21.0, 15.0, 21.0, 4.0, 6.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.40771484375, -0.39493560791015625, -0.3821563720703125, -0.36937713623046875, -0.356597900390625, -0.34381866455078125, -0.3310394287109375, -0.31826019287109375, -0.30548095703125, -0.29270172119140625, -0.2799224853515625, -0.26714324951171875, -0.254364013671875, -0.24158477783203125, -0.2288055419921875, -0.21602630615234375, -0.2032470703125, -0.19046783447265625, -0.1776885986328125, -0.16490936279296875, -0.152130126953125, -0.13935089111328125, -0.1265716552734375, -0.11379241943359375, -0.10101318359375, -0.08823394775390625, -0.0754547119140625, -0.06267547607421875, -0.049896240234375, -0.03711700439453125, -0.0243377685546875, -0.01155853271484375, 0.001220703125, 0.01399993896484375, 0.0267791748046875, 0.03955841064453125, 0.052337646484375, 0.06511688232421875, 0.0778961181640625, 0.09067535400390625, 0.10345458984375, 0.11623382568359375, 0.1290130615234375, 0.14179229736328125, 0.154571533203125, 0.16735076904296875, 0.1801300048828125, 0.19290924072265625, 0.2056884765625, 0.21846771240234375, 0.2312469482421875, 0.24402618408203125, 0.256805419921875, 0.26958465576171875, 0.2823638916015625, 0.29514312744140625, 0.30792236328125, 0.32070159912109375, 0.3334808349609375, 0.34626007080078125, 0.359039306640625, 0.37181854248046875, 0.3845977783203125, 0.39737701416015625, 0.41015625]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 5.0, 1.0, 11.0, 5.0, 8.0, 8.0, 9.0, 17.0, 17.0, 25.0, 24.0, 18.0, 24.0, 24.0, 26.0, 31.0, 18.0, 44.0, 32.0, 33.0, 31.0, 41.0, 1065.0, 44.0, 33.0, 43.0, 37.0, 29.0, 29.0, 40.0, 30.0, 20.0, 31.0, 23.0, 21.0, 20.0, 14.0, 18.0, 20.0, 12.0, 11.0, 7.0, 7.0, 9.0, 5.0, 4.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.0078125, -5.8184814453125, -5.629150390625, -5.4398193359375, -5.25048828125, -5.0611572265625, -4.871826171875, -4.6824951171875, -4.4931640625, -4.3038330078125, -4.114501953125, -3.9251708984375, -3.73583984375, -3.5465087890625, -3.357177734375, -3.1678466796875, -2.978515625, -2.7891845703125, -2.599853515625, -2.4105224609375, -2.22119140625, -2.0318603515625, -1.842529296875, -1.6531982421875, -1.4638671875, -1.2745361328125, -1.085205078125, -0.8958740234375, -0.70654296875, -0.5172119140625, -0.327880859375, -0.1385498046875, 0.05078125, 0.2401123046875, 0.429443359375, 0.6187744140625, 0.80810546875, 0.9974365234375, 1.186767578125, 1.3760986328125, 1.5654296875, 1.7547607421875, 1.944091796875, 2.1334228515625, 2.32275390625, 2.5120849609375, 2.701416015625, 2.8907470703125, 3.080078125, 3.2694091796875, 3.458740234375, 3.6480712890625, 3.83740234375, 4.0267333984375, 4.216064453125, 4.4053955078125, 4.5947265625, 4.7840576171875, 4.973388671875, 5.1627197265625, 5.35205078125, 5.5413818359375, 5.730712890625, 5.9200439453125, 6.109375]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 5.0, 12.0, 15.0, 22.0, 22.0, 37.0, 61.0, 107.0, 133.0, 203.0, 324.0, 448.0, 665.0, 978.0, 1456.0, 2181.0, 3110.0, 4700.0, 6957.0, 10335.0, 15437.0, 23555.0, 35036.0, 54050.0, 81958.0, 121081.0, 430437.0, 935073.0, 122827.0, 83732.0, 54666.0, 35916.0, 23564.0, 15626.0, 10606.0, 7153.0, 4753.0, 3170.0, 2167.0, 1486.0, 1015.0, 681.0, 465.0, 287.0, 190.0, 147.0, 94.0, 70.0, 44.0, 28.0, 23.0, 16.0, 8.0, 3.0, 0.0, 4.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.3046875, -0.2948646545410156, -0.28504180908203125, -0.2752189636230469, -0.2653961181640625, -0.2555732727050781, -0.24575042724609375, -0.23592758178710938, -0.226104736328125, -0.21628189086914062, -0.20645904541015625, -0.19663619995117188, -0.1868133544921875, -0.17699050903320312, -0.16716766357421875, -0.15734481811523438, -0.14752197265625, -0.13769912719726562, -0.12787628173828125, -0.11805343627929688, -0.1082305908203125, -0.09840774536132812, -0.08858489990234375, -0.07876205444335938, -0.068939208984375, -0.059116363525390625, -0.04929351806640625, -0.039470672607421875, -0.0296478271484375, -0.019824981689453125, -0.01000213623046875, -0.000179290771484375, 0.0096435546875, 0.019466400146484375, 0.02928924560546875, 0.039112091064453125, 0.0489349365234375, 0.058757781982421875, 0.06858062744140625, 0.07840347290039062, 0.088226318359375, 0.09804916381835938, 0.10787200927734375, 0.11769485473632812, 0.1275177001953125, 0.13734054565429688, 0.14716339111328125, 0.15698623657226562, 0.16680908203125, 0.17663192749023438, 0.18645477294921875, 0.19627761840820312, 0.2061004638671875, 0.21592330932617188, 0.22574615478515625, 0.23556900024414062, 0.245391845703125, 0.2552146911621094, 0.26503753662109375, 0.2748603820800781, 0.2846832275390625, 0.2945060729980469, 0.30432891845703125, 0.3141517639160156, 0.323974609375]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 6.0, 3.0, 3.0, 12.0, 9.0, 14.0, 11.0, 16.0, 28.0, 24.0, 34.0, 27.0, 33.0, 43.0, 45.0, 86.0, 66.0, 59.0, 69.0, 57.0, 52.0, 46.0, 51.0, 32.0, 31.0, 30.0, 19.0, 21.0, 14.0, 9.0, 7.0, 10.0, 6.0, 7.0, 6.0, 2.0, 6.0, 4.0, 2.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0020046234130859375, -0.0019328296184539795, -0.0018610358238220215, -0.0017892420291900635, -0.0017174482345581055, -0.0016456544399261475, -0.0015738606452941895, -0.0015020668506622314, -0.0014302730560302734, -0.0013584792613983154, -0.0012866854667663574, -0.0012148916721343994, -0.0011430978775024414, -0.0010713040828704834, -0.0009995102882385254, -0.0009277164936065674, -0.0008559226989746094, -0.0007841289043426514, -0.0007123351097106934, -0.0006405413150787354, -0.0005687475204467773, -0.0004969537258148193, -0.00042515993118286133, -0.0003533661365509033, -0.0002815723419189453, -0.0002097785472869873, -0.0001379847526550293, -6.619095802307129e-05, 5.602836608886719e-06, 7.739663124084473e-05, 0.00014919042587280273, 0.00022098422050476074, 0.00029277801513671875, 0.00036457180976867676, 0.00043636560440063477, 0.0005081593990325928, 0.0005799531936645508, 0.0006517469882965088, 0.0007235407829284668, 0.0007953345775604248, 0.0008671283721923828, 0.0009389221668243408, 0.0010107159614562988, 0.0010825097560882568, 0.0011543035507202148, 0.0012260973453521729, 0.0012978911399841309, 0.0013696849346160889, 0.0014414787292480469, 0.0015132725238800049, 0.0015850663185119629, 0.001656860113143921, 0.001728653907775879, 0.001800447702407837, 0.001872241497039795, 0.001944035291671753, 0.002015829086303711, 0.002087622880935669, 0.002159416675567627, 0.002231210470199585, 0.002303004264831543, 0.002374798059463501, 0.002446591854095459, 0.002518385648727417, 0.002590179443359375]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 3.0, 2.0, 2.0, 6.0, 3.0, 9.0, 11.0, 9.0, 16.0, 11.0, 22.0, 27.0, 25.0, 31.0, 47.0, 67.0, 92.0, 144.0, 197.0, 323.0, 729.0, 14636.0, 1020709.0, 9642.0, 790.0, 306.0, 183.0, 111.0, 94.0, 69.0, 57.0, 42.0, 33.0, 32.0, 18.0, 14.0, 8.0, 12.0, 10.0, 3.0, 1.0, 4.0, 2.0, 3.0, 1.0, 3.0, 2.0, 1.0], "bins": [-0.05340576171875, -0.0520172119140625, -0.050628662109375, -0.0492401123046875, -0.0478515625, -0.0464630126953125, -0.045074462890625, -0.0436859130859375, -0.04229736328125, -0.0409088134765625, -0.039520263671875, -0.0381317138671875, -0.0367431640625, -0.0353546142578125, -0.033966064453125, -0.0325775146484375, -0.03118896484375, -0.0298004150390625, -0.028411865234375, -0.0270233154296875, -0.025634765625, -0.0242462158203125, -0.022857666015625, -0.0214691162109375, -0.02008056640625, -0.0186920166015625, -0.017303466796875, -0.0159149169921875, -0.0145263671875, -0.0131378173828125, -0.011749267578125, -0.0103607177734375, -0.00897216796875, -0.0075836181640625, -0.006195068359375, -0.0048065185546875, -0.00341796875, -0.0020294189453125, -0.000640869140625, 0.0007476806640625, 0.00213623046875, 0.0035247802734375, 0.004913330078125, 0.0063018798828125, 0.0076904296875, 0.0090789794921875, 0.010467529296875, 0.0118560791015625, 0.01324462890625, 0.0146331787109375, 0.016021728515625, 0.0174102783203125, 0.018798828125, 0.0201873779296875, 0.021575927734375, 0.0229644775390625, 0.02435302734375, 0.0257415771484375, 0.027130126953125, 0.0285186767578125, 0.0299072265625, 0.0312957763671875, 0.032684326171875, 0.0340728759765625, 0.03546142578125]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 6.0, 10.0, 43.0, 150.0, 360.0, 320.0, 94.0, 27.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008469923050142825, -0.0007027665851637721, -0.0005585408071056008, -0.0004143150872550905, -0.0002700893674045801, -0.00012586364755406976, 1.8362130504101515e-05, 0.00016258779214695096, 0.00030681357020512223, 0.0004510392900556326, 0.0005952650681138039, 0.0007394907879643142, 0.0008837165078148246, 0.001027942169457674, 0.0011721679475158453, 0.0013163937255740166, 0.0014606195036321878, 0.0016048452816903591, 0.0017490709433332086, 0.0018932967213913798, 0.0020375223830342293, 0.0021817481610924006, 0.002325973939150572, 0.0024701994843780994, 0.0026144252624362707, 0.002758651040494442, 0.0029028768185526133, 0.0030471025966107845, 0.003191328141838312, 0.0033355539198964834, 0.0034797796979546547, 0.0036240052431821823, 0.0037682312540709972, 0.003912456799298525, 0.00405668281018734, 0.004200908355414867, 0.004345134366303682, 0.00448935991153121, 0.004633585922420025, 0.0047778114676475525, 0.00492203701287508, 0.005066262558102608, 0.005210488568991423, 0.00535471411421895, 0.005498940125107765, 0.005643165670335293, 0.0057873912155628204, 0.005931617226451635, 0.00607584323734045, 0.006220068782567978, 0.006364294793456793, 0.0065085203386843204, 0.006652746349573135, 0.006796971894800663, 0.006941197440028191, 0.0070854234509170055, 0.007229648996144533, 0.007373874541372061, 0.007518100552260876, 0.007662326097488403, 0.007806552108377218, 0.007950777187943459, 0.00809500366449356, 0.008239229209721088, 0.008383454754948616]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 7.0, 5.0, 5.0, 7.0, 5.0, 12.0, 10.0, 15.0, 11.0, 16.0, 19.0, 25.0, 19.0, 25.0, 20.0, 16.0, 30.0, 31.0, 41.0, 24.0, 31.0, 35.0, 34.0, 31.0, 48.0, 36.0, 31.0, 35.0, 32.0, 25.0, 35.0, 20.0, 21.0, 21.0, 29.0, 26.0, 27.0, 22.0, 15.0, 18.0, 9.0, 9.0, 12.0, 16.0, 5.0, 7.0, 7.0, 3.0, 5.0, 7.0, 4.0, 3.0, 2.0, 2.0, 2.0], "bins": [-0.001078784465789795, -0.0010468754917383194, -0.0010149665176868439, -0.0009830575436353683, -0.0009511485695838928, -0.0009192395955324173, -0.0008873306214809418, -0.0008554216474294662, -0.0008235126733779907, -0.0007916036993265152, -0.0007596947252750397, -0.0007277857512235641, -0.0006958767771720886, -0.0006639678031206131, -0.0006320588290691376, -0.000600149855017662, -0.0005682408809661865, -0.000536331906914711, -0.0005044229328632355, -0.00047251395881175995, -0.0004406049847602844, -0.0004086960107088089, -0.0003767870366573334, -0.00034487806260585785, -0.0003129690885543823, -0.0002810601145029068, -0.0002491511404514313, -0.00021724216639995575, -0.00018533319234848022, -0.0001534242182970047, -0.00012151524424552917, -8.960627019405365e-05, -5.7697296142578125e-05, -2.57883220911026e-05, 6.120651960372925e-06, 3.802962601184845e-05, 6.993860006332397e-05, 0.0001018475741147995, 0.00013375654816627502, 0.00016566552221775055, 0.00019757449626922607, 0.0002294834703207016, 0.0002613924443721771, 0.00029330141842365265, 0.0003252103924751282, 0.0003571193665266037, 0.0003890283405780792, 0.00042093731462955475, 0.0004528462886810303, 0.0004847552627325058, 0.0005166642367839813, 0.0005485732108354568, 0.0005804821848869324, 0.0006123911589384079, 0.0006443001329898834, 0.000676209107041359, 0.0007081180810928345, 0.00074002705514431, 0.0007719360291957855, 0.000803845003247261, 0.0008357539772987366, 0.0008676629513502121, 0.0008995719254016876, 0.0009314808994531631, 0.0009633898735046387]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 2.0, 0.0, 2.0, 2.0, 4.0, 8.0, 14.0, 5.0, 6.0, 12.0, 15.0, 16.0, 28.0, 26.0, 28.0, 29.0, 30.0, 20.0, 41.0, 38.0, 41.0, 50.0, 39.0, 43.0, 43.0, 43.0, 46.0, 36.0, 37.0, 31.0, 29.0, 34.0, 30.0, 22.0, 14.0, 28.0, 19.0, 20.0, 9.0, 10.0, 18.0, 8.0, 7.0, 5.0, 5.0, 6.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0], "bins": [-10.1640625, -9.849853515625, -9.53564453125, -9.221435546875, -8.9072265625, -8.593017578125, -8.27880859375, -7.964599609375, -7.650390625, -7.336181640625, -7.02197265625, -6.707763671875, -6.3935546875, -6.079345703125, -5.76513671875, -5.450927734375, -5.13671875, -4.822509765625, -4.50830078125, -4.194091796875, -3.8798828125, -3.565673828125, -3.25146484375, -2.937255859375, -2.623046875, -2.308837890625, -1.99462890625, -1.680419921875, -1.3662109375, -1.052001953125, -0.73779296875, -0.423583984375, -0.109375, 0.204833984375, 0.51904296875, 0.833251953125, 1.1474609375, 1.461669921875, 1.77587890625, 2.090087890625, 2.404296875, 2.718505859375, 3.03271484375, 3.346923828125, 3.6611328125, 3.975341796875, 4.28955078125, 4.603759765625, 4.91796875, 5.232177734375, 5.54638671875, 5.860595703125, 6.1748046875, 6.489013671875, 6.80322265625, 7.117431640625, 7.431640625, 7.745849609375, 8.06005859375, 8.374267578125, 8.6884765625, 9.002685546875, 9.31689453125, 9.631103515625, 9.9453125]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 4.0, 9.0, 5.0, 2.0, 18.0, 14.0, 25.0, 28.0, 39.0, 57.0, 100.0, 120.0, 193.0, 280.0, 472.0, 798.0, 1608.0, 3136.0, 6637.0, 15120.0, 36299.0, 104109.0, 432357.0, 310808.0, 81903.0, 29745.0, 12784.0, 5775.0, 2735.0, 1388.0, 728.0, 439.0, 245.0, 169.0, 107.0, 76.0, 62.0, 46.0, 26.0, 22.0, 23.0, 10.0, 9.0, 7.0, 8.0, 3.0, 1.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.6796875, -14.20458984375, -13.7294921875, -13.25439453125, -12.779296875, -12.30419921875, -11.8291015625, -11.35400390625, -10.87890625, -10.40380859375, -9.9287109375, -9.45361328125, -8.978515625, -8.50341796875, -8.0283203125, -7.55322265625, -7.078125, -6.60302734375, -6.1279296875, -5.65283203125, -5.177734375, -4.70263671875, -4.2275390625, -3.75244140625, -3.27734375, -2.80224609375, -2.3271484375, -1.85205078125, -1.376953125, -0.90185546875, -0.4267578125, 0.04833984375, 0.5234375, 0.99853515625, 1.4736328125, 1.94873046875, 2.423828125, 2.89892578125, 3.3740234375, 3.84912109375, 4.32421875, 4.79931640625, 5.2744140625, 5.74951171875, 6.224609375, 6.69970703125, 7.1748046875, 7.64990234375, 8.125, 8.60009765625, 9.0751953125, 9.55029296875, 10.025390625, 10.50048828125, 10.9755859375, 11.45068359375, 11.92578125, 12.40087890625, 12.8759765625, 13.35107421875, 13.826171875, 14.30126953125, 14.7763671875, 15.25146484375, 15.7265625]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 4.0, 9.0, 2.0, 2.0, 10.0, 10.0, 13.0, 14.0, 14.0, 22.0, 20.0, 18.0, 32.0, 25.0, 35.0, 39.0, 48.0, 50.0, 62.0, 87.0, 144.0, 1581.0, 238.0, 94.0, 66.0, 65.0, 41.0, 34.0, 37.0, 27.0, 22.0, 18.0, 21.0, 20.0, 27.0, 17.0, 13.0, 9.0, 15.0, 9.0, 7.0, 4.0, 3.0, 7.0, 4.0, 4.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-27.125, -26.270751953125, -25.41650390625, -24.562255859375, -23.7080078125, -22.853759765625, -21.99951171875, -21.145263671875, -20.291015625, -19.436767578125, -18.58251953125, -17.728271484375, -16.8740234375, -16.019775390625, -15.16552734375, -14.311279296875, -13.45703125, -12.602783203125, -11.74853515625, -10.894287109375, -10.0400390625, -9.185791015625, -8.33154296875, -7.477294921875, -6.623046875, -5.768798828125, -4.91455078125, -4.060302734375, -3.2060546875, -2.351806640625, -1.49755859375, -0.643310546875, 0.2109375, 1.065185546875, 1.91943359375, 2.773681640625, 3.6279296875, 4.482177734375, 5.33642578125, 6.190673828125, 7.044921875, 7.899169921875, 8.75341796875, 9.607666015625, 10.4619140625, 11.316162109375, 12.17041015625, 13.024658203125, 13.87890625, 14.733154296875, 15.58740234375, 16.441650390625, 17.2958984375, 18.150146484375, 19.00439453125, 19.858642578125, 20.712890625, 21.567138671875, 22.42138671875, 23.275634765625, 24.1298828125, 24.984130859375, 25.83837890625, 26.692626953125, 27.546875]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 8.0, 12.0, 14.0, 22.0, 30.0, 42.0, 55.0, 90.0, 126.0, 167.0, 336.0, 1138.0, 8958.0, 208727.0, 2880445.0, 40989.0, 3187.0, 639.0, 268.0, 129.0, 104.0, 58.0, 36.0, 47.0, 27.0, 16.0, 18.0, 7.0, 8.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-67.1875, -65.33544921875, -63.4833984375, -61.63134765625, -59.779296875, -57.92724609375, -56.0751953125, -54.22314453125, -52.37109375, -50.51904296875, -48.6669921875, -46.81494140625, -44.962890625, -43.11083984375, -41.2587890625, -39.40673828125, -37.5546875, -35.70263671875, -33.8505859375, -31.99853515625, -30.146484375, -28.29443359375, -26.4423828125, -24.59033203125, -22.73828125, -20.88623046875, -19.0341796875, -17.18212890625, -15.330078125, -13.47802734375, -11.6259765625, -9.77392578125, -7.921875, -6.06982421875, -4.2177734375, -2.36572265625, -0.513671875, 1.33837890625, 3.1904296875, 5.04248046875, 6.89453125, 8.74658203125, 10.5986328125, 12.45068359375, 14.302734375, 16.15478515625, 18.0068359375, 19.85888671875, 21.7109375, 23.56298828125, 25.4150390625, 27.26708984375, 29.119140625, 30.97119140625, 32.8232421875, 34.67529296875, 36.52734375, 38.37939453125, 40.2314453125, 42.08349609375, 43.935546875, 45.78759765625, 47.6396484375, 49.49169921875, 51.34375]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 91.0, 596.0, 315.0, 15.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-373.1446228027344, -365.646728515625, -358.1488037109375, -350.65087890625, -343.1529846191406, -335.65509033203125, -328.15716552734375, -320.65924072265625, -313.1613464355469, -305.6634521484375, -298.16552734375, -290.6676025390625, -283.1697082519531, -275.67181396484375, -268.17388916015625, -260.67596435546875, -253.17807006835938, -245.68016052246094, -238.1822509765625, -230.68434143066406, -223.18643188476562, -215.6885223388672, -208.19061279296875, -200.6927032470703, -193.19479370117188, -185.69688415527344, -178.198974609375, -170.70106506347656, -163.20315551757812, -155.7052459716797, -148.20733642578125, -140.7094268798828, -133.2115020751953, -125.71359252929688, -118.21568298339844, -110.7177734375, -103.21986389160156, -95.72195434570312, -88.22404479980469, -80.72613525390625, -73.22822570800781, -65.73031616210938, -58.23240661621094, -50.7344970703125, -43.23658752441406, -35.738677978515625, -28.240768432617188, -20.74285888671875, -13.244949340820312, -5.747039794921875, 1.7508697509765625, 9.248779296875, 16.746688842773438, 24.244598388671875, 31.742507934570312, 39.24041748046875, 46.73832702636719, 54.236236572265625, 61.73414611816406, 69.2320556640625, 76.72996520996094, 84.22787475585938, 91.72578430175781, 99.22369384765625, 106.72160339355469]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 5.0, 7.0, 9.0, 8.0, 17.0, 12.0, 14.0, 19.0, 21.0, 11.0, 29.0, 33.0, 26.0, 39.0, 25.0, 37.0, 28.0, 53.0, 34.0, 31.0, 44.0, 40.0, 39.0, 44.0, 41.0, 31.0, 36.0, 34.0, 26.0, 36.0, 23.0, 17.0, 22.0, 17.0, 25.0, 16.0, 9.0, 8.0, 8.0, 5.0, 5.0, 3.0, 3.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0], "bins": [-61.3516845703125, -59.632625579833984, -57.9135627746582, -56.19450378417969, -54.475440979003906, -52.75638198852539, -51.037322998046875, -49.318260192871094, -47.59919738769531, -45.8801383972168, -44.161075592041016, -42.4420166015625, -40.72295379638672, -39.0038948059082, -37.28483581542969, -35.565773010253906, -33.84671401977539, -32.127655029296875, -30.408592224121094, -28.689533233642578, -26.970470428466797, -25.25141143798828, -23.532350540161133, -21.813289642333984, -20.094228744506836, -18.375167846679688, -16.65610694885254, -14.937047004699707, -13.217986106872559, -11.49892520904541, -9.779865264892578, -8.06080436706543, -6.341743469238281, -4.622682571411133, -2.9036221504211426, -1.1845617294311523, 0.5344991683959961, 2.2535600662231445, 3.9726200103759766, 5.691680908203125, 7.410741806030273, 9.129802703857422, 10.84886360168457, 12.567923545837402, 14.28698444366455, 16.006046295166016, 17.72510528564453, 19.44416618347168, 21.163227081298828, 22.882287979125977, 24.601348876953125, 26.32040786743164, 28.039470672607422, 29.758529663085938, 31.477590560913086, 33.196651458740234, 34.91571044921875, 36.634769439697266, 38.35383224487305, 40.07289123535156, 41.791954040527344, 43.51101303100586, 45.230072021484375, 46.949134826660156, 48.66819763183594]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 6.0, 4.0, 10.0, 10.0, 8.0, 14.0, 18.0, 21.0, 21.0, 30.0, 24.0, 23.0, 25.0, 29.0, 31.0, 35.0, 41.0, 46.0, 42.0, 43.0, 39.0, 40.0, 42.0, 45.0, 38.0, 27.0, 30.0, 30.0, 32.0, 20.0, 21.0, 29.0, 17.0, 18.0, 24.0, 18.0, 9.0, 6.0, 8.0, 9.0, 6.0, 3.0, 2.0, 5.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-9.9453125, -9.6317138671875, -9.318115234375, -9.0045166015625, -8.69091796875, -8.3773193359375, -8.063720703125, -7.7501220703125, -7.4365234375, -7.1229248046875, -6.809326171875, -6.4957275390625, -6.18212890625, -5.8685302734375, -5.554931640625, -5.2413330078125, -4.927734375, -4.6141357421875, -4.300537109375, -3.9869384765625, -3.67333984375, -3.3597412109375, -3.046142578125, -2.7325439453125, -2.4189453125, -2.1053466796875, -1.791748046875, -1.4781494140625, -1.16455078125, -0.8509521484375, -0.537353515625, -0.2237548828125, 0.08984375, 0.4034423828125, 0.717041015625, 1.0306396484375, 1.34423828125, 1.6578369140625, 1.971435546875, 2.2850341796875, 2.5986328125, 2.9122314453125, 3.225830078125, 3.5394287109375, 3.85302734375, 4.1666259765625, 4.480224609375, 4.7938232421875, 5.107421875, 5.4210205078125, 5.734619140625, 6.0482177734375, 6.36181640625, 6.6754150390625, 6.989013671875, 7.3026123046875, 7.6162109375, 7.9298095703125, 8.243408203125, 8.5570068359375, 8.87060546875, 9.1842041015625, 9.497802734375, 9.8114013671875, 10.125]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 7.0, 8.0, 7.0, 8.0, 8.0, 19.0, 21.0, 40.0, 41.0, 60.0, 86.0, 129.0, 194.0, 271.0, 412.0, 514.0, 819.0, 1175.0, 1846.0, 2887.0, 5019.0, 8859.0, 17027.0, 38924.0, 106682.0, 383165.0, 1447699.0, 1554449.0, 427592.0, 114488.0, 40741.0, 18020.0, 9054.0, 5078.0, 3060.0, 1793.0, 1229.0, 821.0, 579.0, 403.0, 266.0, 204.0, 159.0, 110.0, 95.0, 56.0, 36.0, 37.0, 22.0, 17.0, 13.0, 16.0, 9.0, 10.0, 7.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.0078125, -11.6080322265625, -11.208251953125, -10.8084716796875, -10.40869140625, -10.0089111328125, -9.609130859375, -9.2093505859375, -8.8095703125, -8.4097900390625, -8.010009765625, -7.6102294921875, -7.21044921875, -6.8106689453125, -6.410888671875, -6.0111083984375, -5.611328125, -5.2115478515625, -4.811767578125, -4.4119873046875, -4.01220703125, -3.6124267578125, -3.212646484375, -2.8128662109375, -2.4130859375, -2.0133056640625, -1.613525390625, -1.2137451171875, -0.81396484375, -0.4141845703125, -0.014404296875, 0.3853759765625, 0.78515625, 1.1849365234375, 1.584716796875, 1.9844970703125, 2.38427734375, 2.7840576171875, 3.183837890625, 3.5836181640625, 3.9833984375, 4.3831787109375, 4.782958984375, 5.1827392578125, 5.58251953125, 5.9822998046875, 6.382080078125, 6.7818603515625, 7.181640625, 7.5814208984375, 7.981201171875, 8.3809814453125, 8.78076171875, 9.1805419921875, 9.580322265625, 9.9801025390625, 10.3798828125, 10.7796630859375, 11.179443359375, 11.5792236328125, 11.97900390625, 12.3787841796875, 12.778564453125, 13.1783447265625, 13.578125]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 4.0, 7.0, 8.0, 10.0, 9.0, 22.0, 26.0, 31.0, 38.0, 63.0, 77.0, 107.0, 175.0, 269.0, 421.0, 602.0, 633.0, 518.0, 326.0, 177.0, 155.0, 97.0, 71.0, 53.0, 45.0, 26.0, 21.0, 15.0, 14.0, 10.0, 9.0, 4.0, 10.0, 3.0, 5.0, 6.0, 3.0, 5.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0], "bins": [-19.53125, -18.9920654296875, -18.452880859375, -17.9136962890625, -17.37451171875, -16.8353271484375, -16.296142578125, -15.7569580078125, -15.2177734375, -14.6785888671875, -14.139404296875, -13.6002197265625, -13.06103515625, -12.5218505859375, -11.982666015625, -11.4434814453125, -10.904296875, -10.3651123046875, -9.825927734375, -9.2867431640625, -8.74755859375, -8.2083740234375, -7.669189453125, -7.1300048828125, -6.5908203125, -6.0516357421875, -5.512451171875, -4.9732666015625, -4.43408203125, -3.8948974609375, -3.355712890625, -2.8165283203125, -2.27734375, -1.7381591796875, -1.198974609375, -0.6597900390625, -0.12060546875, 0.4185791015625, 0.957763671875, 1.4969482421875, 2.0361328125, 2.5753173828125, 3.114501953125, 3.6536865234375, 4.19287109375, 4.7320556640625, 5.271240234375, 5.8104248046875, 6.349609375, 6.8887939453125, 7.427978515625, 7.9671630859375, 8.50634765625, 9.0455322265625, 9.584716796875, 10.1239013671875, 10.6630859375, 11.2022705078125, 11.741455078125, 12.2806396484375, 12.81982421875, 13.3590087890625, 13.898193359375, 14.4373779296875, 14.9765625]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 2.0, 3.0, 3.0, 7.0, 6.0, 9.0, 17.0, 18.0, 26.0, 42.0, 51.0, 58.0, 94.0, 125.0, 181.0, 286.0, 482.0, 801.0, 1224.0, 2220.0, 4224.0, 8618.0, 19698.0, 54821.0, 193128.0, 1213518.0, 2241323.0, 322024.0, 80257.0, 27250.0, 11282.0, 5409.0, 2825.0, 1602.0, 976.0, 582.0, 348.0, 219.0, 173.0, 108.0, 73.0, 50.0, 39.0, 26.0, 16.0, 13.0, 11.0, 9.0, 4.0, 2.0, 3.0, 0.0, 2.0, 2.0, 2.0], "bins": [-24.484375, -23.7880859375, -23.091796875, -22.3955078125, -21.69921875, -21.0029296875, -20.306640625, -19.6103515625, -18.9140625, -18.2177734375, -17.521484375, -16.8251953125, -16.12890625, -15.4326171875, -14.736328125, -14.0400390625, -13.34375, -12.6474609375, -11.951171875, -11.2548828125, -10.55859375, -9.8623046875, -9.166015625, -8.4697265625, -7.7734375, -7.0771484375, -6.380859375, -5.6845703125, -4.98828125, -4.2919921875, -3.595703125, -2.8994140625, -2.203125, -1.5068359375, -0.810546875, -0.1142578125, 0.58203125, 1.2783203125, 1.974609375, 2.6708984375, 3.3671875, 4.0634765625, 4.759765625, 5.4560546875, 6.15234375, 6.8486328125, 7.544921875, 8.2412109375, 8.9375, 9.6337890625, 10.330078125, 11.0263671875, 11.72265625, 12.4189453125, 13.115234375, 13.8115234375, 14.5078125, 15.2041015625, 15.900390625, 16.5966796875, 17.29296875, 17.9892578125, 18.685546875, 19.3818359375, 20.078125]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 10.0, 21.0, 47.0, 67.0, 115.0, 149.0, 148.0, 168.0, 112.0, 68.0, 43.0, 26.0, 8.0, 12.0, 8.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.44285583496094, -72.06749725341797, -68.69213104248047, -65.3167724609375, -61.94141387939453, -58.5660514831543, -55.19068908691406, -51.815330505371094, -48.43996810913086, -45.064605712890625, -41.689247131347656, -38.31388473510742, -34.93852233886719, -31.56316375732422, -28.187801361083984, -24.812440872192383, -21.43708038330078, -18.06171989440918, -14.686358451843262, -11.310997009277344, -7.935636520385742, -4.560276031494141, -1.1849136352539062, 2.1904468536376953, 5.565807342529297, 8.941167831420898, 12.316529273986816, 15.691890716552734, 19.067251205444336, 22.442611694335938, 25.817974090576172, 29.193334579467773, 32.568695068359375, 35.94405746459961, 39.31941604614258, 42.69477844238281, 46.07013702392578, 49.445499420166016, 52.82086181640625, 56.19622039794922, 59.57158279418945, 62.94694519042969, 66.32230377197266, 69.69766235351562, 73.07302856445312, 76.4483871459961, 79.82374572753906, 83.19911193847656, 86.57447052001953, 89.9498291015625, 93.3251953125, 96.70055389404297, 100.07591247558594, 103.45127868652344, 106.8266372680664, 110.20199584960938, 113.57736206054688, 116.95272064208984, 120.32808685302734, 123.70344543457031, 127.07880401611328, 130.45416259765625, 133.82952880859375, 137.20489501953125, 140.5802459716797]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 7.0, 12.0, 4.0, 5.0, 10.0, 20.0, 14.0, 19.0, 24.0, 24.0, 23.0, 27.0, 29.0, 36.0, 41.0, 43.0, 48.0, 45.0, 43.0, 58.0, 52.0, 58.0, 42.0, 43.0, 41.0, 27.0, 33.0, 27.0, 18.0, 16.0, 21.0, 25.0, 15.0, 7.0, 11.0, 6.0, 13.0, 9.0, 2.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-60.126739501953125, -58.20262145996094, -56.278499603271484, -54.3543815612793, -52.43026351928711, -50.506141662597656, -48.58202362060547, -46.65790557861328, -44.733787536621094, -42.809669494628906, -40.88554763793945, -38.961429595947266, -37.03731155395508, -35.113189697265625, -33.18907165527344, -31.26495361328125, -29.34083366394043, -27.41671371459961, -25.492595672607422, -23.5684757232666, -21.644357681274414, -19.720237731933594, -17.796119689941406, -15.871999740600586, -13.947880744934082, -12.023761749267578, -10.099642753601074, -8.17552375793457, -6.251404285430908, -4.327284812927246, -2.403165817260742, -0.4790468215942383, 1.4450721740722656, 3.3691911697387695, 5.293310165405273, 7.2174296379089355, 9.141548156738281, 11.065668106079102, 12.989787101745605, 14.91390609741211, 16.838024139404297, 18.762144088745117, 20.686262130737305, 22.610382080078125, 24.534500122070312, 26.458620071411133, 28.382740020751953, 30.30685806274414, 32.230979919433594, 34.15509796142578, 36.079219818115234, 38.00333786010742, 39.92745590209961, 41.85157775878906, 43.77569580078125, 45.69981384277344, 47.623931884765625, 49.54804992675781, 51.472171783447266, 53.39628982543945, 55.32040786743164, 57.244529724121094, 59.16864776611328, 61.09276580810547, 63.016883850097656]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 5.0, 3.0, 0.0, 5.0, 10.0, 12.0, 9.0, 14.0, 10.0, 16.0, 25.0, 25.0, 29.0, 35.0, 30.0, 37.0, 36.0, 54.0, 47.0, 34.0, 51.0, 40.0, 52.0, 46.0, 50.0, 45.0, 36.0, 42.0, 38.0, 26.0, 24.0, 19.0, 19.0, 18.0, 11.0, 12.0, 9.0, 7.0, 5.0, 10.0, 4.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.65625, -11.27294921875, -10.8896484375, -10.50634765625, -10.123046875, -9.73974609375, -9.3564453125, -8.97314453125, -8.58984375, -8.20654296875, -7.8232421875, -7.43994140625, -7.056640625, -6.67333984375, -6.2900390625, -5.90673828125, -5.5234375, -5.14013671875, -4.7568359375, -4.37353515625, -3.990234375, -3.60693359375, -3.2236328125, -2.84033203125, -2.45703125, -2.07373046875, -1.6904296875, -1.30712890625, -0.923828125, -0.54052734375, -0.1572265625, 0.22607421875, 0.609375, 0.99267578125, 1.3759765625, 1.75927734375, 2.142578125, 2.52587890625, 2.9091796875, 3.29248046875, 3.67578125, 4.05908203125, 4.4423828125, 4.82568359375, 5.208984375, 5.59228515625, 5.9755859375, 6.35888671875, 6.7421875, 7.12548828125, 7.5087890625, 7.89208984375, 8.275390625, 8.65869140625, 9.0419921875, 9.42529296875, 9.80859375, 10.19189453125, 10.5751953125, 10.95849609375, 11.341796875, 11.72509765625, 12.1083984375, 12.49169921875, 12.875]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 6.0, 4.0, 4.0, 14.0, 17.0, 23.0, 26.0, 42.0, 70.0, 123.0, 148.0, 251.0, 336.0, 547.0, 888.0, 1476.0, 2500.0, 4113.0, 7011.0, 11851.0, 20604.0, 36151.0, 64893.0, 115908.0, 192127.0, 224245.0, 157339.0, 90192.0, 49886.0, 28294.0, 16049.0, 9363.0, 5445.0, 3308.0, 1937.0, 1214.0, 749.0, 501.0, 314.0, 213.0, 123.0, 82.0, 59.0, 32.0, 28.0, 18.0, 13.0, 9.0, 4.0, 7.0, 5.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.52490234375, -0.5095901489257812, -0.4942779541015625, -0.47896575927734375, -0.463653564453125, -0.44834136962890625, -0.4330291748046875, -0.41771697998046875, -0.40240478515625, -0.38709259033203125, -0.3717803955078125, -0.35646820068359375, -0.341156005859375, -0.32584381103515625, -0.3105316162109375, -0.29521942138671875, -0.2799072265625, -0.26459503173828125, -0.2492828369140625, -0.23397064208984375, -0.218658447265625, -0.20334625244140625, -0.1880340576171875, -0.17272186279296875, -0.15740966796875, -0.14209747314453125, -0.1267852783203125, -0.11147308349609375, -0.096160888671875, -0.08084869384765625, -0.0655364990234375, -0.05022430419921875, -0.034912109375, -0.01959991455078125, -0.0042877197265625, 0.01102447509765625, 0.026336669921875, 0.04164886474609375, 0.0569610595703125, 0.07227325439453125, 0.08758544921875, 0.10289764404296875, 0.1182098388671875, 0.13352203369140625, 0.148834228515625, 0.16414642333984375, 0.1794586181640625, 0.19477081298828125, 0.2100830078125, 0.22539520263671875, 0.2407073974609375, 0.25601959228515625, 0.271331787109375, 0.28664398193359375, 0.3019561767578125, 0.31726837158203125, 0.33258056640625, 0.34789276123046875, 0.3632049560546875, 0.37851715087890625, 0.393829345703125, 0.40914154052734375, 0.4244537353515625, 0.43976593017578125, 0.455078125]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 3.0, 4.0, 6.0, 10.0, 8.0, 12.0, 17.0, 22.0, 21.0, 29.0, 24.0, 26.0, 43.0, 42.0, 51.0, 54.0, 49.0, 50.0, 1079.0, 58.0, 67.0, 53.0, 45.0, 31.0, 44.0, 38.0, 29.0, 19.0, 19.0, 25.0, 13.0, 10.0, 13.0, 3.0, 8.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.515625, -7.2305908203125, -6.945556640625, -6.6605224609375, -6.37548828125, -6.0904541015625, -5.805419921875, -5.5203857421875, -5.2353515625, -4.9503173828125, -4.665283203125, -4.3802490234375, -4.09521484375, -3.8101806640625, -3.525146484375, -3.2401123046875, -2.955078125, -2.6700439453125, -2.385009765625, -2.0999755859375, -1.81494140625, -1.5299072265625, -1.244873046875, -0.9598388671875, -0.6748046875, -0.3897705078125, -0.104736328125, 0.1802978515625, 0.46533203125, 0.7503662109375, 1.035400390625, 1.3204345703125, 1.60546875, 1.8905029296875, 2.175537109375, 2.4605712890625, 2.74560546875, 3.0306396484375, 3.315673828125, 3.6007080078125, 3.8857421875, 4.1707763671875, 4.455810546875, 4.7408447265625, 5.02587890625, 5.3109130859375, 5.595947265625, 5.8809814453125, 6.166015625, 6.4510498046875, 6.736083984375, 7.0211181640625, 7.30615234375, 7.5911865234375, 7.876220703125, 8.1612548828125, 8.4462890625, 8.7313232421875, 9.016357421875, 9.3013916015625, 9.58642578125, 9.8714599609375, 10.156494140625, 10.4415283203125, 10.7265625]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 4.0, 4.0, 4.0, 6.0, 19.0, 16.0, 21.0, 29.0, 55.0, 128.0, 212.0, 337.0, 619.0, 1124.0, 2134.0, 3700.0, 6569.0, 12426.0, 23731.0, 46465.0, 93797.0, 185570.0, 1314709.0, 197895.0, 102162.0, 50486.0, 25362.0, 13364.0, 7302.0, 3952.0, 2103.0, 1222.0, 698.0, 387.0, 193.0, 115.0, 85.0, 45.0, 25.0, 17.0, 14.0, 12.0, 10.0, 4.0, 0.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.50537109375, -0.48827362060546875, -0.4711761474609375, -0.45407867431640625, -0.436981201171875, -0.41988372802734375, -0.4027862548828125, -0.38568878173828125, -0.36859130859375, -0.35149383544921875, -0.3343963623046875, -0.31729888916015625, -0.300201416015625, -0.28310394287109375, -0.2660064697265625, -0.24890899658203125, -0.2318115234375, -0.21471405029296875, -0.1976165771484375, -0.18051910400390625, -0.163421630859375, -0.14632415771484375, -0.1292266845703125, -0.11212921142578125, -0.09503173828125, -0.07793426513671875, -0.0608367919921875, -0.04373931884765625, -0.026641845703125, -0.00954437255859375, 0.0075531005859375, 0.02465057373046875, 0.041748046875, 0.05884552001953125, 0.0759429931640625, 0.09304046630859375, 0.110137939453125, 0.12723541259765625, 0.1443328857421875, 0.16143035888671875, 0.17852783203125, 0.19562530517578125, 0.2127227783203125, 0.22982025146484375, 0.246917724609375, 0.26401519775390625, 0.2811126708984375, 0.29821014404296875, 0.3153076171875, 0.33240509033203125, 0.3495025634765625, 0.36660003662109375, 0.383697509765625, 0.40079498291015625, 0.4178924560546875, 0.43498992919921875, 0.45208740234375, 0.46918487548828125, 0.4862823486328125, 0.5033798217773438, 0.520477294921875, 0.5375747680664062, 0.5546722412109375, 0.5717697143554688, 0.5888671875]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 8.0, 5.0, 6.0, 10.0, 5.0, 12.0, 18.0, 24.0, 38.0, 37.0, 36.0, 63.0, 54.0, 69.0, 55.0, 72.0, 51.0, 74.0, 60.0, 54.0, 51.0, 43.0, 30.0, 27.0, 16.0, 15.0, 12.0, 9.0, 10.0, 9.0, 6.0, 4.0, 5.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0022106170654296875, -0.002143561840057373, -0.0020765066146850586, -0.002009451389312744, -0.0019423961639404297, -0.0018753409385681152, -0.0018082857131958008, -0.0017412304878234863, -0.0016741752624511719, -0.0016071200370788574, -0.001540064811706543, -0.0014730095863342285, -0.001405954360961914, -0.0013388991355895996, -0.0012718439102172852, -0.0012047886848449707, -0.0011377334594726562, -0.0010706782341003418, -0.0010036230087280273, -0.0009365677833557129, -0.0008695125579833984, -0.000802457332611084, -0.0007354021072387695, -0.0006683468818664551, -0.0006012916564941406, -0.0005342364311218262, -0.0004671812057495117, -0.00040012598037719727, -0.0003330707550048828, -0.00026601552963256836, -0.0001989603042602539, -0.00013190507888793945, -6.4849853515625e-05, 2.205371856689453e-06, 6.92605972290039e-05, 0.00013631582260131836, 0.0002033710479736328, 0.00027042627334594727, 0.0003374814987182617, 0.00040453672409057617, 0.0004715919494628906, 0.0005386471748352051, 0.0006057024002075195, 0.000672757625579834, 0.0007398128509521484, 0.0008068680763244629, 0.0008739233016967773, 0.0009409785270690918, 0.0010080337524414062, 0.0010750889778137207, 0.0011421442031860352, 0.0012091994285583496, 0.001276254653930664, 0.0013433098793029785, 0.001410365104675293, 0.0014774203300476074, 0.0015444755554199219, 0.0016115307807922363, 0.0016785860061645508, 0.0017456412315368652, 0.0018126964569091797, 0.0018797516822814941, 0.0019468069076538086, 0.002013862133026123, 0.0020809173583984375]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 6.0, 4.0, 5.0, 6.0, 6.0, 14.0, 11.0, 10.0, 22.0, 29.0, 22.0, 39.0, 47.0, 76.0, 106.0, 143.0, 209.0, 410.0, 1790.0, 50257.0, 973945.0, 19208.0, 1099.0, 336.0, 218.0, 136.0, 95.0, 80.0, 56.0, 44.0, 25.0, 15.0, 21.0, 15.0, 6.0, 10.0, 10.0, 7.0, 4.0, 4.0, 4.0, 0.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.037078857421875, -0.03589773178100586, -0.03471660614013672, -0.03353548049926758, -0.03235435485839844, -0.031173229217529297, -0.029992103576660156, -0.028810977935791016, -0.027629852294921875, -0.026448726654052734, -0.025267601013183594, -0.024086475372314453, -0.022905349731445312, -0.021724224090576172, -0.02054309844970703, -0.01936197280883789, -0.01818084716796875, -0.01699972152709961, -0.01581859588623047, -0.014637470245361328, -0.013456344604492188, -0.012275218963623047, -0.011094093322753906, -0.009912967681884766, -0.008731842041015625, -0.007550716400146484, -0.006369590759277344, -0.005188465118408203, -0.0040073394775390625, -0.002826213836669922, -0.0016450881958007812, -0.0004639625549316406, 0.0007171630859375, 0.0018982887268066406, 0.0030794143676757812, 0.004260540008544922, 0.0054416656494140625, 0.006622791290283203, 0.007803916931152344, 0.008985042572021484, 0.010166168212890625, 0.011347293853759766, 0.012528419494628906, 0.013709545135498047, 0.014890670776367188, 0.016071796417236328, 0.01725292205810547, 0.01843404769897461, 0.01961517333984375, 0.02079629898071289, 0.02197742462158203, 0.023158550262451172, 0.024339675903320312, 0.025520801544189453, 0.026701927185058594, 0.027883052825927734, 0.029064178466796875, 0.030245304107666016, 0.031426429748535156, 0.0326075553894043, 0.03378868103027344, 0.03496980667114258, 0.03615093231201172, 0.03733205795288086, 0.03851318359375]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 8.0, 11.0, 19.0, 53.0, 155.0, 270.0, 269.0, 153.0, 40.0, 18.0, 5.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.005818270146846771, -0.005699192173779011, -0.00558011420071125, -0.0054610357619822025, -0.005341957788914442, -0.005222879815846682, -0.005103801377117634, -0.004984723404049873, -0.004865645430982113, -0.004746567457914352, -0.004627489484846592, -0.004508411046117544, -0.004389333073049784, -0.004270255099982023, -0.0041511766612529755, -0.004032098688185215, -0.0039130207151174545, -0.003793942742049694, -0.00367486453615129, -0.003555786330252886, -0.0034367083571851254, -0.003317630384117365, -0.0031985521782189608, -0.0030794739723205566, -0.002960395999252796, -0.0028413180261850357, -0.0027222398202866316, -0.0026031616143882275, -0.002484083641320467, -0.0023650056682527065, -0.0022459274623543024, -0.0021268492564558983, -0.0020077715162187815, -0.0018886934267356992, -0.0017696153372526169, -0.0016505372477695346, -0.0015314591582864523, -0.00141238106880337, -0.0012933029793202877, -0.0011742248898372054, -0.0010551468003541231, -0.0009360687108710408, -0.0008169906213879585, -0.0006979125319048762, -0.0005788344424217939, -0.00045975635293871164, -0.00034067826345562935, -0.00022160017397254705, -0.00010252208448946476, 1.6556004993617535e-05, 0.00013563409447669983, 0.0002547121839597821, 0.0003737902734428644, 0.0004928683629259467, 0.000611946452409029, 0.0007310245418921113, 0.0008501026313751936, 0.0009691807208582759, 0.0010882588103413582, 0.0012073368998244405, 0.0013264149893075228, 0.001445493078790605, 0.0015645711682736874, 0.0016836492577567697, 0.001802727347239852]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 4.0, 4.0, 9.0, 5.0, 14.0, 9.0, 9.0, 13.0, 19.0, 31.0, 22.0, 38.0, 35.0, 41.0, 37.0, 49.0, 46.0, 42.0, 46.0, 50.0, 52.0, 51.0, 53.0, 27.0, 43.0, 33.0, 30.0, 32.0, 31.0, 25.0, 16.0, 30.0, 13.0, 8.0, 11.0, 6.0, 6.0, 5.0, 8.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011407136917114258, -0.0011027995496988297, -0.0010648854076862335, -0.0010269712656736374, -0.0009890571236610413, -0.0009511429816484451, -0.000913228839635849, -0.0008753146976232529, -0.0008374005556106567, -0.0007994864135980606, -0.0007615722715854645, -0.0007236581295728683, -0.0006857439875602722, -0.0006478298455476761, -0.00060991570353508, -0.0005720015615224838, -0.0005340874195098877, -0.0004961732774972916, -0.00045825913548469543, -0.0004203449934720993, -0.0003824308514595032, -0.00034451670944690704, -0.0003066025674343109, -0.0002686884254217148, -0.00023077428340911865, -0.00019286014139652252, -0.0001549459993839264, -0.00011703185737133026, -7.911771535873413e-05, -4.1203573346138e-05, -3.28943133354187e-06, 3.462471067905426e-05, 7.253885269165039e-05, 0.00011045299470424652, 0.00014836713671684265, 0.00018628127872943878, 0.0002241954207420349, 0.00026210956275463104, 0.00030002370476722717, 0.0003379378467798233, 0.00037585198879241943, 0.00041376613080501556, 0.0004516802728176117, 0.0004895944148302078, 0.000527508556842804, 0.0005654226988554001, 0.0006033368408679962, 0.0006412509828805923, 0.0006791651248931885, 0.0007170792669057846, 0.0007549934089183807, 0.0007929075509309769, 0.000830821692943573, 0.0008687358349561691, 0.0009066499769687653, 0.0009445641189813614, 0.0009824782609939575, 0.0010203924030065536, 0.0010583065450191498, 0.001096220687031746, 0.001134134829044342, 0.0011720489710569382, 0.0012099631130695343, 0.0012478772550821304, 0.0012857913970947266]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 5.0, 3.0, 0.0, 5.0, 10.0, 12.0, 9.0, 14.0, 10.0, 16.0, 25.0, 25.0, 29.0, 35.0, 30.0, 37.0, 36.0, 54.0, 47.0, 34.0, 51.0, 40.0, 52.0, 46.0, 50.0, 45.0, 36.0, 42.0, 38.0, 26.0, 24.0, 19.0, 19.0, 19.0, 10.0, 12.0, 9.0, 7.0, 5.0, 10.0, 4.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.65625, -11.27294921875, -10.8896484375, -10.50634765625, -10.123046875, -9.73974609375, -9.3564453125, -8.97314453125, -8.58984375, -8.20654296875, -7.8232421875, -7.43994140625, -7.056640625, -6.67333984375, -6.2900390625, -5.90673828125, -5.5234375, -5.14013671875, -4.7568359375, -4.37353515625, -3.990234375, -3.60693359375, -3.2236328125, -2.84033203125, -2.45703125, -2.07373046875, -1.6904296875, -1.30712890625, -0.923828125, -0.54052734375, -0.1572265625, 0.22607421875, 0.609375, 0.99267578125, 1.3759765625, 1.75927734375, 2.142578125, 2.52587890625, 2.9091796875, 3.29248046875, 3.67578125, 4.05908203125, 4.4423828125, 4.82568359375, 5.208984375, 5.59228515625, 5.9755859375, 6.35888671875, 6.7421875, 7.12548828125, 7.5087890625, 7.89208984375, 8.275390625, 8.65869140625, 9.0419921875, 9.42529296875, 9.80859375, 10.19189453125, 10.5751953125, 10.95849609375, 11.341796875, 11.72509765625, 12.1083984375, 12.49169921875, 12.875]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 8.0, 13.0, 11.0, 15.0, 16.0, 27.0, 34.0, 45.0, 85.0, 98.0, 143.0, 234.0, 304.0, 522.0, 793.0, 1357.0, 2219.0, 4069.0, 7606.0, 14895.0, 31676.0, 80237.0, 302079.0, 419163.0, 105674.0, 39062.0, 17963.0, 8954.0, 4643.0, 2527.0, 1436.0, 896.0, 561.0, 388.0, 253.0, 162.0, 123.0, 71.0, 39.0, 43.0, 29.0, 28.0, 22.0, 13.0, 8.0, 5.0, 3.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-15.46875, -14.9871826171875, -14.505615234375, -14.0240478515625, -13.54248046875, -13.0609130859375, -12.579345703125, -12.0977783203125, -11.6162109375, -11.1346435546875, -10.653076171875, -10.1715087890625, -9.68994140625, -9.2083740234375, -8.726806640625, -8.2452392578125, -7.763671875, -7.2821044921875, -6.800537109375, -6.3189697265625, -5.83740234375, -5.3558349609375, -4.874267578125, -4.3927001953125, -3.9111328125, -3.4295654296875, -2.947998046875, -2.4664306640625, -1.98486328125, -1.5032958984375, -1.021728515625, -0.5401611328125, -0.05859375, 0.4229736328125, 0.904541015625, 1.3861083984375, 1.86767578125, 2.3492431640625, 2.830810546875, 3.3123779296875, 3.7939453125, 4.2755126953125, 4.757080078125, 5.2386474609375, 5.72021484375, 6.2017822265625, 6.683349609375, 7.1649169921875, 7.646484375, 8.1280517578125, 8.609619140625, 9.0911865234375, 9.57275390625, 10.0543212890625, 10.535888671875, 11.0174560546875, 11.4990234375, 11.9805908203125, 12.462158203125, 12.9437255859375, 13.42529296875, 13.9068603515625, 14.388427734375, 14.8699951171875, 15.3515625]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 5.0, 7.0, 3.0, 9.0, 13.0, 17.0, 15.0, 15.0, 22.0, 24.0, 29.0, 25.0, 28.0, 53.0, 45.0, 55.0, 55.0, 74.0, 144.0, 343.0, 1394.0, 156.0, 82.0, 57.0, 55.0, 44.0, 37.0, 39.0, 30.0, 25.0, 26.0, 24.0, 18.0, 13.0, 12.0, 12.0, 15.0, 6.0, 6.0, 3.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-26.5625, -25.70703125, -24.8515625, -23.99609375, -23.140625, -22.28515625, -21.4296875, -20.57421875, -19.71875, -18.86328125, -18.0078125, -17.15234375, -16.296875, -15.44140625, -14.5859375, -13.73046875, -12.875, -12.01953125, -11.1640625, -10.30859375, -9.453125, -8.59765625, -7.7421875, -6.88671875, -6.03125, -5.17578125, -4.3203125, -3.46484375, -2.609375, -1.75390625, -0.8984375, -0.04296875, 0.8125, 1.66796875, 2.5234375, 3.37890625, 4.234375, 5.08984375, 5.9453125, 6.80078125, 7.65625, 8.51171875, 9.3671875, 10.22265625, 11.078125, 11.93359375, 12.7890625, 13.64453125, 14.5, 15.35546875, 16.2109375, 17.06640625, 17.921875, 18.77734375, 19.6328125, 20.48828125, 21.34375, 22.19921875, 23.0546875, 23.91015625, 24.765625, 25.62109375, 26.4765625, 27.33203125, 28.1875]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 4.0, 7.0, 3.0, 9.0, 15.0, 16.0, 15.0, 23.0, 38.0, 57.0, 56.0, 99.0, 105.0, 144.0, 244.0, 513.0, 1690.0, 9382.0, 84989.0, 2827378.0, 200974.0, 15906.0, 2420.0, 643.0, 311.0, 192.0, 108.0, 75.0, 62.0, 56.0, 33.0, 42.0, 19.0, 13.0, 15.0, 13.0, 9.0, 11.0, 4.0, 5.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-48.1875, -46.7109375, -45.234375, -43.7578125, -42.28125, -40.8046875, -39.328125, -37.8515625, -36.375, -34.8984375, -33.421875, -31.9453125, -30.46875, -28.9921875, -27.515625, -26.0390625, -24.5625, -23.0859375, -21.609375, -20.1328125, -18.65625, -17.1796875, -15.703125, -14.2265625, -12.75, -11.2734375, -9.796875, -8.3203125, -6.84375, -5.3671875, -3.890625, -2.4140625, -0.9375, 0.5390625, 2.015625, 3.4921875, 4.96875, 6.4453125, 7.921875, 9.3984375, 10.875, 12.3515625, 13.828125, 15.3046875, 16.78125, 18.2578125, 19.734375, 21.2109375, 22.6875, 24.1640625, 25.640625, 27.1171875, 28.59375, 30.0703125, 31.546875, 33.0234375, 34.5, 35.9765625, 37.453125, 38.9296875, 40.40625, 41.8828125, 43.359375, 44.8359375, 46.3125]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 216.0, 781.0, 18.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-840.1602172851562, -823.4254150390625, -806.690673828125, -789.9558715820312, -773.2210693359375, -756.4862670898438, -739.75146484375, -723.0167236328125, -706.2819213867188, -689.547119140625, -672.8123779296875, -656.0775756835938, -639.3427734375, -622.6079711914062, -605.8731689453125, -589.138427734375, -572.4036254882812, -555.6688232421875, -538.93408203125, -522.1992797851562, -505.4644775390625, -488.72967529296875, -471.9949035644531, -455.2601318359375, -438.52532958984375, -421.79052734375, -405.0557556152344, -388.32098388671875, -371.586181640625, -354.85137939453125, -338.1166076660156, -321.3818359375, -304.64697265625, -287.91217041015625, -271.1773986816406, -254.44261169433594, -237.70782470703125, -220.97303771972656, -204.23825073242188, -187.5034637451172, -170.76869201660156, -154.03390502929688, -137.2991180419922, -120.5643310546875, -103.82954406738281, -87.09475708007812, -70.35997009277344, -53.62518310546875, -36.89039611816406, -20.155609130859375, -3.4208221435546875, 13.31396484375, 30.048751831054688, 46.783538818359375, 63.51832580566406, 80.25311279296875, 96.98789978027344, 113.72268676757812, 130.4574737548828, 147.1922607421875, 163.9270477294922, 180.66183471679688, 197.39662170410156, 214.13140869140625, 230.86619567871094]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 6.0, 6.0, 5.0, 3.0, 7.0, 14.0, 16.0, 14.0, 23.0, 21.0, 24.0, 26.0, 31.0, 30.0, 18.0, 36.0, 33.0, 42.0, 37.0, 42.0, 46.0, 43.0, 47.0, 44.0, 38.0, 38.0, 25.0, 40.0, 34.0, 22.0, 17.0, 27.0, 22.0, 25.0, 16.0, 15.0, 11.0, 11.0, 6.0, 5.0, 14.0, 8.0, 4.0, 3.0, 2.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-60.2677001953125, -58.33207702636719, -56.396453857421875, -54.46083450317383, -52.525211334228516, -50.5895881652832, -48.653968811035156, -46.718345642089844, -44.78272247314453, -42.84709930419922, -40.911476135253906, -38.97585678100586, -37.04023361206055, -35.104610443115234, -33.16899108886719, -31.233367919921875, -29.297744750976562, -27.36212158203125, -25.42650032043457, -23.49087905883789, -21.555255889892578, -19.619632720947266, -17.684011459350586, -15.74838924407959, -13.812767028808594, -11.877144813537598, -9.941522598266602, -8.005900382995605, -6.070278167724609, -4.134655952453613, -2.199033737182617, -0.2634115219116211, 1.672210693359375, 3.607832908630371, 5.543455123901367, 7.479077339172363, 9.41469955444336, 11.350321769714355, 13.285943984985352, 15.221566200256348, 17.157188415527344, 19.092811584472656, 21.028432846069336, 22.964054107666016, 24.899677276611328, 26.83530044555664, 28.77092170715332, 30.70654296875, 32.64216613769531, 34.577789306640625, 36.51341247558594, 38.449031829833984, 40.3846549987793, 42.32027816772461, 44.255897521972656, 46.19152069091797, 48.12714385986328, 50.062767028808594, 51.998390197753906, 53.93400955200195, 55.869632720947266, 57.80525588989258, 59.740875244140625, 61.67649841308594, 63.61212158203125]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 3.0, 6.0, 5.0, 3.0, 10.0, 8.0, 12.0, 14.0, 27.0, 22.0, 20.0, 31.0, 26.0, 35.0, 48.0, 40.0, 37.0, 38.0, 53.0, 57.0, 39.0, 43.0, 40.0, 40.0, 45.0, 48.0, 45.0, 38.0, 28.0, 18.0, 23.0, 10.0, 15.0, 19.0, 15.0, 12.0, 9.0, 9.0, 5.0, 5.0, 5.0, 1.0, 0.0, 1.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.4609375, -11.072998046875, -10.68505859375, -10.297119140625, -9.9091796875, -9.521240234375, -9.13330078125, -8.745361328125, -8.357421875, -7.969482421875, -7.58154296875, -7.193603515625, -6.8056640625, -6.417724609375, -6.02978515625, -5.641845703125, -5.25390625, -4.865966796875, -4.47802734375, -4.090087890625, -3.7021484375, -3.314208984375, -2.92626953125, -2.538330078125, -2.150390625, -1.762451171875, -1.37451171875, -0.986572265625, -0.5986328125, -0.210693359375, 0.17724609375, 0.565185546875, 0.953125, 1.341064453125, 1.72900390625, 2.116943359375, 2.5048828125, 2.892822265625, 3.28076171875, 3.668701171875, 4.056640625, 4.444580078125, 4.83251953125, 5.220458984375, 5.6083984375, 5.996337890625, 6.38427734375, 6.772216796875, 7.16015625, 7.548095703125, 7.93603515625, 8.323974609375, 8.7119140625, 9.099853515625, 9.48779296875, 9.875732421875, 10.263671875, 10.651611328125, 11.03955078125, 11.427490234375, 11.8154296875, 12.203369140625, 12.59130859375, 12.979248046875, 13.3671875]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 8.0, 7.0, 12.0, 13.0, 13.0, 23.0, 20.0, 28.0, 39.0, 53.0, 69.0, 83.0, 127.0, 175.0, 292.0, 498.0, 1369.0, 10595.0, 3326774.0, 844917.0, 6573.0, 1147.0, 520.0, 255.0, 193.0, 115.0, 74.0, 57.0, 53.0, 47.0, 30.0, 26.0, 14.0, 11.0, 11.0, 11.0, 15.0, 3.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-100.1875, -96.837890625, -93.48828125, -90.138671875, -86.7890625, -83.439453125, -80.08984375, -76.740234375, -73.390625, -70.041015625, -66.69140625, -63.341796875, -59.9921875, -56.642578125, -53.29296875, -49.943359375, -46.59375, -43.244140625, -39.89453125, -36.544921875, -33.1953125, -29.845703125, -26.49609375, -23.146484375, -19.796875, -16.447265625, -13.09765625, -9.748046875, -6.3984375, -3.048828125, 0.30078125, 3.650390625, 7.0, 10.349609375, 13.69921875, 17.048828125, 20.3984375, 23.748046875, 27.09765625, 30.447265625, 33.796875, 37.146484375, 40.49609375, 43.845703125, 47.1953125, 50.544921875, 53.89453125, 57.244140625, 60.59375, 63.943359375, 67.29296875, 70.642578125, 73.9921875, 77.341796875, 80.69140625, 84.041015625, 87.390625, 90.740234375, 94.08984375, 97.439453125, 100.7890625, 104.138671875, 107.48828125, 110.837890625, 114.1875]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 2.0, 3.0, 10.0, 7.0, 9.0, 12.0, 11.0, 13.0, 19.0, 24.0, 32.0, 46.0, 42.0, 72.0, 62.0, 91.0, 111.0, 194.0, 322.0, 437.0, 614.0, 565.0, 429.0, 302.0, 183.0, 117.0, 88.0, 74.0, 47.0, 36.0, 23.0, 14.0, 16.0, 10.0, 11.0, 7.0, 6.0, 5.0, 6.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 4.0], "bins": [-18.75, -18.22802734375, -17.7060546875, -17.18408203125, -16.662109375, -16.14013671875, -15.6181640625, -15.09619140625, -14.57421875, -14.05224609375, -13.5302734375, -13.00830078125, -12.486328125, -11.96435546875, -11.4423828125, -10.92041015625, -10.3984375, -9.87646484375, -9.3544921875, -8.83251953125, -8.310546875, -7.78857421875, -7.2666015625, -6.74462890625, -6.22265625, -5.70068359375, -5.1787109375, -4.65673828125, -4.134765625, -3.61279296875, -3.0908203125, -2.56884765625, -2.046875, -1.52490234375, -1.0029296875, -0.48095703125, 0.041015625, 0.56298828125, 1.0849609375, 1.60693359375, 2.12890625, 2.65087890625, 3.1728515625, 3.69482421875, 4.216796875, 4.73876953125, 5.2607421875, 5.78271484375, 6.3046875, 6.82666015625, 7.3486328125, 7.87060546875, 8.392578125, 8.91455078125, 9.4365234375, 9.95849609375, 10.48046875, 11.00244140625, 11.5244140625, 12.04638671875, 12.568359375, 13.09033203125, 13.6123046875, 14.13427734375, 14.65625]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 6.0, 9.0, 13.0, 29.0, 33.0, 37.0, 50.0, 124.0, 404.0, 2490.0, 37900.0, 3790526.0, 352544.0, 8672.0, 1004.0, 197.0, 84.0, 53.0, 28.0, 19.0, 16.0, 24.0, 7.0, 8.0, 8.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-95.875, -93.1171875, -90.359375, -87.6015625, -84.84375, -82.0859375, -79.328125, -76.5703125, -73.8125, -71.0546875, -68.296875, -65.5390625, -62.78125, -60.0234375, -57.265625, -54.5078125, -51.75, -48.9921875, -46.234375, -43.4765625, -40.71875, -37.9609375, -35.203125, -32.4453125, -29.6875, -26.9296875, -24.171875, -21.4140625, -18.65625, -15.8984375, -13.140625, -10.3828125, -7.625, -4.8671875, -2.109375, 0.6484375, 3.40625, 6.1640625, 8.921875, 11.6796875, 14.4375, 17.1953125, 19.953125, 22.7109375, 25.46875, 28.2265625, 30.984375, 33.7421875, 36.5, 39.2578125, 42.015625, 44.7734375, 47.53125, 50.2890625, 53.046875, 55.8046875, 58.5625, 61.3203125, 64.078125, 66.8359375, 69.59375, 72.3515625, 75.109375, 77.8671875, 80.625]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 28.0, 80.0, 204.0, 326.0, 236.0, 94.0, 27.0, 11.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-167.9612579345703, -161.66505432128906, -155.3688507080078, -149.0726318359375, -142.77642822265625, -136.480224609375, -130.18402099609375, -123.8878173828125, -117.59160614013672, -111.29540252685547, -104.99919128417969, -98.70298767089844, -92.40678405761719, -86.1105728149414, -79.81436920166016, -73.51815795898438, -67.22195434570312, -60.92574691772461, -54.629539489746094, -48.333335876464844, -42.03712844848633, -35.74092102050781, -29.444717407226562, -23.148509979248047, -16.85230255126953, -10.556096076965332, -4.259889602661133, 2.03631591796875, 8.332523345947266, 14.628730773925781, 20.92493438720703, 27.221141815185547, 33.517364501953125, 39.81357192993164, 46.109779357910156, 52.405982971191406, 58.70219039916992, 64.99839782714844, 71.29460144042969, 77.59080505371094, 83.88701629638672, 90.18321990966797, 96.47943115234375, 102.775634765625, 109.07183837890625, 115.36804962158203, 121.66425323486328, 127.96046447753906, 134.2566680908203, 140.55287170410156, 146.8490753173828, 153.14529418945312, 159.44149780273438, 165.73770141601562, 172.03390502929688, 178.33010864257812, 184.62631225585938, 190.92251586914062, 197.21871948242188, 203.51492309570312, 209.81114196777344, 216.1073455810547, 222.40354919433594, 228.6997528076172, 234.9959716796875]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 4.0, 2.0, 9.0, 4.0, 9.0, 11.0, 12.0, 14.0, 13.0, 25.0, 21.0, 21.0, 22.0, 32.0, 38.0, 38.0, 33.0, 31.0, 44.0, 34.0, 38.0, 48.0, 31.0, 32.0, 50.0, 42.0, 37.0, 36.0, 25.0, 32.0, 32.0, 19.0, 25.0, 16.0, 14.0, 21.0, 17.0, 17.0, 11.0, 10.0, 8.0, 8.0, 6.0, 2.0, 6.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-47.93061828613281, -46.3745002746582, -44.81837844848633, -43.26226043701172, -41.70614242553711, -40.1500244140625, -38.593902587890625, -37.037784576416016, -35.481666564941406, -33.9255485534668, -32.36942672729492, -30.813308715820312, -29.257190704345703, -27.70107078552246, -26.14495086669922, -24.58883285522461, -23.032711029052734, -21.476591110229492, -19.920473098754883, -18.36435317993164, -16.80823516845703, -15.252115249633789, -13.695995330810547, -12.139876365661621, -10.583757400512695, -9.02763843536377, -7.4715189933776855, -5.915399551391602, -4.359280586242676, -2.80316162109375, -1.2470417022705078, 0.30907726287841797, 1.8651962280273438, 3.4213154315948486, 4.9774346351623535, 6.5335540771484375, 8.089673042297363, 9.645792007446289, 11.201911926269531, 12.758030891418457, 14.314149856567383, 15.870268821716309, 17.426387786865234, 18.982507705688477, 20.53862762451172, 22.094745635986328, 23.65086555480957, 25.206985473632812, 26.763103485107422, 28.319223403930664, 29.875341415405273, 31.431461334228516, 32.987579345703125, 34.543701171875, 36.09981918334961, 37.65593719482422, 39.212059020996094, 40.7681770324707, 42.32429885864258, 43.88041687011719, 45.4365348815918, 46.992652893066406, 48.54877471923828, 50.10489273071289, 51.6610107421875]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 5.0, 4.0, 5.0, 5.0, 7.0, 7.0, 10.0, 16.0, 9.0, 11.0, 19.0, 27.0, 30.0, 29.0, 37.0, 38.0, 40.0, 36.0, 42.0, 41.0, 42.0, 50.0, 52.0, 38.0, 49.0, 37.0, 35.0, 25.0, 37.0, 32.0, 37.0, 24.0, 20.0, 24.0, 23.0, 20.0, 7.0, 5.0, 7.0, 7.0, 5.0, 5.0, 3.0, 0.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.53125, -11.144287109375, -10.75732421875, -10.370361328125, -9.9833984375, -9.596435546875, -9.20947265625, -8.822509765625, -8.435546875, -8.048583984375, -7.66162109375, -7.274658203125, -6.8876953125, -6.500732421875, -6.11376953125, -5.726806640625, -5.33984375, -4.952880859375, -4.56591796875, -4.178955078125, -3.7919921875, -3.405029296875, -3.01806640625, -2.631103515625, -2.244140625, -1.857177734375, -1.47021484375, -1.083251953125, -0.6962890625, -0.309326171875, 0.07763671875, 0.464599609375, 0.8515625, 1.238525390625, 1.62548828125, 2.012451171875, 2.3994140625, 2.786376953125, 3.17333984375, 3.560302734375, 3.947265625, 4.334228515625, 4.72119140625, 5.108154296875, 5.4951171875, 5.882080078125, 6.26904296875, 6.656005859375, 7.04296875, 7.429931640625, 7.81689453125, 8.203857421875, 8.5908203125, 8.977783203125, 9.36474609375, 9.751708984375, 10.138671875, 10.525634765625, 10.91259765625, 11.299560546875, 11.6865234375, 12.073486328125, 12.46044921875, 12.847412109375, 13.234375]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 3.0, 4.0, 11.0, 10.0, 20.0, 31.0, 44.0, 52.0, 90.0, 128.0, 190.0, 265.0, 418.0, 514.0, 791.0, 1199.0, 1695.0, 2543.0, 3848.0, 5768.0, 8760.0, 13898.0, 21751.0, 34628.0, 56254.0, 89754.0, 137348.0, 185427.0, 167428.0, 116116.0, 73753.0, 45807.0, 28351.0, 17832.0, 11614.0, 7473.0, 4877.0, 3180.0, 2066.0, 1442.0, 1011.0, 690.0, 476.0, 276.0, 241.0, 157.0, 98.0, 67.0, 56.0, 43.0, 20.0, 17.0, 15.0, 7.0, 8.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.4208984375, -0.4076576232910156, -0.39441680908203125, -0.3811759948730469, -0.3679351806640625, -0.3546943664550781, -0.34145355224609375, -0.3282127380371094, -0.314971923828125, -0.3017311096191406, -0.28849029541015625, -0.2752494812011719, -0.2620086669921875, -0.24876785278320312, -0.23552703857421875, -0.22228622436523438, -0.20904541015625, -0.19580459594726562, -0.18256378173828125, -0.16932296752929688, -0.1560821533203125, -0.14284133911132812, -0.12960052490234375, -0.11635971069335938, -0.103118896484375, -0.08987808227539062, -0.07663726806640625, -0.06339645385742188, -0.0501556396484375, -0.036914825439453125, -0.02367401123046875, -0.010433197021484375, 0.0028076171875, 0.016048431396484375, 0.02928924560546875, 0.042530059814453125, 0.0557708740234375, 0.06901168823242188, 0.08225250244140625, 0.09549331665039062, 0.108734130859375, 0.12197494506835938, 0.13521575927734375, 0.14845657348632812, 0.1616973876953125, 0.17493820190429688, 0.18817901611328125, 0.20141983032226562, 0.21466064453125, 0.22790145874023438, 0.24114227294921875, 0.2543830871582031, 0.2676239013671875, 0.2808647155761719, 0.29410552978515625, 0.3073463439941406, 0.320587158203125, 0.3338279724121094, 0.34706878662109375, 0.3603096008300781, 0.3735504150390625, 0.3867912292480469, 0.40003204345703125, 0.4132728576660156, 0.426513671875]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 7.0, 2.0, 1.0, 3.0, 10.0, 8.0, 9.0, 16.0, 15.0, 11.0, 19.0, 19.0, 23.0, 8.0, 23.0, 28.0, 28.0, 39.0, 28.0, 32.0, 35.0, 30.0, 36.0, 40.0, 47.0, 1052.0, 33.0, 32.0, 29.0, 25.0, 25.0, 35.0, 33.0, 29.0, 23.0, 25.0, 25.0, 15.0, 24.0, 14.0, 21.0, 7.0, 10.0, 11.0, 9.0, 6.0, 4.0, 8.0, 4.0, 3.0, 3.0, 1.0, 4.0, 2.0, 4.0, 3.0, 3.0], "bins": [-6.54296875, -6.34033203125, -6.1376953125, -5.93505859375, -5.732421875, -5.52978515625, -5.3271484375, -5.12451171875, -4.921875, -4.71923828125, -4.5166015625, -4.31396484375, -4.111328125, -3.90869140625, -3.7060546875, -3.50341796875, -3.30078125, -3.09814453125, -2.8955078125, -2.69287109375, -2.490234375, -2.28759765625, -2.0849609375, -1.88232421875, -1.6796875, -1.47705078125, -1.2744140625, -1.07177734375, -0.869140625, -0.66650390625, -0.4638671875, -0.26123046875, -0.05859375, 0.14404296875, 0.3466796875, 0.54931640625, 0.751953125, 0.95458984375, 1.1572265625, 1.35986328125, 1.5625, 1.76513671875, 1.9677734375, 2.17041015625, 2.373046875, 2.57568359375, 2.7783203125, 2.98095703125, 3.18359375, 3.38623046875, 3.5888671875, 3.79150390625, 3.994140625, 4.19677734375, 4.3994140625, 4.60205078125, 4.8046875, 5.00732421875, 5.2099609375, 5.41259765625, 5.615234375, 5.81787109375, 6.0205078125, 6.22314453125, 6.42578125]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 5.0, 13.0, 14.0, 16.0, 35.0, 48.0, 60.0, 85.0, 138.0, 202.0, 287.0, 366.0, 569.0, 869.0, 1161.0, 1636.0, 2406.0, 3538.0, 5009.0, 7392.0, 10501.0, 15545.0, 23274.0, 34514.0, 52144.0, 77590.0, 112775.0, 151023.0, 1201848.0, 124303.0, 88377.0, 58828.0, 39370.0, 26557.0, 17852.0, 11962.0, 8250.0, 5703.0, 3835.0, 2734.0, 1899.0, 1299.0, 982.0, 649.0, 464.0, 336.0, 220.0, 157.0, 102.0, 74.0, 41.0, 40.0, 15.0, 8.0, 7.0, 6.0, 2.0, 4.0, 4.0, 1.0, 3.0], "bins": [-0.335693359375, -0.324920654296875, -0.31414794921875, -0.303375244140625, -0.2926025390625, -0.281829833984375, -0.27105712890625, -0.260284423828125, -0.24951171875, -0.238739013671875, -0.22796630859375, -0.217193603515625, -0.2064208984375, -0.195648193359375, -0.18487548828125, -0.174102783203125, -0.163330078125, -0.152557373046875, -0.14178466796875, -0.131011962890625, -0.1202392578125, -0.109466552734375, -0.09869384765625, -0.087921142578125, -0.0771484375, -0.066375732421875, -0.05560302734375, -0.044830322265625, -0.0340576171875, -0.023284912109375, -0.01251220703125, -0.001739501953125, 0.009033203125, 0.019805908203125, 0.03057861328125, 0.041351318359375, 0.0521240234375, 0.062896728515625, 0.07366943359375, 0.084442138671875, 0.09521484375, 0.105987548828125, 0.11676025390625, 0.127532958984375, 0.1383056640625, 0.149078369140625, 0.15985107421875, 0.170623779296875, 0.181396484375, 0.192169189453125, 0.20294189453125, 0.213714599609375, 0.2244873046875, 0.235260009765625, 0.24603271484375, 0.256805419921875, 0.267578125, 0.278350830078125, 0.28912353515625, 0.299896240234375, 0.3106689453125, 0.321441650390625, 0.33221435546875, 0.342987060546875, 0.353759765625]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 2.0, 5.0, 6.0, 6.0, 8.0, 5.0, 14.0, 10.0, 15.0, 15.0, 13.0, 22.0, 25.0, 34.0, 33.0, 43.0, 38.0, 49.0, 48.0, 35.0, 44.0, 52.0, 50.0, 46.0, 57.0, 38.0, 48.0, 34.0, 34.0, 26.0, 18.0, 31.0, 14.0, 15.0, 20.0, 8.0, 7.0, 5.0, 5.0, 5.0, 3.0, 2.0, 6.0, 1.0, 4.0, 4.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0015354156494140625, -0.0014867186546325684, -0.0014380216598510742, -0.00138932466506958, -0.001340627670288086, -0.0012919306755065918, -0.0012432336807250977, -0.0011945366859436035, -0.0011458396911621094, -0.0010971426963806152, -0.001048445701599121, -0.000999748706817627, -0.0009510517120361328, -0.0009023547172546387, -0.0008536577224731445, -0.0008049607276916504, -0.0007562637329101562, -0.0007075667381286621, -0.000658869743347168, -0.0006101727485656738, -0.0005614757537841797, -0.0005127787590026855, -0.0004640817642211914, -0.00041538476943969727, -0.0003666877746582031, -0.000317990779876709, -0.00026929378509521484, -0.0002205967903137207, -0.00017189979553222656, -0.00012320280075073242, -7.450580596923828e-05, -2.580881118774414e-05, 2.288818359375e-05, 7.158517837524414e-05, 0.00012028217315673828, 0.00016897916793823242, 0.00021767616271972656, 0.0002663731575012207, 0.00031507015228271484, 0.000363767147064209, 0.0004124641418457031, 0.00046116113662719727, 0.0005098581314086914, 0.0005585551261901855, 0.0006072521209716797, 0.0006559491157531738, 0.000704646110534668, 0.0007533431053161621, 0.0008020401000976562, 0.0008507370948791504, 0.0008994340896606445, 0.0009481310844421387, 0.0009968280792236328, 0.001045525074005127, 0.001094222068786621, 0.0011429190635681152, 0.0011916160583496094, 0.0012403130531311035, 0.0012890100479125977, 0.0013377070426940918, 0.001386404037475586, 0.00143510103225708, 0.0014837980270385742, 0.0015324950218200684, 0.0015811920166015625]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 5.0, 5.0, 9.0, 9.0, 4.0, 6.0, 8.0, 7.0, 6.0, 14.0, 7.0, 12.0, 19.0, 23.0, 33.0, 30.0, 57.0, 55.0, 77.0, 89.0, 111.0, 182.0, 246.0, 389.0, 802.0, 5393.0, 647429.0, 388139.0, 3393.0, 652.0, 371.0, 223.0, 164.0, 118.0, 91.0, 82.0, 57.0, 36.0, 33.0, 27.0, 24.0, 23.0, 24.0, 16.0, 11.0, 13.0, 10.0, 7.0, 5.0, 7.0, 7.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0], "bins": [-0.02752685546875, -0.026690959930419922, -0.025855064392089844, -0.025019168853759766, -0.024183273315429688, -0.02334737777709961, -0.02251148223876953, -0.021675586700439453, -0.020839691162109375, -0.020003795623779297, -0.01916790008544922, -0.01833200454711914, -0.017496109008789062, -0.016660213470458984, -0.015824317932128906, -0.014988422393798828, -0.01415252685546875, -0.013316631317138672, -0.012480735778808594, -0.011644840240478516, -0.010808944702148438, -0.00997304916381836, -0.009137153625488281, -0.008301258087158203, -0.007465362548828125, -0.006629467010498047, -0.005793571472167969, -0.004957675933837891, -0.0041217803955078125, -0.0032858848571777344, -0.0024499893188476562, -0.0016140937805175781, -0.0007781982421875, 5.7697296142578125e-05, 0.0008935928344726562, 0.0017294883728027344, 0.0025653839111328125, 0.0034012794494628906, 0.004237174987792969, 0.005073070526123047, 0.005908966064453125, 0.006744861602783203, 0.007580757141113281, 0.00841665267944336, 0.009252548217773438, 0.010088443756103516, 0.010924339294433594, 0.011760234832763672, 0.01259613037109375, 0.013432025909423828, 0.014267921447753906, 0.015103816986083984, 0.015939712524414062, 0.01677560806274414, 0.01761150360107422, 0.018447399139404297, 0.019283294677734375, 0.020119190216064453, 0.02095508575439453, 0.02179098129272461, 0.022626876831054688, 0.023462772369384766, 0.024298667907714844, 0.025134563446044922, 0.025970458984375]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 15.0, 96.0, 339.0, 415.0, 126.0, 24.0, 2.0, 4.0], "bins": [-0.009120381437242031, -0.008966132998466492, -0.008811883628368378, -0.008657635189592838, -0.008503386750817299, -0.008349137380719185, -0.008194888941943645, -0.008040639571845531, -0.007886391133069992, -0.007732142228633165, -0.007577893324196339, -0.007423644885420799, -0.0072693959809839725, -0.007115147076547146, -0.0069608986377716064, -0.00680664973333478, -0.006652400828897953, -0.006498151924461126, -0.0063439030200243, -0.00618965458124876, -0.0060354056768119335, -0.005881156772375107, -0.005726908333599567, -0.005572659429162741, -0.005418410524725914, -0.005264161620289087, -0.005109912715852261, -0.004955664277076721, -0.0048014153726398945, -0.004647166468203068, -0.004492918029427528, -0.004338669124990702, -0.004184420220553875, -0.004030171316117048, -0.003875922644510865, -0.003721673972904682, -0.0035674250684678555, -0.0034131761640310287, -0.0032589274924248457, -0.0031046788208186626, -0.002950429916381836, -0.0027961810119450092, -0.002641932340338826, -0.002487683668732643, -0.0023334347642958164, -0.0021791858598589897, -0.0020249371882528067, -0.0018706884002313018, -0.001716439612209797, -0.001562190824188292, -0.0014079420361667871, -0.0012536932481452823, -0.0010994444601237774, -0.0009451956721022725, -0.0007909468840807676, -0.0006366980960592628, -0.00048244924983009696, -0.0003282004618085921, -0.0001739516737870872, -1.9702885765582323e-05, 0.00013454590225592256, 0.00028879469027742743, 0.0004430434782989323, 0.0005972922663204372, 0.0007515410543419421]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 7.0, 3.0, 2.0, 8.0, 9.0, 5.0, 12.0, 7.0, 11.0, 23.0, 18.0, 18.0, 27.0, 22.0, 37.0, 46.0, 39.0, 51.0, 38.0, 66.0, 52.0, 44.0, 63.0, 36.0, 43.0, 26.0, 48.0, 40.0, 49.0, 25.0, 23.0, 29.0, 23.0, 10.0, 11.0, 9.0, 9.0, 10.0, 7.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011335015296936035, -0.0010979622602462769, -0.0010624229907989502, -0.0010268837213516235, -0.0009913444519042969, -0.0009558051824569702, -0.0009202659130096436, -0.0008847266435623169, -0.0008491873741149902, -0.0008136481046676636, -0.0007781088352203369, -0.0007425695657730103, -0.0007070302963256836, -0.0006714910268783569, -0.0006359517574310303, -0.0006004124879837036, -0.000564873218536377, -0.0005293339490890503, -0.0004937946796417236, -0.00045825541019439697, -0.0004227161407470703, -0.00038717687129974365, -0.000351637601852417, -0.00031609833240509033, -0.00028055906295776367, -0.000245019793510437, -0.00020948052406311035, -0.0001739412546157837, -0.00013840198516845703, -0.00010286271572113037, -6.732344627380371e-05, -3.178417682647705e-05, 3.7550926208496094e-06, 3.929436206817627e-05, 7.483363151550293e-05, 0.00011037290096282959, 0.00014591217041015625, 0.0001814514398574829, 0.00021699070930480957, 0.00025252997875213623, 0.0002880692481994629, 0.00032360851764678955, 0.0003591477870941162, 0.00039468705654144287, 0.00043022632598876953, 0.0004657655954360962, 0.0005013048648834229, 0.0005368441343307495, 0.0005723834037780762, 0.0006079226732254028, 0.0006434619426727295, 0.0006790012121200562, 0.0007145404815673828, 0.0007500797510147095, 0.0007856190204620361, 0.0008211582899093628, 0.0008566975593566895, 0.0008922368288040161, 0.0009277760982513428, 0.0009633153676986694, 0.000998854637145996, 0.0010343939065933228, 0.0010699331760406494, 0.001105472445487976, 0.0011410117149353027]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 5.0, 4.0, 5.0, 5.0, 7.0, 7.0, 10.0, 16.0, 9.0, 11.0, 19.0, 27.0, 30.0, 29.0, 37.0, 38.0, 40.0, 36.0, 42.0, 41.0, 42.0, 50.0, 52.0, 38.0, 48.0, 38.0, 35.0, 25.0, 37.0, 32.0, 37.0, 24.0, 20.0, 24.0, 23.0, 20.0, 7.0, 5.0, 7.0, 7.0, 5.0, 5.0, 3.0, 0.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.53125, -11.144287109375, -10.75732421875, -10.370361328125, -9.9833984375, -9.596435546875, -9.20947265625, -8.822509765625, -8.435546875, -8.048583984375, -7.66162109375, -7.274658203125, -6.8876953125, -6.500732421875, -6.11376953125, -5.726806640625, -5.33984375, -4.952880859375, -4.56591796875, -4.178955078125, -3.7919921875, -3.405029296875, -3.01806640625, -2.631103515625, -2.244140625, -1.857177734375, -1.47021484375, -1.083251953125, -0.6962890625, -0.309326171875, 0.07763671875, 0.464599609375, 0.8515625, 1.238525390625, 1.62548828125, 2.012451171875, 2.3994140625, 2.786376953125, 3.17333984375, 3.560302734375, 3.947265625, 4.334228515625, 4.72119140625, 5.108154296875, 5.4951171875, 5.882080078125, 6.26904296875, 6.656005859375, 7.04296875, 7.429931640625, 7.81689453125, 8.203857421875, 8.5908203125, 8.977783203125, 9.36474609375, 9.751708984375, 10.138671875, 10.525634765625, 10.91259765625, 11.299560546875, 11.6865234375, 12.073486328125, 12.46044921875, 12.847412109375, 13.234375]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 6.0, 6.0, 6.0, 4.0, 10.0, 18.0, 18.0, 26.0, 40.0, 65.0, 66.0, 94.0, 124.0, 155.0, 243.0, 308.0, 444.0, 659.0, 939.0, 1277.0, 1877.0, 3029.0, 4977.0, 9649.0, 23159.0, 68610.0, 230334.0, 443502.0, 169136.0, 50946.0, 18151.0, 7936.0, 4325.0, 2576.0, 1731.0, 1155.0, 846.0, 585.0, 406.0, 319.0, 236.0, 154.0, 101.0, 83.0, 62.0, 51.0, 37.0, 21.0, 19.0, 13.0, 12.0, 4.0, 6.0, 2.0, 4.0, 3.0, 3.0, 0.0, 3.0], "bins": [-19.09375, -18.50390625, -17.9140625, -17.32421875, -16.734375, -16.14453125, -15.5546875, -14.96484375, -14.375, -13.78515625, -13.1953125, -12.60546875, -12.015625, -11.42578125, -10.8359375, -10.24609375, -9.65625, -9.06640625, -8.4765625, -7.88671875, -7.296875, -6.70703125, -6.1171875, -5.52734375, -4.9375, -4.34765625, -3.7578125, -3.16796875, -2.578125, -1.98828125, -1.3984375, -0.80859375, -0.21875, 0.37109375, 0.9609375, 1.55078125, 2.140625, 2.73046875, 3.3203125, 3.91015625, 4.5, 5.08984375, 5.6796875, 6.26953125, 6.859375, 7.44921875, 8.0390625, 8.62890625, 9.21875, 9.80859375, 10.3984375, 10.98828125, 11.578125, 12.16796875, 12.7578125, 13.34765625, 13.9375, 14.52734375, 15.1171875, 15.70703125, 16.296875, 16.88671875, 17.4765625, 18.06640625, 18.65625]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 5.0, 2.0, 4.0, 3.0, 6.0, 4.0, 9.0, 9.0, 11.0, 22.0, 13.0, 20.0, 33.0, 26.0, 26.0, 44.0, 42.0, 63.0, 68.0, 78.0, 112.0, 277.0, 1458.0, 208.0, 109.0, 69.0, 66.0, 39.0, 43.0, 33.0, 22.0, 16.0, 25.0, 14.0, 20.0, 11.0, 9.0, 5.0, 8.0, 4.0, 4.0, 5.0, 0.0, 3.0, 6.0, 0.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.1875, -27.25537109375, -26.3232421875, -25.39111328125, -24.458984375, -23.52685546875, -22.5947265625, -21.66259765625, -20.73046875, -19.79833984375, -18.8662109375, -17.93408203125, -17.001953125, -16.06982421875, -15.1376953125, -14.20556640625, -13.2734375, -12.34130859375, -11.4091796875, -10.47705078125, -9.544921875, -8.61279296875, -7.6806640625, -6.74853515625, -5.81640625, -4.88427734375, -3.9521484375, -3.02001953125, -2.087890625, -1.15576171875, -0.2236328125, 0.70849609375, 1.640625, 2.57275390625, 3.5048828125, 4.43701171875, 5.369140625, 6.30126953125, 7.2333984375, 8.16552734375, 9.09765625, 10.02978515625, 10.9619140625, 11.89404296875, 12.826171875, 13.75830078125, 14.6904296875, 15.62255859375, 16.5546875, 17.48681640625, 18.4189453125, 19.35107421875, 20.283203125, 21.21533203125, 22.1474609375, 23.07958984375, 24.01171875, 24.94384765625, 25.8759765625, 26.80810546875, 27.740234375, 28.67236328125, 29.6044921875, 30.53662109375, 31.46875]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 6.0, 3.0, 2.0, 3.0, 9.0, 7.0, 11.0, 6.0, 15.0, 9.0, 16.0, 20.0, 38.0, 68.0, 75.0, 95.0, 132.0, 227.0, 574.0, 1519.0, 29957.0, 3093643.0, 16697.0, 1289.0, 495.0, 264.0, 151.0, 93.0, 66.0, 48.0, 38.0, 28.0, 23.0, 22.0, 17.0, 10.0, 6.0, 6.0, 3.0, 2.0, 2.0, 5.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-96.5, -93.107421875, -89.71484375, -86.322265625, -82.9296875, -79.537109375, -76.14453125, -72.751953125, -69.359375, -65.966796875, -62.57421875, -59.181640625, -55.7890625, -52.396484375, -49.00390625, -45.611328125, -42.21875, -38.826171875, -35.43359375, -32.041015625, -28.6484375, -25.255859375, -21.86328125, -18.470703125, -15.078125, -11.685546875, -8.29296875, -4.900390625, -1.5078125, 1.884765625, 5.27734375, 8.669921875, 12.0625, 15.455078125, 18.84765625, 22.240234375, 25.6328125, 29.025390625, 32.41796875, 35.810546875, 39.203125, 42.595703125, 45.98828125, 49.380859375, 52.7734375, 56.166015625, 59.55859375, 62.951171875, 66.34375, 69.736328125, 73.12890625, 76.521484375, 79.9140625, 83.306640625, 86.69921875, 90.091796875, 93.484375, 96.876953125, 100.26953125, 103.662109375, 107.0546875, 110.447265625, 113.83984375, 117.232421875, 120.625]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 11.0, 43.0, 122.0, 281.0, 313.0, 160.0, 53.0, 24.0, 5.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-162.3277130126953, -157.1274871826172, -151.92726135253906, -146.72702026367188, -141.52679443359375, -136.32656860351562, -131.1263427734375, -125.92610931396484, -120.72587585449219, -115.52565002441406, -110.3254165649414, -105.12519073486328, -99.92495727539062, -94.7247314453125, -89.52450561523438, -84.32427215576172, -79.1240463256836, -73.92382049560547, -68.72358703613281, -63.52336120605469, -58.32312774658203, -53.122901916503906, -47.922672271728516, -42.722442626953125, -37.522212982177734, -32.321983337402344, -27.121753692626953, -21.921525955200195, -16.721296310424805, -11.521066665649414, -6.320838928222656, -1.1206092834472656, 4.079620361328125, 9.279850006103516, 14.48007869720459, 19.680307388305664, 24.880537033081055, 30.080766677856445, 35.2809944152832, 40.481224060058594, 45.681453704833984, 50.881683349609375, 56.081912994384766, 61.282142639160156, 66.48236846923828, 71.68260192871094, 76.88282775878906, 82.08305358886719, 87.28328704833984, 92.48351287841797, 97.68374633789062, 102.88397216796875, 108.0842056274414, 113.28443145751953, 118.48466491699219, 123.68489074707031, 128.88511657714844, 134.08534240722656, 139.2855682373047, 144.48580932617188, 149.68603515625, 154.88626098632812, 160.08648681640625, 165.28671264648438, 170.48695373535156]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 5.0, 8.0, 10.0, 5.0, 9.0, 8.0, 4.0, 11.0, 14.0, 22.0, 15.0, 23.0, 16.0, 28.0, 24.0, 30.0, 33.0, 35.0, 44.0, 38.0, 37.0, 38.0, 53.0, 45.0, 43.0, 40.0, 58.0, 32.0, 38.0, 18.0, 27.0, 27.0, 26.0, 18.0, 21.0, 18.0, 18.0, 12.0, 16.0, 14.0, 6.0, 10.0, 4.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.48014831542969, -81.83209991455078, -79.18404388427734, -76.53599548339844, -73.887939453125, -71.2398910522461, -68.59183502197266, -65.94378662109375, -63.29573440551758, -60.647682189941406, -57.999629974365234, -55.35157775878906, -52.703529357910156, -50.05547332763672, -47.40742492675781, -44.75937271118164, -42.11132049560547, -39.4632682800293, -36.815216064453125, -34.16716384887695, -31.519113540649414, -28.871061325073242, -26.223011016845703, -23.57495880126953, -20.92690658569336, -18.278854370117188, -15.630803108215332, -12.982751846313477, -10.334699630737305, -7.686647415161133, -5.038596153259277, -2.390544891357422, 0.25751495361328125, 2.905566692352295, 5.553618431091309, 8.201669692993164, 10.849721908569336, 13.497774124145508, 16.145824432373047, 18.79387664794922, 21.44192886352539, 24.089981079101562, 26.738033294677734, 29.386083602905273, 32.03413391113281, 34.68218994140625, 37.330238342285156, 39.97829055786133, 42.6263427734375, 45.27439498901367, 47.922447204589844, 50.570499420166016, 53.21855163574219, 55.866600036621094, 58.514652252197266, 61.16270446777344, 63.81075668334961, 66.45880889892578, 69.10685729980469, 71.75491333007812, 74.40296173095703, 77.05101776123047, 79.69906616210938, 82.34712219238281, 84.99517059326172]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 5.0, 5.0, 1.0, 4.0, 2.0, 8.0, 6.0, 5.0, 12.0, 11.0, 18.0, 18.0, 23.0, 22.0, 27.0, 26.0, 22.0, 34.0, 43.0, 50.0, 34.0, 47.0, 46.0, 46.0, 40.0, 32.0, 46.0, 39.0, 35.0, 34.0, 28.0, 35.0, 31.0, 33.0, 20.0, 14.0, 13.0, 28.0, 11.0, 15.0, 7.0, 6.0, 6.0, 8.0, 3.0, 1.0, 3.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.84375, -10.4718017578125, -10.099853515625, -9.7279052734375, -9.35595703125, -8.9840087890625, -8.612060546875, -8.2401123046875, -7.8681640625, -7.4962158203125, -7.124267578125, -6.7523193359375, -6.38037109375, -6.0084228515625, -5.636474609375, -5.2645263671875, -4.892578125, -4.5206298828125, -4.148681640625, -3.7767333984375, -3.40478515625, -3.0328369140625, -2.660888671875, -2.2889404296875, -1.9169921875, -1.5450439453125, -1.173095703125, -0.8011474609375, -0.42919921875, -0.0572509765625, 0.314697265625, 0.6866455078125, 1.05859375, 1.4305419921875, 1.802490234375, 2.1744384765625, 2.54638671875, 2.9183349609375, 3.290283203125, 3.6622314453125, 4.0341796875, 4.4061279296875, 4.778076171875, 5.1500244140625, 5.52197265625, 5.8939208984375, 6.265869140625, 6.6378173828125, 7.009765625, 7.3817138671875, 7.753662109375, 8.1256103515625, 8.49755859375, 8.8695068359375, 9.241455078125, 9.6134033203125, 9.9853515625, 10.3572998046875, 10.729248046875, 11.1011962890625, 11.47314453125, 11.8450927734375, 12.217041015625, 12.5889892578125, 12.9609375]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 7.0, 4.0, 7.0, 10.0, 14.0, 12.0, 32.0, 36.0, 60.0, 76.0, 87.0, 153.0, 246.0, 348.0, 527.0, 775.0, 1316.0, 2217.0, 3762.0, 6970.0, 14105.0, 39474.0, 181706.0, 911216.0, 2056547.0, 763036.0, 149544.0, 33746.0, 12874.0, 6353.0, 3460.0, 2085.0, 1261.0, 749.0, 452.0, 315.0, 230.0, 142.0, 113.0, 65.0, 49.0, 37.0, 16.0, 18.0, 8.0, 12.0, 4.0, 7.0, 5.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.984375, -17.412353515625, -16.84033203125, -16.268310546875, -15.6962890625, -15.124267578125, -14.55224609375, -13.980224609375, -13.408203125, -12.836181640625, -12.26416015625, -11.692138671875, -11.1201171875, -10.548095703125, -9.97607421875, -9.404052734375, -8.83203125, -8.260009765625, -7.68798828125, -7.115966796875, -6.5439453125, -5.971923828125, -5.39990234375, -4.827880859375, -4.255859375, -3.683837890625, -3.11181640625, -2.539794921875, -1.9677734375, -1.395751953125, -0.82373046875, -0.251708984375, 0.3203125, 0.892333984375, 1.46435546875, 2.036376953125, 2.6083984375, 3.180419921875, 3.75244140625, 4.324462890625, 4.896484375, 5.468505859375, 6.04052734375, 6.612548828125, 7.1845703125, 7.756591796875, 8.32861328125, 8.900634765625, 9.47265625, 10.044677734375, 10.61669921875, 11.188720703125, 11.7607421875, 12.332763671875, 12.90478515625, 13.476806640625, 14.048828125, 14.620849609375, 15.19287109375, 15.764892578125, 16.3369140625, 16.908935546875, 17.48095703125, 18.052978515625, 18.625]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 7.0, 7.0, 4.0, 16.0, 12.0, 24.0, 36.0, 47.0, 87.0, 141.0, 236.0, 348.0, 566.0, 815.0, 699.0, 388.0, 251.0, 147.0, 92.0, 49.0, 40.0, 30.0, 7.0, 6.0, 9.0, 7.0, 4.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.421875, -26.49462890625, -25.5673828125, -24.64013671875, -23.712890625, -22.78564453125, -21.8583984375, -20.93115234375, -20.00390625, -19.07666015625, -18.1494140625, -17.22216796875, -16.294921875, -15.36767578125, -14.4404296875, -13.51318359375, -12.5859375, -11.65869140625, -10.7314453125, -9.80419921875, -8.876953125, -7.94970703125, -7.0224609375, -6.09521484375, -5.16796875, -4.24072265625, -3.3134765625, -2.38623046875, -1.458984375, -0.53173828125, 0.3955078125, 1.32275390625, 2.25, 3.17724609375, 4.1044921875, 5.03173828125, 5.958984375, 6.88623046875, 7.8134765625, 8.74072265625, 9.66796875, 10.59521484375, 11.5224609375, 12.44970703125, 13.376953125, 14.30419921875, 15.2314453125, 16.15869140625, 17.0859375, 18.01318359375, 18.9404296875, 19.86767578125, 20.794921875, 21.72216796875, 22.6494140625, 23.57666015625, 24.50390625, 25.43115234375, 26.3583984375, 27.28564453125, 28.212890625, 29.14013671875, 30.0673828125, 30.99462890625, 31.921875]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 4.0, 5.0, 10.0, 5.0, 18.0, 34.0, 46.0, 60.0, 115.0, 191.0, 352.0, 752.0, 2152.0, 8330.0, 68948.0, 2980805.0, 1088026.0, 35759.0, 5664.0, 1638.0, 618.0, 293.0, 182.0, 102.0, 85.0, 40.0, 15.0, 13.0, 11.0, 7.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-54.03125, -52.3876953125, -50.744140625, -49.1005859375, -47.45703125, -45.8134765625, -44.169921875, -42.5263671875, -40.8828125, -39.2392578125, -37.595703125, -35.9521484375, -34.30859375, -32.6650390625, -31.021484375, -29.3779296875, -27.734375, -26.0908203125, -24.447265625, -22.8037109375, -21.16015625, -19.5166015625, -17.873046875, -16.2294921875, -14.5859375, -12.9423828125, -11.298828125, -9.6552734375, -8.01171875, -6.3681640625, -4.724609375, -3.0810546875, -1.4375, 0.2060546875, 1.849609375, 3.4931640625, 5.13671875, 6.7802734375, 8.423828125, 10.0673828125, 11.7109375, 13.3544921875, 14.998046875, 16.6416015625, 18.28515625, 19.9287109375, 21.572265625, 23.2158203125, 24.859375, 26.5029296875, 28.146484375, 29.7900390625, 31.43359375, 33.0771484375, 34.720703125, 36.3642578125, 38.0078125, 39.6513671875, 41.294921875, 42.9384765625, 44.58203125, 46.2255859375, 47.869140625, 49.5126953125, 51.15625]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 39.0, 181.0, 519.0, 230.0, 39.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-495.4661560058594, -483.83349609375, -472.2008361816406, -460.56817626953125, -448.93548583984375, -437.3028259277344, -425.670166015625, -414.0375061035156, -402.40484619140625, -390.7721862792969, -379.1395263671875, -367.5068359375, -355.8741760253906, -344.24151611328125, -332.6088562011719, -320.9761962890625, -309.343505859375, -297.7108459472656, -286.07818603515625, -274.44549560546875, -262.8128356933594, -251.18017578125, -239.54751586914062, -227.91485595703125, -216.28219604492188, -204.6495361328125, -193.01686096191406, -181.3842010498047, -169.7515411376953, -158.11886596679688, -146.4862060546875, -134.85354614257812, -123.22088623046875, -111.58821868896484, -99.95555877685547, -88.32289123535156, -76.69023132324219, -65.05756378173828, -53.424896240234375, -41.792236328125, -30.159568786621094, -18.526905059814453, -6.89423942565918, 4.738426208496094, 16.371089935302734, 28.003753662109375, 39.63642120361328, 51.269081115722656, 62.90174865722656, 74.53441619873047, 86.16707611083984, 97.79974365234375, 109.43240356445312, 121.06507110595703, 132.69773864746094, 144.3303985595703, 155.96307373046875, 167.59573364257812, 179.22840881347656, 190.86106872558594, 202.4937286376953, 214.12640380859375, 225.75906372070312, 237.3917236328125, 249.02438354492188]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 1.0, 1.0, 12.0, 6.0, 5.0, 8.0, 6.0, 12.0, 7.0, 14.0, 15.0, 11.0, 28.0, 27.0, 24.0, 24.0, 24.0, 34.0, 28.0, 29.0, 35.0, 29.0, 43.0, 35.0, 42.0, 42.0, 41.0, 28.0, 43.0, 40.0, 30.0, 29.0, 25.0, 30.0, 34.0, 22.0, 23.0, 12.0, 18.0, 18.0, 10.0, 15.0, 12.0, 8.0, 6.0, 7.0, 6.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.16448974609375, -59.19541931152344, -57.226348876953125, -55.25727844238281, -53.288204193115234, -51.31913375854492, -49.35006332397461, -47.3809928894043, -45.41191864013672, -43.442848205566406, -41.473777770996094, -39.50470733642578, -37.5356330871582, -35.56656265258789, -33.59749221801758, -31.628421783447266, -29.659351348876953, -27.69028091430664, -25.721208572387695, -23.752138137817383, -21.783065795898438, -19.813995361328125, -17.844924926757812, -15.875853538513184, -13.906782150268555, -11.937710762023926, -9.968639373779297, -7.999568939208984, -6.0304975509643555, -4.061426162719727, -2.092355728149414, -0.12328433990478516, 1.8457870483398438, 3.8148581981658936, 5.783929347991943, 7.753000259399414, 9.722071647644043, 11.691143035888672, 13.660213470458984, 15.629284858703613, 17.598356246948242, 19.567426681518555, 21.5364990234375, 23.505569458007812, 25.474639892578125, 27.44371223449707, 29.412782669067383, 31.381855010986328, 33.35092544555664, 35.31999588012695, 37.289066314697266, 39.258140563964844, 41.227210998535156, 43.19628143310547, 45.16535186767578, 47.134422302246094, 49.103492736816406, 51.07256317138672, 53.04163360595703, 55.010704040527344, 56.97977828979492, 58.948848724365234, 60.91791915893555, 62.88698959350586, 64.85606384277344]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 4.0, 7.0, 7.0, 1.0, 7.0, 6.0, 10.0, 7.0, 13.0, 11.0, 15.0, 20.0, 17.0, 25.0, 19.0, 23.0, 30.0, 33.0, 45.0, 31.0, 26.0, 34.0, 37.0, 31.0, 41.0, 45.0, 36.0, 48.0, 39.0, 33.0, 33.0, 29.0, 39.0, 27.0, 24.0, 26.0, 16.0, 12.0, 17.0, 15.0, 22.0, 11.0, 9.0, 6.0, 4.0, 5.0, 4.0, 4.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0], "bins": [-11.140625, -10.8184814453125, -10.496337890625, -10.1741943359375, -9.85205078125, -9.5299072265625, -9.207763671875, -8.8856201171875, -8.5634765625, -8.2413330078125, -7.919189453125, -7.5970458984375, -7.27490234375, -6.9527587890625, -6.630615234375, -6.3084716796875, -5.986328125, -5.6641845703125, -5.342041015625, -5.0198974609375, -4.69775390625, -4.3756103515625, -4.053466796875, -3.7313232421875, -3.4091796875, -3.0870361328125, -2.764892578125, -2.4427490234375, -2.12060546875, -1.7984619140625, -1.476318359375, -1.1541748046875, -0.83203125, -0.5098876953125, -0.187744140625, 0.1343994140625, 0.45654296875, 0.7786865234375, 1.100830078125, 1.4229736328125, 1.7451171875, 2.0672607421875, 2.389404296875, 2.7115478515625, 3.03369140625, 3.3558349609375, 3.677978515625, 4.0001220703125, 4.322265625, 4.6444091796875, 4.966552734375, 5.2886962890625, 5.61083984375, 5.9329833984375, 6.255126953125, 6.5772705078125, 6.8994140625, 7.2215576171875, 7.543701171875, 7.8658447265625, 8.18798828125, 8.5101318359375, 8.832275390625, 9.1544189453125, 9.4765625]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 2.0, 6.0, 12.0, 22.0, 27.0, 46.0, 81.0, 110.0, 145.0, 252.0, 307.0, 476.0, 701.0, 1079.0, 1582.0, 2375.0, 3482.0, 5451.0, 8309.0, 13107.0, 20077.0, 31841.0, 51489.0, 81467.0, 128845.0, 184182.0, 178578.0, 122943.0, 77307.0, 48605.0, 30629.0, 19410.0, 12350.0, 7829.0, 5094.0, 3411.0, 2285.0, 1514.0, 1027.0, 676.0, 481.0, 290.0, 218.0, 155.0, 108.0, 65.0, 42.0, 29.0, 15.0, 13.0, 9.0, 5.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.377197265625, -0.36460113525390625, -0.3520050048828125, -0.33940887451171875, -0.326812744140625, -0.31421661376953125, -0.3016204833984375, -0.28902435302734375, -0.27642822265625, -0.26383209228515625, -0.2512359619140625, -0.23863983154296875, -0.226043701171875, -0.21344757080078125, -0.2008514404296875, -0.18825531005859375, -0.1756591796875, -0.16306304931640625, -0.1504669189453125, -0.13787078857421875, -0.125274658203125, -0.11267852783203125, -0.1000823974609375, -0.08748626708984375, -0.07489013671875, -0.06229400634765625, -0.0496978759765625, -0.03710174560546875, -0.024505615234375, -0.01190948486328125, 0.0006866455078125, 0.01328277587890625, 0.02587890625, 0.03847503662109375, 0.0510711669921875, 0.06366729736328125, 0.076263427734375, 0.08885955810546875, 0.1014556884765625, 0.11405181884765625, 0.12664794921875, 0.13924407958984375, 0.1518402099609375, 0.16443634033203125, 0.177032470703125, 0.18962860107421875, 0.2022247314453125, 0.21482086181640625, 0.2274169921875, 0.24001312255859375, 0.2526092529296875, 0.26520538330078125, 0.277801513671875, 0.29039764404296875, 0.3029937744140625, 0.31558990478515625, 0.32818603515625, 0.34078216552734375, 0.3533782958984375, 0.36597442626953125, 0.378570556640625, 0.39116668701171875, 0.4037628173828125, 0.41635894775390625, 0.428955078125]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 1.0, 6.0, 8.0, 9.0, 14.0, 6.0, 18.0, 15.0, 16.0, 19.0, 31.0, 23.0, 20.0, 30.0, 33.0, 32.0, 37.0, 30.0, 32.0, 45.0, 35.0, 42.0, 1069.0, 40.0, 35.0, 47.0, 44.0, 38.0, 26.0, 36.0, 26.0, 25.0, 26.0, 18.0, 11.0, 10.0, 20.0, 16.0, 5.0, 12.0, 4.0, 3.0, 5.0, 5.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.796875, -6.5791015625, -6.361328125, -6.1435546875, -5.92578125, -5.7080078125, -5.490234375, -5.2724609375, -5.0546875, -4.8369140625, -4.619140625, -4.4013671875, -4.18359375, -3.9658203125, -3.748046875, -3.5302734375, -3.3125, -3.0947265625, -2.876953125, -2.6591796875, -2.44140625, -2.2236328125, -2.005859375, -1.7880859375, -1.5703125, -1.3525390625, -1.134765625, -0.9169921875, -0.69921875, -0.4814453125, -0.263671875, -0.0458984375, 0.171875, 0.3896484375, 0.607421875, 0.8251953125, 1.04296875, 1.2607421875, 1.478515625, 1.6962890625, 1.9140625, 2.1318359375, 2.349609375, 2.5673828125, 2.78515625, 3.0029296875, 3.220703125, 3.4384765625, 3.65625, 3.8740234375, 4.091796875, 4.3095703125, 4.52734375, 4.7451171875, 4.962890625, 5.1806640625, 5.3984375, 5.6162109375, 5.833984375, 6.0517578125, 6.26953125, 6.4873046875, 6.705078125, 6.9228515625, 7.140625]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 9.0, 13.0, 20.0, 19.0, 38.0, 68.0, 110.0, 147.0, 249.0, 370.0, 552.0, 865.0, 1361.0, 2023.0, 3121.0, 4705.0, 7309.0, 10968.0, 17385.0, 26934.0, 42988.0, 68996.0, 109524.0, 164244.0, 1235795.0, 145262.0, 93326.0, 58475.0, 36572.0, 23340.0, 14866.0, 9481.0, 6156.0, 4104.0, 2660.0, 1757.0, 1151.0, 811.0, 489.0, 284.0, 224.0, 142.0, 68.0, 63.0, 41.0, 26.0, 13.0, 6.0, 3.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.369873046875, -0.3580665588378906, -0.34626007080078125, -0.3344535827636719, -0.3226470947265625, -0.3108406066894531, -0.29903411865234375, -0.2872276306152344, -0.275421142578125, -0.2636146545410156, -0.25180816650390625, -0.24000167846679688, -0.2281951904296875, -0.21638870239257812, -0.20458221435546875, -0.19277572631835938, -0.18096923828125, -0.16916275024414062, -0.15735626220703125, -0.14554977416992188, -0.1337432861328125, -0.12193679809570312, -0.11013031005859375, -0.09832382202148438, -0.086517333984375, -0.07471084594726562, -0.06290435791015625, -0.051097869873046875, -0.0392913818359375, -0.027484893798828125, -0.01567840576171875, -0.003871917724609375, 0.0079345703125, 0.019741058349609375, 0.03154754638671875, 0.043354034423828125, 0.0551605224609375, 0.06696701049804688, 0.07877349853515625, 0.09057998657226562, 0.102386474609375, 0.11419296264648438, 0.12599945068359375, 0.13780593872070312, 0.1496124267578125, 0.16141891479492188, 0.17322540283203125, 0.18503189086914062, 0.19683837890625, 0.20864486694335938, 0.22045135498046875, 0.23225784301757812, 0.2440643310546875, 0.2558708190917969, 0.26767730712890625, 0.2794837951660156, 0.291290283203125, 0.3030967712402344, 0.31490325927734375, 0.3267097473144531, 0.3385162353515625, 0.3503227233886719, 0.36212921142578125, 0.3739356994628906, 0.3857421875]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 5.0, 5.0, 4.0, 6.0, 5.0, 5.0, 9.0, 6.0, 16.0, 8.0, 21.0, 15.0, 20.0, 33.0, 37.0, 34.0, 35.0, 52.0, 45.0, 45.0, 50.0, 52.0, 52.0, 45.0, 50.0, 44.0, 43.0, 36.0, 25.0, 24.0, 35.0, 17.0, 26.0, 18.0, 10.0, 9.0, 7.0, 14.0, 7.0, 4.0, 5.0, 7.0, 4.0, 2.0, 6.0, 3.0, 2.0, 4.0, 2.0, 1.0], "bins": [-0.0019378662109375, -0.0018841028213500977, -0.0018303394317626953, -0.001776576042175293, -0.0017228126525878906, -0.0016690492630004883, -0.001615285873413086, -0.0015615224838256836, -0.0015077590942382812, -0.001453995704650879, -0.0014002323150634766, -0.0013464689254760742, -0.0012927055358886719, -0.0012389421463012695, -0.0011851787567138672, -0.0011314153671264648, -0.0010776519775390625, -0.0010238885879516602, -0.0009701251983642578, -0.0009163618087768555, -0.0008625984191894531, -0.0008088350296020508, -0.0007550716400146484, -0.0007013082504272461, -0.0006475448608398438, -0.0005937814712524414, -0.0005400180816650391, -0.0004862546920776367, -0.0004324913024902344, -0.00037872791290283203, -0.0003249645233154297, -0.00027120113372802734, -0.000217437744140625, -0.00016367435455322266, -0.00010991096496582031, -5.614757537841797e-05, -2.384185791015625e-06, 5.137920379638672e-05, 0.00010514259338378906, 0.0001589059829711914, 0.00021266937255859375, 0.0002664327621459961, 0.00032019615173339844, 0.0003739595413208008, 0.0004277229309082031, 0.00048148632049560547, 0.0005352497100830078, 0.0005890130996704102, 0.0006427764892578125, 0.0006965398788452148, 0.0007503032684326172, 0.0008040666580200195, 0.0008578300476074219, 0.0009115934371948242, 0.0009653568267822266, 0.001019120216369629, 0.0010728836059570312, 0.0011266469955444336, 0.001180410385131836, 0.0012341737747192383, 0.0012879371643066406, 0.001341700553894043, 0.0013954639434814453, 0.0014492273330688477, 0.00150299072265625]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 1.0, 6.0, 4.0, 1.0, 9.0, 9.0, 9.0, 7.0, 19.0, 11.0, 12.0, 20.0, 24.0, 30.0, 41.0, 46.0, 78.0, 82.0, 120.0, 147.0, 193.0, 370.0, 685.0, 4534.0, 658754.0, 378217.0, 3264.0, 635.0, 365.0, 224.0, 143.0, 119.0, 81.0, 77.0, 40.0, 43.0, 26.0, 19.0, 16.0, 8.0, 16.0, 17.0, 11.0, 6.0, 5.0, 4.0, 6.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.03057861328125, -0.029484272003173828, -0.028389930725097656, -0.027295589447021484, -0.026201248168945312, -0.02510690689086914, -0.02401256561279297, -0.022918224334716797, -0.021823883056640625, -0.020729541778564453, -0.01963520050048828, -0.01854085922241211, -0.017446517944335938, -0.016352176666259766, -0.015257835388183594, -0.014163494110107422, -0.01306915283203125, -0.011974811553955078, -0.010880470275878906, -0.009786128997802734, -0.008691787719726562, -0.007597446441650391, -0.006503105163574219, -0.005408763885498047, -0.004314422607421875, -0.003220081329345703, -0.0021257400512695312, -0.0010313987731933594, 6.29425048828125e-05, 0.0011572837829589844, 0.0022516250610351562, 0.003345966339111328, 0.0044403076171875, 0.005534648895263672, 0.006628990173339844, 0.007723331451416016, 0.008817672729492188, 0.00991201400756836, 0.011006355285644531, 0.012100696563720703, 0.013195037841796875, 0.014289379119873047, 0.015383720397949219, 0.01647806167602539, 0.017572402954101562, 0.018666744232177734, 0.019761085510253906, 0.020855426788330078, 0.02194976806640625, 0.023044109344482422, 0.024138450622558594, 0.025232791900634766, 0.026327133178710938, 0.02742147445678711, 0.02851581573486328, 0.029610157012939453, 0.030704498291015625, 0.0317988395690918, 0.03289318084716797, 0.03398752212524414, 0.03508186340332031, 0.036176204681396484, 0.037270545959472656, 0.03836488723754883, 0.039459228515625]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 18.0, 130.0, 489.0, 316.0, 57.0, 7.0], "bins": [-0.013277190737426281, -0.013058687560260296, -0.012840183451771736, -0.012621680274605751, -0.012403177097439766, -0.01218467392027378, -0.011966169811785221, -0.011747666634619236, -0.011529162526130676, -0.011310659348964691, -0.011092155240476131, -0.010873652063310146, -0.010655148886144161, -0.010436644777655602, -0.010218141600489616, -0.009999638423323631, -0.009781135246157646, -0.009562632068991661, -0.009344127960503101, -0.009125624783337116, -0.008907121606171131, -0.008688617497682571, -0.008470114320516586, -0.008251611143350601, -0.008033107966184616, -0.007814604789018631, -0.0075961011461913586, -0.007377597503364086, -0.007159094326198101, -0.006940590683370829, -0.006722087040543556, -0.006503583863377571, -0.006285079754889011, -0.006066576112061739, -0.005848072934895754, -0.0056295692920684814, -0.005411066114902496, -0.005192562472075224, -0.0049740588292479515, -0.004755555652081966, -0.004537052009254694, -0.004318548366427422, -0.0041000451892614365, -0.003881541546434164, -0.0036630381364375353, -0.0034445347264409065, -0.003226031083613634, -0.0030075276736170053, -0.0027890244964510202, -0.0025705210864543915, -0.002352017443627119, -0.0021335140336304903, -0.0019150106236338615, -0.0016965072136372328, -0.0014780036872252822, -0.0012595001608133316, -0.0010409967508167028, -0.0008224932826124132, -0.0006039898144081235, -0.0003854863462038338, -0.00016698287799954414, 5.152053199708462e-05, 0.0002700240584090352, 0.0004885275848209858, 0.0007070310530252755]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 7.0, 7.0, 9.0, 12.0, 9.0, 17.0, 13.0, 14.0, 15.0, 11.0, 31.0, 16.0, 34.0, 26.0, 24.0, 26.0, 39.0, 33.0, 41.0, 44.0, 45.0, 33.0, 47.0, 46.0, 38.0, 42.0, 44.0, 32.0, 27.0, 40.0, 33.0, 26.0, 20.0, 15.0, 15.0, 17.0, 7.0, 8.0, 9.0, 10.0, 7.0, 8.0, 3.0, 3.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-0.0010848641395568848, -0.0010503875091671944, -0.001015910878777504, -0.0009814342483878136, -0.0009469576179981232, -0.0009124809876084328, -0.0008780043572187424, -0.000843527726829052, -0.0008090510964393616, -0.0007745744660496712, -0.0007400978356599808, -0.0007056212052702904, -0.0006711445748806, -0.0006366679444909096, -0.0006021913141012192, -0.0005677146837115288, -0.0005332380533218384, -0.000498761422932148, -0.0004642847925424576, -0.0004298081621527672, -0.0003953315317630768, -0.0003608549013733864, -0.000326378270983696, -0.0002919016405940056, -0.0002574250102043152, -0.00022294837981462479, -0.0001884717494249344, -0.000153995119035244, -0.00011951848864555359, -8.504185825586319e-05, -5.056522786617279e-05, -1.608859747648239e-05, 1.8388032913208008e-05, 5.286466330289841e-05, 8.73412936925888e-05, 0.0001218179240822792, 0.0001562945544719696, 0.00019077118486166, 0.0002252478152513504, 0.0002597244456410408, 0.0002942010760307312, 0.0003286777064204216, 0.000363154336810112, 0.0003976309671998024, 0.0004321075975894928, 0.0004665842279791832, 0.0005010608583688736, 0.000535537488758564, 0.0005700141191482544, 0.0006044907495379448, 0.0006389673799276352, 0.0006734440103173256, 0.000707920640707016, 0.0007423972710967064, 0.0007768739014863968, 0.0008113505318760872, 0.0008458271622657776, 0.000880303792655468, 0.0009147804230451584, 0.0009492570534348488, 0.0009837336838245392, 0.0010182103142142296, 0.00105268694460392, 0.0010871635749936104, 0.0011216402053833008]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 4.0, 7.0, 7.0, 1.0, 7.0, 6.0, 10.0, 7.0, 13.0, 11.0, 15.0, 20.0, 17.0, 25.0, 19.0, 23.0, 30.0, 33.0, 45.0, 31.0, 26.0, 34.0, 37.0, 31.0, 41.0, 45.0, 36.0, 48.0, 39.0, 33.0, 33.0, 29.0, 39.0, 27.0, 24.0, 26.0, 16.0, 12.0, 17.0, 15.0, 22.0, 11.0, 9.0, 6.0, 4.0, 5.0, 4.0, 4.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0], "bins": [-11.140625, -10.8184814453125, -10.496337890625, -10.1741943359375, -9.85205078125, -9.5299072265625, -9.207763671875, -8.8856201171875, -8.5634765625, -8.2413330078125, -7.919189453125, -7.5970458984375, -7.27490234375, -6.9527587890625, -6.630615234375, -6.3084716796875, -5.986328125, -5.6641845703125, -5.342041015625, -5.0198974609375, -4.69775390625, -4.3756103515625, -4.053466796875, -3.7313232421875, -3.4091796875, -3.0870361328125, -2.764892578125, -2.4427490234375, -2.12060546875, -1.7984619140625, -1.476318359375, -1.1541748046875, -0.83203125, -0.5098876953125, -0.187744140625, 0.1343994140625, 0.45654296875, 0.7786865234375, 1.100830078125, 1.4229736328125, 1.7451171875, 2.0672607421875, 2.389404296875, 2.7115478515625, 3.03369140625, 3.3558349609375, 3.677978515625, 4.0001220703125, 4.322265625, 4.6444091796875, 4.966552734375, 5.2886962890625, 5.61083984375, 5.9329833984375, 6.255126953125, 6.5772705078125, 6.8994140625, 7.2215576171875, 7.543701171875, 7.8658447265625, 8.18798828125, 8.5101318359375, 8.832275390625, 9.1544189453125, 9.4765625]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 9.0, 9.0, 9.0, 15.0, 19.0, 26.0, 42.0, 58.0, 81.0, 103.0, 147.0, 224.0, 305.0, 454.0, 639.0, 874.0, 1321.0, 1900.0, 3230.0, 5766.0, 12608.0, 44610.0, 261933.0, 561242.0, 110119.0, 22468.0, 8416.0, 4220.0, 2508.0, 1582.0, 1108.0, 732.0, 545.0, 343.0, 252.0, 171.0, 129.0, 94.0, 69.0, 52.0, 36.0, 24.0, 21.0, 15.0, 8.0, 9.0, 5.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-23.984375, -23.240966796875, -22.49755859375, -21.754150390625, -21.0107421875, -20.267333984375, -19.52392578125, -18.780517578125, -18.037109375, -17.293701171875, -16.55029296875, -15.806884765625, -15.0634765625, -14.320068359375, -13.57666015625, -12.833251953125, -12.08984375, -11.346435546875, -10.60302734375, -9.859619140625, -9.1162109375, -8.372802734375, -7.62939453125, -6.885986328125, -6.142578125, -5.399169921875, -4.65576171875, -3.912353515625, -3.1689453125, -2.425537109375, -1.68212890625, -0.938720703125, -0.1953125, 0.548095703125, 1.29150390625, 2.034912109375, 2.7783203125, 3.521728515625, 4.26513671875, 5.008544921875, 5.751953125, 6.495361328125, 7.23876953125, 7.982177734375, 8.7255859375, 9.468994140625, 10.21240234375, 10.955810546875, 11.69921875, 12.442626953125, 13.18603515625, 13.929443359375, 14.6728515625, 15.416259765625, 16.15966796875, 16.903076171875, 17.646484375, 18.389892578125, 19.13330078125, 19.876708984375, 20.6201171875, 21.363525390625, 22.10693359375, 22.850341796875, 23.59375]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 6.0, 4.0, 3.0, 5.0, 14.0, 10.0, 4.0, 17.0, 16.0, 25.0, 23.0, 34.0, 31.0, 41.0, 62.0, 76.0, 120.0, 308.0, 1610.0, 175.0, 101.0, 58.0, 58.0, 49.0, 27.0, 33.0, 22.0, 17.0, 19.0, 21.0, 13.0, 9.0, 15.0, 9.0, 9.0, 5.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.15625, -28.15966796875, -27.1630859375, -26.16650390625, -25.169921875, -24.17333984375, -23.1767578125, -22.18017578125, -21.18359375, -20.18701171875, -19.1904296875, -18.19384765625, -17.197265625, -16.20068359375, -15.2041015625, -14.20751953125, -13.2109375, -12.21435546875, -11.2177734375, -10.22119140625, -9.224609375, -8.22802734375, -7.2314453125, -6.23486328125, -5.23828125, -4.24169921875, -3.2451171875, -2.24853515625, -1.251953125, -0.25537109375, 0.7412109375, 1.73779296875, 2.734375, 3.73095703125, 4.7275390625, 5.72412109375, 6.720703125, 7.71728515625, 8.7138671875, 9.71044921875, 10.70703125, 11.70361328125, 12.7001953125, 13.69677734375, 14.693359375, 15.68994140625, 16.6865234375, 17.68310546875, 18.6796875, 19.67626953125, 20.6728515625, 21.66943359375, 22.666015625, 23.66259765625, 24.6591796875, 25.65576171875, 26.65234375, 27.64892578125, 28.6455078125, 29.64208984375, 30.638671875, 31.63525390625, 32.6318359375, 33.62841796875, 34.625]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 6.0, 9.0, 7.0, 13.0, 11.0, 27.0, 29.0, 38.0, 61.0, 89.0, 109.0, 185.0, 350.0, 737.0, 2799.0, 3000110.0, 138260.0, 1570.0, 553.0, 267.0, 148.0, 111.0, 66.0, 42.0, 34.0, 18.0, 13.0, 13.0, 7.0, 6.0, 12.0, 3.0, 4.0, 0.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-114.0625, -110.5908203125, -107.119140625, -103.6474609375, -100.17578125, -96.7041015625, -93.232421875, -89.7607421875, -86.2890625, -82.8173828125, -79.345703125, -75.8740234375, -72.40234375, -68.9306640625, -65.458984375, -61.9873046875, -58.515625, -55.0439453125, -51.572265625, -48.1005859375, -44.62890625, -41.1572265625, -37.685546875, -34.2138671875, -30.7421875, -27.2705078125, -23.798828125, -20.3271484375, -16.85546875, -13.3837890625, -9.912109375, -6.4404296875, -2.96875, 0.5029296875, 3.974609375, 7.4462890625, 10.91796875, 14.3896484375, 17.861328125, 21.3330078125, 24.8046875, 28.2763671875, 31.748046875, 35.2197265625, 38.69140625, 42.1630859375, 45.634765625, 49.1064453125, 52.578125, 56.0498046875, 59.521484375, 62.9931640625, 66.46484375, 69.9365234375, 73.408203125, 76.8798828125, 80.3515625, 83.8232421875, 87.294921875, 90.7666015625, 94.23828125, 97.7099609375, 101.181640625, 104.6533203125, 108.125]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 8.0, 40.0, 118.0, 297.0, 303.0, 165.0, 48.0, 15.0, 10.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-276.0885009765625, -270.4713134765625, -264.8540954589844, -259.2369079589844, -253.61972045898438, -248.0025177001953, -242.3853302001953, -236.76812744140625, -231.15093994140625, -225.5337371826172, -219.9165496826172, -214.29934692382812, -208.68215942382812, -203.06495666503906, -197.44776916503906, -191.83056640625, -186.21337890625, -180.59617614746094, -174.97898864746094, -169.36178588867188, -163.74459838867188, -158.1273956298828, -152.5102081298828, -146.89300537109375, -141.2758026123047, -135.65859985351562, -130.04141235351562, -124.4242172241211, -118.80702209472656, -113.18982696533203, -107.5726318359375, -101.95542907714844, -96.3382339477539, -90.72103881835938, -85.10384368896484, -79.48664855957031, -73.86945343017578, -68.25225830078125, -62.63505935668945, -57.01786422729492, -51.40066909790039, -45.78347396850586, -40.16627883911133, -34.54907989501953, -28.931886672973633, -23.3146915435791, -17.697494506835938, -12.080299377441406, -6.463104248046875, -0.8459086418151855, 4.771286964416504, 10.388483047485352, 16.005678176879883, 21.622873306274414, 27.240070343017578, 32.85726547241211, 38.47446060180664, 44.09165573120117, 49.7088508605957, 55.3260498046875, 60.94324493408203, 66.56044006347656, 72.1776351928711, 77.79483032226562, 83.41202545166016]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 4.0, 3.0, 6.0, 3.0, 3.0, 8.0, 8.0, 16.0, 20.0, 10.0, 16.0, 21.0, 29.0, 24.0, 27.0, 37.0, 36.0, 42.0, 39.0, 43.0, 48.0, 38.0, 42.0, 36.0, 42.0, 45.0, 40.0, 33.0, 45.0, 28.0, 19.0, 22.0, 29.0, 15.0, 23.0, 14.0, 17.0, 10.0, 9.0, 8.0, 12.0, 10.0, 7.0, 5.0, 6.0, 0.0, 4.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-73.05841064453125, -70.78607940673828, -68.51374816894531, -66.24142456054688, -63.96908950805664, -61.69676208496094, -59.42443084716797, -57.152099609375, -54.87976837158203, -52.60743713378906, -50.33510971069336, -48.06277847290039, -45.79044723510742, -43.51811981201172, -41.24578857421875, -38.97345733642578, -36.70112991333008, -34.42879867553711, -32.156471252441406, -29.884140014648438, -27.61180877685547, -25.339479446411133, -23.067150115966797, -20.794818878173828, -18.522489547729492, -16.250160217285156, -13.977828979492188, -11.705499649047852, -9.4331693649292, -7.160839080810547, -4.888509750366211, -2.6161794662475586, -0.34384918212890625, 1.928480863571167, 4.20081090927124, 6.473140716552734, 8.745471000671387, 11.017801284790039, 13.290130615234375, 15.562460899353027, 17.83479118347168, 20.107120513916016, 22.379451751708984, 24.65178108215332, 26.924110412597656, 29.196441650390625, 31.46877098083496, 33.7411003112793, 36.013431549072266, 38.285762786865234, 40.55809020996094, 42.830421447753906, 45.102752685546875, 47.375083923339844, 49.64741134643555, 51.919742584228516, 54.19207000732422, 56.46440124511719, 58.73672866821289, 61.00905990600586, 63.28139114379883, 65.55371856689453, 67.8260498046875, 70.09838104248047, 72.37071228027344]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 1.0, 1.0, 5.0, 8.0, 5.0, 6.0, 6.0, 9.0, 10.0, 8.0, 12.0, 16.0, 15.0, 23.0, 17.0, 27.0, 28.0, 28.0, 33.0, 33.0, 36.0, 28.0, 34.0, 37.0, 33.0, 52.0, 48.0, 38.0, 30.0, 29.0, 41.0, 38.0, 37.0, 32.0, 29.0, 26.0, 15.0, 18.0, 19.0, 17.0, 13.0, 10.0, 14.0, 10.0, 7.0, 8.0, 3.0, 5.0, 7.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0], "bins": [-11.890625, -11.5469970703125, -11.203369140625, -10.8597412109375, -10.51611328125, -10.1724853515625, -9.828857421875, -9.4852294921875, -9.1416015625, -8.7979736328125, -8.454345703125, -8.1107177734375, -7.76708984375, -7.4234619140625, -7.079833984375, -6.7362060546875, -6.392578125, -6.0489501953125, -5.705322265625, -5.3616943359375, -5.01806640625, -4.6744384765625, -4.330810546875, -3.9871826171875, -3.6435546875, -3.2999267578125, -2.956298828125, -2.6126708984375, -2.26904296875, -1.9254150390625, -1.581787109375, -1.2381591796875, -0.89453125, -0.5509033203125, -0.207275390625, 0.1363525390625, 0.47998046875, 0.8236083984375, 1.167236328125, 1.5108642578125, 1.8544921875, 2.1981201171875, 2.541748046875, 2.8853759765625, 3.22900390625, 3.5726318359375, 3.916259765625, 4.2598876953125, 4.603515625, 4.9471435546875, 5.290771484375, 5.6343994140625, 5.97802734375, 6.3216552734375, 6.665283203125, 7.0089111328125, 7.3525390625, 7.6961669921875, 8.039794921875, 8.3834228515625, 8.72705078125, 9.0706787109375, 9.414306640625, 9.7579345703125, 10.1015625]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 4.0, 8.0, 12.0, 9.0, 17.0, 23.0, 29.0, 43.0, 64.0, 91.0, 143.0, 181.0, 255.0, 367.0, 574.0, 773.0, 1093.0, 1703.0, 2551.0, 4130.0, 7360.0, 14681.0, 42923.0, 184329.0, 746996.0, 1780364.0, 1013921.0, 282103.0, 67982.0, 19393.0, 8643.0, 4846.0, 2902.0, 1869.0, 1193.0, 841.0, 562.0, 366.0, 275.0, 198.0, 137.0, 91.0, 65.0, 51.0, 35.0, 28.0, 22.0, 13.0, 11.0, 5.0, 9.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-14.703125, -14.252685546875, -13.80224609375, -13.351806640625, -12.9013671875, -12.450927734375, -12.00048828125, -11.550048828125, -11.099609375, -10.649169921875, -10.19873046875, -9.748291015625, -9.2978515625, -8.847412109375, -8.39697265625, -7.946533203125, -7.49609375, -7.045654296875, -6.59521484375, -6.144775390625, -5.6943359375, -5.243896484375, -4.79345703125, -4.343017578125, -3.892578125, -3.442138671875, -2.99169921875, -2.541259765625, -2.0908203125, -1.640380859375, -1.18994140625, -0.739501953125, -0.2890625, 0.161376953125, 0.61181640625, 1.062255859375, 1.5126953125, 1.963134765625, 2.41357421875, 2.864013671875, 3.314453125, 3.764892578125, 4.21533203125, 4.665771484375, 5.1162109375, 5.566650390625, 6.01708984375, 6.467529296875, 6.91796875, 7.368408203125, 7.81884765625, 8.269287109375, 8.7197265625, 9.170166015625, 9.62060546875, 10.071044921875, 10.521484375, 10.971923828125, 11.42236328125, 11.872802734375, 12.3232421875, 12.773681640625, 13.22412109375, 13.674560546875, 14.125]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 6.0, 10.0, 13.0, 36.0, 65.0, 102.0, 200.0, 340.0, 679.0, 999.0, 731.0, 402.0, 213.0, 135.0, 65.0, 43.0, 15.0, 13.0, 7.0, 6.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.125, -38.026123046875, -36.92724609375, -35.828369140625, -34.7294921875, -33.630615234375, -32.53173828125, -31.432861328125, -30.333984375, -29.235107421875, -28.13623046875, -27.037353515625, -25.9384765625, -24.839599609375, -23.74072265625, -22.641845703125, -21.54296875, -20.444091796875, -19.34521484375, -18.246337890625, -17.1474609375, -16.048583984375, -14.94970703125, -13.850830078125, -12.751953125, -11.653076171875, -10.55419921875, -9.455322265625, -8.3564453125, -7.257568359375, -6.15869140625, -5.059814453125, -3.9609375, -2.862060546875, -1.76318359375, -0.664306640625, 0.4345703125, 1.533447265625, 2.63232421875, 3.731201171875, 4.830078125, 5.928955078125, 7.02783203125, 8.126708984375, 9.2255859375, 10.324462890625, 11.42333984375, 12.522216796875, 13.62109375, 14.719970703125, 15.81884765625, 16.917724609375, 18.0166015625, 19.115478515625, 20.21435546875, 21.313232421875, 22.412109375, 23.510986328125, 24.60986328125, 25.708740234375, 26.8076171875, 27.906494140625, 29.00537109375, 30.104248046875, 31.203125]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 7.0, 17.0, 26.0, 53.0, 110.0, 217.0, 492.0, 1669.0, 12674.0, 3747731.0, 424492.0, 5015.0, 1055.0, 404.0, 140.0, 81.0, 53.0, 25.0, 8.0, 5.0, 5.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.4375, -70.798828125, -68.16015625, -65.521484375, -62.8828125, -60.244140625, -57.60546875, -54.966796875, -52.328125, -49.689453125, -47.05078125, -44.412109375, -41.7734375, -39.134765625, -36.49609375, -33.857421875, -31.21875, -28.580078125, -25.94140625, -23.302734375, -20.6640625, -18.025390625, -15.38671875, -12.748046875, -10.109375, -7.470703125, -4.83203125, -2.193359375, 0.4453125, 3.083984375, 5.72265625, 8.361328125, 11.0, 13.638671875, 16.27734375, 18.916015625, 21.5546875, 24.193359375, 26.83203125, 29.470703125, 32.109375, 34.748046875, 37.38671875, 40.025390625, 42.6640625, 45.302734375, 47.94140625, 50.580078125, 53.21875, 55.857421875, 58.49609375, 61.134765625, 63.7734375, 66.412109375, 69.05078125, 71.689453125, 74.328125, 76.966796875, 79.60546875, 82.244140625, 84.8828125, 87.521484375, 90.16015625, 92.798828125, 95.4375]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 9.0, 17.0, 26.0, 133.0, 226.0, 253.0, 193.0, 98.0, 40.0, 11.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-244.01589965820312, -238.7572784423828, -233.49864196777344, -228.24002075195312, -222.98138427734375, -217.72276306152344, -212.46414184570312, -207.20550537109375, -201.94688415527344, -196.68826293945312, -191.42962646484375, -186.17100524902344, -180.91238403320312, -175.65374755859375, -170.39512634277344, -165.13650512695312, -159.87786865234375, -154.61924743652344, -149.36061096191406, -144.10198974609375, -138.84335327148438, -133.58473205566406, -128.32611083984375, -123.0674819946289, -117.80885314941406, -112.55022430419922, -107.29159545898438, -102.03297424316406, -96.77434539794922, -91.51571655273438, -86.25709533691406, -80.99846649169922, -75.73983001708984, -70.481201171875, -65.22257995605469, -59.963951110839844, -54.705322265625, -49.446693420410156, -44.18806838989258, -38.929443359375, -33.670814514160156, -28.412187576293945, -23.153560638427734, -17.894933700561523, -12.636306762695312, -7.377679824829102, -2.1190528869628906, 3.1395721435546875, 8.398200988769531, 13.656827926635742, 18.915454864501953, 24.174081802368164, 29.432708740234375, 34.69133758544922, 39.9499626159668, 45.208587646484375, 50.46721649169922, 55.72584533691406, 60.98447036743164, 66.24309539794922, 71.50172424316406, 76.7603530883789, 82.01898193359375, 87.27760314941406, 92.5362319946289]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0, 4.0, 5.0, 4.0, 5.0, 7.0, 8.0, 10.0, 11.0, 11.0, 22.0, 19.0, 18.0, 20.0, 27.0, 20.0, 37.0, 33.0, 46.0, 50.0, 42.0, 56.0, 36.0, 49.0, 43.0, 50.0, 40.0, 27.0, 37.0, 25.0, 26.0, 42.0, 30.0, 22.0, 26.0, 18.0, 15.0, 12.0, 17.0, 9.0, 12.0, 5.0, 6.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-62.6953125, -60.63544464111328, -58.57557678222656, -56.51570510864258, -54.45583724975586, -52.39596939086914, -50.336097717285156, -48.27622985839844, -46.21636199951172, -44.156494140625, -42.09662628173828, -40.0367546081543, -37.97688674926758, -35.91701889038086, -33.857147216796875, -31.797279357910156, -29.737411499023438, -27.67754364013672, -25.617673873901367, -23.557804107666016, -21.497936248779297, -19.438068389892578, -17.378198623657227, -15.318329811096191, -13.258460998535156, -11.198592185974121, -9.138723373413086, -7.078854560852051, -5.018985748291016, -2.9591169357299805, -0.8992481231689453, 1.1606206893920898, 3.220489501953125, 5.28035831451416, 7.340227127075195, 9.40009593963623, 11.459964752197266, 13.5198335647583, 15.579702377319336, 17.639572143554688, 19.699440002441406, 21.759307861328125, 23.819177627563477, 25.879047393798828, 27.938915252685547, 29.998783111572266, 32.05865478515625, 34.11852264404297, 36.17839050292969, 38.238258361816406, 40.298126220703125, 42.35799789428711, 44.41786575317383, 46.47773361206055, 48.53760528564453, 50.59747314453125, 52.65734100341797, 54.71720886230469, 56.777076721191406, 58.83694839477539, 60.89681625366211, 62.95668411254883, 65.01655578613281, 67.07642364501953, 69.13629150390625]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 3.0, 3.0, 3.0, 5.0, 3.0, 8.0, 5.0, 5.0, 8.0, 5.0, 13.0, 15.0, 20.0, 32.0, 17.0, 25.0, 24.0, 28.0, 36.0, 28.0, 36.0, 33.0, 42.0, 29.0, 41.0, 43.0, 42.0, 53.0, 30.0, 32.0, 49.0, 30.0, 40.0, 24.0, 33.0, 16.0, 27.0, 19.0, 11.0, 20.0, 17.0, 15.0, 5.0, 4.0, 4.0, 6.0, 7.0, 6.0, 6.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.421875, -9.1326904296875, -8.843505859375, -8.5543212890625, -8.26513671875, -7.9759521484375, -7.686767578125, -7.3975830078125, -7.1083984375, -6.8192138671875, -6.530029296875, -6.2408447265625, -5.95166015625, -5.6624755859375, -5.373291015625, -5.0841064453125, -4.794921875, -4.5057373046875, -4.216552734375, -3.9273681640625, -3.63818359375, -3.3489990234375, -3.059814453125, -2.7706298828125, -2.4814453125, -2.1922607421875, -1.903076171875, -1.6138916015625, -1.32470703125, -1.0355224609375, -0.746337890625, -0.4571533203125, -0.16796875, 0.1212158203125, 0.410400390625, 0.6995849609375, 0.98876953125, 1.2779541015625, 1.567138671875, 1.8563232421875, 2.1455078125, 2.4346923828125, 2.723876953125, 3.0130615234375, 3.30224609375, 3.5914306640625, 3.880615234375, 4.1697998046875, 4.458984375, 4.7481689453125, 5.037353515625, 5.3265380859375, 5.61572265625, 5.9049072265625, 6.194091796875, 6.4832763671875, 6.7724609375, 7.0616455078125, 7.350830078125, 7.6400146484375, 7.92919921875, 8.2183837890625, 8.507568359375, 8.7967529296875, 9.0859375]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 7.0, 12.0, 14.0, 27.0, 35.0, 57.0, 78.0, 109.0, 165.0, 240.0, 346.0, 426.0, 651.0, 931.0, 1311.0, 1797.0, 2549.0, 3584.0, 5271.0, 7434.0, 10469.0, 15384.0, 22389.0, 32905.0, 49800.0, 76164.0, 116095.0, 164584.0, 169189.0, 121949.0, 80336.0, 52438.0, 34949.0, 23638.0, 16095.0, 11065.0, 7680.0, 5387.0, 3757.0, 2774.0, 1891.0, 1378.0, 947.0, 646.0, 500.0, 358.0, 250.0, 173.0, 102.0, 83.0, 49.0, 35.0, 22.0, 21.0, 6.0, 7.0, 5.0, 2.0, 2.0, 2.0], "bins": [-0.30419921875, -0.2947120666503906, -0.28522491455078125, -0.2757377624511719, -0.2662506103515625, -0.2567634582519531, -0.24727630615234375, -0.23778915405273438, -0.228302001953125, -0.21881484985351562, -0.20932769775390625, -0.19984054565429688, -0.1903533935546875, -0.18086624145507812, -0.17137908935546875, -0.16189193725585938, -0.15240478515625, -0.14291763305664062, -0.13343048095703125, -0.12394332885742188, -0.1144561767578125, -0.10496902465820312, -0.09548187255859375, -0.08599472045898438, -0.076507568359375, -0.06702041625976562, -0.05753326416015625, -0.048046112060546875, -0.0385589599609375, -0.029071807861328125, -0.01958465576171875, -0.010097503662109375, -0.0006103515625, 0.008876800537109375, 0.01836395263671875, 0.027851104736328125, 0.0373382568359375, 0.046825408935546875, 0.05631256103515625, 0.06579971313476562, 0.075286865234375, 0.08477401733398438, 0.09426116943359375, 0.10374832153320312, 0.1132354736328125, 0.12272262573242188, 0.13220977783203125, 0.14169692993164062, 0.15118408203125, 0.16067123413085938, 0.17015838623046875, 0.17964553833007812, 0.1891326904296875, 0.19861984252929688, 0.20810699462890625, 0.21759414672851562, 0.227081298828125, 0.23656845092773438, 0.24605560302734375, 0.2555427551269531, 0.2650299072265625, 0.2745170593261719, 0.28400421142578125, 0.2934913635253906, 0.302978515625]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 6.0, 7.0, 6.0, 12.0, 5.0, 8.0, 21.0, 17.0, 20.0, 23.0, 18.0, 31.0, 29.0, 29.0, 41.0, 30.0, 45.0, 39.0, 26.0, 42.0, 1061.0, 31.0, 36.0, 41.0, 33.0, 43.0, 41.0, 29.0, 38.0, 28.0, 27.0, 20.0, 21.0, 18.0, 16.0, 16.0, 12.0, 11.0, 14.0, 9.0, 4.0, 6.0, 2.0, 7.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-6.0703125, -5.88568115234375, -5.7010498046875, -5.51641845703125, -5.331787109375, -5.14715576171875, -4.9625244140625, -4.77789306640625, -4.59326171875, -4.40863037109375, -4.2239990234375, -4.03936767578125, -3.854736328125, -3.67010498046875, -3.4854736328125, -3.30084228515625, -3.1162109375, -2.93157958984375, -2.7469482421875, -2.56231689453125, -2.377685546875, -2.19305419921875, -2.0084228515625, -1.82379150390625, -1.63916015625, -1.45452880859375, -1.2698974609375, -1.08526611328125, -0.900634765625, -0.71600341796875, -0.5313720703125, -0.34674072265625, -0.162109375, 0.02252197265625, 0.2071533203125, 0.39178466796875, 0.576416015625, 0.76104736328125, 0.9456787109375, 1.13031005859375, 1.31494140625, 1.49957275390625, 1.6842041015625, 1.86883544921875, 2.053466796875, 2.23809814453125, 2.4227294921875, 2.60736083984375, 2.7919921875, 2.97662353515625, 3.1612548828125, 3.34588623046875, 3.530517578125, 3.71514892578125, 3.8997802734375, 4.08441162109375, 4.26904296875, 4.45367431640625, 4.6383056640625, 4.82293701171875, 5.007568359375, 5.19219970703125, 5.3768310546875, 5.56146240234375, 5.74609375]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 0.0, 0.0, 5.0, 7.0, 6.0, 13.0, 20.0, 29.0, 44.0, 86.0, 122.0, 156.0, 247.0, 376.0, 502.0, 676.0, 1001.0, 1489.0, 2280.0, 3205.0, 4817.0, 7302.0, 10858.0, 16323.0, 25263.0, 38603.0, 60031.0, 92251.0, 136799.0, 1220205.0, 155112.0, 110102.0, 72708.0, 46972.0, 30314.0, 19834.0, 12804.0, 8510.0, 5806.0, 3863.0, 2602.0, 1854.0, 1255.0, 878.0, 584.0, 390.0, 271.0, 188.0, 129.0, 87.0, 53.0, 35.0, 30.0, 12.0, 17.0, 10.0, 3.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.31201171875, -0.3024749755859375, -0.292938232421875, -0.2834014892578125, -0.27386474609375, -0.2643280029296875, -0.254791259765625, -0.2452545166015625, -0.2357177734375, -0.2261810302734375, -0.216644287109375, -0.2071075439453125, -0.19757080078125, -0.1880340576171875, -0.178497314453125, -0.1689605712890625, -0.159423828125, -0.1498870849609375, -0.140350341796875, -0.1308135986328125, -0.12127685546875, -0.1117401123046875, -0.102203369140625, -0.0926666259765625, -0.0831298828125, -0.0735931396484375, -0.064056396484375, -0.0545196533203125, -0.04498291015625, -0.0354461669921875, -0.025909423828125, -0.0163726806640625, -0.0068359375, 0.0027008056640625, 0.012237548828125, 0.0217742919921875, 0.03131103515625, 0.0408477783203125, 0.050384521484375, 0.0599212646484375, 0.0694580078125, 0.0789947509765625, 0.088531494140625, 0.0980682373046875, 0.10760498046875, 0.1171417236328125, 0.126678466796875, 0.1362152099609375, 0.145751953125, 0.1552886962890625, 0.164825439453125, 0.1743621826171875, 0.18389892578125, 0.1934356689453125, 0.202972412109375, 0.2125091552734375, 0.2220458984375, 0.2315826416015625, 0.241119384765625, 0.2506561279296875, 0.26019287109375, 0.2697296142578125, 0.279266357421875, 0.2888031005859375, 0.29833984375]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 8.0, 7.0, 9.0, 9.0, 7.0, 10.0, 17.0, 19.0, 16.0, 24.0, 27.0, 32.0, 34.0, 38.0, 38.0, 51.0, 43.0, 37.0, 43.0, 58.0, 48.0, 37.0, 55.0, 50.0, 37.0, 31.0, 28.0, 35.0, 27.0, 22.0, 27.0, 14.0, 12.0, 8.0, 15.0, 9.0, 7.0, 1.0, 6.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.0015077590942382812, -0.0014654546976089478, -0.0014231503009796143, -0.0013808459043502808, -0.0013385415077209473, -0.0012962371110916138, -0.0012539327144622803, -0.0012116283178329468, -0.0011693239212036133, -0.0011270195245742798, -0.0010847151279449463, -0.0010424107313156128, -0.0010001063346862793, -0.0009578019380569458, -0.0009154975414276123, -0.0008731931447982788, -0.0008308887481689453, -0.0007885843515396118, -0.0007462799549102783, -0.0007039755582809448, -0.0006616711616516113, -0.0006193667650222778, -0.0005770623683929443, -0.0005347579717636108, -0.0004924535751342773, -0.00045014917850494385, -0.00040784478187561035, -0.00036554038524627686, -0.00032323598861694336, -0.00028093159198760986, -0.00023862719535827637, -0.00019632279872894287, -0.00015401840209960938, -0.00011171400547027588, -6.940960884094238e-05, -2.7105212211608887e-05, 1.519918441772461e-05, 5.7503581047058105e-05, 9.98079776763916e-05, 0.0001421123743057251, 0.0001844167709350586, 0.0002267211675643921, 0.0002690255641937256, 0.0003113299608230591, 0.0003536343574523926, 0.0003959387540817261, 0.00043824315071105957, 0.00048054754734039307, 0.0005228519439697266, 0.0005651563405990601, 0.0006074607372283936, 0.000649765133857727, 0.0006920695304870605, 0.000734373927116394, 0.0007766783237457275, 0.000818982720375061, 0.0008612871170043945, 0.000903591513633728, 0.0009458959102630615, 0.000988200306892395, 0.0010305047035217285, 0.001072809100151062, 0.0011151134967803955, 0.001157417893409729, 0.0011997222900390625]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 8.0, 4.0, 5.0, 9.0, 10.0, 17.0, 21.0, 25.0, 35.0, 42.0, 53.0, 73.0, 84.0, 139.0, 170.0, 277.0, 448.0, 1160.0, 60596.0, 979262.0, 4140.0, 703.0, 379.0, 218.0, 146.0, 124.0, 91.0, 68.0, 50.0, 34.0, 37.0, 29.0, 28.0, 14.0, 16.0, 6.0, 8.0, 10.0, 6.0, 1.0, 5.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0264434814453125, -0.02554011344909668, -0.02463674545288086, -0.02373337745666504, -0.02283000946044922, -0.0219266414642334, -0.021023273468017578, -0.020119905471801758, -0.019216537475585938, -0.018313169479370117, -0.017409801483154297, -0.016506433486938477, -0.015603065490722656, -0.014699697494506836, -0.013796329498291016, -0.012892961502075195, -0.011989593505859375, -0.011086225509643555, -0.010182857513427734, -0.009279489517211914, -0.008376121520996094, -0.0074727535247802734, -0.006569385528564453, -0.005666017532348633, -0.0047626495361328125, -0.003859281539916992, -0.002955913543701172, -0.0020525455474853516, -0.0011491775512695312, -0.00024580955505371094, 0.0006575584411621094, 0.0015609264373779297, 0.00246429443359375, 0.0033676624298095703, 0.004271030426025391, 0.005174398422241211, 0.006077766418457031, 0.0069811344146728516, 0.007884502410888672, 0.008787870407104492, 0.009691238403320312, 0.010594606399536133, 0.011497974395751953, 0.012401342391967773, 0.013304710388183594, 0.014208078384399414, 0.015111446380615234, 0.016014814376831055, 0.016918182373046875, 0.017821550369262695, 0.018724918365478516, 0.019628286361694336, 0.020531654357910156, 0.021435022354125977, 0.022338390350341797, 0.023241758346557617, 0.024145126342773438, 0.025048494338989258, 0.025951862335205078, 0.0268552303314209, 0.02775859832763672, 0.02866196632385254, 0.02956533432006836, 0.03046870231628418, 0.0313720703125]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 126.0, 879.0, 11.0, 0.0, 1.0, 1.0], "bins": [-0.020500371232628822, -0.020154595375061035, -0.019808819517493248, -0.01946304365992546, -0.019117267802357674, -0.018771493807435036, -0.01842571794986725, -0.01807994209229946, -0.017734166234731674, -0.017388390377163887, -0.0170426145195961, -0.016696838662028313, -0.016351062804460526, -0.016005288809537888, -0.0156595129519701, -0.015313737094402313, -0.014967961236834526, -0.014622185379266739, -0.014276409521698952, -0.01393063459545374, -0.013584858737885952, -0.013239082880318165, -0.012893307022750378, -0.012547532096505165, -0.012201755307614803, -0.011855979450047016, -0.011510203592479229, -0.011164428666234016, -0.01081865280866623, -0.010472876951098442, -0.010127101093530655, -0.009781325235962868, -0.00943555124104023, -0.009089775383472443, -0.008743999525904655, -0.008398224599659443, -0.008052448742091656, -0.0077066728845238686, -0.007360897026956081, -0.0070151216350495815, -0.006669345311820507, -0.00632356945425272, -0.00597779406234622, -0.005632018204778433, -0.005286242812871933, -0.004940466955304146, -0.004594691097736359, -0.004248915705829859, -0.003903140313923359, -0.0035573646891862154, -0.003211589064449072, -0.0028658132068812847, -0.002520037814974785, -0.0021742619574069977, -0.0018284863326698542, -0.0014827107079327106, -0.0011369350831955671, -0.0007911594584584236, -0.0004453837755136192, -9.960809256881475e-05, 0.00024616753216832876, 0.0005919431569054723, 0.0009377188980579376, 0.0012834945227950811, 0.0016292701475322247]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 5.0, 2.0, 5.0, 6.0, 8.0, 6.0, 5.0, 11.0, 10.0, 17.0, 20.0, 27.0, 27.0, 23.0, 26.0, 45.0, 43.0, 43.0, 46.0, 51.0, 43.0, 58.0, 39.0, 46.0, 45.0, 36.0, 41.0, 31.0, 34.0, 32.0, 29.0, 21.0, 19.0, 19.0, 18.0, 14.0, 11.0, 6.0, 6.0, 4.0, 6.0, 7.0, 4.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0008199214935302734, -0.0007931860163807869, -0.0007664505392313004, -0.0007397150620818138, -0.0007129795849323273, -0.0006862441077828407, -0.0006595086306333542, -0.0006327731534838676, -0.0006060376763343811, -0.0005793021991848946, -0.000552566722035408, -0.0005258312448859215, -0.0004990957677364349, -0.0004723602905869484, -0.00044562481343746185, -0.0004188893362879753, -0.00039215385913848877, -0.00036541838198900223, -0.0003386829048395157, -0.00031194742769002914, -0.0002852119505405426, -0.00025847647339105606, -0.00023174099624156952, -0.00020500551909208298, -0.00017827004194259644, -0.0001515345647931099, -0.00012479908764362335, -9.806361049413681e-05, -7.132813334465027e-05, -4.459265619516373e-05, -1.7857179045677185e-05, 8.878298103809357e-06, 3.56137752532959e-05, 6.234925240278244e-05, 8.908472955226898e-05, 0.00011582020670175552, 0.00014255568385124207, 0.0001692911610007286, 0.00019602663815021515, 0.0002227621152997017, 0.00024949759244918823, 0.0002762330695986748, 0.0003029685467481613, 0.00032970402389764786, 0.0003564395010471344, 0.00038317497819662094, 0.0004099104553461075, 0.000436645932495594, 0.00046338140964508057, 0.0004901168867945671, 0.0005168523639440536, 0.0005435878410935402, 0.0005703233182430267, 0.0005970587953925133, 0.0006237942725419998, 0.0006505297496914864, 0.0006772652268409729, 0.0007040007039904594, 0.000730736181139946, 0.0007574716582894325, 0.0007842071354389191, 0.0008109426125884056, 0.0008376780897378922, 0.0008644135668873787, 0.0008911490440368652]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 3.0, 3.0, 3.0, 5.0, 3.0, 8.0, 5.0, 5.0, 8.0, 5.0, 13.0, 15.0, 20.0, 32.0, 17.0, 25.0, 24.0, 28.0, 36.0, 28.0, 36.0, 33.0, 42.0, 29.0, 41.0, 43.0, 42.0, 53.0, 30.0, 32.0, 49.0, 30.0, 40.0, 24.0, 33.0, 17.0, 26.0, 19.0, 11.0, 20.0, 17.0, 15.0, 5.0, 4.0, 4.0, 6.0, 7.0, 6.0, 6.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.421875, -9.1326904296875, -8.843505859375, -8.5543212890625, -8.26513671875, -7.9759521484375, -7.686767578125, -7.3975830078125, -7.1083984375, -6.8192138671875, -6.530029296875, -6.2408447265625, -5.95166015625, -5.6624755859375, -5.373291015625, -5.0841064453125, -4.794921875, -4.5057373046875, -4.216552734375, -3.9273681640625, -3.63818359375, -3.3489990234375, -3.059814453125, -2.7706298828125, -2.4814453125, -2.1922607421875, -1.903076171875, -1.6138916015625, -1.32470703125, -1.0355224609375, -0.746337890625, -0.4571533203125, -0.16796875, 0.1212158203125, 0.410400390625, 0.6995849609375, 0.98876953125, 1.2779541015625, 1.567138671875, 1.8563232421875, 2.1455078125, 2.4346923828125, 2.723876953125, 3.0130615234375, 3.30224609375, 3.5914306640625, 3.880615234375, 4.1697998046875, 4.458984375, 4.7481689453125, 5.037353515625, 5.3265380859375, 5.61572265625, 5.9049072265625, 6.194091796875, 6.4832763671875, 6.7724609375, 7.0616455078125, 7.350830078125, 7.6400146484375, 7.92919921875, 8.2183837890625, 8.507568359375, 8.7967529296875, 9.0859375]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 6.0, 6.0, 4.0, 6.0, 7.0, 11.0, 14.0, 17.0, 23.0, 27.0, 34.0, 57.0, 83.0, 134.0, 164.0, 295.0, 395.0, 551.0, 921.0, 1661.0, 3291.0, 8071.0, 26162.0, 121753.0, 624358.0, 202548.0, 37870.0, 10895.0, 4191.0, 1956.0, 1062.0, 604.0, 393.0, 298.0, 207.0, 142.0, 94.0, 73.0, 46.0, 31.0, 31.0, 17.0, 14.0, 10.0, 8.0, 10.0, 6.0, 5.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.484375, -15.979248046875, -15.47412109375, -14.968994140625, -14.4638671875, -13.958740234375, -13.45361328125, -12.948486328125, -12.443359375, -11.938232421875, -11.43310546875, -10.927978515625, -10.4228515625, -9.917724609375, -9.41259765625, -8.907470703125, -8.40234375, -7.897216796875, -7.39208984375, -6.886962890625, -6.3818359375, -5.876708984375, -5.37158203125, -4.866455078125, -4.361328125, -3.856201171875, -3.35107421875, -2.845947265625, -2.3408203125, -1.835693359375, -1.33056640625, -0.825439453125, -0.3203125, 0.184814453125, 0.68994140625, 1.195068359375, 1.7001953125, 2.205322265625, 2.71044921875, 3.215576171875, 3.720703125, 4.225830078125, 4.73095703125, 5.236083984375, 5.7412109375, 6.246337890625, 6.75146484375, 7.256591796875, 7.76171875, 8.266845703125, 8.77197265625, 9.277099609375, 9.7822265625, 10.287353515625, 10.79248046875, 11.297607421875, 11.802734375, 12.307861328125, 12.81298828125, 13.318115234375, 13.8232421875, 14.328369140625, 14.83349609375, 15.338623046875, 15.84375]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 6.0, 6.0, 2.0, 2.0, 4.0, 11.0, 15.0, 18.0, 13.0, 16.0, 28.0, 29.0, 27.0, 31.0, 46.0, 57.0, 70.0, 98.0, 249.0, 1735.0, 159.0, 70.0, 57.0, 54.0, 45.0, 33.0, 24.0, 28.0, 24.0, 18.0, 13.0, 12.0, 10.0, 11.0, 12.0, 4.0, 2.0, 3.0, 4.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.0625, -25.22998046875, -24.3974609375, -23.56494140625, -22.732421875, -21.89990234375, -21.0673828125, -20.23486328125, -19.40234375, -18.56982421875, -17.7373046875, -16.90478515625, -16.072265625, -15.23974609375, -14.4072265625, -13.57470703125, -12.7421875, -11.90966796875, -11.0771484375, -10.24462890625, -9.412109375, -8.57958984375, -7.7470703125, -6.91455078125, -6.08203125, -5.24951171875, -4.4169921875, -3.58447265625, -2.751953125, -1.91943359375, -1.0869140625, -0.25439453125, 0.578125, 1.41064453125, 2.2431640625, 3.07568359375, 3.908203125, 4.74072265625, 5.5732421875, 6.40576171875, 7.23828125, 8.07080078125, 8.9033203125, 9.73583984375, 10.568359375, 11.40087890625, 12.2333984375, 13.06591796875, 13.8984375, 14.73095703125, 15.5634765625, 16.39599609375, 17.228515625, 18.06103515625, 18.8935546875, 19.72607421875, 20.55859375, 21.39111328125, 22.2236328125, 23.05615234375, 23.888671875, 24.72119140625, 25.5537109375, 26.38623046875, 27.21875]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 4.0, 2.0, 4.0, 1.0, 7.0, 9.0, 7.0, 10.0, 9.0, 15.0, 19.0, 25.0, 30.0, 49.0, 72.0, 105.0, 173.0, 323.0, 627.0, 1851.0, 2923237.0, 216453.0, 1351.0, 537.0, 301.0, 154.0, 98.0, 55.0, 41.0, 39.0, 20.0, 21.0, 15.0, 12.0, 6.0, 5.0, 5.0, 4.0, 3.0, 2.0, 6.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-74.625, -72.357421875, -70.08984375, -67.822265625, -65.5546875, -63.287109375, -61.01953125, -58.751953125, -56.484375, -54.216796875, -51.94921875, -49.681640625, -47.4140625, -45.146484375, -42.87890625, -40.611328125, -38.34375, -36.076171875, -33.80859375, -31.541015625, -29.2734375, -27.005859375, -24.73828125, -22.470703125, -20.203125, -17.935546875, -15.66796875, -13.400390625, -11.1328125, -8.865234375, -6.59765625, -4.330078125, -2.0625, 0.205078125, 2.47265625, 4.740234375, 7.0078125, 9.275390625, 11.54296875, 13.810546875, 16.078125, 18.345703125, 20.61328125, 22.880859375, 25.1484375, 27.416015625, 29.68359375, 31.951171875, 34.21875, 36.486328125, 38.75390625, 41.021484375, 43.2890625, 45.556640625, 47.82421875, 50.091796875, 52.359375, 54.626953125, 56.89453125, 59.162109375, 61.4296875, 63.697265625, 65.96484375, 68.232421875, 70.5]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 35.0, 488.0, 465.0, 21.0, 0.0, 1.0], "bins": [-351.5297546386719, -345.6678466796875, -339.8059387207031, -333.94403076171875, -328.0821228027344, -322.22021484375, -316.3583068847656, -310.49639892578125, -304.63446044921875, -298.7725524902344, -292.91064453125, -287.0487365722656, -281.18682861328125, -275.3249206542969, -269.4630126953125, -263.60107421875, -257.73919677734375, -251.87728881835938, -246.015380859375, -240.15347290039062, -234.29156494140625, -228.4296417236328, -222.56773376464844, -216.70582580566406, -210.8439178466797, -204.9820098876953, -199.12010192871094, -193.25819396972656, -187.39627075195312, -181.53436279296875, -175.67245483398438, -169.810546875, -163.94863891601562, -158.08673095703125, -152.22482299804688, -146.3629150390625, -140.50100708007812, -134.6390838623047, -128.7771759033203, -122.91526794433594, -117.0533676147461, -111.19145965576172, -105.32954406738281, -99.46763610839844, -93.60572814941406, -87.74382019042969, -81.88191223144531, -76.0199966430664, -70.15808868408203, -64.29618072509766, -58.434268951416016, -52.572357177734375, -46.71044921875, -40.848541259765625, -34.986629486083984, -29.124717712402344, -23.26280975341797, -17.40089988708496, -11.538990020751953, -5.677080154418945, 0.1848297119140625, 6.04673957824707, 11.908649444580078, 17.77056121826172, 23.632469177246094]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 0.0, 8.0, 4.0, 8.0, 7.0, 4.0, 13.0, 4.0, 12.0, 20.0, 23.0, 31.0, 21.0, 28.0, 29.0, 31.0, 42.0, 44.0, 47.0, 34.0, 47.0, 42.0, 45.0, 39.0, 35.0, 46.0, 32.0, 31.0, 41.0, 33.0, 27.0, 35.0, 25.0, 20.0, 20.0, 17.0, 17.0, 9.0, 14.0, 4.0, 6.0, 2.0, 4.0, 6.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-58.50165939331055, -56.80950927734375, -55.11735916137695, -53.425209045410156, -51.73305892944336, -50.04090881347656, -48.348758697509766, -46.65660858154297, -44.96445846557617, -43.272308349609375, -41.58015823364258, -39.88800811767578, -38.195858001708984, -36.50370788574219, -34.81155776977539, -33.119407653808594, -31.427257537841797, -29.735107421875, -28.042957305908203, -26.350807189941406, -24.65865707397461, -22.966506958007812, -21.274356842041016, -19.58220672607422, -17.890056610107422, -16.197906494140625, -14.505756378173828, -12.813606262207031, -11.121456146240234, -9.429306030273438, -7.737155914306641, -6.045005798339844, -4.352851867675781, -2.6607017517089844, -0.9685516357421875, 0.7235984802246094, 2.4157485961914062, 4.107898712158203, 5.800048828125, 7.492198944091797, 9.184349060058594, 10.87649917602539, 12.568649291992188, 14.260799407958984, 15.952949523925781, 17.645099639892578, 19.337249755859375, 21.029399871826172, 22.72154998779297, 24.413700103759766, 26.105850219726562, 27.79800033569336, 29.490150451660156, 31.182300567626953, 32.87445068359375, 34.56660079956055, 36.258750915527344, 37.95090103149414, 39.64305114746094, 41.335201263427734, 43.02735137939453, 44.71950149536133, 46.411651611328125, 48.10380172729492, 49.79595184326172]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 5.0, 4.0, 7.0, 6.0, 8.0, 5.0, 7.0, 14.0, 9.0, 18.0, 22.0, 23.0, 23.0, 25.0, 30.0, 27.0, 46.0, 43.0, 43.0, 37.0, 31.0, 40.0, 50.0, 38.0, 45.0, 35.0, 37.0, 30.0, 39.0, 40.0, 26.0, 29.0, 36.0, 22.0, 24.0, 11.0, 7.0, 18.0, 12.0, 8.0, 5.0, 4.0, 3.0, 1.0, 6.0, 5.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.375, -11.0362548828125, -10.697509765625, -10.3587646484375, -10.02001953125, -9.6812744140625, -9.342529296875, -9.0037841796875, -8.6650390625, -8.3262939453125, -7.987548828125, -7.6488037109375, -7.31005859375, -6.9713134765625, -6.632568359375, -6.2938232421875, -5.955078125, -5.6163330078125, -5.277587890625, -4.9388427734375, -4.60009765625, -4.2613525390625, -3.922607421875, -3.5838623046875, -3.2451171875, -2.9063720703125, -2.567626953125, -2.2288818359375, -1.89013671875, -1.5513916015625, -1.212646484375, -0.8739013671875, -0.53515625, -0.1964111328125, 0.142333984375, 0.4810791015625, 0.81982421875, 1.1585693359375, 1.497314453125, 1.8360595703125, 2.1748046875, 2.5135498046875, 2.852294921875, 3.1910400390625, 3.52978515625, 3.8685302734375, 4.207275390625, 4.5460205078125, 4.884765625, 5.2235107421875, 5.562255859375, 5.9010009765625, 6.23974609375, 6.5784912109375, 6.917236328125, 7.2559814453125, 7.5947265625, 7.9334716796875, 8.272216796875, 8.6109619140625, 8.94970703125, 9.2884521484375, 9.627197265625, 9.9659423828125, 10.3046875]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 5.0, 4.0, 8.0, 6.0, 11.0, 6.0, 8.0, 21.0, 33.0, 33.0, 33.0, 54.0, 64.0, 82.0, 109.0, 135.0, 192.0, 225.0, 287.0, 457.0, 734.0, 1295.0, 3056.0, 10923.0, 80078.0, 2468469.0, 1563615.0, 50297.0, 8067.0, 2526.0, 1160.0, 637.0, 452.0, 261.0, 197.0, 140.0, 127.0, 120.0, 85.0, 74.0, 45.0, 44.0, 27.0, 26.0, 13.0, 8.0, 14.0, 7.0, 9.0, 3.0, 5.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-49.3125, -47.81396484375, -46.3154296875, -44.81689453125, -43.318359375, -41.81982421875, -40.3212890625, -38.82275390625, -37.32421875, -35.82568359375, -34.3271484375, -32.82861328125, -31.330078125, -29.83154296875, -28.3330078125, -26.83447265625, -25.3359375, -23.83740234375, -22.3388671875, -20.84033203125, -19.341796875, -17.84326171875, -16.3447265625, -14.84619140625, -13.34765625, -11.84912109375, -10.3505859375, -8.85205078125, -7.353515625, -5.85498046875, -4.3564453125, -2.85791015625, -1.359375, 0.13916015625, 1.6376953125, 3.13623046875, 4.634765625, 6.13330078125, 7.6318359375, 9.13037109375, 10.62890625, 12.12744140625, 13.6259765625, 15.12451171875, 16.623046875, 18.12158203125, 19.6201171875, 21.11865234375, 22.6171875, 24.11572265625, 25.6142578125, 27.11279296875, 28.611328125, 30.10986328125, 31.6083984375, 33.10693359375, 34.60546875, 36.10400390625, 37.6025390625, 39.10107421875, 40.599609375, 42.09814453125, 43.5966796875, 45.09521484375, 46.59375]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 13.0, 10.0, 8.0, 18.0, 25.0, 39.0, 52.0, 62.0, 96.0, 141.0, 228.0, 380.0, 558.0, 642.0, 635.0, 383.0, 263.0, 164.0, 97.0, 93.0, 52.0, 39.0, 24.0, 16.0, 15.0, 7.0, 9.0, 7.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-37.15625, -36.304443359375, -35.45263671875, -34.600830078125, -33.7490234375, -32.897216796875, -32.04541015625, -31.193603515625, -30.341796875, -29.489990234375, -28.63818359375, -27.786376953125, -26.9345703125, -26.082763671875, -25.23095703125, -24.379150390625, -23.52734375, -22.675537109375, -21.82373046875, -20.971923828125, -20.1201171875, -19.268310546875, -18.41650390625, -17.564697265625, -16.712890625, -15.861083984375, -15.00927734375, -14.157470703125, -13.3056640625, -12.453857421875, -11.60205078125, -10.750244140625, -9.8984375, -9.046630859375, -8.19482421875, -7.343017578125, -6.4912109375, -5.639404296875, -4.78759765625, -3.935791015625, -3.083984375, -2.232177734375, -1.38037109375, -0.528564453125, 0.3232421875, 1.175048828125, 2.02685546875, 2.878662109375, 3.73046875, 4.582275390625, 5.43408203125, 6.285888671875, 7.1376953125, 7.989501953125, 8.84130859375, 9.693115234375, 10.544921875, 11.396728515625, 12.24853515625, 13.100341796875, 13.9521484375, 14.803955078125, 15.65576171875, 16.507568359375, 17.359375]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 4.0, 6.0, 10.0, 19.0, 32.0, 32.0, 58.0, 119.0, 177.0, 312.0, 655.0, 1372.0, 3263.0, 9224.0, 40262.0, 348103.0, 3352239.0, 380523.0, 42133.0, 9619.0, 3283.0, 1329.0, 693.0, 353.0, 189.0, 119.0, 51.0, 38.0, 25.0, 14.0, 8.0, 6.0, 4.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.875, -32.8642578125, -31.853515625, -30.8427734375, -29.83203125, -28.8212890625, -27.810546875, -26.7998046875, -25.7890625, -24.7783203125, -23.767578125, -22.7568359375, -21.74609375, -20.7353515625, -19.724609375, -18.7138671875, -17.703125, -16.6923828125, -15.681640625, -14.6708984375, -13.66015625, -12.6494140625, -11.638671875, -10.6279296875, -9.6171875, -8.6064453125, -7.595703125, -6.5849609375, -5.57421875, -4.5634765625, -3.552734375, -2.5419921875, -1.53125, -0.5205078125, 0.490234375, 1.5009765625, 2.51171875, 3.5224609375, 4.533203125, 5.5439453125, 6.5546875, 7.5654296875, 8.576171875, 9.5869140625, 10.59765625, 11.6083984375, 12.619140625, 13.6298828125, 14.640625, 15.6513671875, 16.662109375, 17.6728515625, 18.68359375, 19.6943359375, 20.705078125, 21.7158203125, 22.7265625, 23.7373046875, 24.748046875, 25.7587890625, 26.76953125, 27.7802734375, 28.791015625, 29.8017578125, 30.8125]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 14.0, 14.0, 23.0, 40.0, 42.0, 77.0, 88.0, 127.0, 151.0, 124.0, 92.0, 71.0, 59.0, 24.0, 19.0, 12.0, 9.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-175.2210235595703, -168.93338012695312, -162.64573669433594, -156.35809326171875, -150.07044982910156, -143.78280639648438, -137.49514770507812, -131.20751953125, -124.91986846923828, -118.6322250366211, -112.3445816040039, -106.05693054199219, -99.769287109375, -93.48164367675781, -87.19400024414062, -80.90635681152344, -74.61871337890625, -68.33106994628906, -62.043426513671875, -55.75577926635742, -49.468135833740234, -43.18049240112305, -36.892845153808594, -30.605201721191406, -24.31755828857422, -18.02991485595703, -11.742269515991211, -5.454624176025391, 0.8330192565917969, 7.120662689208984, 13.408309936523438, 19.695953369140625, 25.983596801757812, 32.271240234375, 38.55888366699219, 44.84653091430664, 51.13417434692383, 57.421817779541016, 63.70946502685547, 69.99710845947266, 76.28475189208984, 82.57239532470703, 88.86003875732422, 95.14768981933594, 101.43533325195312, 107.72297668457031, 114.0106201171875, 120.29826354980469, 126.58590698242188, 132.87355041503906, 139.16119384765625, 145.44883728027344, 151.73648071289062, 158.0241241455078, 164.311767578125, 170.59942626953125, 176.88705444335938, 183.17469787597656, 189.46234130859375, 195.74998474121094, 202.03762817382812, 208.3252716064453, 214.6129150390625, 220.90057373046875, 227.18821716308594]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 2.0, 6.0, 5.0, 8.0, 9.0, 14.0, 9.0, 16.0, 15.0, 17.0, 22.0, 31.0, 30.0, 25.0, 26.0, 31.0, 32.0, 35.0, 37.0, 38.0, 43.0, 34.0, 40.0, 40.0, 39.0, 53.0, 41.0, 43.0, 29.0, 26.0, 24.0, 32.0, 30.0, 20.0, 16.0, 15.0, 15.0, 7.0, 14.0, 5.0, 8.0, 6.0, 4.0, 3.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-90.97396087646484, -88.21078491210938, -85.4476089477539, -82.68443298339844, -79.9212646484375, -77.15808868408203, -74.39491271972656, -71.6317367553711, -68.86856079101562, -66.10538482666016, -63.34221267700195, -60.579036712646484, -57.815860748291016, -55.05268859863281, -52.289512634277344, -49.526336669921875, -46.76316452026367, -43.9999885559082, -41.23681640625, -38.47364044189453, -35.71046447753906, -32.947288513183594, -30.18411636352539, -27.420940399169922, -24.657766342163086, -21.89459228515625, -19.13141632080078, -16.368242263793945, -13.605067253112793, -10.84189224243164, -8.078718185424805, -5.315542221069336, -2.5523681640625, 0.21080660820007324, 2.9739813804626465, 5.737155914306641, 8.500330924987793, 11.263505935668945, 14.026679992675781, 16.78985595703125, 19.553030014038086, 22.316204071044922, 25.07938003540039, 27.842554092407227, 30.605728149414062, 33.36890411376953, 36.132080078125, 38.89525604248047, 41.65842819213867, 44.42160415649414, 47.184776306152344, 49.94795227050781, 52.71112823486328, 55.47430419921875, 58.23747634887695, 61.00065231323242, 63.763824462890625, 66.5270004272461, 69.29017639160156, 72.0533447265625, 74.81652069091797, 77.57969665527344, 80.3428726196289, 83.10604858398438, 85.86922454833984]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 7.0, 8.0, 10.0, 11.0, 10.0, 13.0, 14.0, 16.0, 22.0, 28.0, 24.0, 35.0, 31.0, 34.0, 45.0, 44.0, 30.0, 45.0, 50.0, 50.0, 45.0, 56.0, 50.0, 36.0, 42.0, 33.0, 38.0, 40.0, 29.0, 23.0, 12.0, 16.0, 17.0, 7.0, 7.0, 3.0, 5.0, 5.0, 5.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-133.75, -129.58984375, -125.4296875, -121.26953125, -117.109375, -112.94921875, -108.7890625, -104.62890625, -100.46875, -96.30859375, -92.1484375, -87.98828125, -83.828125, -79.66796875, -75.5078125, -71.34765625, -67.1875, -63.02734375, -58.8671875, -54.70703125, -50.546875, -46.38671875, -42.2265625, -38.06640625, -33.90625, -29.74609375, -25.5859375, -21.42578125, -17.265625, -13.10546875, -8.9453125, -4.78515625, -0.625, 3.53515625, 7.6953125, 11.85546875, 16.015625, 20.17578125, 24.3359375, 28.49609375, 32.65625, 36.81640625, 40.9765625, 45.13671875, 49.296875, 53.45703125, 57.6171875, 61.77734375, 65.9375, 70.09765625, 74.2578125, 78.41796875, 82.578125, 86.73828125, 90.8984375, 95.05859375, 99.21875, 103.37890625, 107.5390625, 111.69921875, 115.859375, 120.01953125, 124.1796875, 128.33984375, 132.5]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 5.0, 11.0, 10.0, 10.0, 18.0, 23.0, 35.0, 50.0, 71.0, 100.0, 157.0, 237.0, 298.0, 451.0, 623.0, 899.0, 1399.0, 2017.0, 3131.0, 4743.0, 7023.0, 11072.0, 17977.0, 28613.0, 47999.0, 83655.0, 149370.0, 226427.0, 191091.0, 109987.0, 62286.0, 36235.0, 22257.0, 14005.0, 8890.0, 5771.0, 3836.0, 2541.0, 1663.0, 1104.0, 789.0, 530.0, 323.0, 272.0, 175.0, 122.0, 79.0, 58.0, 35.0, 25.0, 24.0, 13.0, 14.0, 8.0, 3.0, 2.0, 5.0, 3.0, 1.0, 1.0], "bins": [-5.46875, -5.29644775390625, -5.1241455078125, -4.95184326171875, -4.779541015625, -4.60723876953125, -4.4349365234375, -4.26263427734375, -4.09033203125, -3.91802978515625, -3.7457275390625, -3.57342529296875, -3.401123046875, -3.22882080078125, -3.0565185546875, -2.88421630859375, -2.7119140625, -2.53961181640625, -2.3673095703125, -2.19500732421875, -2.022705078125, -1.85040283203125, -1.6781005859375, -1.50579833984375, -1.33349609375, -1.16119384765625, -0.9888916015625, -0.81658935546875, -0.644287109375, -0.47198486328125, -0.2996826171875, -0.12738037109375, 0.044921875, 0.21722412109375, 0.3895263671875, 0.56182861328125, 0.734130859375, 0.90643310546875, 1.0787353515625, 1.25103759765625, 1.42333984375, 1.59564208984375, 1.7679443359375, 1.94024658203125, 2.112548828125, 2.28485107421875, 2.4571533203125, 2.62945556640625, 2.8017578125, 2.97406005859375, 3.1463623046875, 3.31866455078125, 3.490966796875, 3.66326904296875, 3.8355712890625, 4.00787353515625, 4.18017578125, 4.35247802734375, 4.5247802734375, 4.69708251953125, 4.869384765625, 5.04168701171875, 5.2139892578125, 5.38629150390625, 5.55859375]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 5.0, 5.0, 6.0, 8.0, 9.0, 10.0, 14.0, 16.0, 12.0, 12.0, 21.0, 25.0, 23.0, 20.0, 28.0, 41.0, 32.0, 25.0, 41.0, 28.0, 29.0, 36.0, 42.0, 1060.0, 40.0, 43.0, 35.0, 36.0, 27.0, 36.0, 29.0, 24.0, 25.0, 38.0, 31.0, 23.0, 22.0, 12.0, 16.0, 7.0, 6.0, 8.0, 9.0, 3.0, 5.0, 1.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-66.125, -63.9345703125, -61.744140625, -59.5537109375, -57.36328125, -55.1728515625, -52.982421875, -50.7919921875, -48.6015625, -46.4111328125, -44.220703125, -42.0302734375, -39.83984375, -37.6494140625, -35.458984375, -33.2685546875, -31.078125, -28.8876953125, -26.697265625, -24.5068359375, -22.31640625, -20.1259765625, -17.935546875, -15.7451171875, -13.5546875, -11.3642578125, -9.173828125, -6.9833984375, -4.79296875, -2.6025390625, -0.412109375, 1.7783203125, 3.96875, 6.1591796875, 8.349609375, 10.5400390625, 12.73046875, 14.9208984375, 17.111328125, 19.3017578125, 21.4921875, 23.6826171875, 25.873046875, 28.0634765625, 30.25390625, 32.4443359375, 34.634765625, 36.8251953125, 39.015625, 41.2060546875, 43.396484375, 45.5869140625, 47.77734375, 49.9677734375, 52.158203125, 54.3486328125, 56.5390625, 58.7294921875, 60.919921875, 63.1103515625, 65.30078125, 67.4912109375, 69.681640625, 71.8720703125, 74.0625]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 9.0, 4.0, 11.0, 9.0, 36.0, 36.0, 54.0, 82.0, 134.0, 191.0, 290.0, 404.0, 532.0, 896.0, 1296.0, 1832.0, 2645.0, 3897.0, 5800.0, 8434.0, 12402.0, 18884.0, 28225.0, 43105.0, 66192.0, 101898.0, 150273.0, 1223297.0, 144147.0, 97254.0, 62367.0, 40579.0, 26744.0, 17869.0, 12065.0, 8006.0, 5462.0, 3776.0, 2515.0, 1698.0, 1218.0, 787.0, 580.0, 391.0, 272.0, 188.0, 119.0, 87.0, 57.0, 33.0, 22.0, 24.0, 5.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-3.44140625, -3.328338623046875, -3.21527099609375, -3.102203369140625, -2.9891357421875, -2.876068115234375, -2.76300048828125, -2.649932861328125, -2.536865234375, -2.423797607421875, -2.31072998046875, -2.197662353515625, -2.0845947265625, -1.971527099609375, -1.85845947265625, -1.745391845703125, -1.63232421875, -1.519256591796875, -1.40618896484375, -1.293121337890625, -1.1800537109375, -1.066986083984375, -0.95391845703125, -0.840850830078125, -0.727783203125, -0.614715576171875, -0.50164794921875, -0.388580322265625, -0.2755126953125, -0.162445068359375, -0.04937744140625, 0.063690185546875, 0.1767578125, 0.289825439453125, 0.40289306640625, 0.515960693359375, 0.6290283203125, 0.742095947265625, 0.85516357421875, 0.968231201171875, 1.081298828125, 1.194366455078125, 1.30743408203125, 1.420501708984375, 1.5335693359375, 1.646636962890625, 1.75970458984375, 1.872772216796875, 1.98583984375, 2.098907470703125, 2.21197509765625, 2.325042724609375, 2.4381103515625, 2.551177978515625, 2.66424560546875, 2.777313232421875, 2.890380859375, 3.003448486328125, 3.11651611328125, 3.229583740234375, 3.3426513671875, 3.455718994140625, 3.56878662109375, 3.681854248046875, 3.794921875]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 2.0, 2.0, 1.0, 5.0, 6.0, 8.0, 10.0, 14.0, 22.0, 31.0, 38.0, 30.0, 59.0, 55.0, 84.0, 71.0, 74.0, 76.0, 67.0, 73.0, 45.0, 48.0, 38.0, 34.0, 17.0, 24.0, 24.0, 8.0, 16.0, 7.0, 6.0, 5.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0285797119140625, -0.02771306037902832, -0.02684640884399414, -0.02597975730895996, -0.02511310577392578, -0.0242464542388916, -0.023379802703857422, -0.022513151168823242, -0.021646499633789062, -0.020779848098754883, -0.019913196563720703, -0.019046545028686523, -0.018179893493652344, -0.017313241958618164, -0.016446590423583984, -0.015579938888549805, -0.014713287353515625, -0.013846635818481445, -0.012979984283447266, -0.012113332748413086, -0.011246681213378906, -0.010380029678344727, -0.009513378143310547, -0.008646726608276367, -0.0077800750732421875, -0.006913423538208008, -0.006046772003173828, -0.0051801204681396484, -0.004313468933105469, -0.003446817398071289, -0.0025801658630371094, -0.0017135143280029297, -0.00084686279296875, 1.9788742065429688e-05, 0.0008864402770996094, 0.001753091812133789, 0.0026197433471679688, 0.0034863948822021484, 0.004353046417236328, 0.005219697952270508, 0.0060863494873046875, 0.006953001022338867, 0.007819652557373047, 0.008686304092407227, 0.009552955627441406, 0.010419607162475586, 0.011286258697509766, 0.012152910232543945, 0.013019561767578125, 0.013886213302612305, 0.014752864837646484, 0.015619516372680664, 0.016486167907714844, 0.017352819442749023, 0.018219470977783203, 0.019086122512817383, 0.019952774047851562, 0.020819425582885742, 0.021686077117919922, 0.0225527286529541, 0.02341938018798828, 0.02428603172302246, 0.02515268325805664, 0.02601933479309082, 0.026885986328125]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 4.0, 3.0, 9.0, 6.0, 13.0, 10.0, 12.0, 20.0, 47.0, 52.0, 62.0, 103.0, 168.0, 239.0, 450.0, 759.0, 1369.0, 2810.0, 6393.0, 17359.0, 55117.0, 218030.0, 464328.0, 201055.0, 52024.0, 16240.0, 6031.0, 2684.0, 1304.0, 737.0, 401.0, 261.0, 156.0, 93.0, 71.0, 34.0, 27.0, 23.0, 14.0, 13.0, 12.0, 7.0, 4.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1341552734375, -0.12989234924316406, -0.12562942504882812, -0.12136650085449219, -0.11710357666015625, -0.11284065246582031, -0.10857772827148438, -0.10431480407714844, -0.1000518798828125, -0.09578895568847656, -0.09152603149414062, -0.08726310729980469, -0.08300018310546875, -0.07873725891113281, -0.07447433471679688, -0.07021141052246094, -0.065948486328125, -0.06168556213378906, -0.057422637939453125, -0.05315971374511719, -0.04889678955078125, -0.04463386535644531, -0.040370941162109375, -0.03610801696777344, -0.0318450927734375, -0.027582168579101562, -0.023319244384765625, -0.019056320190429688, -0.01479339599609375, -0.010530471801757812, -0.006267547607421875, -0.0020046234130859375, 0.00225830078125, 0.0065212249755859375, 0.010784149169921875, 0.015047073364257812, 0.01930999755859375, 0.023572921752929688, 0.027835845947265625, 0.03209877014160156, 0.0363616943359375, 0.04062461853027344, 0.044887542724609375, 0.04915046691894531, 0.05341339111328125, 0.05767631530761719, 0.061939239501953125, 0.06620216369628906, 0.070465087890625, 0.07472801208496094, 0.07899093627929688, 0.08325386047363281, 0.08751678466796875, 0.09177970886230469, 0.09604263305664062, 0.10030555725097656, 0.1045684814453125, 0.10883140563964844, 0.11309432983398438, 0.11735725402832031, 0.12162017822265625, 0.1258831024169922, 0.13014602661132812, 0.13440895080566406, 0.138671875]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 18.0, 20.0, 41.0, 69.0, 86.0, 117.0, 163.0, 145.0, 106.0, 77.0, 47.0, 45.0, 27.0, 16.0, 10.0, 12.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.020172372460365295, -0.01910342648625374, -0.01803448237478733, -0.016965538263320923, -0.015896592289209366, -0.014827647246420383, -0.013758702203631401, -0.012689757160842419, -0.011620812118053436, -0.010551867075264454, -0.009482922032475471, -0.008413976989686489, -0.007345031946897507, -0.006276086904108524, -0.005207141861319542, -0.0041381968185305595, -0.003069251775741577, -0.0020003067329525948, -0.0009313616901636124, 0.00013758335262537003, 0.0012065283954143524, 0.002275473438203335, 0.003344418480992317, 0.0044133635237813, 0.005482308566570282, 0.006551253609359264, 0.007620198652148247, 0.00868914369493723, 0.009758088737726212, 0.010827033780515194, 0.011895978823304176, 0.012964923866093159, 0.014033865183591843, 0.015102810226380825, 0.016171755269169807, 0.017240699380636215, 0.018309645354747772, 0.01937859132885933, 0.020447535440325737, 0.021516479551792145, 0.022585425525903702, 0.02365437150001526, 0.024723315611481667, 0.025792259722948074, 0.02686120569705963, 0.02793015167117119, 0.028999095782637596, 0.030068039894104004, 0.03113698586821556, 0.03220593184232712, 0.033274874091148376, 0.034343820065259933, 0.03541276603937149, 0.03648171201348305, 0.037550657987594604, 0.03861960023641586, 0.03968854621052742, 0.04075749218463898, 0.041826434433460236, 0.04289538040757179, 0.04396432638168335, 0.04503327235579491, 0.046102218329906464, 0.04717116057872772, 0.04824010655283928]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 5.0, 6.0, 2.0, 5.0, 9.0, 10.0, 14.0, 10.0, 13.0, 19.0, 22.0, 17.0, 28.0, 22.0, 25.0, 34.0, 34.0, 34.0, 30.0, 44.0, 29.0, 36.0, 37.0, 37.0, 38.0, 42.0, 35.0, 38.0, 37.0, 30.0, 32.0, 34.0, 25.0, 29.0, 16.0, 13.0, 18.0, 13.0, 22.0, 6.0, 17.0, 6.0, 8.0, 2.0, 3.0, 7.0, 3.0, 4.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.01125270128250122, -0.010897240601480007, -0.010541779920458794, -0.01018631923943758, -0.009830858558416367, -0.009475397877395153, -0.00911993719637394, -0.008764476515352726, -0.008409015834331512, -0.008053555153310299, -0.007698094472289085, -0.007342633791267872, -0.006987173110246658, -0.006631712429225445, -0.006276251748204231, -0.005920791067183018, -0.005565330386161804, -0.005209869705140591, -0.004854409024119377, -0.004498948343098164, -0.00414348766207695, -0.0037880269810557365, -0.003432566300034523, -0.0030771056190133095, -0.002721644937992096, -0.0023661842569708824, -0.002010723575949669, -0.0016552628949284554, -0.0012998022139072418, -0.0009443415328860283, -0.0005888808518648148, -0.00023342017084360123, 0.0001220405101776123, 0.00047750119119882584, 0.0008329618722200394, 0.001188422553241253, 0.0015438832342624664, 0.00189934391528368, 0.0022548045963048935, 0.002610265277326107, 0.0029657259583473206, 0.003321186639368534, 0.0036766473203897476, 0.004032108001410961, 0.004387568682432175, 0.004743029363453388, 0.005098490044474602, 0.005453950725495815, 0.005809411406517029, 0.006164872087538242, 0.006520332768559456, 0.006875793449580669, 0.007231254130601883, 0.0075867148116230965, 0.00794217549264431, 0.008297636173665524, 0.008653096854686737, 0.00900855753570795, 0.009364018216729164, 0.009719478897750378, 0.010074939578771591, 0.010430400259792805, 0.010785860940814018, 0.011141321621835232, 0.011496782302856445]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 7.0, 8.0, 10.0, 11.0, 10.0, 13.0, 14.0, 16.0, 22.0, 28.0, 23.0, 35.0, 31.0, 35.0, 45.0, 43.0, 31.0, 42.0, 52.0, 49.0, 46.0, 56.0, 51.0, 36.0, 42.0, 32.0, 39.0, 39.0, 30.0, 22.0, 13.0, 15.0, 17.0, 8.0, 7.0, 3.0, 4.0, 6.0, 5.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-133.75, -129.591796875, -125.43359375, -121.275390625, -117.1171875, -112.958984375, -108.80078125, -104.642578125, -100.484375, -96.326171875, -92.16796875, -88.009765625, -83.8515625, -79.693359375, -75.53515625, -71.376953125, -67.21875, -63.060546875, -58.90234375, -54.744140625, -50.5859375, -46.427734375, -42.26953125, -38.111328125, -33.953125, -29.794921875, -25.63671875, -21.478515625, -17.3203125, -13.162109375, -9.00390625, -4.845703125, -0.6875, 3.470703125, 7.62890625, 11.787109375, 15.9453125, 20.103515625, 24.26171875, 28.419921875, 32.578125, 36.736328125, 40.89453125, 45.052734375, 49.2109375, 53.369140625, 57.52734375, 61.685546875, 65.84375, 70.001953125, 74.16015625, 78.318359375, 82.4765625, 86.634765625, 90.79296875, 94.951171875, 99.109375, 103.267578125, 107.42578125, 111.583984375, 115.7421875, 119.900390625, 124.05859375, 128.216796875, 132.375]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 4.0, 4.0, 11.0, 8.0, 14.0, 15.0, 23.0, 33.0, 53.0, 75.0, 116.0, 141.0, 251.0, 371.0, 572.0, 921.0, 1761.0, 3429.0, 7585.0, 19954.0, 65237.0, 263575.0, 479184.0, 142629.0, 38226.0, 13078.0, 5353.0, 2517.0, 1356.0, 751.0, 449.0, 270.0, 184.0, 130.0, 79.0, 48.0, 44.0, 25.0, 22.0, 18.0, 12.0, 8.0, 5.0, 3.0, 8.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.59375, -21.87158203125, -21.1494140625, -20.42724609375, -19.705078125, -18.98291015625, -18.2607421875, -17.53857421875, -16.81640625, -16.09423828125, -15.3720703125, -14.64990234375, -13.927734375, -13.20556640625, -12.4833984375, -11.76123046875, -11.0390625, -10.31689453125, -9.5947265625, -8.87255859375, -8.150390625, -7.42822265625, -6.7060546875, -5.98388671875, -5.26171875, -4.53955078125, -3.8173828125, -3.09521484375, -2.373046875, -1.65087890625, -0.9287109375, -0.20654296875, 0.515625, 1.23779296875, 1.9599609375, 2.68212890625, 3.404296875, 4.12646484375, 4.8486328125, 5.57080078125, 6.29296875, 7.01513671875, 7.7373046875, 8.45947265625, 9.181640625, 9.90380859375, 10.6259765625, 11.34814453125, 12.0703125, 12.79248046875, 13.5146484375, 14.23681640625, 14.958984375, 15.68115234375, 16.4033203125, 17.12548828125, 17.84765625, 18.56982421875, 19.2919921875, 20.01416015625, 20.736328125, 21.45849609375, 22.1806640625, 22.90283203125, 23.625]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 7.0, 9.0, 10.0, 17.0, 37.0, 55.0, 61.0, 74.0, 78.0, 92.0, 2131.0, 114.0, 80.0, 87.0, 49.0, 52.0, 30.0, 26.0, 18.0, 12.0, 5.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-256.0, -247.08984375, -238.1796875, -229.26953125, -220.359375, -211.44921875, -202.5390625, -193.62890625, -184.71875, -175.80859375, -166.8984375, -157.98828125, -149.078125, -140.16796875, -131.2578125, -122.34765625, -113.4375, -104.52734375, -95.6171875, -86.70703125, -77.796875, -68.88671875, -59.9765625, -51.06640625, -42.15625, -33.24609375, -24.3359375, -15.42578125, -6.515625, 2.39453125, 11.3046875, 20.21484375, 29.125, 38.03515625, 46.9453125, 55.85546875, 64.765625, 73.67578125, 82.5859375, 91.49609375, 100.40625, 109.31640625, 118.2265625, 127.13671875, 136.046875, 144.95703125, 153.8671875, 162.77734375, 171.6875, 180.59765625, 189.5078125, 198.41796875, 207.328125, 216.23828125, 225.1484375, 234.05859375, 242.96875, 251.87890625, 260.7890625, 269.69921875, 278.609375, 287.51953125, 296.4296875, 305.33984375, 314.25]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 6.0, 3.0, 2.0, 9.0, 6.0, 15.0, 23.0, 27.0, 57.0, 116.0, 175.0, 310.0, 648.0, 1496.0, 6167.0, 102532.0, 2958692.0, 67746.0, 5014.0, 1325.0, 615.0, 290.0, 186.0, 104.0, 50.0, 32.0, 23.0, 13.0, 9.0, 11.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.21875, -52.68896484375, -51.1591796875, -49.62939453125, -48.099609375, -46.56982421875, -45.0400390625, -43.51025390625, -41.98046875, -40.45068359375, -38.9208984375, -37.39111328125, -35.861328125, -34.33154296875, -32.8017578125, -31.27197265625, -29.7421875, -28.21240234375, -26.6826171875, -25.15283203125, -23.623046875, -22.09326171875, -20.5634765625, -19.03369140625, -17.50390625, -15.97412109375, -14.4443359375, -12.91455078125, -11.384765625, -9.85498046875, -8.3251953125, -6.79541015625, -5.265625, -3.73583984375, -2.2060546875, -0.67626953125, 0.853515625, 2.38330078125, 3.9130859375, 5.44287109375, 6.97265625, 8.50244140625, 10.0322265625, 11.56201171875, 13.091796875, 14.62158203125, 16.1513671875, 17.68115234375, 19.2109375, 20.74072265625, 22.2705078125, 23.80029296875, 25.330078125, 26.85986328125, 28.3896484375, 29.91943359375, 31.44921875, 32.97900390625, 34.5087890625, 36.03857421875, 37.568359375, 39.09814453125, 40.6279296875, 42.15771484375, 43.6875]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 7.0, 5.0, 28.0, 44.0, 102.0, 209.0, 290.0, 172.0, 81.0, 32.0, 15.0, 13.0, 7.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-249.83074951171875, -236.20213317871094, -222.57351684570312, -208.94491577148438, -195.31629943847656, -181.68768310546875, -168.05906677246094, -154.43045043945312, -140.80184936523438, -127.17323303222656, -113.54462432861328, -99.91600799560547, -86.28739929199219, -72.65878295898438, -59.03016662597656, -45.40155792236328, -31.772933959960938, -18.14432144165039, -4.515707015991211, 9.112907409667969, 22.741519927978516, 36.37013244628906, 49.998748779296875, 63.627357482910156, 77.25597381591797, 90.88459014892578, 104.51319885253906, 118.14181518554688, 131.7704315185547, 145.3990478515625, 159.02764892578125, 172.65626525878906, 186.28488159179688, 199.9134979248047, 213.5421142578125, 227.17071533203125, 240.79933166503906, 254.42794799804688, 268.05657958984375, 281.6851806640625, 295.31378173828125, 308.9423828125, 322.5710144042969, 336.1996154785156, 349.8282470703125, 363.45684814453125, 377.08544921875, 390.7140808105469, 404.34271240234375, 417.9713134765625, 431.5999450683594, 445.2285461425781, 458.857177734375, 472.48577880859375, 486.1143798828125, 499.7430114746094, 513.37158203125, 527.0001831054688, 540.6287841796875, 554.2574462890625, 567.8860473632812, 581.5146484375, 595.1432495117188, 608.7718505859375, 622.4005126953125]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 3.0, 8.0, 6.0, 6.0, 9.0, 8.0, 14.0, 8.0, 17.0, 18.0, 17.0, 26.0, 33.0, 38.0, 42.0, 31.0, 38.0, 41.0, 34.0, 60.0, 54.0, 45.0, 53.0, 55.0, 45.0, 49.0, 30.0, 33.0, 29.0, 27.0, 29.0, 19.0, 11.0, 10.0, 9.0, 9.0, 16.0, 7.0, 3.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-183.43011474609375, -177.02760314941406, -170.62509155273438, -164.2225799560547, -157.820068359375, -151.4175567626953, -145.01504516601562, -138.61251831054688, -132.21002197265625, -125.80751037597656, -119.40499877929688, -113.00248718261719, -106.5999755859375, -100.19746398925781, -93.7949447631836, -87.3924331665039, -80.98991394042969, -74.58740234375, -68.18489074707031, -61.78237533569336, -55.37986373901367, -48.977352142333984, -42.57483673095703, -36.172325134277344, -29.769813537597656, -23.36730194091797, -16.96478843688965, -10.562274932861328, -4.159763336181641, 2.242748260498047, 8.645263671875, 15.047775268554688, 21.450286865234375, 27.852798461914062, 34.25531005859375, 40.6578254699707, 47.06033706665039, 53.46284866333008, 59.86536407470703, 66.26787567138672, 72.6703872680664, 79.0728988647461, 85.47541046142578, 91.8779296875, 98.28044128417969, 104.68295288085938, 111.08546447753906, 117.48797607421875, 123.89048767089844, 130.29299926757812, 136.6955108642578, 143.0980224609375, 149.5005340576172, 155.90304565429688, 162.30557250976562, 168.70806884765625, 175.110595703125, 181.5131072998047, 187.91561889648438, 194.31813049316406, 200.72064208984375, 207.12315368652344, 213.52566528320312, 219.92819213867188, 226.3306884765625]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 5.0, 5.0, 5.0, 5.0, 7.0, 8.0, 17.0, 22.0, 22.0, 48.0, 65.0, 83.0, 104.0, 168.0, 261.0, 406.0, 614.0, 870.0, 1170.0, 1040704.0, 1163.0, 910.0, 633.0, 420.0, 274.0, 174.0, 117.0, 73.0, 55.0, 35.0, 23.0, 22.0, 20.0, 10.0, 7.0, 9.0, 7.0, 5.0, 3.0, 1.0, 2.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-105.2955322265625, -102.24687957763672, -99.19823455810547, -96.14958190917969, -93.1009292602539, -90.05228424072266, -87.00363159179688, -83.95498657226562, -80.90633392333984, -77.85768127441406, -74.80903625488281, -71.76038360595703, -68.71173095703125, -65.6630859375, -62.61443328857422, -59.5657844543457, -56.51713180541992, -53.468482971191406, -50.419830322265625, -47.37118148803711, -44.322532653808594, -41.27388000488281, -38.2252311706543, -35.17658233642578, -32.1279296875, -29.07927894592285, -26.030630111694336, -22.981979370117188, -19.933330535888672, -16.884679794311523, -13.836029052734375, -10.78738021850586, -7.738731384277344, -4.690081596374512, -1.6414313316345215, 1.4072189331054688, 4.455868721008301, 7.504518508911133, 10.553169250488281, 13.601818084716797, 16.650468826293945, 19.699119567871094, 22.74776840209961, 25.796419143676758, 28.845069885253906, 31.893718719482422, 34.94236755371094, 37.99102020263672, 41.039669036865234, 44.08831787109375, 47.13697052001953, 50.18561935424805, 53.23426818847656, 56.282920837402344, 59.33156967163086, 62.380218505859375, 65.42887115478516, 68.47752380371094, 71.52616882324219, 74.57482147216797, 77.62347412109375, 80.672119140625, 83.72077178955078, 86.76942443847656, 89.81806945800781]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 1.0, 0.0, 5.0, 5.0, 3.0, 5.0, 7.0, 6.0, 26.0, 53.0, 119.0, 7956.0, 51454864.0, 85.0, 39.0, 10.0, 11.0, 6.0, 4.0, 5.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 2.0, 2.0, 2.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2810.0, -2670.123046875, -2530.246337890625, -2390.36962890625, -2250.49267578125, -2110.61572265625, -1970.739013671875, -1830.8621826171875, -1690.9853515625, -1551.1085205078125, -1411.231689453125, -1271.3548583984375, -1131.47802734375, -991.6011962890625, -851.724365234375, -711.8475341796875, -571.970703125, -432.0938720703125, -292.217041015625, -152.3402099609375, -12.46337890625, 127.4134521484375, 267.290283203125, 407.1671142578125, 547.0439453125, 686.9207763671875, 826.797607421875, 966.6744384765625, 1106.55126953125, 1246.4281005859375, 1386.304931640625, 1526.1817626953125, 1666.05859375, 1805.9354248046875, 1945.812255859375, 2085.68896484375, 2225.56591796875, 2365.44287109375, 2505.319580078125, 2645.1962890625, 2785.0732421875, 2924.9501953125, 3064.826904296875, 3204.70361328125, 3344.58056640625, 3484.45751953125, 3624.334228515625, 3764.2109375, 3904.087890625, 4043.96484375, 4183.841796875, 4323.71826171875, 4463.59521484375, 4603.47216796875, 4743.3486328125, 4883.2255859375, 5023.1025390625, 5162.9794921875, 5302.8564453125, 5442.73291015625, 5582.60986328125, 5722.48681640625, 5862.36328125, 6002.240234375, 6142.1171875]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [3.0, 3.0, 6.0, 8.0, 18.0, 32.0, 43.0, 55.0, 75.0, 122.0, 189.0, 278.0, 409.0, 600.0, 851.0, 1220.0, 1739.0, 2481.0, 3480.0, 5293.0, 7561.0, 11132.0, 16421.0, 24864.0, 38634.0, 59873.0, 94265.0, 151870.0, 247438.0, 388395.0, 2682661.0, 1525645.0, 377116.0, 239910.0, 147972.0, 91381.0, 57795.0, 36890.0, 24329.0, 15866.0, 10636.0, 7398.0, 4968.0, 3577.0, 2524.0, 1716.0, 1186.0, 806.0, 542.0, 405.0, 266.0, 186.0, 119.0, 84.0, 39.0, 34.0, 16.0, 12.0, 11.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.5029296875, -1.4543914794921875, -1.405853271484375, -1.3573150634765625, -1.30877685546875, -1.2602386474609375, -1.211700439453125, -1.1631622314453125, -1.1146240234375, -1.0660858154296875, -1.017547607421875, -0.9690093994140625, -0.92047119140625, -0.8719329833984375, -0.823394775390625, -0.7748565673828125, -0.726318359375, -0.6777801513671875, -0.629241943359375, -0.5807037353515625, -0.53216552734375, -0.4836273193359375, -0.435089111328125, -0.3865509033203125, -0.3380126953125, -0.2894744873046875, -0.240936279296875, -0.1923980712890625, -0.14385986328125, -0.0953216552734375, -0.046783447265625, 0.0017547607421875, 0.05029296875, 0.0988311767578125, 0.147369384765625, 0.1959075927734375, 0.24444580078125, 0.2929840087890625, 0.341522216796875, 0.3900604248046875, 0.4385986328125, 0.4871368408203125, 0.535675048828125, 0.5842132568359375, 0.63275146484375, 0.6812896728515625, 0.729827880859375, 0.7783660888671875, 0.826904296875, 0.8754425048828125, 0.923980712890625, 0.9725189208984375, 1.02105712890625, 1.0695953369140625, 1.118133544921875, 1.1666717529296875, 1.2152099609375, 1.2637481689453125, 1.312286376953125, 1.3608245849609375, 1.40936279296875, 1.4579010009765625, 1.506439208984375, 1.5549774169921875, 1.603515625]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 5.0, 1.0, 0.0, 0.0, 6.0, 5.0, 4.0, 6.0, 5.0, 7.0, 7.0, 8.0, 9.0, 14.0, 18.0, 22.0, 19.0, 19.0, 25.0, 30.0, 38.0, 31.0, 38.0, 43.0, 41.0, 45.0, 37.0, 51.0, 1037.0, 58.0, 50.0, 23.0, 45.0, 24.0, 32.0, 26.0, 29.0, 26.0, 16.0, 20.0, 21.0, 16.0, 11.0, 13.0, 5.0, 13.0, 10.0, 5.0, 6.0, 5.0, 5.0, 3.0, 5.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.34375, -22.578369140625, -21.81298828125, -21.047607421875, -20.2822265625, -19.516845703125, -18.75146484375, -17.986083984375, -17.220703125, -16.455322265625, -15.68994140625, -14.924560546875, -14.1591796875, -13.393798828125, -12.62841796875, -11.863037109375, -11.09765625, -10.332275390625, -9.56689453125, -8.801513671875, -8.0361328125, -7.270751953125, -6.50537109375, -5.739990234375, -4.974609375, -4.209228515625, -3.44384765625, -2.678466796875, -1.9130859375, -1.147705078125, -0.38232421875, 0.383056640625, 1.1484375, 1.913818359375, 2.67919921875, 3.444580078125, 4.2099609375, 4.975341796875, 5.74072265625, 6.506103515625, 7.271484375, 8.036865234375, 8.80224609375, 9.567626953125, 10.3330078125, 11.098388671875, 11.86376953125, 12.629150390625, 13.39453125, 14.159912109375, 14.92529296875, 15.690673828125, 16.4560546875, 17.221435546875, 17.98681640625, 18.752197265625, 19.517578125, 20.282958984375, 21.04833984375, 21.813720703125, 22.5791015625, 23.344482421875, 24.10986328125, 24.875244140625, 25.640625]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 10.0, 14.0, 15.0, 30.0, 48.0, 68.0, 105.0, 130.0, 208.0, 366.0, 540.0, 845.0, 1226.0, 2022.0, 3329.0, 5306.0, 8796.0, 14476.0, 23817.0, 39847.0, 67075.0, 111343.0, 184301.0, 293298.0, 425506.0, 3484430.0, 653498.0, 364267.0, 237377.0, 146329.0, 88561.0, 52790.0, 31936.0, 19333.0, 11821.0, 7108.0, 4275.0, 2732.0, 1566.0, 961.0, 620.0, 416.0, 270.0, 181.0, 91.0, 55.0, 39.0, 18.0, 16.0, 12.0, 12.0, 6.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.638671875, -1.59014892578125, -1.5416259765625, -1.49310302734375, -1.444580078125, -1.39605712890625, -1.3475341796875, -1.29901123046875, -1.25048828125, -1.20196533203125, -1.1534423828125, -1.10491943359375, -1.056396484375, -1.00787353515625, -0.9593505859375, -0.91082763671875, -0.8623046875, -0.81378173828125, -0.7652587890625, -0.71673583984375, -0.668212890625, -0.61968994140625, -0.5711669921875, -0.52264404296875, -0.47412109375, -0.42559814453125, -0.3770751953125, -0.32855224609375, -0.280029296875, -0.23150634765625, -0.1829833984375, -0.13446044921875, -0.0859375, -0.03741455078125, 0.0111083984375, 0.05963134765625, 0.108154296875, 0.15667724609375, 0.2052001953125, 0.25372314453125, 0.30224609375, 0.35076904296875, 0.3992919921875, 0.44781494140625, 0.496337890625, 0.54486083984375, 0.5933837890625, 0.64190673828125, 0.6904296875, 0.73895263671875, 0.7874755859375, 0.83599853515625, 0.884521484375, 0.93304443359375, 0.9815673828125, 1.03009033203125, 1.07861328125, 1.12713623046875, 1.1756591796875, 1.22418212890625, 1.272705078125, 1.32122802734375, 1.3697509765625, 1.41827392578125, 1.466796875]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 4.0, 9.0, 5.0, 10.0, 8.0, 12.0, 18.0, 14.0, 15.0, 21.0, 33.0, 33.0, 37.0, 37.0, 27.0, 22.0, 43.0, 31.0, 37.0, 36.0, 365.0, 730.0, 48.0, 38.0, 27.0, 39.0, 34.0, 41.0, 25.0, 34.0, 30.0, 17.0, 19.0, 16.0, 16.0, 15.0, 20.0, 14.0, 12.0, 3.0, 8.0, 5.0, 4.0, 3.0, 3.0, 3.0, 4.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0], "bins": [-17.921875, -17.36328125, -16.8046875, -16.24609375, -15.6875, -15.12890625, -14.5703125, -14.01171875, -13.453125, -12.89453125, -12.3359375, -11.77734375, -11.21875, -10.66015625, -10.1015625, -9.54296875, -8.984375, -8.42578125, -7.8671875, -7.30859375, -6.75, -6.19140625, -5.6328125, -5.07421875, -4.515625, -3.95703125, -3.3984375, -2.83984375, -2.28125, -1.72265625, -1.1640625, -0.60546875, -0.046875, 0.51171875, 1.0703125, 1.62890625, 2.1875, 2.74609375, 3.3046875, 3.86328125, 4.421875, 4.98046875, 5.5390625, 6.09765625, 6.65625, 7.21484375, 7.7734375, 8.33203125, 8.890625, 9.44921875, 10.0078125, 10.56640625, 11.125, 11.68359375, 12.2421875, 12.80078125, 13.359375, 13.91796875, 14.4765625, 15.03515625, 15.59375, 16.15234375, 16.7109375, 17.26953125, 17.828125]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 3.0, 7.0, 9.0, 14.0, 5.0, 13.0, 22.0, 20.0, 32.0, 39.0, 47.0, 72.0, 84.0, 146.0, 241.0, 381.0, 573.0, 1131.0, 2078.0, 4150.0, 8457.0, 17760.0, 36552.0, 78939.0, 206264.0, 5712191.0, 118404.0, 53766.0, 25550.0, 12029.0, 5843.0, 3048.0, 1520.0, 735.0, 436.0, 270.0, 163.0, 126.0, 78.0, 60.0, 48.0, 28.0, 25.0, 17.0, 11.0, 15.0, 10.0, 6.0, 5.0, 3.0, 5.0, 2.0, 7.0, 1.0, 1.0, 1.0], "bins": [-5.19140625, -5.0352783203125, -4.879150390625, -4.7230224609375, -4.56689453125, -4.4107666015625, -4.254638671875, -4.0985107421875, -3.9423828125, -3.7862548828125, -3.630126953125, -3.4739990234375, -3.31787109375, -3.1617431640625, -3.005615234375, -2.8494873046875, -2.693359375, -2.5372314453125, -2.381103515625, -2.2249755859375, -2.06884765625, -1.9127197265625, -1.756591796875, -1.6004638671875, -1.4443359375, -1.2882080078125, -1.132080078125, -0.9759521484375, -0.81982421875, -0.6636962890625, -0.507568359375, -0.3514404296875, -0.1953125, -0.0391845703125, 0.116943359375, 0.2730712890625, 0.42919921875, 0.5853271484375, 0.741455078125, 0.8975830078125, 1.0537109375, 1.2098388671875, 1.365966796875, 1.5220947265625, 1.67822265625, 1.8343505859375, 1.990478515625, 2.1466064453125, 2.302734375, 2.4588623046875, 2.614990234375, 2.7711181640625, 2.92724609375, 3.0833740234375, 3.239501953125, 3.3956298828125, 3.5517578125, 3.7078857421875, 3.864013671875, 4.0201416015625, 4.17626953125, 4.3323974609375, 4.488525390625, 4.6446533203125, 4.80078125]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 2.0, 3.0, 3.0, 6.0, 11.0, 6.0, 11.0, 6.0, 19.0, 15.0, 20.0, 17.0, 25.0, 17.0, 28.0, 36.0, 36.0, 35.0, 32.0, 35.0, 39.0, 28.0, 44.0, 190.0, 899.0, 44.0, 39.0, 37.0, 35.0, 29.0, 31.0, 28.0, 27.0, 21.0, 18.0, 23.0, 22.0, 9.0, 11.0, 16.0, 13.0, 9.0, 7.0, 11.0, 11.0, 7.0, 4.0, 6.0, 1.0, 3.0, 0.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-12.7578125, -12.3497314453125, -11.941650390625, -11.5335693359375, -11.12548828125, -10.7174072265625, -10.309326171875, -9.9012451171875, -9.4931640625, -9.0850830078125, -8.677001953125, -8.2689208984375, -7.86083984375, -7.4527587890625, -7.044677734375, -6.6365966796875, -6.228515625, -5.8204345703125, -5.412353515625, -5.0042724609375, -4.59619140625, -4.1881103515625, -3.780029296875, -3.3719482421875, -2.9638671875, -2.5557861328125, -2.147705078125, -1.7396240234375, -1.33154296875, -0.9234619140625, -0.515380859375, -0.1072998046875, 0.30078125, 0.7088623046875, 1.116943359375, 1.5250244140625, 1.93310546875, 2.3411865234375, 2.749267578125, 3.1573486328125, 3.5654296875, 3.9735107421875, 4.381591796875, 4.7896728515625, 5.19775390625, 5.6058349609375, 6.013916015625, 6.4219970703125, 6.830078125, 7.2381591796875, 7.646240234375, 8.0543212890625, 8.46240234375, 8.8704833984375, 9.278564453125, 9.6866455078125, 10.0947265625, 10.5028076171875, 10.910888671875, 11.3189697265625, 11.72705078125, 12.1351318359375, 12.543212890625, 12.9512939453125, 13.359375]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 0.0, 5.0, 5.0, 2.0, 9.0, 16.0, 26.0, 48.0, 72.0, 151.0, 186.0, 192.0, 98.0, 73.0, 38.0, 28.0, 22.0, 10.0, 6.0, 7.0, 3.0, 3.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-42.452117919921875, -41.43827438354492, -40.424434661865234, -39.41059112548828, -38.39674758911133, -37.382904052734375, -36.36906433105469, -35.355220794677734, -34.34137725830078, -33.32753372192383, -32.31369400024414, -31.299850463867188, -30.286006927490234, -29.272165298461914, -28.258323669433594, -27.24448013305664, -26.230640411376953, -25.216798782348633, -24.20295524597168, -23.18911361694336, -22.175270080566406, -21.161428451538086, -20.147586822509766, -19.133743286132812, -18.119901657104492, -17.106060028076172, -16.09221649169922, -15.078374862670898, -14.064532279968262, -13.050689697265625, -12.036848068237305, -11.023005485534668, -10.009159088134766, -8.995316505432129, -7.98147439956665, -6.967632293701172, -5.953789710998535, -4.939947128295898, -3.92610502243042, -2.9122629165649414, -1.8984203338623047, -0.8845779895782471, 0.12926435470581055, 1.1431066989898682, 2.156949043273926, 3.1707916259765625, 4.184633731842041, 5.1984758377075195, 6.212318420410156, 7.226161003112793, 8.24000358581543, 9.25384521484375, 10.267687797546387, 11.281530380249023, 12.295372009277344, 13.30921459197998, 14.323057174682617, 15.336899757385254, 16.35074234008789, 17.36458396911621, 18.37842559814453, 19.392269134521484, 20.406110763549805, 21.419952392578125, 22.433795928955078]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 2.0, 4.0, 4.0, 5.0, 16.0, 8.0, 10.0, 7.0, 11.0, 14.0, 14.0, 23.0, 26.0, 30.0, 30.0, 32.0, 38.0, 38.0, 49.0, 38.0, 41.0, 31.0, 42.0, 46.0, 46.0, 28.0, 39.0, 37.0, 42.0, 26.0, 38.0, 28.0, 16.0, 26.0, 30.0, 22.0, 16.0, 11.0, 9.0, 5.0, 3.0, 8.0, 3.0, 8.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-33.435340881347656, -32.49299621582031, -31.55065155029297, -30.608306884765625, -29.66596221923828, -28.723617553710938, -27.781272888183594, -26.83892822265625, -25.896583557128906, -24.954238891601562, -24.01189422607422, -23.069549560546875, -22.12720489501953, -21.184860229492188, -20.242515563964844, -19.3001708984375, -18.357826232910156, -17.415481567382812, -16.47313690185547, -15.530792236328125, -14.588447570800781, -13.646102905273438, -12.703758239746094, -11.76141357421875, -10.819068908691406, -9.876724243164062, -8.934379577636719, -7.992034912109375, -7.049690246582031, -6.1073455810546875, -5.165000915527344, -4.22265625, -3.2803096771240234, -2.3379650115966797, -1.395620346069336, -0.4532756805419922, 0.48906898498535156, 1.4314136505126953, 2.373758316040039, 3.316102981567383, 4.258447647094727, 5.20079231262207, 6.143136978149414, 7.085481643676758, 8.027826309204102, 8.970170974731445, 9.912515640258789, 10.854860305786133, 11.797204971313477, 12.73954963684082, 13.681894302368164, 14.624238967895508, 15.566583633422852, 16.508928298950195, 17.45127296447754, 18.393617630004883, 19.335962295532227, 20.27830696105957, 21.220651626586914, 22.162996292114258, 23.1053409576416, 24.047685623168945, 24.99003028869629, 25.932374954223633, 26.874719619750977]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 4.0, 6.0, 5.0, 9.0, 4.0, 15.0, 17.0, 33.0, 37.0, 49.0, 87.0, 119.0, 144.0, 252.0, 383.0, 642.0, 1114.0, 2277.0, 5082.0, 17427.0, 3833948.0, 304323.0, 17134.0, 5359.0, 2468.0, 1288.0, 745.0, 408.0, 302.0, 163.0, 124.0, 93.0, 53.0, 46.0, 29.0, 22.0, 23.0, 11.0, 5.0, 7.0, 6.0, 9.0, 2.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.324951171875, -0.3128929138183594, -0.30083465576171875, -0.2887763977050781, -0.2767181396484375, -0.2646598815917969, -0.25260162353515625, -0.24054336547851562, -0.228485107421875, -0.21642684936523438, -0.20436859130859375, -0.19231033325195312, -0.1802520751953125, -0.16819381713867188, -0.15613555908203125, -0.14407730102539062, -0.13201904296875, -0.11996078491210938, -0.10790252685546875, -0.09584426879882812, -0.0837860107421875, -0.07172775268554688, -0.05966949462890625, -0.047611236572265625, -0.035552978515625, -0.023494720458984375, -0.01143646240234375, 0.000621795654296875, 0.0126800537109375, 0.024738311767578125, 0.03679656982421875, 0.048854827880859375, 0.0609130859375, 0.07297134399414062, 0.08502960205078125, 0.09708786010742188, 0.1091461181640625, 0.12120437622070312, 0.13326263427734375, 0.14532089233398438, 0.157379150390625, 0.16943740844726562, 0.18149566650390625, 0.19355392456054688, 0.2056121826171875, 0.21767044067382812, 0.22972869873046875, 0.24178695678710938, 0.25384521484375, 0.2659034729003906, 0.27796173095703125, 0.2900199890136719, 0.3020782470703125, 0.3141365051269531, 0.32619476318359375, 0.3382530212402344, 0.350311279296875, 0.3623695373535156, 0.37442779541015625, 0.3864860534667969, 0.3985443115234375, 0.4106025695800781, 0.42266082763671875, 0.4347190856933594, 0.44677734375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 7.0, 2.0, 2.0, 2.0, 8.0, 10.0, 6.0, 4.0, 7.0, 5.0, 22.0, 17.0, 682.0, 122.0, 15.0, 13.0, 10.0, 13.0, 9.0, 6.0, 6.0, 3.0, 9.0, 4.0, 4.0, 4.0, 3.0, 4.0, 1.0, 2.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.136962890625, -0.13256072998046875, -0.1281585693359375, -0.12375640869140625, -0.119354248046875, -0.11495208740234375, -0.1105499267578125, -0.10614776611328125, -0.10174560546875, -0.09734344482421875, -0.0929412841796875, -0.08853912353515625, -0.084136962890625, -0.07973480224609375, -0.0753326416015625, -0.07093048095703125, -0.0665283203125, -0.06212615966796875, -0.0577239990234375, -0.05332183837890625, -0.048919677734375, -0.04451751708984375, -0.0401153564453125, -0.03571319580078125, -0.03131103515625, -0.02690887451171875, -0.0225067138671875, -0.01810455322265625, -0.013702392578125, -0.00930023193359375, -0.0048980712890625, -0.00049591064453125, 0.00390625, 0.00830841064453125, 0.0127105712890625, 0.01711273193359375, 0.021514892578125, 0.02591705322265625, 0.0303192138671875, 0.03472137451171875, 0.03912353515625, 0.04352569580078125, 0.0479278564453125, 0.05233001708984375, 0.056732177734375, 0.06113433837890625, 0.0655364990234375, 0.06993865966796875, 0.0743408203125, 0.07874298095703125, 0.0831451416015625, 0.08754730224609375, 0.091949462890625, 0.09635162353515625, 0.1007537841796875, 0.10515594482421875, 0.10955810546875, 0.11396026611328125, 0.1183624267578125, 0.12276458740234375, 0.127166748046875, 0.13156890869140625, 0.1359710693359375, 0.14037322998046875, 0.144775390625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 1.0, 5.0, 8.0, 8.0, 13.0, 15.0, 21.0, 30.0, 21.0, 50.0, 64.0, 95.0, 157.0, 241.0, 407.0, 694.0, 1248.0, 2399.0, 5460.0, 14331.0, 54357.0, 896162.0, 3105309.0, 80455.0, 19373.0, 7052.0, 3017.0, 1448.0, 773.0, 404.0, 231.0, 130.0, 96.0, 59.0, 43.0, 31.0, 21.0, 18.0, 5.0, 5.0, 8.0, 5.0, 3.0, 7.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.32763671875, -0.3174324035644531, -0.30722808837890625, -0.2970237731933594, -0.2868194580078125, -0.2766151428222656, -0.26641082763671875, -0.2562065124511719, -0.246002197265625, -0.23579788208007812, -0.22559356689453125, -0.21538925170898438, -0.2051849365234375, -0.19498062133789062, -0.18477630615234375, -0.17457199096679688, -0.16436767578125, -0.15416336059570312, -0.14395904541015625, -0.13375473022460938, -0.1235504150390625, -0.11334609985351562, -0.10314178466796875, -0.09293746948242188, -0.082733154296875, -0.07252883911132812, -0.06232452392578125, -0.052120208740234375, -0.0419158935546875, -0.031711578369140625, -0.02150726318359375, -0.011302947998046875, -0.0010986328125, 0.009105682373046875, 0.01930999755859375, 0.029514312744140625, 0.0397186279296875, 0.049922943115234375, 0.06012725830078125, 0.07033157348632812, 0.080535888671875, 0.09074020385742188, 0.10094451904296875, 0.11114883422851562, 0.1213531494140625, 0.13155746459960938, 0.14176177978515625, 0.15196609497070312, 0.16217041015625, 0.17237472534179688, 0.18257904052734375, 0.19278335571289062, 0.2029876708984375, 0.21319198608398438, 0.22339630126953125, 0.23360061645507812, 0.243804931640625, 0.2540092468261719, 0.26421356201171875, 0.2744178771972656, 0.2846221923828125, 0.2948265075683594, 0.30503082275390625, 0.3152351379394531, 0.325439453125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 3.0, 1.0, 4.0, 7.0, 7.0, 10.0, 15.0, 13.0, 22.0, 32.0, 47.0, 106.0, 238.0, 951.0, 1881.0, 376.0, 142.0, 73.0, 35.0, 23.0, 18.0, 14.0, 6.0, 7.0, 7.0, 10.0, 9.0, 5.0, 4.0, 2.0, 1.0, 3.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16455078125, -0.15850448608398438, -0.15245819091796875, -0.14641189575195312, -0.1403656005859375, -0.13431930541992188, -0.12827301025390625, -0.12222671508789062, -0.116180419921875, -0.11013412475585938, -0.10408782958984375, -0.09804153442382812, -0.0919952392578125, -0.08594894409179688, -0.07990264892578125, -0.07385635375976562, -0.06781005859375, -0.061763763427734375, -0.05571746826171875, -0.049671173095703125, -0.0436248779296875, -0.037578582763671875, -0.03153228759765625, -0.025485992431640625, -0.019439697265625, -0.013393402099609375, -0.00734710693359375, -0.001300811767578125, 0.0047454833984375, 0.010791778564453125, 0.01683807373046875, 0.022884368896484375, 0.0289306640625, 0.034976959228515625, 0.04102325439453125, 0.047069549560546875, 0.0531158447265625, 0.059162139892578125, 0.06520843505859375, 0.07125473022460938, 0.077301025390625, 0.08334732055664062, 0.08939361572265625, 0.09543991088867188, 0.1014862060546875, 0.10753250122070312, 0.11357879638671875, 0.11962509155273438, 0.12567138671875, 0.13171768188476562, 0.13776397705078125, 0.14381027221679688, 0.1498565673828125, 0.15590286254882812, 0.16194915771484375, 0.16799545288085938, 0.174041748046875, 0.18008804321289062, 0.18613433837890625, 0.19218063354492188, 0.1982269287109375, 0.20427322387695312, 0.21031951904296875, 0.21636581420898438, 0.222412109375]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 34.0, 686.0, 271.0, 13.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.102365016937256, -5.991053104400635, -5.8797407150268555, -5.768428802490234, -5.657116889953613, -5.545804977416992, -5.434492588043213, -5.323180675506592, -5.2118682861328125, -5.100556373596191, -4.989243984222412, -4.877932071685791, -4.76662015914917, -4.655307769775391, -4.5439958572387695, -4.432683944702148, -4.321372032165527, -4.210060119628906, -4.098747730255127, -3.987435817718506, -3.8761239051818848, -3.7648117542266846, -3.6534996032714844, -3.5421876907348633, -3.430875539779663, -3.319563388824463, -3.208251476287842, -3.0969393253326416, -2.9856271743774414, -2.8743152618408203, -2.76300311088562, -2.65169095993042, -2.540379285812378, -2.4290671348571777, -2.3177552223205566, -2.2064430713653564, -2.0951309204101562, -1.9838190078735352, -1.872506856918335, -1.7611948251724243, -1.6498827934265137, -1.538570761680603, -1.4272587299346924, -1.3159465789794922, -1.2046345472335815, -1.093322515487671, -0.9820104241371155, -0.8706983327865601, -0.7593863010406494, -0.6480742692947388, -0.5367621779441833, -0.4254501163959503, -0.3141380548477173, -0.20282602310180664, -0.09151393175125122, 0.0197981595993042, 0.13111019134521484, 0.24242225289344788, 0.3537343144416809, 0.46504637598991394, 0.576358437538147, 0.6876704692840576, 0.798982560634613, 0.9102946519851685, 1.021606683731079]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 2.0, 4.0, 4.0, 2.0, 3.0, 2.0, 5.0, 4.0, 5.0, 5.0, 20.0, 19.0, 13.0, 31.0, 30.0, 48.0, 71.0, 61.0, 82.0, 82.0, 93.0, 71.0, 70.0, 46.0, 62.0, 53.0, 35.0, 16.0, 12.0, 16.0, 13.0, 4.0, 9.0, 5.0, 4.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.7848069667816162, -0.7634256482124329, -0.7420442700386047, -0.7206629514694214, -0.6992815732955933, -0.6779002547264099, -0.6565189361572266, -0.6351375579833984, -0.6137562394142151, -0.5923749208450317, -0.5709935426712036, -0.5496122241020203, -0.5282309055328369, -0.5068495273590088, -0.48546820878982544, -0.4640868604183197, -0.44270551204681396, -0.4213241636753082, -0.3999428153038025, -0.37856149673461914, -0.3571801483631134, -0.33579879999160767, -0.3144174814224243, -0.2930361330509186, -0.27165478467941284, -0.2502734363079071, -0.22889210283756256, -0.20751076936721802, -0.18612942099571228, -0.16474807262420654, -0.143366739153862, -0.12198540568351746, -0.1006041169166565, -0.07922277599573135, -0.05784143507480621, -0.03646009415388107, -0.015078753232955933, 0.006302587687969208, 0.027683928608894348, 0.04906526207923889, 0.07044661045074463, 0.09182795137166977, 0.11320929229259491, 0.13459062576293945, 0.1559719741344452, 0.17735332250595093, 0.19873465597629547, 0.22011598944664001, 0.24149733781814575, 0.2628786861896515, 0.2842600345611572, 0.3056413531303406, 0.3270227015018463, 0.34840404987335205, 0.3697853684425354, 0.39116671681404114, 0.4125480651855469, 0.4339294135570526, 0.45531076192855835, 0.4766920804977417, 0.49807342886924744, 0.5194547772407532, 0.5408360958099365, 0.5622174739837646, 0.583598792552948]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 5.0, 0.0, 2.0, 6.0, 13.0, 8.0, 13.0, 25.0, 21.0, 38.0, 72.0, 86.0, 108.0, 160.0, 259.0, 338.0, 560.0, 923.0, 1427.0, 2408.0, 4179.0, 7769.0, 16047.0, 38189.0, 881625.0, 52500.0, 19903.0, 9573.0, 4851.0, 2870.0, 1632.0, 972.0, 677.0, 425.0, 257.0, 195.0, 125.0, 83.0, 66.0, 43.0, 25.0, 33.0, 23.0, 9.0, 3.0, 4.0, 4.0, 8.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.61572265625, -0.59344482421875, -0.5711669921875, -0.54888916015625, -0.526611328125, -0.50433349609375, -0.4820556640625, -0.45977783203125, -0.4375, -0.41522216796875, -0.3929443359375, -0.37066650390625, -0.348388671875, -0.32611083984375, -0.3038330078125, -0.28155517578125, -0.25927734375, -0.23699951171875, -0.2147216796875, -0.19244384765625, -0.170166015625, -0.14788818359375, -0.1256103515625, -0.10333251953125, -0.0810546875, -0.05877685546875, -0.0364990234375, -0.01422119140625, 0.008056640625, 0.03033447265625, 0.0526123046875, 0.07489013671875, 0.09716796875, 0.11944580078125, 0.1417236328125, 0.16400146484375, 0.186279296875, 0.20855712890625, 0.2308349609375, 0.25311279296875, 0.275390625, 0.29766845703125, 0.3199462890625, 0.34222412109375, 0.364501953125, 0.38677978515625, 0.4090576171875, 0.43133544921875, 0.45361328125, 0.47589111328125, 0.4981689453125, 0.52044677734375, 0.542724609375, 0.56500244140625, 0.5872802734375, 0.60955810546875, 0.6318359375, 0.65411376953125, 0.6763916015625, 0.69866943359375, 0.720947265625, 0.74322509765625, 0.7655029296875, 0.78778076171875, 0.81005859375]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 5.0, 3.0, 2.0, 3.0, 6.0, 7.0, 6.0, 7.0, 2.0, 9.0, 8.0, 22.0, 19.0, 481.0, 313.0, 15.0, 16.0, 10.0, 13.0, 5.0, 11.0, 6.0, 2.0, 7.0, 4.0, 7.0, 4.0, 2.0, 3.0, 4.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1290283203125, -0.1248779296875, -0.1207275390625, -0.1165771484375, -0.1124267578125, -0.1082763671875, -0.1041259765625, -0.0999755859375, -0.0958251953125, -0.0916748046875, -0.0875244140625, -0.0833740234375, -0.0792236328125, -0.0750732421875, -0.0709228515625, -0.0667724609375, -0.0626220703125, -0.0584716796875, -0.0543212890625, -0.0501708984375, -0.0460205078125, -0.0418701171875, -0.0377197265625, -0.0335693359375, -0.0294189453125, -0.0252685546875, -0.0211181640625, -0.0169677734375, -0.0128173828125, -0.0086669921875, -0.0045166015625, -0.0003662109375, 0.0037841796875, 0.0079345703125, 0.0120849609375, 0.0162353515625, 0.0203857421875, 0.0245361328125, 0.0286865234375, 0.0328369140625, 0.0369873046875, 0.0411376953125, 0.0452880859375, 0.0494384765625, 0.0535888671875, 0.0577392578125, 0.0618896484375, 0.0660400390625, 0.0701904296875, 0.0743408203125, 0.0784912109375, 0.0826416015625, 0.0867919921875, 0.0909423828125, 0.0950927734375, 0.0992431640625, 0.1033935546875, 0.1075439453125, 0.1116943359375, 0.1158447265625, 0.1199951171875, 0.1241455078125, 0.1282958984375, 0.1324462890625, 0.1365966796875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 7.0, 5.0, 6.0, 11.0, 9.0, 17.0, 15.0, 22.0, 32.0, 39.0, 66.0, 66.0, 91.0, 110.0, 175.0, 230.0, 371.0, 521.0, 999.0, 1880.0, 3993.0, 9593.0, 26680.0, 85742.0, 349238.0, 416782.0, 101143.0, 30403.0, 10965.0, 4372.0, 2009.0, 1016.0, 577.0, 379.0, 279.0, 188.0, 113.0, 110.0, 67.0, 51.0, 46.0, 39.0, 31.0, 23.0, 12.0, 12.0, 9.0, 2.0, 2.0, 7.0, 4.0, 0.0, 1.0, 2.0], "bins": [-0.419189453125, -0.40723419189453125, -0.3952789306640625, -0.38332366943359375, -0.371368408203125, -0.35941314697265625, -0.3474578857421875, -0.33550262451171875, -0.32354736328125, -0.31159210205078125, -0.2996368408203125, -0.28768157958984375, -0.275726318359375, -0.26377105712890625, -0.2518157958984375, -0.23986053466796875, -0.2279052734375, -0.21595001220703125, -0.2039947509765625, -0.19203948974609375, -0.180084228515625, -0.16812896728515625, -0.1561737060546875, -0.14421844482421875, -0.13226318359375, -0.12030792236328125, -0.1083526611328125, -0.09639739990234375, -0.084442138671875, -0.07248687744140625, -0.0605316162109375, -0.04857635498046875, -0.03662109375, -0.02466583251953125, -0.0127105712890625, -0.00075531005859375, 0.011199951171875, 0.02315521240234375, 0.0351104736328125, 0.04706573486328125, 0.05902099609375, 0.07097625732421875, 0.0829315185546875, 0.09488677978515625, 0.106842041015625, 0.11879730224609375, 0.1307525634765625, 0.14270782470703125, 0.1546630859375, 0.16661834716796875, 0.1785736083984375, 0.19052886962890625, 0.202484130859375, 0.21443939208984375, 0.2263946533203125, 0.23834991455078125, 0.25030517578125, 0.26226043701171875, 0.2742156982421875, 0.28617095947265625, 0.298126220703125, 0.31008148193359375, 0.3220367431640625, 0.33399200439453125, 0.345947265625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 5.0, 7.0, 7.0, 15.0, 13.0, 9.0, 10.0, 15.0, 18.0, 18.0, 29.0, 25.0, 39.0, 29.0, 34.0, 41.0, 41.0, 42.0, 31.0, 43.0, 50.0, 48.0, 44.0, 41.0, 28.0, 32.0, 45.0, 39.0, 26.0, 16.0, 25.0, 19.0, 21.0, 14.0, 11.0, 15.0, 15.0, 13.0, 6.0, 5.0, 2.0, 8.0, 3.0, 1.0, 2.0, 2.0, 0.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.4716796875, -0.45647430419921875, -0.4412689208984375, -0.42606353759765625, -0.410858154296875, -0.39565277099609375, -0.3804473876953125, -0.36524200439453125, -0.35003662109375, -0.33483123779296875, -0.3196258544921875, -0.30442047119140625, -0.289215087890625, -0.27400970458984375, -0.2588043212890625, -0.24359893798828125, -0.2283935546875, -0.21318817138671875, -0.1979827880859375, -0.18277740478515625, -0.167572021484375, -0.15236663818359375, -0.1371612548828125, -0.12195587158203125, -0.10675048828125, -0.09154510498046875, -0.0763397216796875, -0.06113433837890625, -0.045928955078125, -0.03072357177734375, -0.0155181884765625, -0.00031280517578125, 0.014892578125, 0.03009796142578125, 0.0453033447265625, 0.06050872802734375, 0.075714111328125, 0.09091949462890625, 0.1061248779296875, 0.12133026123046875, 0.13653564453125, 0.15174102783203125, 0.1669464111328125, 0.18215179443359375, 0.197357177734375, 0.21256256103515625, 0.2277679443359375, 0.24297332763671875, 0.2581787109375, 0.27338409423828125, 0.2885894775390625, 0.30379486083984375, 0.319000244140625, 0.33420562744140625, 0.3494110107421875, 0.36461639404296875, 0.37982177734375, 0.39502716064453125, 0.4102325439453125, 0.42543792724609375, 0.440643310546875, 0.45584869384765625, 0.4710540771484375, 0.48625946044921875, 0.50146484375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 8.0, 14.0, 13.0, 28.0, 22.0, 23.0, 45.0, 88.0, 130.0, 215.0, 333.0, 754.0, 1747.0, 4580.0, 15593.0, 122661.0, 830998.0, 54888.0, 10422.0, 3257.0, 1320.0, 634.0, 305.0, 164.0, 89.0, 73.0, 38.0, 31.0, 22.0, 11.0, 12.0, 8.0, 5.0, 7.0, 0.0, 5.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0], "bins": [-0.45849609375, -0.44654083251953125, -0.4345855712890625, -0.42263031005859375, -0.410675048828125, -0.39871978759765625, -0.3867645263671875, -0.37480926513671875, -0.36285400390625, -0.35089874267578125, -0.3389434814453125, -0.32698822021484375, -0.315032958984375, -0.30307769775390625, -0.2911224365234375, -0.27916717529296875, -0.2672119140625, -0.25525665283203125, -0.2433013916015625, -0.23134613037109375, -0.219390869140625, -0.20743560791015625, -0.1954803466796875, -0.18352508544921875, -0.17156982421875, -0.15961456298828125, -0.1476593017578125, -0.13570404052734375, -0.123748779296875, -0.11179351806640625, -0.0998382568359375, -0.08788299560546875, -0.075927734375, -0.06397247314453125, -0.0520172119140625, -0.04006195068359375, -0.028106689453125, -0.01615142822265625, -0.0041961669921875, 0.00775909423828125, 0.01971435546875, 0.03166961669921875, 0.0436248779296875, 0.05558013916015625, 0.067535400390625, 0.07949066162109375, 0.0914459228515625, 0.10340118408203125, 0.1153564453125, 0.12731170654296875, 0.1392669677734375, 0.15122222900390625, 0.163177490234375, 0.17513275146484375, 0.1870880126953125, 0.19904327392578125, 0.21099853515625, 0.22295379638671875, 0.2349090576171875, 0.24686431884765625, 0.258819580078125, 0.27077484130859375, 0.2827301025390625, 0.29468536376953125, 0.306640625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 2.0, 8.0, 10.0, 9.0, 17.0, 22.0, 32.0, 59.0, 78.0, 107.0, 152.0, 140.0, 131.0, 75.0, 56.0, 30.0, 27.0, 20.0, 8.0, 8.0, 4.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-5.698204040527344e-05, -5.565676838159561e-05, -5.4331496357917786e-05, -5.300622433423996e-05, -5.1680952310562134e-05, -5.035568028688431e-05, -4.903040826320648e-05, -4.7705136239528656e-05, -4.637986421585083e-05, -4.5054592192173004e-05, -4.372932016849518e-05, -4.240404814481735e-05, -4.1078776121139526e-05, -3.97535040974617e-05, -3.8428232073783875e-05, -3.710296005010605e-05, -3.577768802642822e-05, -3.44524160027504e-05, -3.312714397907257e-05, -3.1801871955394745e-05, -3.047659993171692e-05, -2.9151327908039093e-05, -2.7826055884361267e-05, -2.650078386068344e-05, -2.5175511837005615e-05, -2.385023981332779e-05, -2.2524967789649963e-05, -2.1199695765972137e-05, -1.987442374229431e-05, -1.8549151718616486e-05, -1.722387969493866e-05, -1.5898607671260834e-05, -1.4573335647583008e-05, -1.3248063623905182e-05, -1.1922791600227356e-05, -1.059751957654953e-05, -9.272247552871704e-06, -7.946975529193878e-06, -6.621703505516052e-06, -5.296431481838226e-06, -3.9711594581604e-06, -2.6458874344825745e-06, -1.3206154108047485e-06, 4.6566128730773926e-09, 1.3299286365509033e-06, 2.6552006602287292e-06, 3.980472683906555e-06, 5.305744707584381e-06, 6.631016731262207e-06, 7.956288754940033e-06, 9.281560778617859e-06, 1.0606832802295685e-05, 1.193210482597351e-05, 1.3257376849651337e-05, 1.4582648873329163e-05, 1.590792089700699e-05, 1.7233192920684814e-05, 1.855846494436264e-05, 1.9883736968040466e-05, 2.1209008991718292e-05, 2.2534281015396118e-05, 2.3859553039073944e-05, 2.518482506275177e-05, 2.6510097086429596e-05, 2.7835369110107422e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 2.0, 9.0, 5.0, 12.0, 16.0, 21.0, 39.0, 68.0, 100.0, 181.0, 395.0, 869.0, 2573.0, 10074.0, 69350.0, 789254.0, 153373.0, 16353.0, 3701.0, 1165.0, 454.0, 232.0, 118.0, 78.0, 41.0, 32.0, 13.0, 8.0, 11.0, 3.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.471435546875, -0.4582099914550781, -0.44498443603515625, -0.4317588806152344, -0.4185333251953125, -0.4053077697753906, -0.39208221435546875, -0.3788566589355469, -0.365631103515625, -0.3524055480957031, -0.33917999267578125, -0.3259544372558594, -0.3127288818359375, -0.2995033264160156, -0.28627777099609375, -0.2730522155761719, -0.25982666015625, -0.24660110473632812, -0.23337554931640625, -0.22014999389648438, -0.2069244384765625, -0.19369888305664062, -0.18047332763671875, -0.16724777221679688, -0.154022216796875, -0.14079666137695312, -0.12757110595703125, -0.11434555053710938, -0.1011199951171875, -0.08789443969726562, -0.07466888427734375, -0.061443328857421875, -0.0482177734375, -0.034992218017578125, -0.02176666259765625, -0.008541107177734375, 0.0046844482421875, 0.017910003662109375, 0.03113555908203125, 0.044361114501953125, 0.057586669921875, 0.07081222534179688, 0.08403778076171875, 0.09726333618164062, 0.1104888916015625, 0.12371444702148438, 0.13694000244140625, 0.15016555786132812, 0.16339111328125, 0.17661666870117188, 0.18984222412109375, 0.20306777954101562, 0.2162933349609375, 0.22951889038085938, 0.24274444580078125, 0.2559700012207031, 0.269195556640625, 0.2824211120605469, 0.29564666748046875, 0.3088722229003906, 0.3220977783203125, 0.3353233337402344, 0.34854888916015625, 0.3617744445800781, 0.375]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 1.0, 3.0, 4.0, 2.0, 7.0, 2.0, 5.0, 11.0, 7.0, 14.0, 20.0, 21.0, 26.0, 27.0, 32.0, 50.0, 57.0, 57.0, 77.0, 62.0, 64.0, 74.0, 57.0, 59.0, 55.0, 37.0, 25.0, 32.0, 25.0, 21.0, 19.0, 10.0, 10.0, 5.0, 4.0, 6.0, 1.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.251220703125, -0.24225997924804688, -0.23329925537109375, -0.22433853149414062, -0.2153778076171875, -0.20641708374023438, -0.19745635986328125, -0.18849563598632812, -0.179534912109375, -0.17057418823242188, -0.16161346435546875, -0.15265274047851562, -0.1436920166015625, -0.13473129272460938, -0.12577056884765625, -0.11680984497070312, -0.10784912109375, -0.09888839721679688, -0.08992767333984375, -0.08096694946289062, -0.0720062255859375, -0.06304550170898438, -0.05408477783203125, -0.045124053955078125, -0.036163330078125, -0.027202606201171875, -0.01824188232421875, -0.009281158447265625, -0.0003204345703125, 0.008640289306640625, 0.01760101318359375, 0.026561737060546875, 0.0355224609375, 0.044483184814453125, 0.05344390869140625, 0.062404632568359375, 0.0713653564453125, 0.08032608032226562, 0.08928680419921875, 0.09824752807617188, 0.107208251953125, 0.11616897583007812, 0.12512969970703125, 0.13409042358398438, 0.1430511474609375, 0.15201187133789062, 0.16097259521484375, 0.16993331909179688, 0.17889404296875, 0.18785476684570312, 0.19681549072265625, 0.20577621459960938, 0.2147369384765625, 0.22369766235351562, 0.23265838623046875, 0.24161911010742188, 0.250579833984375, 0.2595405578613281, 0.26850128173828125, 0.2774620056152344, 0.2864227294921875, 0.2953834533691406, 0.30434417724609375, 0.3133049011230469, 0.322265625]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 8.0, 16.0, 52.0, 246.0, 532.0, 104.0, 30.0, 11.0, 7.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.320096015930176, -9.954046249389648, -9.587996482849121, -9.221946716308594, -8.855896949768066, -8.489847183227539, -8.123798370361328, -7.757748603820801, -7.391698837280273, -7.025649070739746, -6.659599304199219, -6.293549537658691, -5.927500247955322, -5.561450481414795, -5.195400714874268, -4.829351425170898, -4.463301181793213, -4.0972514152526855, -3.7312018871307373, -3.36515212059021, -2.9991025924682617, -2.6330528259277344, -2.267003059387207, -1.9009535312652588, -1.5349037647247314, -1.1688541173934937, -0.8028044104576111, -0.4367547035217285, -0.07070505619049072, 0.29534459114074707, 0.6613943576812744, 1.0274438858032227, 1.39349365234375, 1.7595432996749878, 2.1255929470062256, 2.491642713546753, 2.857692241668701, 3.2237420082092285, 3.589791774749756, 3.955841302871704, 4.321890830993652, 4.68794059753418, 5.053990364074707, 5.420040130615234, 5.7860894203186035, 6.152139186859131, 6.518188953399658, 6.884238243103027, 7.250288486480713, 7.61633825302124, 7.982388019561768, 8.348437309265137, 8.714487075805664, 9.080536842346191, 9.446586608886719, 9.812636375427246, 10.178686141967773, 10.5447359085083, 10.910785675048828, 11.276835441589355, 11.642885208129883, 12.008934020996094, 12.374984741210938, 12.741033554077148, 13.107083320617676]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 5.0, 5.0, 3.0, 5.0, 11.0, 8.0, 8.0, 12.0, 16.0, 21.0, 34.0, 77.0, 124.0, 148.0, 171.0, 137.0, 81.0, 51.0, 21.0, 15.0, 14.0, 5.0, 10.0, 4.0, 4.0, 4.0, 1.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.580841064453125, -10.227663040161133, -9.874485969543457, -9.521307945251465, -9.168130874633789, -8.814952850341797, -8.461774826049805, -8.108597755432129, -7.755420207977295, -7.402242660522461, -7.049065113067627, -6.695887565612793, -6.342709541320801, -5.989532470703125, -5.636354446411133, -5.283176898956299, -4.929999351501465, -4.576821804046631, -4.223644256591797, -3.870466470718384, -3.51728892326355, -3.164111375808716, -2.8109335899353027, -2.4577560424804688, -2.1045784950256348, -1.7514009475708008, -1.3982232809066772, -1.0450456142425537, -0.6918680667877197, -0.33869051933288574, 0.014487266540527344, 0.36766481399536133, 0.7208414077758789, 1.074018955230713, 1.4271966218948364, 1.78037428855896, 2.133551836013794, 2.486729383468628, 2.839907169342041, 3.193084716796875, 3.546262264251709, 3.899439811706543, 4.252617359161377, 4.605794906616211, 4.958972930908203, 5.312150001525879, 5.665328025817871, 6.018505573272705, 6.371683120727539, 6.724860668182373, 7.078038215637207, 7.431216239929199, 7.784393310546875, 8.137571334838867, 8.49074935913086, 8.843926429748535, 9.197103500366211, 9.550281524658203, 9.903458595275879, 10.256636619567871, 10.609813690185547, 10.962991714477539, 11.316169738769531, 11.669346809387207, 12.0225248336792]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 5.0, 5.0, 3.0, 9.0, 9.0, 21.0, 24.0, 49.0, 57.0, 142.0, 270.0, 473.0, 1133.0, 2389.0, 5900.0, 17000.0, 66682.0, 3840788.0, 212236.0, 29859.0, 9585.0, 3885.0, 1820.0, 875.0, 449.0, 270.0, 129.0, 79.0, 44.0, 26.0, 18.0, 10.0, 10.0, 7.0, 4.0, 4.0, 2.0, 3.0, 1.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.1025390625, -1.066680908203125, -1.03082275390625, -0.994964599609375, -0.9591064453125, -0.923248291015625, -0.88739013671875, -0.851531982421875, -0.815673828125, -0.779815673828125, -0.74395751953125, -0.708099365234375, -0.6722412109375, -0.636383056640625, -0.60052490234375, -0.564666748046875, -0.52880859375, -0.492950439453125, -0.45709228515625, -0.421234130859375, -0.3853759765625, -0.349517822265625, -0.31365966796875, -0.277801513671875, -0.241943359375, -0.206085205078125, -0.17022705078125, -0.134368896484375, -0.0985107421875, -0.062652587890625, -0.02679443359375, 0.009063720703125, 0.044921875, 0.080780029296875, 0.11663818359375, 0.152496337890625, 0.1883544921875, 0.224212646484375, 0.26007080078125, 0.295928955078125, 0.331787109375, 0.367645263671875, 0.40350341796875, 0.439361572265625, 0.4752197265625, 0.511077880859375, 0.54693603515625, 0.582794189453125, 0.61865234375, 0.654510498046875, 0.69036865234375, 0.726226806640625, 0.7620849609375, 0.797943115234375, 0.83380126953125, 0.869659423828125, 0.905517578125, 0.941375732421875, 0.97723388671875, 1.013092041015625, 1.0489501953125, 1.084808349609375, 1.12066650390625, 1.156524658203125, 1.1923828125]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 5.0, 7.0, 9.0, 6.0, 6.0, 7.0, 7.0, 5.0, 9.0, 7.0, 23.0, 48.0, 133.0, 276.0, 236.0, 93.0, 25.0, 9.0, 7.0, 7.0, 10.0, 6.0, 7.0, 5.0, 7.0, 9.0, 1.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0748291015625, -0.07239627838134766, -0.06996345520019531, -0.06753063201904297, -0.06509780883789062, -0.06266498565673828, -0.06023216247558594, -0.057799339294433594, -0.05536651611328125, -0.052933692932128906, -0.05050086975097656, -0.04806804656982422, -0.045635223388671875, -0.04320240020751953, -0.04076957702636719, -0.038336753845214844, -0.0359039306640625, -0.033471107482910156, -0.031038284301757812, -0.02860546112060547, -0.026172637939453125, -0.02373981475830078, -0.021306991577148438, -0.018874168395996094, -0.01644134521484375, -0.014008522033691406, -0.011575698852539062, -0.009142875671386719, -0.006710052490234375, -0.004277229309082031, -0.0018444061279296875, 0.0005884170532226562, 0.003021240234375, 0.005454063415527344, 0.007886886596679688, 0.010319709777832031, 0.012752532958984375, 0.015185356140136719, 0.017618179321289062, 0.020051002502441406, 0.02248382568359375, 0.024916648864746094, 0.027349472045898438, 0.02978229522705078, 0.032215118408203125, 0.03464794158935547, 0.03708076477050781, 0.039513587951660156, 0.0419464111328125, 0.044379234313964844, 0.04681205749511719, 0.04924488067626953, 0.051677703857421875, 0.05411052703857422, 0.05654335021972656, 0.058976173400878906, 0.06140899658203125, 0.0638418197631836, 0.06627464294433594, 0.06870746612548828, 0.07114028930664062, 0.07357311248779297, 0.07600593566894531, 0.07843875885009766, 0.08087158203125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 8.0, 14.0, 8.0, 8.0, 19.0, 19.0, 26.0, 52.0, 64.0, 108.0, 161.0, 278.0, 527.0, 1028.0, 2179.0, 5672.0, 18005.0, 98117.0, 3149473.0, 843045.0, 54921.0, 12414.0, 4304.0, 1770.0, 880.0, 425.0, 249.0, 155.0, 112.0, 72.0, 47.0, 33.0, 31.0, 13.0, 9.0, 12.0, 9.0, 5.0, 6.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.576171875, -0.5554885864257812, -0.5348052978515625, -0.5141220092773438, -0.493438720703125, -0.47275543212890625, -0.4520721435546875, -0.43138885498046875, -0.41070556640625, -0.39002227783203125, -0.3693389892578125, -0.34865570068359375, -0.327972412109375, -0.30728912353515625, -0.2866058349609375, -0.26592254638671875, -0.2452392578125, -0.22455596923828125, -0.2038726806640625, -0.18318939208984375, -0.162506103515625, -0.14182281494140625, -0.1211395263671875, -0.10045623779296875, -0.07977294921875, -0.05908966064453125, -0.0384063720703125, -0.01772308349609375, 0.002960205078125, 0.02364349365234375, 0.0443267822265625, 0.06501007080078125, 0.085693359375, 0.10637664794921875, 0.1270599365234375, 0.14774322509765625, 0.168426513671875, 0.18910980224609375, 0.2097930908203125, 0.23047637939453125, 0.25115966796875, 0.27184295654296875, 0.2925262451171875, 0.31320953369140625, 0.333892822265625, 0.35457611083984375, 0.3752593994140625, 0.39594268798828125, 0.4166259765625, 0.43730926513671875, 0.4579925537109375, 0.47867584228515625, 0.499359130859375, 0.5200424194335938, 0.5407257080078125, 0.5614089965820312, 0.58209228515625, 0.6027755737304688, 0.6234588623046875, 0.6441421508789062, 0.664825439453125, 0.6855087280273438, 0.7061920166015625, 0.7268753051757812, 0.74755859375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 5.0, 3.0, 2.0, 3.0, 5.0, 8.0, 13.0, 24.0, 29.0, 34.0, 45.0, 86.0, 143.0, 250.0, 779.0, 1627.0, 492.0, 231.0, 110.0, 50.0, 35.0, 27.0, 21.0, 11.0, 8.0, 7.0, 7.0, 3.0, 3.0, 7.0, 3.0, 2.0, 3.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12939453125, -0.12465667724609375, -0.1199188232421875, -0.11518096923828125, -0.110443115234375, -0.10570526123046875, -0.1009674072265625, -0.09622955322265625, -0.09149169921875, -0.08675384521484375, -0.0820159912109375, -0.07727813720703125, -0.072540283203125, -0.06780242919921875, -0.0630645751953125, -0.05832672119140625, -0.0535888671875, -0.04885101318359375, -0.0441131591796875, -0.03937530517578125, -0.034637451171875, -0.02989959716796875, -0.0251617431640625, -0.02042388916015625, -0.01568603515625, -0.01094818115234375, -0.0062103271484375, -0.00147247314453125, 0.003265380859375, 0.00800323486328125, 0.0127410888671875, 0.01747894287109375, 0.022216796875, 0.02695465087890625, 0.0316925048828125, 0.03643035888671875, 0.041168212890625, 0.04590606689453125, 0.0506439208984375, 0.05538177490234375, 0.06011962890625, 0.06485748291015625, 0.0695953369140625, 0.07433319091796875, 0.079071044921875, 0.08380889892578125, 0.0885467529296875, 0.09328460693359375, 0.0980224609375, 0.10276031494140625, 0.1074981689453125, 0.11223602294921875, 0.116973876953125, 0.12171173095703125, 0.1264495849609375, 0.13118743896484375, 0.13592529296875, 0.14066314697265625, 0.1454010009765625, 0.15013885498046875, 0.154876708984375, 0.15961456298828125, 0.1643524169921875, 0.16909027099609375, 0.173828125]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 12.0, 205.0, 717.0, 58.0, 7.0, 7.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1674286127090454, -1.0536460876464844, -0.9398636817932129, -0.8260812163352966, -0.7122987508773804, -0.5985162854194641, -0.48473381996154785, -0.3709513545036316, -0.25716888904571533, -0.14338642358779907, -0.029603958129882812, 0.08417850732803345, 0.1979609727859497, 0.31174343824386597, 0.4255259037017822, 0.5393083691596985, 0.6530908346176147, 0.766873300075531, 0.8806557655334473, 0.9944382309913635, 1.1082206964492798, 1.2220032215118408, 1.3357856273651123, 1.4495680332183838, 1.5633505582809448, 1.6771330833435059, 1.7909154891967773, 1.9046978950500488, 2.0184803009033203, 2.132262945175171, 2.2460453510284424, 2.359827756881714, 2.4736104011535645, 2.587392807006836, 2.7011752128601074, 2.814957857131958, 2.9287402629852295, 3.042522668838501, 3.1563053131103516, 3.270087718963623, 3.3838701248168945, 3.497652530670166, 3.6114349365234375, 3.725217580795288, 3.8389999866485596, 3.952782392501831, 4.066565036773682, 4.180347442626953, 4.294129848480225, 4.407912254333496, 4.521694660186768, 4.635477066040039, 4.749259948730469, 4.86304235458374, 4.976824760437012, 5.090607166290283, 5.204389572143555, 5.318171977996826, 5.431954383850098, 5.545736789703369, 5.659519195556641, 5.77330207824707, 5.887084484100342, 6.000866889953613, 6.114649295806885]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 5.0, 3.0, 4.0, 7.0, 5.0, 4.0, 10.0, 9.0, 17.0, 20.0, 32.0, 33.0, 49.0, 58.0, 61.0, 75.0, 81.0, 92.0, 94.0, 72.0, 68.0, 37.0, 42.0, 25.0, 22.0, 13.0, 12.0, 15.0, 6.0, 9.0, 5.0, 2.0, 4.0, 2.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.7323246598243713, -0.7118960022926331, -0.69146728515625, -0.6710386276245117, -0.6506099104881287, -0.6301812529563904, -0.6097525358200073, -0.589323878288269, -0.5688952207565308, -0.5484665632247925, -0.5280378460884094, -0.5076091885566711, -0.4871804714202881, -0.4667518138885498, -0.44632312655448914, -0.42589443922042847, -0.4054657220840454, -0.38503703474998474, -0.3646083474159241, -0.3441796600818634, -0.32375097274780273, -0.30332231521606445, -0.2828936278820038, -0.2624649405479431, -0.24203625321388245, -0.22160756587982178, -0.2011788785457611, -0.18075020611286163, -0.16032151877880096, -0.1398928314447403, -0.11946415156126022, -0.09903547167778015, -0.07860672473907471, -0.05817804113030434, -0.037749357521533966, -0.017320673912763596, 0.003108009696006775, 0.023536697030067444, 0.043965376913547516, 0.06439405679702759, 0.08482274413108826, 0.10525143146514893, 0.1256801187992096, 0.14610879123210907, 0.16653747856616974, 0.1869661659002304, 0.20739483833312988, 0.22782352566719055, 0.24825221300125122, 0.2686809003353119, 0.28910958766937256, 0.3095382750034332, 0.3299669623374939, 0.3503956198692322, 0.37082430720329285, 0.3912529945373535, 0.4116816818714142, 0.43211036920547485, 0.4525390565395355, 0.4729677438735962, 0.4933964014053345, 0.5138251185417175, 0.5342537760734558, 0.5546824932098389, 0.5751111507415771]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 3.0, 4.0, 2.0, 8.0, 5.0, 14.0, 19.0, 26.0, 36.0, 35.0, 78.0, 108.0, 134.0, 212.0, 345.0, 563.0, 804.0, 1341.0, 2185.0, 3612.0, 6290.0, 11164.0, 21350.0, 60020.0, 583635.0, 278218.0, 38795.0, 16775.0, 9222.0, 5275.0, 3092.0, 1899.0, 1190.0, 699.0, 483.0, 304.0, 180.0, 123.0, 87.0, 57.0, 44.0, 30.0, 28.0, 11.0, 14.0, 17.0, 10.0, 7.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.45849609375, -0.4449462890625, -0.431396484375, -0.4178466796875, -0.404296875, -0.3907470703125, -0.377197265625, -0.3636474609375, -0.35009765625, -0.3365478515625, -0.322998046875, -0.3094482421875, -0.2958984375, -0.2823486328125, -0.268798828125, -0.2552490234375, -0.24169921875, -0.2281494140625, -0.214599609375, -0.2010498046875, -0.1875, -0.1739501953125, -0.160400390625, -0.1468505859375, -0.13330078125, -0.1197509765625, -0.106201171875, -0.0926513671875, -0.0791015625, -0.0655517578125, -0.052001953125, -0.0384521484375, -0.02490234375, -0.0113525390625, 0.002197265625, 0.0157470703125, 0.029296875, 0.0428466796875, 0.056396484375, 0.0699462890625, 0.08349609375, 0.0970458984375, 0.110595703125, 0.1241455078125, 0.1376953125, 0.1512451171875, 0.164794921875, 0.1783447265625, 0.19189453125, 0.2054443359375, 0.218994140625, 0.2325439453125, 0.24609375, 0.2596435546875, 0.273193359375, 0.2867431640625, 0.30029296875, 0.3138427734375, 0.327392578125, 0.3409423828125, 0.3544921875, 0.3680419921875, 0.381591796875, 0.3951416015625, 0.40869140625]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 4.0, 3.0, 4.0, 5.0, 3.0, 5.0, 5.0, 7.0, 8.0, 6.0, 11.0, 8.0, 11.0, 29.0, 48.0, 115.0, 171.0, 215.0, 146.0, 67.0, 37.0, 18.0, 8.0, 10.0, 7.0, 6.0, 6.0, 9.0, 6.0, 8.0, 5.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.0814208984375, -0.07910823822021484, -0.07679557800292969, -0.07448291778564453, -0.07217025756835938, -0.06985759735107422, -0.06754493713378906, -0.0652322769165039, -0.06291961669921875, -0.060606956481933594, -0.05829429626464844, -0.05598163604736328, -0.053668975830078125, -0.05135631561279297, -0.04904365539550781, -0.046730995178222656, -0.0444183349609375, -0.042105674743652344, -0.03979301452636719, -0.03748035430908203, -0.035167694091796875, -0.03285503387451172, -0.030542373657226562, -0.028229713439941406, -0.02591705322265625, -0.023604393005371094, -0.021291732788085938, -0.01897907257080078, -0.016666412353515625, -0.014353752136230469, -0.012041091918945312, -0.009728431701660156, -0.007415771484375, -0.005103111267089844, -0.0027904510498046875, -0.00047779083251953125, 0.001834869384765625, 0.004147529602050781, 0.0064601898193359375, 0.008772850036621094, 0.01108551025390625, 0.013398170471191406, 0.015710830688476562, 0.01802349090576172, 0.020336151123046875, 0.02264881134033203, 0.024961471557617188, 0.027274131774902344, 0.0295867919921875, 0.031899452209472656, 0.03421211242675781, 0.03652477264404297, 0.038837432861328125, 0.04115009307861328, 0.04346275329589844, 0.045775413513183594, 0.04808807373046875, 0.050400733947753906, 0.05271339416503906, 0.05502605438232422, 0.057338714599609375, 0.05965137481689453, 0.06196403503417969, 0.06427669525146484, 0.06658935546875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 4.0, 7.0, 13.0, 33.0, 67.0, 139.0, 425.0, 2250.0, 103426.0, 925337.0, 15523.0, 890.0, 245.0, 96.0, 56.0, 14.0, 14.0, 6.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.306640625, -1.2661895751953125, -1.225738525390625, -1.1852874755859375, -1.14483642578125, -1.1043853759765625, -1.063934326171875, -1.0234832763671875, -0.9830322265625, -0.9425811767578125, -0.902130126953125, -0.8616790771484375, -0.82122802734375, -0.7807769775390625, -0.740325927734375, -0.6998748779296875, -0.659423828125, -0.6189727783203125, -0.578521728515625, -0.5380706787109375, -0.49761962890625, -0.4571685791015625, -0.416717529296875, -0.3762664794921875, -0.3358154296875, -0.2953643798828125, -0.254913330078125, -0.2144622802734375, -0.17401123046875, -0.1335601806640625, -0.093109130859375, -0.0526580810546875, -0.01220703125, 0.0282440185546875, 0.068695068359375, 0.1091461181640625, 0.14959716796875, 0.1900482177734375, 0.230499267578125, 0.2709503173828125, 0.3114013671875, 0.3518524169921875, 0.392303466796875, 0.4327545166015625, 0.47320556640625, 0.5136566162109375, 0.554107666015625, 0.5945587158203125, 0.635009765625, 0.6754608154296875, 0.715911865234375, 0.7563629150390625, 0.79681396484375, 0.8372650146484375, 0.877716064453125, 0.9181671142578125, 0.9586181640625, 0.9990692138671875, 1.039520263671875, 1.0799713134765625, 1.12042236328125, 1.1608734130859375, 1.201324462890625, 1.2417755126953125, 1.2822265625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 3.0, 8.0, 5.0, 10.0, 4.0, 7.0, 17.0, 11.0, 12.0, 14.0, 13.0, 24.0, 29.0, 25.0, 26.0, 33.0, 37.0, 43.0, 38.0, 39.0, 48.0, 24.0, 39.0, 44.0, 33.0, 39.0, 36.0, 38.0, 36.0, 23.0, 27.0, 33.0, 24.0, 26.0, 18.0, 20.0, 8.0, 21.0, 12.0, 12.0, 13.0, 11.0, 5.0, 2.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0], "bins": [-0.250244140625, -0.24298667907714844, -0.23572921752929688, -0.2284717559814453, -0.22121429443359375, -0.2139568328857422, -0.20669937133789062, -0.19944190979003906, -0.1921844482421875, -0.18492698669433594, -0.17766952514648438, -0.1704120635986328, -0.16315460205078125, -0.1558971405029297, -0.14863967895507812, -0.14138221740722656, -0.134124755859375, -0.12686729431152344, -0.11960983276367188, -0.11235237121582031, -0.10509490966796875, -0.09783744812011719, -0.09057998657226562, -0.08332252502441406, -0.0760650634765625, -0.06880760192871094, -0.061550140380859375, -0.05429267883300781, -0.04703521728515625, -0.03977775573730469, -0.032520294189453125, -0.025262832641601562, -0.01800537109375, -0.010747909545898438, -0.003490447998046875, 0.0037670135498046875, 0.01102447509765625, 0.018281936645507812, 0.025539398193359375, 0.03279685974121094, 0.0400543212890625, 0.04731178283691406, 0.054569244384765625, 0.06182670593261719, 0.06908416748046875, 0.07634162902832031, 0.08359909057617188, 0.09085655212402344, 0.098114013671875, 0.10537147521972656, 0.11262893676757812, 0.11988639831542969, 0.12714385986328125, 0.1344013214111328, 0.14165878295898438, 0.14891624450683594, 0.1561737060546875, 0.16343116760253906, 0.17068862915039062, 0.1779460906982422, 0.18520355224609375, 0.1924610137939453, 0.19971847534179688, 0.20697593688964844, 0.2142333984375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 7.0, 4.0, 6.0, 8.0, 10.0, 19.0, 21.0, 60.0, 75.0, 130.0, 339.0, 924.0, 3095.0, 23499.0, 903449.0, 108373.0, 6174.0, 1341.0, 506.0, 227.0, 111.0, 69.0, 33.0, 26.0, 17.0, 9.0, 10.0, 8.0, 0.0, 3.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.724609375, -0.7002182006835938, -0.6758270263671875, -0.6514358520507812, -0.627044677734375, -0.6026535034179688, -0.5782623291015625, -0.5538711547851562, -0.52947998046875, -0.5050888061523438, -0.4806976318359375, -0.45630645751953125, -0.431915283203125, -0.40752410888671875, -0.3831329345703125, -0.35874176025390625, -0.3343505859375, -0.30995941162109375, -0.2855682373046875, -0.26117706298828125, -0.236785888671875, -0.21239471435546875, -0.1880035400390625, -0.16361236572265625, -0.13922119140625, -0.11483001708984375, -0.0904388427734375, -0.06604766845703125, -0.041656494140625, -0.01726531982421875, 0.0071258544921875, 0.03151702880859375, 0.055908203125, 0.08029937744140625, 0.1046905517578125, 0.12908172607421875, 0.153472900390625, 0.17786407470703125, 0.2022552490234375, 0.22664642333984375, 0.25103759765625, 0.27542877197265625, 0.2998199462890625, 0.32421112060546875, 0.348602294921875, 0.37299346923828125, 0.3973846435546875, 0.42177581787109375, 0.4461669921875, 0.47055816650390625, 0.4949493408203125, 0.5193405151367188, 0.543731689453125, 0.5681228637695312, 0.5925140380859375, 0.6169052124023438, 0.64129638671875, 0.6656875610351562, 0.6900787353515625, 0.7144699096679688, 0.738861083984375, 0.7632522583007812, 0.7876434326171875, 0.8120346069335938, 0.83642578125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 8.0, 9.0, 29.0, 26.0, 37.0, 27.0, 52.0, 71.0, 95.0, 95.0, 104.0, 121.0, 75.0, 73.0, 50.0, 30.0, 16.0, 15.0, 23.0, 17.0, 8.0, 7.0, 2.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.9265880584716797e-05, -2.841278910636902e-05, -2.755969762802124e-05, -2.6706606149673462e-05, -2.5853514671325684e-05, -2.5000423192977905e-05, -2.4147331714630127e-05, -2.329424023628235e-05, -2.244114875793457e-05, -2.1588057279586792e-05, -2.0734965801239014e-05, -1.9881874322891235e-05, -1.9028782844543457e-05, -1.817569136619568e-05, -1.73225998878479e-05, -1.6469508409500122e-05, -1.5616416931152344e-05, -1.4763325452804565e-05, -1.3910233974456787e-05, -1.3057142496109009e-05, -1.220405101776123e-05, -1.1350959539413452e-05, -1.0497868061065674e-05, -9.644776582717896e-06, -8.791685104370117e-06, -7.938593626022339e-06, -7.0855021476745605e-06, -6.232410669326782e-06, -5.379319190979004e-06, -4.526227712631226e-06, -3.6731362342834473e-06, -2.820044755935669e-06, -1.9669532775878906e-06, -1.1138617992401123e-06, -2.60770320892334e-07, 5.923211574554443e-07, 1.4454126358032227e-06, 2.298504114151001e-06, 3.1515955924987793e-06, 4.004687070846558e-06, 4.857778549194336e-06, 5.710870027542114e-06, 6.563961505889893e-06, 7.417052984237671e-06, 8.27014446258545e-06, 9.123235940933228e-06, 9.976327419281006e-06, 1.0829418897628784e-05, 1.1682510375976562e-05, 1.253560185432434e-05, 1.3388693332672119e-05, 1.4241784811019897e-05, 1.5094876289367676e-05, 1.5947967767715454e-05, 1.6801059246063232e-05, 1.765415072441101e-05, 1.850724220275879e-05, 1.9360333681106567e-05, 2.0213425159454346e-05, 2.1066516637802124e-05, 2.1919608116149902e-05, 2.277269959449768e-05, 2.362579107284546e-05, 2.4478882551193237e-05, 2.5331974029541016e-05]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 5.0, 5.0, 12.0, 21.0, 15.0, 25.0, 69.0, 121.0, 248.0, 727.0, 2511.0, 14365.0, 390224.0, 616979.0, 18847.0, 2878.0, 854.0, 346.0, 148.0, 76.0, 23.0, 20.0, 14.0, 6.0, 7.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.61865234375, -0.5980758666992188, -0.5774993896484375, -0.5569229125976562, -0.536346435546875, -0.5157699584960938, -0.4951934814453125, -0.47461700439453125, -0.45404052734375, -0.43346405029296875, -0.4128875732421875, -0.39231109619140625, -0.371734619140625, -0.35115814208984375, -0.3305816650390625, -0.31000518798828125, -0.2894287109375, -0.26885223388671875, -0.2482757568359375, -0.22769927978515625, -0.207122802734375, -0.18654632568359375, -0.1659698486328125, -0.14539337158203125, -0.12481689453125, -0.10424041748046875, -0.0836639404296875, -0.06308746337890625, -0.042510986328125, -0.02193450927734375, -0.0013580322265625, 0.01921844482421875, 0.039794921875, 0.06037139892578125, 0.0809478759765625, 0.10152435302734375, 0.122100830078125, 0.14267730712890625, 0.1632537841796875, 0.18383026123046875, 0.20440673828125, 0.22498321533203125, 0.2455596923828125, 0.26613616943359375, 0.286712646484375, 0.30728912353515625, 0.3278656005859375, 0.34844207763671875, 0.3690185546875, 0.38959503173828125, 0.4101715087890625, 0.43074798583984375, 0.451324462890625, 0.47190093994140625, 0.4924774169921875, 0.5130538940429688, 0.53363037109375, 0.5542068481445312, 0.5747833251953125, 0.5953598022460938, 0.615936279296875, 0.6365127563476562, 0.6570892333984375, 0.6776657104492188, 0.6982421875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 0.0, 1.0, 4.0, 4.0, 8.0, 15.0, 15.0, 25.0, 33.0, 50.0, 69.0, 103.0, 105.0, 110.0, 116.0, 100.0, 80.0, 57.0, 40.0, 23.0, 16.0, 14.0, 2.0, 6.0, 3.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.297607421875, -0.28643035888671875, -0.2752532958984375, -0.26407623291015625, -0.252899169921875, -0.24172210693359375, -0.2305450439453125, -0.21936798095703125, -0.20819091796875, -0.19701385498046875, -0.1858367919921875, -0.17465972900390625, -0.163482666015625, -0.15230560302734375, -0.1411285400390625, -0.12995147705078125, -0.1187744140625, -0.10759735107421875, -0.0964202880859375, -0.08524322509765625, -0.074066162109375, -0.06288909912109375, -0.0517120361328125, -0.04053497314453125, -0.02935791015625, -0.01818084716796875, -0.0070037841796875, 0.00417327880859375, 0.015350341796875, 0.02652740478515625, 0.0377044677734375, 0.04888153076171875, 0.06005859375, 0.07123565673828125, 0.0824127197265625, 0.09358978271484375, 0.104766845703125, 0.11594390869140625, 0.1271209716796875, 0.13829803466796875, 0.14947509765625, 0.16065216064453125, 0.1718292236328125, 0.18300628662109375, 0.194183349609375, 0.20536041259765625, 0.2165374755859375, 0.22771453857421875, 0.2388916015625, 0.25006866455078125, 0.2612457275390625, 0.27242279052734375, 0.283599853515625, 0.29477691650390625, 0.3059539794921875, 0.31713104248046875, 0.32830810546875, 0.33948516845703125, 0.3506622314453125, 0.36183929443359375, 0.373016357421875, 0.38419342041015625, 0.3953704833984375, 0.40654754638671875, 0.417724609375]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 11.0, 166.0, 702.0, 103.0, 18.0, 4.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1491875648498535, -4.814847469329834, -4.480506896972656, -4.146166801452637, -3.811826229095459, -3.4774861335754395, -3.143145799636841, -2.808805465698242, -2.4744651317596436, -2.140124797821045, -1.8057844638824463, -1.4714442491531372, -1.1371039152145386, -0.8027635812759399, -0.46842336654663086, -0.13408303260803223, 0.2002573013305664, 0.534597635269165, 0.8689379096031189, 1.2032781839370728, 1.5376185178756714, 1.87195885181427, 2.206299066543579, 2.5406394004821777, 2.8749797344207764, 3.209320068359375, 3.5436604022979736, 3.8780007362365723, 4.212340831756592, 4.5466814041137695, 4.881021499633789, 5.215361595153809, 5.5497026443481445, 5.884042739868164, 6.218383312225342, 6.552723407745361, 6.887063980102539, 7.221404075622559, 7.555744171142578, 7.890084743499756, 8.224425315856934, 8.558765411376953, 8.893105506896973, 9.227446556091309, 9.561786651611328, 9.896126747131348, 10.230466842651367, 10.564807891845703, 10.899147033691406, 11.233487129211426, 11.567827224731445, 11.902168273925781, 12.2365083694458, 12.57084846496582, 12.90518856048584, 13.23952865600586, 13.573869705200195, 13.908209800720215, 14.242549896240234, 14.57689094543457, 14.91123104095459, 15.24557113647461, 15.579911231994629, 15.914251327514648, 16.248592376708984]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 3.0, 9.0, 5.0, 7.0, 5.0, 13.0, 7.0, 15.0, 28.0, 48.0, 55.0, 82.0, 94.0, 105.0, 96.0, 98.0, 95.0, 71.0, 53.0, 30.0, 16.0, 13.0, 8.0, 10.0, 6.0, 8.0, 5.0, 7.0, 2.0, 1.0, 6.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3582828044891357, -3.242628574371338, -3.12697434425354, -3.011320114135742, -2.8956658840179443, -2.7800116539001465, -2.6643576622009277, -2.548703193664551, -2.433049201965332, -2.317394971847534, -2.2017407417297363, -2.0860865116119385, -1.9704322814941406, -1.8547780513763428, -1.7391239404678345, -1.6234697103500366, -1.5078153610229492, -1.3921611309051514, -1.2765069007873535, -1.1608526706695557, -1.0451984405517578, -0.9295442700386047, -0.8138900995254517, -0.6982358694076538, -0.582581639289856, -0.4669274091720581, -0.35127320885658264, -0.23561900854110718, -0.11996477842330933, -0.004310548305511475, 0.1113436222076416, 0.22699785232543945, 0.3426518440246582, 0.45830607414245605, 0.5739603042602539, 0.689614474773407, 0.8052687048912048, 0.9209229350090027, 1.0365771055221558, 1.1522313356399536, 1.2678855657577515, 1.3835397958755493, 1.4991940259933472, 1.6148481369018555, 1.7305023670196533, 1.8461565971374512, 1.961810827255249, 2.077465057373047, 2.1931192874908447, 2.3087735176086426, 2.4244277477264404, 2.5400819778442383, 2.655736207962036, 2.771390438079834, 2.8870444297790527, 3.0026988983154297, 3.1183528900146484, 3.2340071201324463, 3.349661350250244, 3.465315580368042, 3.58096981048584, 3.6966240406036377, 3.8122782707214355, 3.9279322624206543, 4.043586730957031]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 5.0, 6.0, 7.0, 12.0, 18.0, 29.0, 45.0, 60.0, 73.0, 129.0, 213.0, 298.0, 495.0, 794.0, 1473.0, 3052.0, 8055.0, 32916.0, 3292254.0, 814029.0, 26242.0, 7221.0, 2965.0, 1468.0, 822.0, 495.0, 339.0, 221.0, 160.0, 100.0, 85.0, 53.0, 50.0, 28.0, 23.0, 15.0, 12.0, 10.0, 6.0, 6.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.404296875, -1.3629302978515625, -1.321563720703125, -1.2801971435546875, -1.23883056640625, -1.1974639892578125, -1.156097412109375, -1.1147308349609375, -1.0733642578125, -1.0319976806640625, -0.990631103515625, -0.9492645263671875, -0.90789794921875, -0.8665313720703125, -0.825164794921875, -0.7837982177734375, -0.742431640625, -0.7010650634765625, -0.659698486328125, -0.6183319091796875, -0.57696533203125, -0.5355987548828125, -0.494232177734375, -0.4528656005859375, -0.4114990234375, -0.3701324462890625, -0.328765869140625, -0.2873992919921875, -0.24603271484375, -0.2046661376953125, -0.163299560546875, -0.1219329833984375, -0.08056640625, -0.0391998291015625, 0.002166748046875, 0.0435333251953125, 0.08489990234375, 0.1262664794921875, 0.167633056640625, 0.2089996337890625, 0.2503662109375, 0.2917327880859375, 0.333099365234375, 0.3744659423828125, 0.41583251953125, 0.4571990966796875, 0.498565673828125, 0.5399322509765625, 0.581298828125, 0.6226654052734375, 0.664031982421875, 0.7053985595703125, 0.74676513671875, 0.7881317138671875, 0.829498291015625, 0.8708648681640625, 0.9122314453125, 0.9535980224609375, 0.994964599609375, 1.0363311767578125, 1.07769775390625, 1.1190643310546875, 1.160430908203125, 1.2017974853515625, 1.2431640625]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 5.0, 2.0, 1.0, 2.0, 8.0, 2.0, 1.0, 4.0, 8.0, 9.0, 11.0, 11.0, 16.0, 21.0, 39.0, 64.0, 83.0, 121.0, 135.0, 127.0, 114.0, 77.0, 39.0, 21.0, 18.0, 17.0, 8.0, 11.0, 7.0, 3.0, 6.0, 5.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0545654296875, -0.05260181427001953, -0.05063819885253906, -0.048674583435058594, -0.046710968017578125, -0.044747352600097656, -0.04278373718261719, -0.04082012176513672, -0.03885650634765625, -0.03689289093017578, -0.03492927551269531, -0.032965660095214844, -0.031002044677734375, -0.029038429260253906, -0.027074813842773438, -0.02511119842529297, -0.0231475830078125, -0.02118396759033203, -0.019220352172851562, -0.017256736755371094, -0.015293121337890625, -0.013329505920410156, -0.011365890502929688, -0.009402275085449219, -0.00743865966796875, -0.005475044250488281, -0.0035114288330078125, -0.0015478134155273438, 0.000415802001953125, 0.0023794174194335938, 0.0043430328369140625, 0.006306648254394531, 0.008270263671875, 0.010233879089355469, 0.012197494506835938, 0.014161109924316406, 0.016124725341796875, 0.018088340759277344, 0.020051956176757812, 0.02201557159423828, 0.02397918701171875, 0.02594280242919922, 0.027906417846679688, 0.029870033264160156, 0.031833648681640625, 0.033797264099121094, 0.03576087951660156, 0.03772449493408203, 0.0396881103515625, 0.04165172576904297, 0.04361534118652344, 0.045578956604003906, 0.047542572021484375, 0.049506187438964844, 0.05146980285644531, 0.05343341827392578, 0.05539703369140625, 0.05736064910888672, 0.05932426452636719, 0.061287879943847656, 0.06325149536132812, 0.0652151107788086, 0.06717872619628906, 0.06914234161376953, 0.07110595703125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 7.0, 5.0, 3.0, 6.0, 11.0, 13.0, 21.0, 22.0, 50.0, 103.0, 205.0, 775.0, 5639.0, 701459.0, 3476860.0, 7752.0, 883.0, 244.0, 91.0, 43.0, 28.0, 18.0, 14.0, 6.0, 7.0, 5.0, 2.0, 4.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.259765625, -2.18701171875, -2.1142578125, -2.04150390625, -1.96875, -1.89599609375, -1.8232421875, -1.75048828125, -1.677734375, -1.60498046875, -1.5322265625, -1.45947265625, -1.38671875, -1.31396484375, -1.2412109375, -1.16845703125, -1.095703125, -1.02294921875, -0.9501953125, -0.87744140625, -0.8046875, -0.73193359375, -0.6591796875, -0.58642578125, -0.513671875, -0.44091796875, -0.3681640625, -0.29541015625, -0.22265625, -0.14990234375, -0.0771484375, -0.00439453125, 0.068359375, 0.14111328125, 0.2138671875, 0.28662109375, 0.359375, 0.43212890625, 0.5048828125, 0.57763671875, 0.650390625, 0.72314453125, 0.7958984375, 0.86865234375, 0.94140625, 1.01416015625, 1.0869140625, 1.15966796875, 1.232421875, 1.30517578125, 1.3779296875, 1.45068359375, 1.5234375, 1.59619140625, 1.6689453125, 1.74169921875, 1.814453125, 1.88720703125, 1.9599609375, 2.03271484375, 2.10546875, 2.17822265625, 2.2509765625, 2.32373046875, 2.396484375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 3.0, 4.0, 4.0, 6.0, 12.0, 8.0, 16.0, 22.0, 33.0, 43.0, 78.0, 179.0, 425.0, 1516.0, 982.0, 326.0, 146.0, 83.0, 54.0, 35.0, 22.0, 22.0, 13.0, 13.0, 3.0, 5.0, 6.0, 2.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.175048828125, -0.1703014373779297, -0.16555404663085938, -0.16080665588378906, -0.15605926513671875, -0.15131187438964844, -0.14656448364257812, -0.1418170928955078, -0.1370697021484375, -0.1323223114013672, -0.12757492065429688, -0.12282752990722656, -0.11808013916015625, -0.11333274841308594, -0.10858535766601562, -0.10383796691894531, -0.099090576171875, -0.09434318542480469, -0.08959579467773438, -0.08484840393066406, -0.08010101318359375, -0.07535362243652344, -0.07060623168945312, -0.06585884094238281, -0.0611114501953125, -0.05636405944824219, -0.051616668701171875, -0.04686927795410156, -0.04212188720703125, -0.03737449645996094, -0.032627105712890625, -0.027879714965820312, -0.02313232421875, -0.018384933471679688, -0.013637542724609375, -0.008890151977539062, -0.00414276123046875, 0.0006046295166015625, 0.005352020263671875, 0.010099411010742188, 0.0148468017578125, 0.019594192504882812, 0.024341583251953125, 0.029088973999023438, 0.03383636474609375, 0.03858375549316406, 0.043331146240234375, 0.04807853698730469, 0.052825927734375, 0.05757331848144531, 0.062320709228515625, 0.06706809997558594, 0.07181549072265625, 0.07656288146972656, 0.08131027221679688, 0.08605766296386719, 0.0908050537109375, 0.09555244445800781, 0.10029983520507812, 0.10504722595214844, 0.10979461669921875, 0.11454200744628906, 0.11928939819335938, 0.12403678894042969, 0.1287841796875]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 10.0, 86.0, 853.0, 55.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.395724296569824, -6.24866247177124, -6.101600646972656, -5.9545392990112305, -5.8074774742126465, -5.6604156494140625, -5.5133538246154785, -5.3662919998168945, -5.219230651855469, -5.072168827056885, -4.925107002258301, -4.778045654296875, -4.630983829498291, -4.483922004699707, -4.336860179901123, -4.189798355102539, -4.042736530303955, -3.895674705505371, -3.748613119125366, -3.6015512943267822, -3.4544897079467773, -3.3074278831481934, -3.1603660583496094, -3.0133042335510254, -2.8662426471710205, -2.7191808223724365, -2.5721192359924316, -2.4250574111938477, -2.2779955863952637, -2.130934000015259, -1.9838721752166748, -1.8368104696273804, -1.689748764038086, -1.5426870584487915, -1.395625352859497, -1.248563528060913, -1.1015018224716187, -0.9544401168823242, -0.807378351688385, -0.6603165864944458, -0.5132548809051514, -0.36619314551353455, -0.21913141012191772, -0.0720696747303009, 0.07499206066131592, 0.22205376625061035, 0.36911553144454956, 0.5161772966384888, 0.6632390022277832, 0.8103007078170776, 0.9573624730110168, 1.104424238204956, 1.2514859437942505, 1.398547649383545, 1.545609474182129, 1.6926711797714233, 1.8397328853607178, 1.9867945909500122, 2.1338562965393066, 2.2809181213378906, 2.4279799461364746, 2.5750415325164795, 2.7221033573150635, 2.8691649436950684, 3.0162267684936523]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 9.0, 13.0, 11.0, 18.0, 33.0, 36.0, 46.0, 65.0, 76.0, 93.0, 85.0, 88.0, 92.0, 83.0, 54.0, 56.0, 37.0, 25.0, 22.0, 11.0, 11.0, 12.0, 4.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7862330079078674, -0.7607574462890625, -0.7352818250656128, -0.7098062634468079, -0.6843306422233582, -0.6588550806045532, -0.6333794593811035, -0.6079038977622986, -0.5824282765388489, -0.556952714920044, -0.5314770936965942, -0.5060015320777893, -0.4805259108543396, -0.45505034923553467, -0.42957472801208496, -0.40409916639328003, -0.3786235749721527, -0.3531479835510254, -0.32767239212989807, -0.30219680070877075, -0.27672120928764343, -0.2512456178665161, -0.22577004134655, -0.20029444992542267, -0.17481885850429535, -0.14934326708316803, -0.12386767566204071, -0.09839209169149399, -0.07291650027036667, -0.047440916299819946, -0.021965324878692627, 0.0035102665424346924, 0.02898585796356201, 0.05446144938468933, 0.07993704080581665, 0.10541262477636337, 0.1308882236480713, 0.15636380016803741, 0.18183939158916473, 0.20731498301029205, 0.23279057443141937, 0.2582661509513855, 0.2837417423725128, 0.30921733379364014, 0.33469292521476746, 0.3601685166358948, 0.3856441080570221, 0.4111196994781494, 0.43659529089927673, 0.46207088232040405, 0.48754647374153137, 0.5130220651626587, 0.5384976267814636, 0.5639732480049133, 0.5894488096237183, 0.614924430847168, 0.6403999924659729, 0.6658755540847778, 0.6913511753082275, 0.7168267369270325, 0.7423023581504822, 0.7677779197692871, 0.7932535409927368, 0.8187291026115417, 0.8442047238349915]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 2.0, 2.0, 2.0, 8.0, 3.0, 12.0, 17.0, 21.0, 32.0, 39.0, 67.0, 73.0, 119.0, 180.0, 289.0, 529.0, 927.0, 1830.0, 3989.0, 10391.0, 36449.0, 224143.0, 638274.0, 97295.0, 20806.0, 7007.0, 2787.0, 1401.0, 678.0, 424.0, 264.0, 155.0, 84.0, 74.0, 56.0, 31.0, 25.0, 17.0, 19.0, 10.0, 7.0, 7.0, 5.0, 2.0, 1.0, 1.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.399169921875, -0.386810302734375, -0.37445068359375, -0.362091064453125, -0.3497314453125, -0.337371826171875, -0.32501220703125, -0.312652587890625, -0.30029296875, -0.287933349609375, -0.27557373046875, -0.263214111328125, -0.2508544921875, -0.238494873046875, -0.22613525390625, -0.213775634765625, -0.201416015625, -0.189056396484375, -0.17669677734375, -0.164337158203125, -0.1519775390625, -0.139617919921875, -0.12725830078125, -0.114898681640625, -0.1025390625, -0.090179443359375, -0.07781982421875, -0.065460205078125, -0.0531005859375, -0.040740966796875, -0.02838134765625, -0.016021728515625, -0.003662109375, 0.008697509765625, 0.02105712890625, 0.033416748046875, 0.0457763671875, 0.058135986328125, 0.07049560546875, 0.082855224609375, 0.09521484375, 0.107574462890625, 0.11993408203125, 0.132293701171875, 0.1446533203125, 0.157012939453125, 0.16937255859375, 0.181732177734375, 0.194091796875, 0.206451416015625, 0.21881103515625, 0.231170654296875, 0.2435302734375, 0.255889892578125, 0.26824951171875, 0.280609130859375, 0.29296875, 0.305328369140625, 0.31768798828125, 0.330047607421875, 0.3424072265625, 0.354766845703125, 0.36712646484375, 0.379486083984375, 0.391845703125]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 3.0, 6.0, 10.0, 12.0, 14.0, 15.0, 20.0, 29.0, 32.0, 63.0, 77.0, 107.0, 123.0, 95.0, 103.0, 89.0, 57.0, 48.0, 24.0, 21.0, 14.0, 10.0, 8.0, 3.0, 3.0, 6.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.047607421875, -0.04596376419067383, -0.044320106506347656, -0.042676448822021484, -0.04103279113769531, -0.03938913345336914, -0.03774547576904297, -0.0361018180847168, -0.034458160400390625, -0.03281450271606445, -0.03117084503173828, -0.02952718734741211, -0.027883529663085938, -0.026239871978759766, -0.024596214294433594, -0.022952556610107422, -0.02130889892578125, -0.019665241241455078, -0.018021583557128906, -0.016377925872802734, -0.014734268188476562, -0.01309061050415039, -0.011446952819824219, -0.009803295135498047, -0.008159637451171875, -0.006515979766845703, -0.004872322082519531, -0.0032286643981933594, -0.0015850067138671875, 5.8650970458984375e-05, 0.0017023086547851562, 0.003345966339111328, 0.0049896240234375, 0.006633281707763672, 0.008276939392089844, 0.009920597076416016, 0.011564254760742188, 0.01320791244506836, 0.014851570129394531, 0.016495227813720703, 0.018138885498046875, 0.019782543182373047, 0.02142620086669922, 0.02306985855102539, 0.024713516235351562, 0.026357173919677734, 0.028000831604003906, 0.029644489288330078, 0.03128814697265625, 0.03293180465698242, 0.034575462341308594, 0.036219120025634766, 0.03786277770996094, 0.03950643539428711, 0.04115009307861328, 0.04279375076293945, 0.044437408447265625, 0.0460810661315918, 0.04772472381591797, 0.04936838150024414, 0.05101203918457031, 0.052655696868896484, 0.054299354553222656, 0.05594301223754883, 0.057586669921875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 4.0, 2.0, 2.0, 12.0, 7.0, 15.0, 13.0, 23.0, 26.0, 40.0, 56.0, 86.0, 114.0, 167.0, 222.0, 348.0, 544.0, 1107.0, 2686.0, 9351.0, 45346.0, 305762.0, 559168.0, 97435.0, 17761.0, 4516.0, 1620.0, 765.0, 440.0, 239.0, 176.0, 140.0, 101.0, 74.0, 47.0, 34.0, 26.0, 23.0, 13.0, 8.0, 10.0, 6.0, 8.0, 3.0, 7.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.36181640625, -0.350921630859375, -0.34002685546875, -0.329132080078125, -0.3182373046875, -0.307342529296875, -0.29644775390625, -0.285552978515625, -0.274658203125, -0.263763427734375, -0.25286865234375, -0.241973876953125, -0.2310791015625, -0.220184326171875, -0.20928955078125, -0.198394775390625, -0.1875, -0.176605224609375, -0.16571044921875, -0.154815673828125, -0.1439208984375, -0.133026123046875, -0.12213134765625, -0.111236572265625, -0.100341796875, -0.089447021484375, -0.07855224609375, -0.067657470703125, -0.0567626953125, -0.045867919921875, -0.03497314453125, -0.024078369140625, -0.01318359375, -0.002288818359375, 0.00860595703125, 0.019500732421875, 0.0303955078125, 0.041290283203125, 0.05218505859375, 0.063079833984375, 0.073974609375, 0.084869384765625, 0.09576416015625, 0.106658935546875, 0.1175537109375, 0.128448486328125, 0.13934326171875, 0.150238037109375, 0.1611328125, 0.172027587890625, 0.18292236328125, 0.193817138671875, 0.2047119140625, 0.215606689453125, 0.22650146484375, 0.237396240234375, 0.248291015625, 0.259185791015625, 0.27008056640625, 0.280975341796875, 0.2918701171875, 0.302764892578125, 0.31365966796875, 0.324554443359375, 0.33544921875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 8.0, 9.0, 8.0, 13.0, 9.0, 16.0, 23.0, 16.0, 34.0, 27.0, 18.0, 22.0, 38.0, 34.0, 28.0, 43.0, 37.0, 53.0, 43.0, 44.0, 55.0, 43.0, 39.0, 40.0, 32.0, 41.0, 33.0, 23.0, 28.0, 22.0, 24.0, 16.0, 11.0, 11.0, 12.0, 15.0, 7.0, 5.0, 5.0, 9.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.16162109375, -0.15612411499023438, -0.15062713623046875, -0.14513015747070312, -0.1396331787109375, -0.13413619995117188, -0.12863922119140625, -0.12314224243164062, -0.117645263671875, -0.11214828491210938, -0.10665130615234375, -0.10115432739257812, -0.0956573486328125, -0.09016036987304688, -0.08466339111328125, -0.07916641235351562, -0.07366943359375, -0.06817245483398438, -0.06267547607421875, -0.057178497314453125, -0.0516815185546875, -0.046184539794921875, -0.04068756103515625, -0.035190582275390625, -0.029693603515625, -0.024196624755859375, -0.01869964599609375, -0.013202667236328125, -0.0077056884765625, -0.002208709716796875, 0.00328826904296875, 0.008785247802734375, 0.0142822265625, 0.019779205322265625, 0.02527618408203125, 0.030773162841796875, 0.0362701416015625, 0.041767120361328125, 0.04726409912109375, 0.052761077880859375, 0.058258056640625, 0.06375503540039062, 0.06925201416015625, 0.07474899291992188, 0.0802459716796875, 0.08574295043945312, 0.09123992919921875, 0.09673690795898438, 0.10223388671875, 0.10773086547851562, 0.11322784423828125, 0.11872482299804688, 0.1242218017578125, 0.12971878051757812, 0.13521575927734375, 0.14071273803710938, 0.146209716796875, 0.15170669555664062, 0.15720367431640625, 0.16270065307617188, 0.1681976318359375, 0.17369461059570312, 0.17919158935546875, 0.18468856811523438, 0.190185546875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 7.0, 3.0, 6.0, 9.0, 14.0, 14.0, 36.0, 50.0, 111.0, 208.0, 456.0, 1224.0, 5185.0, 58058.0, 840706.0, 131364.0, 8376.0, 1587.0, 566.0, 261.0, 134.0, 51.0, 38.0, 38.0, 16.0, 5.0, 10.0, 11.0, 3.0, 5.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.466796875, -0.45331573486328125, -0.4398345947265625, -0.42635345458984375, -0.412872314453125, -0.39939117431640625, -0.3859100341796875, -0.37242889404296875, -0.35894775390625, -0.34546661376953125, -0.3319854736328125, -0.31850433349609375, -0.305023193359375, -0.29154205322265625, -0.2780609130859375, -0.26457977294921875, -0.2510986328125, -0.23761749267578125, -0.2241363525390625, -0.21065521240234375, -0.197174072265625, -0.18369293212890625, -0.1702117919921875, -0.15673065185546875, -0.14324951171875, -0.12976837158203125, -0.1162872314453125, -0.10280609130859375, -0.089324951171875, -0.07584381103515625, -0.0623626708984375, -0.04888153076171875, -0.035400390625, -0.02191925048828125, -0.0084381103515625, 0.00504302978515625, 0.018524169921875, 0.03200531005859375, 0.0454864501953125, 0.05896759033203125, 0.07244873046875, 0.08592987060546875, 0.0994110107421875, 0.11289215087890625, 0.126373291015625, 0.13985443115234375, 0.1533355712890625, 0.16681671142578125, 0.1802978515625, 0.19377899169921875, 0.2072601318359375, 0.22074127197265625, 0.234222412109375, 0.24770355224609375, 0.2611846923828125, 0.27466583251953125, 0.28814697265625, 0.30162811279296875, 0.3151092529296875, 0.32859039306640625, 0.342071533203125, 0.35555267333984375, 0.3690338134765625, 0.38251495361328125, 0.39599609375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 7.0, 3.0, 4.0, 7.0, 7.0, 6.0, 11.0, 19.0, 14.0, 26.0, 44.0, 55.0, 102.0, 112.0, 145.0, 104.0, 96.0, 59.0, 55.0, 34.0, 21.0, 18.0, 22.0, 8.0, 5.0, 2.0, 1.0, 5.0, 2.0, 0.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.5643577575683594e-05, -3.466382622718811e-05, -3.368407487869263e-05, -3.2704323530197144e-05, -3.172457218170166e-05, -3.074482083320618e-05, -2.9765069484710693e-05, -2.878531813621521e-05, -2.7805566787719727e-05, -2.6825815439224243e-05, -2.584606409072876e-05, -2.4866312742233276e-05, -2.3886561393737793e-05, -2.290681004524231e-05, -2.1927058696746826e-05, -2.0947307348251343e-05, -1.996755599975586e-05, -1.8987804651260376e-05, -1.8008053302764893e-05, -1.702830195426941e-05, -1.6048550605773926e-05, -1.5068799257278442e-05, -1.4089047908782959e-05, -1.3109296560287476e-05, -1.2129545211791992e-05, -1.1149793863296509e-05, -1.0170042514801025e-05, -9.190291166305542e-06, -8.210539817810059e-06, -7.230788469314575e-06, -6.251037120819092e-06, -5.271285772323608e-06, -4.291534423828125e-06, -3.3117830753326416e-06, -2.332031726837158e-06, -1.3522803783416748e-06, -3.725290298461914e-07, 6.07222318649292e-07, 1.5869736671447754e-06, 2.566725015640259e-06, 3.546476364135742e-06, 4.526227712631226e-06, 5.505979061126709e-06, 6.485730409622192e-06, 7.465481758117676e-06, 8.44523310661316e-06, 9.424984455108643e-06, 1.0404735803604126e-05, 1.138448715209961e-05, 1.2364238500595093e-05, 1.3343989849090576e-05, 1.432374119758606e-05, 1.5303492546081543e-05, 1.6283243894577026e-05, 1.726299524307251e-05, 1.8242746591567993e-05, 1.9222497940063477e-05, 2.020224928855896e-05, 2.1182000637054443e-05, 2.2161751985549927e-05, 2.314150333404541e-05, 2.4121254682540894e-05, 2.5101006031036377e-05, 2.608075737953186e-05, 2.7060508728027344e-05]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 5.0, 8.0, 5.0, 7.0, 11.0, 12.0, 17.0, 36.0, 42.0, 55.0, 70.0, 110.0, 179.0, 270.0, 493.0, 911.0, 2164.0, 6473.0, 26121.0, 153487.0, 674748.0, 147433.0, 25094.0, 6375.0, 2190.0, 913.0, 501.0, 284.0, 155.0, 128.0, 64.0, 60.0, 43.0, 28.0, 17.0, 12.0, 6.0, 9.0, 8.0, 5.0, 0.0, 1.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.26953125, -0.2603912353515625, -0.251251220703125, -0.2421112060546875, -0.23297119140625, -0.2238311767578125, -0.214691162109375, -0.2055511474609375, -0.1964111328125, -0.1872711181640625, -0.178131103515625, -0.1689910888671875, -0.15985107421875, -0.1507110595703125, -0.141571044921875, -0.1324310302734375, -0.123291015625, -0.1141510009765625, -0.105010986328125, -0.0958709716796875, -0.08673095703125, -0.0775909423828125, -0.068450927734375, -0.0593109130859375, -0.0501708984375, -0.0410308837890625, -0.031890869140625, -0.0227508544921875, -0.01361083984375, -0.0044708251953125, 0.004669189453125, 0.0138092041015625, 0.02294921875, 0.0320892333984375, 0.041229248046875, 0.0503692626953125, 0.05950927734375, 0.0686492919921875, 0.077789306640625, 0.0869293212890625, 0.0960693359375, 0.1052093505859375, 0.114349365234375, 0.1234893798828125, 0.13262939453125, 0.1417694091796875, 0.150909423828125, 0.1600494384765625, 0.169189453125, 0.1783294677734375, 0.187469482421875, 0.1966094970703125, 0.20574951171875, 0.2148895263671875, 0.224029541015625, 0.2331695556640625, 0.2423095703125, 0.2514495849609375, 0.260589599609375, 0.2697296142578125, 0.27886962890625, 0.2880096435546875, 0.297149658203125, 0.3062896728515625, 0.3154296875]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 9.0, 6.0, 12.0, 11.0, 11.0, 9.0, 22.0, 34.0, 49.0, 66.0, 69.0, 107.0, 119.0, 97.0, 104.0, 72.0, 60.0, 38.0, 30.0, 30.0, 8.0, 10.0, 7.0, 4.0, 5.0, 3.0, 3.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1617431640625, -0.15545654296875, -0.149169921875, -0.14288330078125, -0.1365966796875, -0.13031005859375, -0.1240234375, -0.11773681640625, -0.1114501953125, -0.10516357421875, -0.098876953125, -0.09259033203125, -0.0863037109375, -0.08001708984375, -0.07373046875, -0.06744384765625, -0.0611572265625, -0.05487060546875, -0.048583984375, -0.04229736328125, -0.0360107421875, -0.02972412109375, -0.0234375, -0.01715087890625, -0.0108642578125, -0.00457763671875, 0.001708984375, 0.00799560546875, 0.0142822265625, 0.02056884765625, 0.02685546875, 0.03314208984375, 0.0394287109375, 0.04571533203125, 0.052001953125, 0.05828857421875, 0.0645751953125, 0.07086181640625, 0.0771484375, 0.08343505859375, 0.0897216796875, 0.09600830078125, 0.102294921875, 0.10858154296875, 0.1148681640625, 0.12115478515625, 0.12744140625, 0.13372802734375, 0.1400146484375, 0.14630126953125, 0.152587890625, 0.15887451171875, 0.1651611328125, 0.17144775390625, 0.177734375, 0.18402099609375, 0.1903076171875, 0.19659423828125, 0.202880859375, 0.20916748046875, 0.2154541015625, 0.22174072265625, 0.22802734375, 0.23431396484375, 0.2406005859375]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 9.0, 24.0, 159.0, 628.0, 167.0, 12.0, 3.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.105749130249023, -8.886743545532227, -8.66773796081543, -8.448732376098633, -8.229726791381836, -8.010721206665039, -7.791715621948242, -7.572710037231445, -7.353704452514648, -7.134698867797852, -6.915693283081055, -6.696687698364258, -6.477682113647461, -6.258676528930664, -6.039670944213867, -5.82066535949707, -5.601659774780273, -5.382654190063477, -5.16364860534668, -4.944643020629883, -4.725637435913086, -4.506631851196289, -4.287626266479492, -4.068620681762695, -3.8496146202087402, -3.6306090354919434, -3.4116034507751465, -3.1925978660583496, -2.9735922813415527, -2.754586696624756, -2.535581111907959, -2.316575527191162, -2.0975699424743652, -1.8785643577575684, -1.6595587730407715, -1.4405531883239746, -1.2215476036071777, -1.0025418996810913, -0.7835363149642944, -0.5645307302474976, -0.3455251455307007, -0.12651954591274261, 0.09248605370521545, 0.3114916682243347, 0.5304972529411316, 0.7495028972625732, 0.9685084819793701, 1.187514066696167, 1.4065196514129639, 1.6255252361297607, 1.8445308208465576, 2.0635364055633545, 2.2825419902801514, 2.5015478134155273, 2.720553398132324, 2.939558982849121, 3.158564567565918, 3.377570152282715, 3.5965757369995117, 3.8155813217163086, 4.0345869064331055, 4.253592491149902, 4.472598075866699, 4.691603660583496, 4.910609245300293]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 5.0, 4.0, 8.0, 14.0, 14.0, 23.0, 31.0, 42.0, 50.0, 39.0, 57.0, 59.0, 81.0, 86.0, 75.0, 69.0, 76.0, 46.0, 54.0, 46.0, 25.0, 31.0, 18.0, 18.0, 9.0, 7.0, 7.0, 3.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.9901975393295288, -1.9276379346847534, -1.8650784492492676, -1.8025188446044922, -1.7399592399597168, -1.6773996353149414, -1.6148401498794556, -1.5522805452346802, -1.4897210597991943, -1.427161455154419, -1.364601969718933, -1.3020423650741577, -1.2394827604293823, -1.1769232749938965, -1.114363670349121, -1.0518040657043457, -0.9892444610595703, -0.9266849160194397, -0.8641253113746643, -0.8015657663345337, -0.7390061616897583, -0.6764466166496277, -0.6138870716094971, -0.5513274669647217, -0.48876792192459106, -0.42620834708213806, -0.36364877223968506, -0.30108922719955444, -0.23852965235710144, -0.17597007751464844, -0.11341053247451782, -0.05085095763206482, 0.011708736419677734, 0.07426830381155014, 0.13682787120342255, 0.19938743114471436, 0.26194700598716736, 0.32450658082962036, 0.387066125869751, 0.449625700712204, 0.512185275554657, 0.5747448205947876, 0.637304425239563, 0.6998639702796936, 0.7624235153198242, 0.8249831199645996, 0.8875426650047302, 0.9501022100448608, 1.0126618146896362, 1.0752214193344116, 1.1377809047698975, 1.2003405094146729, 1.2629001140594482, 1.3254597187042236, 1.3880192041397095, 1.4505788087844849, 1.5131382942199707, 1.575697898864746, 1.638257384300232, 1.7008169889450073, 1.7633765935897827, 1.8259360790252686, 1.888495683670044, 1.9510552883148193, 2.0136148929595947]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 5.0, 5.0, 9.0, 12.0, 19.0, 27.0, 64.0, 76.0, 175.0, 639.0, 5105.0, 3930610.0, 253829.0, 2904.0, 456.0, 174.0, 83.0, 33.0, 23.0, 13.0, 5.0, 7.0, 4.0, 3.0, 3.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.775390625, -2.69805908203125, -2.6207275390625, -2.54339599609375, -2.466064453125, -2.38873291015625, -2.3114013671875, -2.23406982421875, -2.15673828125, -2.07940673828125, -2.0020751953125, -1.92474365234375, -1.847412109375, -1.77008056640625, -1.6927490234375, -1.61541748046875, -1.5380859375, -1.46075439453125, -1.3834228515625, -1.30609130859375, -1.228759765625, -1.15142822265625, -1.0740966796875, -0.99676513671875, -0.91943359375, -0.84210205078125, -0.7647705078125, -0.68743896484375, -0.610107421875, -0.53277587890625, -0.4554443359375, -0.37811279296875, -0.30078125, -0.22344970703125, -0.1461181640625, -0.06878662109375, 0.008544921875, 0.08587646484375, 0.1632080078125, 0.24053955078125, 0.31787109375, 0.39520263671875, 0.4725341796875, 0.54986572265625, 0.627197265625, 0.70452880859375, 0.7818603515625, 0.85919189453125, 0.9365234375, 1.01385498046875, 1.0911865234375, 1.16851806640625, 1.245849609375, 1.32318115234375, 1.4005126953125, 1.47784423828125, 1.55517578125, 1.63250732421875, 1.7098388671875, 1.78717041015625, 1.864501953125, 1.94183349609375, 2.0191650390625, 2.09649658203125, 2.173828125]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 5.0, 6.0, 13.0, 12.0, 15.0, 24.0, 45.0, 46.0, 90.0, 98.0, 119.0, 120.0, 100.0, 78.0, 66.0, 57.0, 44.0, 18.0, 16.0, 6.0, 6.0, 6.0, 5.0, 3.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0758056640625, -0.07365751266479492, -0.07150936126708984, -0.06936120986938477, -0.06721305847167969, -0.06506490707397461, -0.06291675567626953, -0.06076860427856445, -0.058620452880859375, -0.0564723014831543, -0.05432415008544922, -0.05217599868774414, -0.05002784729003906, -0.047879695892333984, -0.045731544494628906, -0.04358339309692383, -0.04143524169921875, -0.03928709030151367, -0.037138938903808594, -0.034990787506103516, -0.03284263610839844, -0.03069448471069336, -0.02854633331298828, -0.026398181915283203, -0.024250030517578125, -0.022101879119873047, -0.01995372772216797, -0.01780557632446289, -0.015657424926757812, -0.013509273529052734, -0.011361122131347656, -0.009212970733642578, -0.0070648193359375, -0.004916667938232422, -0.0027685165405273438, -0.0006203651428222656, 0.0015277862548828125, 0.0036759376525878906, 0.005824089050292969, 0.007972240447998047, 0.010120391845703125, 0.012268543243408203, 0.014416694641113281, 0.01656484603881836, 0.018712997436523438, 0.020861148834228516, 0.023009300231933594, 0.025157451629638672, 0.02730560302734375, 0.029453754425048828, 0.031601905822753906, 0.033750057220458984, 0.03589820861816406, 0.03804636001586914, 0.04019451141357422, 0.0423426628112793, 0.044490814208984375, 0.04663896560668945, 0.04878711700439453, 0.05093526840209961, 0.05308341979980469, 0.055231571197509766, 0.057379722595214844, 0.05952787399291992, 0.061676025390625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 5.0, 10.0, 19.0, 20.0, 37.0, 73.0, 112.0, 180.0, 495.0, 2692.0, 73641.0, 4080653.0, 34177.0, 1542.0, 339.0, 114.0, 78.0, 47.0, 25.0, 13.0, 7.0, 3.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3330078125, -1.29058837890625, -1.2481689453125, -1.20574951171875, -1.163330078125, -1.12091064453125, -1.0784912109375, -1.03607177734375, -0.99365234375, -0.95123291015625, -0.9088134765625, -0.86639404296875, -0.823974609375, -0.78155517578125, -0.7391357421875, -0.69671630859375, -0.654296875, -0.61187744140625, -0.5694580078125, -0.52703857421875, -0.484619140625, -0.44219970703125, -0.3997802734375, -0.35736083984375, -0.31494140625, -0.27252197265625, -0.2301025390625, -0.18768310546875, -0.145263671875, -0.10284423828125, -0.0604248046875, -0.01800537109375, 0.0244140625, 0.06683349609375, 0.1092529296875, 0.15167236328125, 0.194091796875, 0.23651123046875, 0.2789306640625, 0.32135009765625, 0.36376953125, 0.40618896484375, 0.4486083984375, 0.49102783203125, 0.533447265625, 0.57586669921875, 0.6182861328125, 0.66070556640625, 0.703125, 0.74554443359375, 0.7879638671875, 0.83038330078125, 0.872802734375, 0.91522216796875, 0.9576416015625, 1.00006103515625, 1.04248046875, 1.08489990234375, 1.1273193359375, 1.16973876953125, 1.212158203125, 1.25457763671875, 1.2969970703125, 1.33941650390625, 1.3818359375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 5.0, 7.0, 10.0, 21.0, 31.0, 51.0, 83.0, 245.0, 807.0, 2020.0, 501.0, 176.0, 61.0, 30.0, 23.0, 5.0, 5.0, 4.0, 1.0, 2.0], "bins": [-0.326171875, -0.3200550079345703, -0.3139381408691406, -0.30782127380371094, -0.30170440673828125, -0.29558753967285156, -0.2894706726074219, -0.2833538055419922, -0.2772369384765625, -0.2711200714111328, -0.2650032043457031, -0.25888633728027344, -0.25276947021484375, -0.24665260314941406, -0.24053573608398438, -0.2344188690185547, -0.228302001953125, -0.2221851348876953, -0.21606826782226562, -0.20995140075683594, -0.20383453369140625, -0.19771766662597656, -0.19160079956054688, -0.1854839324951172, -0.1793670654296875, -0.1732501983642578, -0.16713333129882812, -0.16101646423339844, -0.15489959716796875, -0.14878273010253906, -0.14266586303710938, -0.1365489959716797, -0.13043212890625, -0.12431526184082031, -0.11819839477539062, -0.11208152770996094, -0.10596466064453125, -0.09984779357910156, -0.09373092651367188, -0.08761405944824219, -0.0814971923828125, -0.07538032531738281, -0.06926345825195312, -0.06314659118652344, -0.05702972412109375, -0.05091285705566406, -0.044795989990234375, -0.03867912292480469, -0.032562255859375, -0.026445388793945312, -0.020328521728515625, -0.014211654663085938, -0.00809478759765625, -0.0019779205322265625, 0.004138946533203125, 0.010255813598632812, 0.0163726806640625, 0.022489547729492188, 0.028606414794921875, 0.03472328186035156, 0.04084014892578125, 0.04695701599121094, 0.053073883056640625, 0.05919075012207031, 0.0653076171875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 15.0, 65.0, 310.0, 414.0, 162.0, 31.0, 5.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-2.764394760131836, -2.7144267559051514, -2.6644585132598877, -2.614490509033203, -2.5645225048065186, -2.514554262161255, -2.4645862579345703, -2.4146182537078857, -2.364650011062622, -2.3146820068359375, -2.264713764190674, -2.2147457599639893, -2.1647777557373047, -2.114809513092041, -2.0648415088653564, -2.014873504638672, -1.9649055004119873, -1.9149373769760132, -1.8649693727493286, -1.8150012493133545, -1.7650331258773804, -1.7150651216506958, -1.6650969982147217, -1.615128993988037, -1.5651607513427734, -1.5151926279067993, -1.4652246236801147, -1.4152565002441406, -1.3652883768081665, -1.315320372581482, -1.2653522491455078, -1.2153842449188232, -1.1654160022735596, -1.1154478788375854, -1.0654798746109009, -1.0155117511749268, -0.9655436873435974, -0.9155756235122681, -0.865607500076294, -0.8156394362449646, -0.7656713724136353, -0.7157033085823059, -0.6657351851463318, -0.6157671213150024, -0.5657990574836731, -0.5158309936523438, -0.46586287021636963, -0.4158948063850403, -0.36592674255371094, -0.3159586489200592, -0.26599058508872986, -0.21602249145507812, -0.16605441272258759, -0.11608633399009705, -0.06611824035644531, -0.016150176525115967, 0.03381791710853577, 0.0837859958410263, 0.13375407457351685, 0.18372216820716858, 0.23369024693965912, 0.28365832567214966, 0.3336264193058014, 0.38359448313713074, 0.43356257677078247]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 3.0, 6.0, 4.0, 5.0, 7.0, 10.0, 13.0, 12.0, 25.0, 32.0, 31.0, 44.0, 45.0, 37.0, 64.0, 84.0, 59.0, 67.0, 68.0, 67.0, 66.0, 56.0, 41.0, 34.0, 33.0, 25.0, 16.0, 16.0, 10.0, 9.0, 8.0, 6.0, 2.0, 2.0, 2.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.36810165643692017, -0.3520564138889313, -0.3360111713409424, -0.3199659585952759, -0.303920716047287, -0.2878754734992981, -0.2718302607536316, -0.2557850182056427, -0.2397397756576538, -0.22369453310966492, -0.20764930546283722, -0.19160407781600952, -0.17555883526802063, -0.15951359272003174, -0.14346836507320404, -0.12742313742637634, -0.11137789487838745, -0.09533265978097916, -0.07928742468357086, -0.06324218958616257, -0.04719695448875427, -0.031151719391345978, -0.015106484293937683, 0.0009387508034706116, 0.016983985900878906, 0.0330292209982872, 0.049074456095695496, 0.06511969119310379, 0.08116492629051208, 0.09721016138792038, 0.11325539648532867, 0.12930062413215637, 0.1453458070755005, 0.16139104962348938, 0.17743627727031708, 0.19348150491714478, 0.20952674746513367, 0.22557199001312256, 0.24161721765995026, 0.25766244530677795, 0.27370768785476685, 0.28975293040275574, 0.30579817295074463, 0.32184338569641113, 0.3378886282444, 0.3539338707923889, 0.3699790835380554, 0.3860243260860443, 0.4020695686340332, 0.4181148111820221, 0.434160053730011, 0.4502052664756775, 0.4662505090236664, 0.4822957515716553, 0.4983409643173218, 0.5143862366676331, 0.5304314494132996, 0.5464766621589661, 0.5625219345092773, 0.5785671472549438, 0.5946123600006104, 0.6106576323509216, 0.6267028450965881, 0.6427481174468994, 0.6587933301925659]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 4.0, 6.0, 4.0, 6.0, 20.0, 15.0, 23.0, 26.0, 44.0, 64.0, 75.0, 144.0, 190.0, 278.0, 454.0, 831.0, 1690.0, 4059.0, 13548.0, 84231.0, 550977.0, 335911.0, 41461.0, 8492.0, 2928.0, 1299.0, 665.0, 384.0, 223.0, 153.0, 91.0, 78.0, 58.0, 33.0, 21.0, 17.0, 13.0, 9.0, 8.0, 5.0, 3.0, 5.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 3.0], "bins": [-0.420654296875, -0.40891265869140625, -0.3971710205078125, -0.38542938232421875, -0.373687744140625, -0.36194610595703125, -0.3502044677734375, -0.33846282958984375, -0.32672119140625, -0.31497955322265625, -0.3032379150390625, -0.29149627685546875, -0.279754638671875, -0.26801300048828125, -0.2562713623046875, -0.24452972412109375, -0.2327880859375, -0.22104644775390625, -0.2093048095703125, -0.19756317138671875, -0.185821533203125, -0.17407989501953125, -0.1623382568359375, -0.15059661865234375, -0.13885498046875, -0.12711334228515625, -0.1153717041015625, -0.10363006591796875, -0.091888427734375, -0.08014678955078125, -0.0684051513671875, -0.05666351318359375, -0.044921875, -0.03318023681640625, -0.0214385986328125, -0.00969696044921875, 0.002044677734375, 0.01378631591796875, 0.0255279541015625, 0.03726959228515625, 0.04901123046875, 0.06075286865234375, 0.0724945068359375, 0.08423614501953125, 0.095977783203125, 0.10771942138671875, 0.1194610595703125, 0.13120269775390625, 0.1429443359375, 0.15468597412109375, 0.1664276123046875, 0.17816925048828125, 0.189910888671875, 0.20165252685546875, 0.2133941650390625, 0.22513580322265625, 0.23687744140625, 0.24861907958984375, 0.2603607177734375, 0.27210235595703125, 0.283843994140625, 0.29558563232421875, 0.3073272705078125, 0.31906890869140625, 0.330810546875]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 0.0, 5.0, 8.0, 10.0, 21.0, 26.0, 37.0, 57.0, 76.0, 109.0, 120.0, 117.0, 98.0, 89.0, 62.0, 56.0, 41.0, 26.0, 12.0, 5.0, 7.0, 5.0, 4.0, 1.0, 2.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06683349609375, -0.06488800048828125, -0.0629425048828125, -0.06099700927734375, -0.059051513671875, -0.05710601806640625, -0.0551605224609375, -0.05321502685546875, -0.05126953125, -0.04932403564453125, -0.0473785400390625, -0.04543304443359375, -0.043487548828125, -0.04154205322265625, -0.0395965576171875, -0.03765106201171875, -0.03570556640625, -0.03376007080078125, -0.0318145751953125, -0.02986907958984375, -0.027923583984375, -0.02597808837890625, -0.0240325927734375, -0.02208709716796875, -0.0201416015625, -0.01819610595703125, -0.0162506103515625, -0.01430511474609375, -0.012359619140625, -0.01041412353515625, -0.0084686279296875, -0.00652313232421875, -0.00457763671875, -0.00263214111328125, -0.0006866455078125, 0.00125885009765625, 0.003204345703125, 0.00514984130859375, 0.0070953369140625, 0.00904083251953125, 0.010986328125, 0.01293182373046875, 0.0148773193359375, 0.01682281494140625, 0.018768310546875, 0.02071380615234375, 0.0226593017578125, 0.02460479736328125, 0.02655029296875, 0.02849578857421875, 0.0304412841796875, 0.03238677978515625, 0.034332275390625, 0.03627777099609375, 0.0382232666015625, 0.04016876220703125, 0.0421142578125, 0.04405975341796875, 0.0460052490234375, 0.04795074462890625, 0.049896240234375, 0.05184173583984375, 0.0537872314453125, 0.05573272705078125, 0.05767822265625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 3.0, 0.0, 3.0, 7.0, 14.0, 12.0, 18.0, 25.0, 47.0, 52.0, 95.0, 122.0, 178.0, 253.0, 433.0, 760.0, 1567.0, 3454.0, 12037.0, 69362.0, 456594.0, 423872.0, 61989.0, 10846.0, 3372.0, 1451.0, 765.0, 440.0, 238.0, 174.0, 107.0, 63.0, 52.0, 43.0, 28.0, 23.0, 15.0, 11.0, 12.0, 10.0, 1.0, 5.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.331298828125, -0.32125091552734375, -0.3112030029296875, -0.30115509033203125, -0.291107177734375, -0.28105926513671875, -0.2710113525390625, -0.26096343994140625, -0.25091552734375, -0.24086761474609375, -0.2308197021484375, -0.22077178955078125, -0.210723876953125, -0.20067596435546875, -0.1906280517578125, -0.18058013916015625, -0.1705322265625, -0.16048431396484375, -0.1504364013671875, -0.14038848876953125, -0.130340576171875, -0.12029266357421875, -0.1102447509765625, -0.10019683837890625, -0.09014892578125, -0.08010101318359375, -0.0700531005859375, -0.06000518798828125, -0.049957275390625, -0.03990936279296875, -0.0298614501953125, -0.01981353759765625, -0.009765625, 0.00028228759765625, 0.0103302001953125, 0.02037811279296875, 0.030426025390625, 0.04047393798828125, 0.0505218505859375, 0.06056976318359375, 0.07061767578125, 0.08066558837890625, 0.0907135009765625, 0.10076141357421875, 0.110809326171875, 0.12085723876953125, 0.1309051513671875, 0.14095306396484375, 0.1510009765625, 0.16104888916015625, 0.1710968017578125, 0.18114471435546875, 0.191192626953125, 0.20124053955078125, 0.2112884521484375, 0.22133636474609375, 0.23138427734375, 0.24143218994140625, 0.2514801025390625, 0.26152801513671875, 0.271575927734375, 0.28162384033203125, 0.2916717529296875, 0.30171966552734375, 0.311767578125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 4.0, 9.0, 13.0, 10.0, 9.0, 11.0, 14.0, 24.0, 23.0, 29.0, 38.0, 34.0, 50.0, 35.0, 49.0, 40.0, 41.0, 54.0, 42.0, 36.0, 48.0, 41.0, 42.0, 48.0, 36.0, 54.0, 25.0, 27.0, 23.0, 19.0, 19.0, 11.0, 10.0, 11.0, 5.0, 8.0, 3.0, 3.0, 3.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.2353515625, -0.22888946533203125, -0.2224273681640625, -0.21596527099609375, -0.209503173828125, -0.20304107666015625, -0.1965789794921875, -0.19011688232421875, -0.18365478515625, -0.17719268798828125, -0.1707305908203125, -0.16426849365234375, -0.157806396484375, -0.15134429931640625, -0.1448822021484375, -0.13842010498046875, -0.1319580078125, -0.12549591064453125, -0.1190338134765625, -0.11257171630859375, -0.106109619140625, -0.09964752197265625, -0.0931854248046875, -0.08672332763671875, -0.08026123046875, -0.07379913330078125, -0.0673370361328125, -0.06087493896484375, -0.054412841796875, -0.04795074462890625, -0.0414886474609375, -0.03502655029296875, -0.028564453125, -0.02210235595703125, -0.0156402587890625, -0.00917816162109375, -0.002716064453125, 0.00374603271484375, 0.0102081298828125, 0.01667022705078125, 0.02313232421875, 0.02959442138671875, 0.0360565185546875, 0.04251861572265625, 0.048980712890625, 0.05544281005859375, 0.0619049072265625, 0.06836700439453125, 0.0748291015625, 0.08129119873046875, 0.0877532958984375, 0.09421539306640625, 0.100677490234375, 0.10713958740234375, 0.1136016845703125, 0.12006378173828125, 0.12652587890625, 0.13298797607421875, 0.1394500732421875, 0.14591217041015625, 0.152374267578125, 0.15883636474609375, 0.1652984619140625, 0.17176055908203125, 0.17822265625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 4.0, 3.0, 1.0, 5.0, 8.0, 5.0, 12.0, 9.0, 22.0, 14.0, 27.0, 29.0, 53.0, 126.0, 176.0, 392.0, 881.0, 2973.0, 17756.0, 563712.0, 443143.0, 14872.0, 2619.0, 813.0, 384.0, 192.0, 121.0, 69.0, 37.0, 24.0, 10.0, 10.0, 11.0, 15.0, 11.0, 2.0, 2.0, 6.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.476806640625, -0.4631690979003906, -0.44953155517578125, -0.4358940124511719, -0.4222564697265625, -0.4086189270019531, -0.39498138427734375, -0.3813438415527344, -0.367706298828125, -0.3540687561035156, -0.34043121337890625, -0.3267936706542969, -0.3131561279296875, -0.2995185852050781, -0.28588104248046875, -0.2722434997558594, -0.25860595703125, -0.24496841430664062, -0.23133087158203125, -0.21769332885742188, -0.2040557861328125, -0.19041824340820312, -0.17678070068359375, -0.16314315795898438, -0.149505615234375, -0.13586807250976562, -0.12223052978515625, -0.10859298706054688, -0.0949554443359375, -0.08131790161132812, -0.06768035888671875, -0.054042816162109375, -0.0404052734375, -0.026767730712890625, -0.01313018798828125, 0.000507354736328125, 0.0141448974609375, 0.027782440185546875, 0.04141998291015625, 0.055057525634765625, 0.068695068359375, 0.08233261108398438, 0.09597015380859375, 0.10960769653320312, 0.1232452392578125, 0.13688278198242188, 0.15052032470703125, 0.16415786743164062, 0.17779541015625, 0.19143295288085938, 0.20507049560546875, 0.21870803833007812, 0.2323455810546875, 0.24598312377929688, 0.25962066650390625, 0.2732582092285156, 0.286895751953125, 0.3005332946777344, 0.31417083740234375, 0.3278083801269531, 0.3414459228515625, 0.3550834655761719, 0.36872100830078125, 0.3823585510253906, 0.39599609375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 0.0, 2.0, 0.0, 5.0, 6.0, 3.0, 10.0, 17.0, 20.0, 25.0, 63.0, 82.0, 125.0, 168.0, 150.0, 108.0, 73.0, 51.0, 31.0, 9.0, 21.0, 13.0, 6.0, 5.0, 6.0, 6.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.9173831939697266e-05, -4.787743091583252e-05, -4.6581029891967773e-05, -4.528462886810303e-05, -4.398822784423828e-05, -4.2691826820373535e-05, -4.139542579650879e-05, -4.009902477264404e-05, -3.88026237487793e-05, -3.750622272491455e-05, -3.6209821701049805e-05, -3.491342067718506e-05, -3.361701965332031e-05, -3.2320618629455566e-05, -3.102421760559082e-05, -2.9727816581726074e-05, -2.8431415557861328e-05, -2.7135014533996582e-05, -2.5838613510131836e-05, -2.454221248626709e-05, -2.3245811462402344e-05, -2.1949410438537598e-05, -2.065300941467285e-05, -1.9356608390808105e-05, -1.806020736694336e-05, -1.6763806343078613e-05, -1.5467405319213867e-05, -1.4171004295349121e-05, -1.2874603271484375e-05, -1.1578202247619629e-05, -1.0281801223754883e-05, -8.985400199890137e-06, -7.68899917602539e-06, -6.3925981521606445e-06, -5.0961971282958984e-06, -3.7997961044311523e-06, -2.5033950805664062e-06, -1.2069940567016602e-06, 8.940696716308594e-08, 1.385807991027832e-06, 2.682209014892578e-06, 3.978610038757324e-06, 5.27501106262207e-06, 6.571412086486816e-06, 7.867813110351562e-06, 9.164214134216309e-06, 1.0460615158081055e-05, 1.17570161819458e-05, 1.3053417205810547e-05, 1.4349818229675293e-05, 1.564621925354004e-05, 1.6942620277404785e-05, 1.823902130126953e-05, 1.9535422325134277e-05, 2.0831823348999023e-05, 2.212822437286377e-05, 2.3424625396728516e-05, 2.4721026420593262e-05, 2.6017427444458008e-05, 2.7313828468322754e-05, 2.86102294921875e-05, 2.9906630516052246e-05, 3.120303153991699e-05, 3.249943256378174e-05, 3.3795833587646484e-05]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 6.0, 2.0, 3.0, 4.0, 6.0, 11.0, 15.0, 16.0, 36.0, 60.0, 157.0, 426.0, 1198.0, 6955.0, 227340.0, 793024.0, 16142.0, 2094.0, 619.0, 234.0, 93.0, 51.0, 28.0, 15.0, 7.0, 4.0, 3.0, 4.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.472900390625, -0.4548301696777344, -0.43675994873046875, -0.4186897277832031, -0.4006195068359375, -0.3825492858886719, -0.36447906494140625, -0.3464088439941406, -0.328338623046875, -0.3102684020996094, -0.29219818115234375, -0.2741279602050781, -0.2560577392578125, -0.23798751831054688, -0.21991729736328125, -0.20184707641601562, -0.18377685546875, -0.16570663452148438, -0.14763641357421875, -0.12956619262695312, -0.1114959716796875, -0.09342575073242188, -0.07535552978515625, -0.057285308837890625, -0.039215087890625, -0.021144866943359375, -0.00307464599609375, 0.014995574951171875, 0.0330657958984375, 0.051136016845703125, 0.06920623779296875, 0.08727645874023438, 0.1053466796875, 0.12341690063476562, 0.14148712158203125, 0.15955734252929688, 0.1776275634765625, 0.19569778442382812, 0.21376800537109375, 0.23183822631835938, 0.249908447265625, 0.2679786682128906, 0.28604888916015625, 0.3041191101074219, 0.3221893310546875, 0.3402595520019531, 0.35832977294921875, 0.3763999938964844, 0.39447021484375, 0.4125404357910156, 0.43061065673828125, 0.4486808776855469, 0.4667510986328125, 0.4848213195800781, 0.5028915405273438, 0.5209617614746094, 0.539031982421875, 0.5571022033691406, 0.5751724243164062, 0.5932426452636719, 0.6113128662109375, 0.6293830871582031, 0.6474533081054688, 0.6655235290527344, 0.68359375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 5.0, 3.0, 3.0, 7.0, 13.0, 23.0, 28.0, 32.0, 51.0, 52.0, 77.0, 89.0, 86.0, 101.0, 86.0, 78.0, 74.0, 50.0, 41.0, 17.0, 17.0, 15.0, 13.0, 11.0, 7.0, 3.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.12359619140625, -0.11888599395751953, -0.11417579650878906, -0.1094655990600586, -0.10475540161132812, -0.10004520416259766, -0.09533500671386719, -0.09062480926513672, -0.08591461181640625, -0.08120441436767578, -0.07649421691894531, -0.07178401947021484, -0.06707382202148438, -0.062363624572753906, -0.05765342712402344, -0.05294322967529297, -0.0482330322265625, -0.04352283477783203, -0.03881263732910156, -0.034102439880371094, -0.029392242431640625, -0.024682044982910156, -0.019971847534179688, -0.015261650085449219, -0.01055145263671875, -0.005841255187988281, -0.0011310577392578125, 0.0035791397094726562, 0.008289337158203125, 0.012999534606933594, 0.017709732055664062, 0.02241992950439453, 0.027130126953125, 0.03184032440185547, 0.03655052185058594, 0.041260719299316406, 0.045970916748046875, 0.050681114196777344, 0.05539131164550781, 0.06010150909423828, 0.06481170654296875, 0.06952190399169922, 0.07423210144042969, 0.07894229888916016, 0.08365249633789062, 0.0883626937866211, 0.09307289123535156, 0.09778308868408203, 0.1024932861328125, 0.10720348358154297, 0.11191368103027344, 0.1166238784790039, 0.12133407592773438, 0.12604427337646484, 0.1307544708251953, 0.13546466827392578, 0.14017486572265625, 0.14488506317138672, 0.1495952606201172, 0.15430545806884766, 0.15901565551757812, 0.1637258529663086, 0.16843605041503906, 0.17314624786376953, 0.1778564453125]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 11.0, 92.0, 480.0, 358.0, 54.0, 8.0, 3.0, 8.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.306140899658203, -5.115708827972412, -4.925276756286621, -4.734844207763672, -4.544412136077881, -4.35398006439209, -4.163547992706299, -3.973115921020508, -3.782683849334717, -3.592251777648926, -3.4018194675445557, -3.2113873958587646, -3.0209553241729736, -2.8305230140686035, -2.6400909423828125, -2.4496588706970215, -2.2592265605926514, -2.0687944889068604, -1.8783622980117798, -1.6879301071166992, -1.4974980354309082, -1.3070658445358276, -1.116633653640747, -0.926201581954956, -0.7357693910598755, -0.5453372597694397, -0.3549050986766815, -0.16447293758392334, 0.02595919370651245, 0.21639132499694824, 0.4068235158920288, 0.5972555875778198, 0.7876877784729004, 0.9781199097633362, 1.168552041053772, 1.3589842319488525, 1.5494163036346436, 1.7398484945297241, 1.9302806854248047, 2.1207127571105957, 2.3111448287963867, 2.5015769004821777, 2.692009210586548, 2.882441282272339, 3.07287335395813, 3.2633056640625, 3.453737735748291, 3.644169807434082, 3.834602117538452, 4.025034427642822, 4.215466499328613, 4.405898571014404, 4.596330642700195, 4.786762714385986, 4.977194786071777, 5.167627334594727, 5.358059406280518, 5.548491477966309, 5.7389235496521, 5.929355621337891, 6.11978816986084, 6.310220241546631, 6.500652313232422, 6.691084384918213, 6.881516456604004]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 3.0, 3.0, 8.0, 7.0, 15.0, 14.0, 10.0, 13.0, 21.0, 21.0, 29.0, 42.0, 39.0, 43.0, 38.0, 40.0, 39.0, 49.0, 55.0, 44.0, 43.0, 53.0, 43.0, 54.0, 40.0, 37.0, 30.0, 33.0, 29.0, 22.0, 20.0, 18.0, 10.0, 5.0, 6.0, 4.0, 3.0, 0.0, 6.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.3532865047454834, -1.3094385862350464, -1.2655906677246094, -1.2217426300048828, -1.1778947114944458, -1.1340467929840088, -1.0901988744735718, -1.0463509559631348, -1.0025029182434082, -0.9586549997329712, -0.9148070216178894, -0.8709591031074524, -0.8271111249923706, -0.7832632064819336, -0.7394152879714966, -0.6955673694610596, -0.6517194509506226, -0.6078715324401855, -0.5640235543251038, -0.5201756358146667, -0.47632768750190735, -0.43247973918914795, -0.38863182067871094, -0.34478387236595154, -0.30093592405319214, -0.25708797574043274, -0.21324004232883453, -0.16939210891723633, -0.12554416060447693, -0.08169621229171753, -0.03784829378128052, 0.005999654531478882, 0.04984772205352783, 0.09369566291570663, 0.13754360377788544, 0.18139153718948364, 0.22523948550224304, 0.26908743381500244, 0.31293535232543945, 0.35678330063819885, 0.40063124895095825, 0.44447919726371765, 0.48832714557647705, 0.5321750640869141, 0.5760229825973511, 0.6198709607124329, 0.6637188792228699, 0.7075668573379517, 0.7514147758483887, 0.7952626943588257, 0.8391106724739075, 0.8829585909843445, 0.9268065690994263, 0.9706544876098633, 1.0145024061203003, 1.0583503246307373, 1.1021983623504639, 1.1460462808609009, 1.189894199371338, 1.2337422370910645, 1.2775901556015015, 1.3214380741119385, 1.3652859926223755, 1.4091339111328125, 1.4529818296432495]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 2.0, 1.0, 4.0, 6.0, 10.0, 15.0, 23.0, 22.0, 46.0, 66.0, 80.0, 166.0, 268.0, 664.0, 1486.0, 4589.0, 21898.0, 298717.0, 3760895.0, 88488.0, 11304.0, 3045.0, 1175.0, 578.0, 324.0, 169.0, 98.0, 42.0, 31.0, 19.0, 16.0, 10.0, 6.0, 7.0, 3.0, 4.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.625, -0.6082496643066406, -0.5914993286132812, -0.5747489929199219, -0.5579986572265625, -0.5412483215332031, -0.5244979858398438, -0.5077476501464844, -0.490997314453125, -0.4742469787597656, -0.45749664306640625, -0.4407463073730469, -0.4239959716796875, -0.4072456359863281, -0.39049530029296875, -0.3737449645996094, -0.35699462890625, -0.3402442932128906, -0.32349395751953125, -0.3067436218261719, -0.2899932861328125, -0.2732429504394531, -0.25649261474609375, -0.23974227905273438, -0.222991943359375, -0.20624160766601562, -0.18949127197265625, -0.17274093627929688, -0.1559906005859375, -0.13924026489257812, -0.12248992919921875, -0.10573959350585938, -0.0889892578125, -0.07223892211914062, -0.05548858642578125, -0.038738250732421875, -0.0219879150390625, -0.005237579345703125, 0.01151275634765625, 0.028263092041015625, 0.045013427734375, 0.061763763427734375, 0.07851409912109375, 0.09526443481445312, 0.1120147705078125, 0.12876510620117188, 0.14551544189453125, 0.16226577758789062, 0.17901611328125, 0.19576644897460938, 0.21251678466796875, 0.22926712036132812, 0.2460174560546875, 0.2627677917480469, 0.27951812744140625, 0.2962684631347656, 0.313018798828125, 0.3297691345214844, 0.34651947021484375, 0.3632698059082031, 0.3800201416015625, 0.3967704772949219, 0.41352081298828125, 0.4302711486816406, 0.447021484375]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 5.0, 9.0, 8.0, 17.0, 17.0, 23.0, 24.0, 37.0, 55.0, 70.0, 82.0, 85.0, 89.0, 86.0, 85.0, 60.0, 41.0, 61.0, 48.0, 27.0, 23.0, 12.0, 11.0, 5.0, 9.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.061187744140625, -0.05932426452636719, -0.057460784912109375, -0.05559730529785156, -0.05373382568359375, -0.05187034606933594, -0.050006866455078125, -0.04814338684082031, -0.0462799072265625, -0.04441642761230469, -0.042552947998046875, -0.04068946838378906, -0.03882598876953125, -0.03696250915527344, -0.035099029541015625, -0.03323554992675781, -0.0313720703125, -0.029508590698242188, -0.027645111083984375, -0.025781631469726562, -0.02391815185546875, -0.022054672241210938, -0.020191192626953125, -0.018327713012695312, -0.0164642333984375, -0.014600753784179688, -0.012737274169921875, -0.010873794555664062, -0.00901031494140625, -0.0071468353271484375, -0.005283355712890625, -0.0034198760986328125, -0.001556396484375, 0.0003070831298828125, 0.002170562744140625, 0.0040340423583984375, 0.00589752197265625, 0.0077610015869140625, 0.009624481201171875, 0.011487960815429688, 0.0133514404296875, 0.015214920043945312, 0.017078399658203125, 0.018941879272460938, 0.02080535888671875, 0.022668838500976562, 0.024532318115234375, 0.026395797729492188, 0.02825927734375, 0.030122756958007812, 0.031986236572265625, 0.03384971618652344, 0.03571319580078125, 0.03757667541503906, 0.039440155029296875, 0.04130363464355469, 0.0431671142578125, 0.04503059387207031, 0.046894073486328125, 0.04875755310058594, 0.05062103271484375, 0.05248451232910156, 0.054347991943359375, 0.05621147155761719, 0.058074951171875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 2.0, 1.0, 6.0, 10.0, 8.0, 9.0, 15.0, 19.0, 33.0, 70.0, 122.0, 299.0, 638.0, 1864.0, 9278.0, 115953.0, 3854047.0, 196406.0, 11823.0, 2331.0, 700.0, 283.0, 136.0, 83.0, 53.0, 38.0, 24.0, 7.0, 10.0, 4.0, 2.0, 8.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53369140625, -0.5162353515625, -0.498779296875, -0.4813232421875, -0.4638671875, -0.4464111328125, -0.428955078125, -0.4114990234375, -0.39404296875, -0.3765869140625, -0.359130859375, -0.3416748046875, -0.32421875, -0.3067626953125, -0.289306640625, -0.2718505859375, -0.25439453125, -0.2369384765625, -0.219482421875, -0.2020263671875, -0.1845703125, -0.1671142578125, -0.149658203125, -0.1322021484375, -0.11474609375, -0.0972900390625, -0.079833984375, -0.0623779296875, -0.044921875, -0.0274658203125, -0.010009765625, 0.0074462890625, 0.02490234375, 0.0423583984375, 0.059814453125, 0.0772705078125, 0.0947265625, 0.1121826171875, 0.129638671875, 0.1470947265625, 0.16455078125, 0.1820068359375, 0.199462890625, 0.2169189453125, 0.234375, 0.2518310546875, 0.269287109375, 0.2867431640625, 0.30419921875, 0.3216552734375, 0.339111328125, 0.3565673828125, 0.3740234375, 0.3914794921875, 0.408935546875, 0.4263916015625, 0.44384765625, 0.4613037109375, 0.478759765625, 0.4962158203125, 0.513671875, 0.5311279296875, 0.548583984375, 0.5660400390625, 0.58349609375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 5.0, 6.0, 6.0, 4.0, 14.0, 13.0, 18.0, 24.0, 27.0, 47.0, 73.0, 94.0, 179.0, 281.0, 597.0, 1315.0, 583.0, 283.0, 190.0, 114.0, 64.0, 42.0, 33.0, 13.0, 12.0, 7.0, 8.0, 4.0, 3.0, 5.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.08587646484375, -0.08338642120361328, -0.08089637756347656, -0.07840633392333984, -0.07591629028320312, -0.0734262466430664, -0.07093620300292969, -0.06844615936279297, -0.06595611572265625, -0.06346607208251953, -0.06097602844238281, -0.058485984802246094, -0.055995941162109375, -0.053505897521972656, -0.05101585388183594, -0.04852581024169922, -0.0460357666015625, -0.04354572296142578, -0.04105567932128906, -0.038565635681152344, -0.036075592041015625, -0.033585548400878906, -0.031095504760742188, -0.02860546112060547, -0.02611541748046875, -0.02362537384033203, -0.021135330200195312, -0.018645286560058594, -0.016155242919921875, -0.013665199279785156, -0.011175155639648438, -0.008685111999511719, -0.006195068359375, -0.0037050247192382812, -0.0012149810791015625, 0.0012750625610351562, 0.003765106201171875, 0.006255149841308594, 0.008745193481445312, 0.011235237121582031, 0.01372528076171875, 0.01621532440185547, 0.018705368041992188, 0.021195411682128906, 0.023685455322265625, 0.026175498962402344, 0.028665542602539062, 0.03115558624267578, 0.0336456298828125, 0.03613567352294922, 0.03862571716308594, 0.041115760803222656, 0.043605804443359375, 0.046095848083496094, 0.04858589172363281, 0.05107593536376953, 0.05356597900390625, 0.05605602264404297, 0.05854606628417969, 0.061036109924316406, 0.06352615356445312, 0.06601619720458984, 0.06850624084472656, 0.07099628448486328, 0.073486328125]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 15.0, 26.0, 105.0, 210.0, 305.0, 221.0, 85.0, 31.0, 6.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1512868404388428, -1.1198092699050903, -1.0883318185806274, -1.056854248046875, -1.025376796722412, -0.9938992261886597, -0.962421715259552, -0.9309442043304443, -0.8994666337966919, -0.8679891228675842, -0.8365116119384766, -0.8050340414047241, -0.7735565304756165, -0.7420790195465088, -0.7106015086174011, -0.6791239976882935, -0.6476464867591858, -0.6161689758300781, -0.5846914649009705, -0.5532139539718628, -0.5217363834381104, -0.4902588725090027, -0.458781361579895, -0.42730385065078735, -0.3958263099193573, -0.36434879899024963, -0.3328712582588196, -0.3013937473297119, -0.26991623640060425, -0.2384386956691742, -0.20696118474006653, -0.17548365890979767, -0.1440061330795288, -0.11252860724925995, -0.08105108886957169, -0.04957357048988342, -0.018096044659614563, 0.013381481170654297, 0.04485899209976196, 0.07633651793003082, 0.10781404376029968, 0.13929156959056854, 0.1707690954208374, 0.20224660634994507, 0.23372413218021393, 0.2652016580104828, 0.29667916893959045, 0.3281567096710205, 0.3596342206001282, 0.39111173152923584, 0.4225892722606659, 0.45406678318977356, 0.4855443239212036, 0.5170218348503113, 0.548499345779419, 0.5799768567085266, 0.6114543676376343, 0.6429318785667419, 0.6744093894958496, 0.705886960029602, 0.7373644709587097, 0.7688419818878174, 0.800319492816925, 0.8317970037460327, 0.8632745742797852]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 6.0, 4.0, 5.0, 11.0, 9.0, 17.0, 11.0, 30.0, 19.0, 19.0, 49.0, 43.0, 47.0, 58.0, 51.0, 60.0, 57.0, 60.0, 50.0, 65.0, 41.0, 63.0, 34.0, 47.0, 33.0, 35.0, 18.0, 15.0, 19.0, 10.0, 11.0, 2.0, 6.0, 7.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25104695558547974, -0.2399238795042038, -0.22880080342292786, -0.21767771244049072, -0.20655465126037598, -0.19543156027793884, -0.1843084841966629, -0.17318540811538696, -0.16206233203411102, -0.15093925595283508, -0.13981617987155914, -0.1286931037902832, -0.11757002025842667, -0.10644694417715073, -0.09532386064529419, -0.08420078456401825, -0.07307770848274231, -0.06195463240146637, -0.05083155259490013, -0.03970847278833389, -0.028585396707057953, -0.017462320625782013, -0.006339237093925476, 0.004783838987350464, 0.015906915068626404, 0.027029993012547493, 0.03815307095646858, 0.04927615076303482, 0.06039922684431076, 0.0715223029255867, 0.08264538645744324, 0.09376846253871918, 0.10489153861999512, 0.11601461470127106, 0.127137690782547, 0.13826078176498413, 0.14938384294509888, 0.160506933927536, 0.17163001000881195, 0.1827530860900879, 0.19387616217136383, 0.20499923825263977, 0.2161223143339157, 0.22724539041519165, 0.23836848139762878, 0.24949154257774353, 0.26061463356018066, 0.2717376947402954, 0.28286078572273254, 0.2939838767051697, 0.3051069378852844, 0.31623002886772156, 0.3273530900478363, 0.33847618103027344, 0.3495992422103882, 0.3607223331928253, 0.37184542417526245, 0.3829685151576996, 0.39409157633781433, 0.40521466732025146, 0.4163377285003662, 0.42746081948280334, 0.4385839104652405, 0.4497069716453552, 0.46083003282546997]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 7.0, 2.0, 3.0, 5.0, 12.0, 6.0, 14.0, 20.0, 34.0, 35.0, 73.0, 96.0, 135.0, 238.0, 412.0, 704.0, 1308.0, 3202.0, 10608.0, 49300.0, 276013.0, 525649.0, 143641.0, 26111.0, 6278.0, 2156.0, 1063.0, 540.0, 310.0, 202.0, 113.0, 84.0, 59.0, 36.0, 28.0, 18.0, 17.0, 7.0, 7.0, 5.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.258544921875, -0.2502861022949219, -0.24202728271484375, -0.23376846313476562, -0.2255096435546875, -0.21725082397460938, -0.20899200439453125, -0.20073318481445312, -0.192474365234375, -0.18421554565429688, -0.17595672607421875, -0.16769790649414062, -0.1594390869140625, -0.15118026733398438, -0.14292144775390625, -0.13466262817382812, -0.12640380859375, -0.11814498901367188, -0.10988616943359375, -0.10162734985351562, -0.0933685302734375, -0.08510971069335938, -0.07685089111328125, -0.06859207153320312, -0.060333251953125, -0.052074432373046875, -0.04381561279296875, -0.035556793212890625, -0.0272979736328125, -0.019039154052734375, -0.01078033447265625, -0.002521514892578125, 0.0057373046875, 0.013996124267578125, 0.02225494384765625, 0.030513763427734375, 0.0387725830078125, 0.047031402587890625, 0.05529022216796875, 0.06354904174804688, 0.071807861328125, 0.08006668090820312, 0.08832550048828125, 0.09658432006835938, 0.1048431396484375, 0.11310195922851562, 0.12136077880859375, 0.12961959838867188, 0.13787841796875, 0.14613723754882812, 0.15439605712890625, 0.16265487670898438, 0.1709136962890625, 0.17917251586914062, 0.18743133544921875, 0.19569015502929688, 0.203948974609375, 0.21220779418945312, 0.22046661376953125, 0.22872543334960938, 0.2369842529296875, 0.24524307250976562, 0.25350189208984375, 0.2617607116699219, 0.27001953125]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 9.0, 9.0, 14.0, 23.0, 15.0, 29.0, 53.0, 84.0, 90.0, 99.0, 100.0, 87.0, 91.0, 67.0, 62.0, 56.0, 32.0, 29.0, 16.0, 8.0, 6.0, 4.0, 8.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06402587890625, -0.06195068359375, -0.05987548828125, -0.05780029296875, -0.05572509765625, -0.05364990234375, -0.05157470703125, -0.04949951171875, -0.04742431640625, -0.04534912109375, -0.04327392578125, -0.04119873046875, -0.03912353515625, -0.03704833984375, -0.03497314453125, -0.03289794921875, -0.03082275390625, -0.02874755859375, -0.02667236328125, -0.02459716796875, -0.02252197265625, -0.02044677734375, -0.01837158203125, -0.01629638671875, -0.01422119140625, -0.01214599609375, -0.01007080078125, -0.00799560546875, -0.00592041015625, -0.00384521484375, -0.00177001953125, 0.00030517578125, 0.00238037109375, 0.00445556640625, 0.00653076171875, 0.00860595703125, 0.01068115234375, 0.01275634765625, 0.01483154296875, 0.01690673828125, 0.01898193359375, 0.02105712890625, 0.02313232421875, 0.02520751953125, 0.02728271484375, 0.02935791015625, 0.03143310546875, 0.03350830078125, 0.03558349609375, 0.03765869140625, 0.03973388671875, 0.04180908203125, 0.04388427734375, 0.04595947265625, 0.04803466796875, 0.05010986328125, 0.05218505859375, 0.05426025390625, 0.05633544921875, 0.05841064453125, 0.06048583984375, 0.06256103515625, 0.06463623046875, 0.06671142578125, 0.06878662109375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 5.0, 4.0, 14.0, 6.0, 17.0, 27.0, 26.0, 36.0, 41.0, 48.0, 74.0, 104.0, 191.0, 243.0, 380.0, 715.0, 1220.0, 2428.0, 6462.0, 23213.0, 116931.0, 453676.0, 345451.0, 72468.0, 15438.0, 4793.0, 1981.0, 978.0, 555.0, 320.0, 210.0, 143.0, 92.0, 74.0, 63.0, 35.0, 22.0, 16.0, 19.0, 12.0, 7.0, 5.0, 6.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.244140625, -0.23647689819335938, -0.22881317138671875, -0.22114944458007812, -0.2134857177734375, -0.20582199096679688, -0.19815826416015625, -0.19049453735351562, -0.182830810546875, -0.17516708374023438, -0.16750335693359375, -0.15983963012695312, -0.1521759033203125, -0.14451217651367188, -0.13684844970703125, -0.12918472290039062, -0.12152099609375, -0.11385726928710938, -0.10619354248046875, -0.09852981567382812, -0.0908660888671875, -0.08320236206054688, -0.07553863525390625, -0.06787490844726562, -0.060211181640625, -0.052547454833984375, -0.04488372802734375, -0.037220001220703125, -0.0295562744140625, -0.021892547607421875, -0.01422882080078125, -0.006565093994140625, 0.0010986328125, 0.008762359619140625, 0.01642608642578125, 0.024089813232421875, 0.0317535400390625, 0.039417266845703125, 0.04708099365234375, 0.054744720458984375, 0.062408447265625, 0.07007217407226562, 0.07773590087890625, 0.08539962768554688, 0.0930633544921875, 0.10072708129882812, 0.10839080810546875, 0.11605453491210938, 0.12371826171875, 0.13138198852539062, 0.13904571533203125, 0.14670944213867188, 0.1543731689453125, 0.16203689575195312, 0.16970062255859375, 0.17736434936523438, 0.185028076171875, 0.19269180297851562, 0.20035552978515625, 0.20801925659179688, 0.2156829833984375, 0.22334671020507812, 0.23101043701171875, 0.23867416381835938, 0.246337890625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 8.0, 0.0, 3.0, 4.0, 4.0, 5.0, 6.0, 11.0, 7.0, 15.0, 20.0, 24.0, 16.0, 25.0, 30.0, 30.0, 42.0, 39.0, 39.0, 55.0, 46.0, 41.0, 52.0, 50.0, 45.0, 46.0, 34.0, 53.0, 32.0, 39.0, 32.0, 32.0, 22.0, 16.0, 17.0, 16.0, 11.0, 14.0, 6.0, 7.0, 6.0, 3.0, 3.0, 0.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0], "bins": [-0.239990234375, -0.2331085205078125, -0.226226806640625, -0.2193450927734375, -0.21246337890625, -0.2055816650390625, -0.198699951171875, -0.1918182373046875, -0.1849365234375, -0.1780548095703125, -0.171173095703125, -0.1642913818359375, -0.15740966796875, -0.1505279541015625, -0.143646240234375, -0.1367645263671875, -0.1298828125, -0.1230010986328125, -0.116119384765625, -0.1092376708984375, -0.10235595703125, -0.0954742431640625, -0.088592529296875, -0.0817108154296875, -0.0748291015625, -0.0679473876953125, -0.061065673828125, -0.0541839599609375, -0.04730224609375, -0.0404205322265625, -0.033538818359375, -0.0266571044921875, -0.019775390625, -0.0128936767578125, -0.006011962890625, 0.0008697509765625, 0.00775146484375, 0.0146331787109375, 0.021514892578125, 0.0283966064453125, 0.0352783203125, 0.0421600341796875, 0.049041748046875, 0.0559234619140625, 0.06280517578125, 0.0696868896484375, 0.076568603515625, 0.0834503173828125, 0.09033203125, 0.0972137451171875, 0.104095458984375, 0.1109771728515625, 0.11785888671875, 0.1247406005859375, 0.131622314453125, 0.1385040283203125, 0.1453857421875, 0.1522674560546875, 0.159149169921875, 0.1660308837890625, 0.17291259765625, 0.1797943115234375, 0.186676025390625, 0.1935577392578125, 0.200439453125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 7.0, 3.0, 11.0, 17.0, 24.0, 27.0, 54.0, 83.0, 135.0, 278.0, 467.0, 1027.0, 2692.0, 9393.0, 50923.0, 469536.0, 450985.0, 49273.0, 8872.0, 2577.0, 1059.0, 465.0, 263.0, 135.0, 90.0, 55.0, 34.0, 20.0, 15.0, 11.0, 10.0, 3.0, 2.0, 6.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1629638671875, -0.15802383422851562, -0.15308380126953125, -0.14814376831054688, -0.1432037353515625, -0.13826370239257812, -0.13332366943359375, -0.12838363647460938, -0.123443603515625, -0.11850357055664062, -0.11356353759765625, -0.10862350463867188, -0.1036834716796875, -0.09874343872070312, -0.09380340576171875, -0.08886337280273438, -0.08392333984375, -0.07898330688476562, -0.07404327392578125, -0.06910324096679688, -0.0641632080078125, -0.059223175048828125, -0.05428314208984375, -0.049343109130859375, -0.044403076171875, -0.039463043212890625, -0.03452301025390625, -0.029582977294921875, -0.0246429443359375, -0.019702911376953125, -0.01476287841796875, -0.009822845458984375, -0.0048828125, 5.7220458984375e-05, 0.00499725341796875, 0.009937286376953125, 0.0148773193359375, 0.019817352294921875, 0.02475738525390625, 0.029697418212890625, 0.034637451171875, 0.039577484130859375, 0.04451751708984375, 0.049457550048828125, 0.0543975830078125, 0.059337615966796875, 0.06427764892578125, 0.06921768188476562, 0.07415771484375, 0.07909774780273438, 0.08403778076171875, 0.08897781372070312, 0.0939178466796875, 0.09885787963867188, 0.10379791259765625, 0.10873794555664062, 0.113677978515625, 0.11861801147460938, 0.12355804443359375, 0.12849807739257812, 0.1334381103515625, 0.13837814331054688, 0.14331817626953125, 0.14825820922851562, 0.1531982421875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 2.0, 3.0, 2.0, 3.0, 1.0, 5.0, 11.0, 9.0, 12.0, 15.0, 12.0, 20.0, 29.0, 51.0, 38.0, 74.0, 83.0, 97.0, 101.0, 105.0, 66.0, 76.0, 43.0, 37.0, 25.0, 15.0, 15.0, 10.0, 14.0, 6.0, 4.0, 6.0, 5.0, 1.0, 1.0, 3.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.3365020751953125e-05, -2.2739171981811523e-05, -2.2113323211669922e-05, -2.148747444152832e-05, -2.086162567138672e-05, -2.0235776901245117e-05, -1.9609928131103516e-05, -1.8984079360961914e-05, -1.8358230590820312e-05, -1.773238182067871e-05, -1.710653305053711e-05, -1.6480684280395508e-05, -1.5854835510253906e-05, -1.5228986740112305e-05, -1.4603137969970703e-05, -1.3977289199829102e-05, -1.33514404296875e-05, -1.2725591659545898e-05, -1.2099742889404297e-05, -1.1473894119262695e-05, -1.0848045349121094e-05, -1.0222196578979492e-05, -9.59634780883789e-06, -8.970499038696289e-06, -8.344650268554688e-06, -7.718801498413086e-06, -7.092952728271484e-06, -6.467103958129883e-06, -5.841255187988281e-06, -5.21540641784668e-06, -4.589557647705078e-06, -3.9637088775634766e-06, -3.337860107421875e-06, -2.7120113372802734e-06, -2.086162567138672e-06, -1.4603137969970703e-06, -8.344650268554688e-07, -2.086162567138672e-07, 4.172325134277344e-07, 1.043081283569336e-06, 1.6689300537109375e-06, 2.294778823852539e-06, 2.9206275939941406e-06, 3.546476364135742e-06, 4.172325134277344e-06, 4.798173904418945e-06, 5.424022674560547e-06, 6.0498714447021484e-06, 6.67572021484375e-06, 7.3015689849853516e-06, 7.927417755126953e-06, 8.553266525268555e-06, 9.179115295410156e-06, 9.804964065551758e-06, 1.043081283569336e-05, 1.1056661605834961e-05, 1.1682510375976562e-05, 1.2308359146118164e-05, 1.2934207916259766e-05, 1.3560056686401367e-05, 1.4185905456542969e-05, 1.481175422668457e-05, 1.5437602996826172e-05, 1.6063451766967773e-05, 1.6689300537109375e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 6.0, 2.0, 1.0, 5.0, 3.0, 8.0, 11.0, 19.0, 13.0, 22.0, 43.0, 62.0, 100.0, 169.0, 290.0, 534.0, 1139.0, 3012.0, 10969.0, 59976.0, 496515.0, 413129.0, 48432.0, 9258.0, 2608.0, 1022.0, 512.0, 266.0, 164.0, 94.0, 52.0, 35.0, 24.0, 18.0, 6.0, 8.0, 9.0, 5.0, 4.0, 3.0, 1.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.15185546875, -0.14694786071777344, -0.14204025268554688, -0.1371326446533203, -0.13222503662109375, -0.1273174285888672, -0.12240982055664062, -0.11750221252441406, -0.1125946044921875, -0.10768699645996094, -0.10277938842773438, -0.09787178039550781, -0.09296417236328125, -0.08805656433105469, -0.08314895629882812, -0.07824134826660156, -0.073333740234375, -0.06842613220214844, -0.06351852416992188, -0.05861091613769531, -0.05370330810546875, -0.04879570007324219, -0.043888092041015625, -0.03898048400878906, -0.0340728759765625, -0.029165267944335938, -0.024257659912109375, -0.019350051879882812, -0.01444244384765625, -0.009534835815429688, -0.004627227783203125, 0.0002803802490234375, 0.00518798828125, 0.010095596313476562, 0.015003204345703125, 0.019910812377929688, 0.02481842041015625, 0.029726028442382812, 0.034633636474609375, 0.03954124450683594, 0.0444488525390625, 0.04935646057128906, 0.054264068603515625, 0.05917167663574219, 0.06407928466796875, 0.06898689270019531, 0.07389450073242188, 0.07880210876464844, 0.083709716796875, 0.08861732482910156, 0.09352493286132812, 0.09843254089355469, 0.10334014892578125, 0.10824775695800781, 0.11315536499023438, 0.11806297302246094, 0.1229705810546875, 0.12787818908691406, 0.13278579711914062, 0.1376934051513672, 0.14260101318359375, 0.1475086212158203, 0.15241622924804688, 0.15732383728027344, 0.1622314453125]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 6.0, 10.0, 11.0, 14.0, 14.0, 16.0, 42.0, 33.0, 57.0, 91.0, 100.0, 108.0, 93.0, 90.0, 93.0, 65.0, 49.0, 39.0, 22.0, 16.0, 8.0, 10.0, 6.0, 5.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.102783203125, -0.09895896911621094, -0.09513473510742188, -0.09131050109863281, -0.08748626708984375, -0.08366203308105469, -0.07983779907226562, -0.07601356506347656, -0.0721893310546875, -0.06836509704589844, -0.06454086303710938, -0.06071662902832031, -0.05689239501953125, -0.05306816101074219, -0.049243927001953125, -0.04541969299316406, -0.041595458984375, -0.03777122497558594, -0.033946990966796875, -0.030122756958007812, -0.02629852294921875, -0.022474288940429688, -0.018650054931640625, -0.014825820922851562, -0.0110015869140625, -0.0071773529052734375, -0.003353118896484375, 0.0004711151123046875, 0.00429534912109375, 0.008119583129882812, 0.011943817138671875, 0.015768051147460938, 0.01959228515625, 0.023416519165039062, 0.027240753173828125, 0.031064987182617188, 0.03488922119140625, 0.03871345520019531, 0.042537689208984375, 0.04636192321777344, 0.0501861572265625, 0.05401039123535156, 0.057834625244140625, 0.06165885925292969, 0.06548309326171875, 0.06930732727050781, 0.07313156127929688, 0.07695579528808594, 0.080780029296875, 0.08460426330566406, 0.08842849731445312, 0.09225273132324219, 0.09607696533203125, 0.09990119934082031, 0.10372543334960938, 0.10754966735839844, 0.1113739013671875, 0.11519813537597656, 0.11902236938476562, 0.12284660339355469, 0.12667083740234375, 0.1304950714111328, 0.13431930541992188, 0.13814353942871094, 0.1419677734375]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 7.0, 15.0, 15.0, 75.0, 161.0, 250.0, 255.0, 116.0, 56.0, 24.0, 15.0, 13.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.98941969871521, -1.9183576107025146, -1.8472955226898193, -1.776233434677124, -1.7051713466644287, -1.6341092586517334, -1.5630472898483276, -1.4919852018356323, -1.420923113822937, -1.3498610258102417, -1.2787989377975464, -1.207736849784851, -1.1366748809814453, -1.06561279296875, -0.9945507049560547, -0.9234886169433594, -0.8524265289306641, -0.7813644409179688, -0.7103023529052734, -0.6392403244972229, -0.5681782364845276, -0.4971161484718323, -0.42605409026145935, -0.3549920320510864, -0.2839299440383911, -0.212867870926857, -0.14180579781532288, -0.07074372470378876, 0.00031834840774536133, 0.07138043642044067, 0.1424424946308136, 0.21350455284118652, 0.28456687927246094, 0.35562896728515625, 0.4266910254955292, 0.4977530837059021, 0.5688151717185974, 0.6398772597312927, 0.7109392881393433, 0.7820013761520386, 0.8530634641647339, 0.9241255521774292, 0.9951876401901245, 1.0662497282028198, 1.1373116970062256, 1.208373785018921, 1.2794358730316162, 1.3504979610443115, 1.4215600490570068, 1.4926221370697021, 1.5636842250823975, 1.6347463130950928, 1.705808401107788, 1.7768704891204834, 1.8479324579238892, 1.9189945459365845, 1.9900566339492798, 2.0611186027526855, 2.132180690765381, 2.203242778778076, 2.2743048667907715, 2.345366954803467, 2.416429042816162, 2.4874911308288574, 2.5585532188415527]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 2.0, 5.0, 6.0, 10.0, 4.0, 7.0, 12.0, 13.0, 19.0, 21.0, 31.0, 32.0, 49.0, 42.0, 35.0, 46.0, 45.0, 53.0, 47.0, 46.0, 51.0, 62.0, 47.0, 54.0, 40.0, 43.0, 29.0, 19.0, 25.0, 17.0, 22.0, 16.0, 13.0, 9.0, 7.0, 6.0, 1.0, 4.0, 7.0, 3.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4216700792312622, -1.3776602745056152, -1.3336503505706787, -1.2896405458450317, -1.2456307411193848, -1.2016208171844482, -1.1576110124588013, -1.1136012077331543, -1.0695912837982178, -1.0255814790725708, -0.9815715551376343, -0.9375617504119873, -0.8935518860816956, -0.8495420217514038, -0.8055322170257568, -0.7615223526954651, -0.7175124883651733, -0.6735026240348816, -0.6294927597045898, -0.5854829549789429, -0.5414730906486511, -0.4974632263183594, -0.45345339179039, -0.40944355726242065, -0.3654336929321289, -0.32142382860183716, -0.2774139940738678, -0.23340414464473724, -0.1893942952156067, -0.14538444578647614, -0.10137459635734558, -0.05736476182937622, -0.013354778289794922, 0.030655071139335632, 0.07466492056846619, 0.11867476999759674, 0.1626846194267273, 0.20669446885585785, 0.2507043182849884, 0.29471415281295776, 0.3387240171432495, 0.38273388147354126, 0.4267437160015106, 0.47075355052948, 0.5147634148597717, 0.5587732791900635, 0.6027830839157104, 0.6467929482460022, 0.690802812576294, 0.7348126769065857, 0.7788225412368774, 0.8228323459625244, 0.8668422102928162, 0.9108520746231079, 0.9548618793487549, 0.9988717436790466, 1.0428816080093384, 1.0868914127349854, 1.1309013366699219, 1.1749111413955688, 1.2189209461212158, 1.2629308700561523, 1.3069406747817993, 1.3509504795074463, 1.3949604034423828]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 4.0, 0.0, 3.0, 3.0, 8.0, 8.0, 11.0, 12.0, 17.0, 22.0, 44.0, 88.0, 129.0, 206.0, 460.0, 915.0, 2429.0, 8204.0, 42957.0, 1172054.0, 2898862.0, 53431.0, 9621.0, 2701.0, 959.0, 495.0, 246.0, 160.0, 84.0, 50.0, 31.0, 23.0, 17.0, 11.0, 6.0, 7.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.422607421875, -0.4117851257324219, -0.40096282958984375, -0.3901405334472656, -0.3793182373046875, -0.3684959411621094, -0.35767364501953125, -0.3468513488769531, -0.336029052734375, -0.3252067565917969, -0.31438446044921875, -0.3035621643066406, -0.2927398681640625, -0.2819175720214844, -0.27109527587890625, -0.2602729797363281, -0.24945068359375, -0.23862838745117188, -0.22780609130859375, -0.21698379516601562, -0.2061614990234375, -0.19533920288085938, -0.18451690673828125, -0.17369461059570312, -0.162872314453125, -0.15205001831054688, -0.14122772216796875, -0.13040542602539062, -0.1195831298828125, -0.10876083374023438, -0.09793853759765625, -0.08711624145507812, -0.0762939453125, -0.06547164916992188, -0.05464935302734375, -0.043827056884765625, -0.0330047607421875, -0.022182464599609375, -0.01136016845703125, -0.000537872314453125, 0.010284423828125, 0.021106719970703125, 0.03192901611328125, 0.042751312255859375, 0.0535736083984375, 0.06439590454101562, 0.07521820068359375, 0.08604049682617188, 0.09686279296875, 0.10768508911132812, 0.11850738525390625, 0.12932968139648438, 0.1401519775390625, 0.15097427368164062, 0.16179656982421875, 0.17261886596679688, 0.183441162109375, 0.19426345825195312, 0.20508575439453125, 0.21590805053710938, 0.2267303466796875, 0.23755264282226562, 0.24837493896484375, 0.2591972351074219, 0.27001953125]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 7.0, 8.0, 8.0, 10.0, 17.0, 22.0, 33.0, 39.0, 46.0, 59.0, 73.0, 86.0, 82.0, 82.0, 86.0, 65.0, 62.0, 59.0, 38.0, 29.0, 26.0, 24.0, 18.0, 4.0, 7.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06036376953125, -0.05842304229736328, -0.05648231506347656, -0.054541587829589844, -0.052600860595703125, -0.050660133361816406, -0.04871940612792969, -0.04677867889404297, -0.04483795166015625, -0.04289722442626953, -0.04095649719238281, -0.039015769958496094, -0.037075042724609375, -0.035134315490722656, -0.03319358825683594, -0.03125286102294922, -0.0293121337890625, -0.02737140655517578, -0.025430679321289062, -0.023489952087402344, -0.021549224853515625, -0.019608497619628906, -0.017667770385742188, -0.01572704315185547, -0.01378631591796875, -0.011845588684082031, -0.009904861450195312, -0.007964134216308594, -0.006023406982421875, -0.004082679748535156, -0.0021419525146484375, -0.00020122528076171875, 0.001739501953125, 0.0036802291870117188, 0.0056209564208984375, 0.007561683654785156, 0.009502410888671875, 0.011443138122558594, 0.013383865356445312, 0.015324592590332031, 0.01726531982421875, 0.01920604705810547, 0.021146774291992188, 0.023087501525878906, 0.025028228759765625, 0.026968955993652344, 0.028909683227539062, 0.03085041046142578, 0.0327911376953125, 0.03473186492919922, 0.03667259216308594, 0.038613319396972656, 0.040554046630859375, 0.042494773864746094, 0.04443550109863281, 0.04637622833251953, 0.04831695556640625, 0.05025768280029297, 0.05219841003417969, 0.054139137268066406, 0.056079864501953125, 0.058020591735839844, 0.05996131896972656, 0.06190204620361328, 0.0638427734375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 3.0, 3.0, 2.0, 4.0, 9.0, 17.0, 26.0, 43.0, 70.0, 176.0, 372.0, 1073.0, 4245.0, 39961.0, 3484412.0, 641991.0, 17930.0, 2609.0, 747.0, 285.0, 144.0, 74.0, 40.0, 13.0, 13.0, 11.0, 3.0, 5.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3955078125, -0.38077545166015625, -0.3660430908203125, -0.35131072998046875, -0.336578369140625, -0.32184600830078125, -0.3071136474609375, -0.29238128662109375, -0.27764892578125, -0.26291656494140625, -0.2481842041015625, -0.23345184326171875, -0.218719482421875, -0.20398712158203125, -0.1892547607421875, -0.17452239990234375, -0.1597900390625, -0.14505767822265625, -0.1303253173828125, -0.11559295654296875, -0.100860595703125, -0.08612823486328125, -0.0713958740234375, -0.05666351318359375, -0.04193115234375, -0.02719879150390625, -0.0124664306640625, 0.00226593017578125, 0.016998291015625, 0.03173065185546875, 0.0464630126953125, 0.06119537353515625, 0.075927734375, 0.09066009521484375, 0.1053924560546875, 0.12012481689453125, 0.134857177734375, 0.14958953857421875, 0.1643218994140625, 0.17905426025390625, 0.19378662109375, 0.20851898193359375, 0.2232513427734375, 0.23798370361328125, 0.252716064453125, 0.26744842529296875, 0.2821807861328125, 0.29691314697265625, 0.3116455078125, 0.32637786865234375, 0.3411102294921875, 0.35584259033203125, 0.370574951171875, 0.38530731201171875, 0.4000396728515625, 0.41477203369140625, 0.42950439453125, 0.44423675537109375, 0.4589691162109375, 0.47370147705078125, 0.488433837890625, 0.5031661987304688, 0.5178985595703125, 0.5326309204101562, 0.54736328125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 4.0, 4.0, 6.0, 8.0, 24.0, 29.0, 43.0, 97.0, 115.0, 274.0, 650.0, 1564.0, 613.0, 280.0, 151.0, 67.0, 62.0, 33.0, 11.0, 16.0, 11.0, 3.0, 2.0, 5.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07269287109375, -0.06994915008544922, -0.06720542907714844, -0.06446170806884766, -0.061717987060546875, -0.058974266052246094, -0.05623054504394531, -0.05348682403564453, -0.05074310302734375, -0.04799938201904297, -0.04525566101074219, -0.042511940002441406, -0.039768218994140625, -0.037024497985839844, -0.03428077697753906, -0.03153705596923828, -0.0287933349609375, -0.02604961395263672, -0.023305892944335938, -0.020562171936035156, -0.017818450927734375, -0.015074729919433594, -0.012331008911132812, -0.009587287902832031, -0.00684356689453125, -0.004099845886230469, -0.0013561248779296875, 0.0013875961303710938, 0.004131317138671875, 0.006875038146972656, 0.009618759155273438, 0.012362480163574219, 0.015106201171875, 0.01784992218017578, 0.020593643188476562, 0.023337364196777344, 0.026081085205078125, 0.028824806213378906, 0.03156852722167969, 0.03431224822998047, 0.03705596923828125, 0.03979969024658203, 0.04254341125488281, 0.045287132263183594, 0.048030853271484375, 0.050774574279785156, 0.05351829528808594, 0.05626201629638672, 0.0590057373046875, 0.06174945831298828, 0.06449317932128906, 0.06723690032958984, 0.06998062133789062, 0.0727243423461914, 0.07546806335449219, 0.07821178436279297, 0.08095550537109375, 0.08369922637939453, 0.08644294738769531, 0.0891866683959961, 0.09193038940429688, 0.09467411041259766, 0.09741783142089844, 0.10016155242919922, 0.1029052734375]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 7.0, 39.0, 86.0, 223.0, 307.0, 225.0, 81.0, 33.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8218624591827393, -0.7957729697227478, -0.7696834206581116, -0.7435939311981201, -0.7175044417381287, -0.6914149522781372, -0.665325403213501, -0.6392359137535095, -0.6131464242935181, -0.5870569348335266, -0.5609673857688904, -0.5348778963088989, -0.5087884068489075, -0.48269888758659363, -0.4566093683242798, -0.43051987886428833, -0.4044303596019745, -0.37834084033966064, -0.3522513508796692, -0.32616183161735535, -0.3000723421573639, -0.27398282289505005, -0.2478933185338974, -0.22180381417274475, -0.1957143098115921, -0.16962480545043945, -0.1435353010892868, -0.11744578927755356, -0.09135628491640091, -0.06526677310466766, -0.039177268743515015, -0.013087764382362366, 0.013001739978790283, 0.03909124433994293, 0.06518074870109558, 0.09127026051282883, 0.11735976487398148, 0.14344927668571472, 0.16953878104686737, 0.19562828540802002, 0.22171778976917267, 0.24780729413032532, 0.27389681339263916, 0.2999863028526306, 0.32607582211494446, 0.3521653413772583, 0.37825483083724976, 0.4043443202972412, 0.43043383955955505, 0.4565233588218689, 0.48261284828186035, 0.5087023377418518, 0.534791886806488, 0.5608813762664795, 0.586970865726471, 0.6130603551864624, 0.6391499042510986, 0.6652393937110901, 0.6913289427757263, 0.7174184322357178, 0.7435079216957092, 0.7695974111557007, 0.7956869602203369, 0.8217764496803284, 0.8478659391403198]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 5.0, 3.0, 2.0, 7.0, 3.0, 5.0, 11.0, 10.0, 11.0, 9.0, 18.0, 14.0, 30.0, 30.0, 24.0, 38.0, 29.0, 34.0, 39.0, 43.0, 40.0, 51.0, 37.0, 51.0, 52.0, 38.0, 41.0, 36.0, 40.0, 36.0, 38.0, 24.0, 30.0, 18.0, 18.0, 15.0, 14.0, 15.0, 10.0, 10.0, 7.0, 7.0, 3.0, 5.0, 4.0, 3.0, 4.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2156888246536255, -0.2089981883764267, -0.2023075520992279, -0.1956169307231903, -0.18892629444599152, -0.18223565816879272, -0.17554502189159393, -0.16885438561439514, -0.16216376423835754, -0.15547312796115875, -0.14878249168395996, -0.14209187030792236, -0.13540123403072357, -0.12871059775352478, -0.12201996147632599, -0.1153293251991272, -0.1086386889219284, -0.10194805264472961, -0.09525742381811142, -0.08856678754091263, -0.08187615871429443, -0.07518552243709564, -0.06849488615989685, -0.06180425360798836, -0.055113621056079865, -0.04842298850417137, -0.04173235595226288, -0.03504171967506409, -0.028351087123155594, -0.0216604545712471, -0.01496981829404831, -0.008279185742139816, -0.0015885531902313232, 0.005102080292999744, 0.011792713776230812, 0.018483348190784454, 0.025173980742692947, 0.03186461329460144, 0.03855524957180023, 0.045245882123708725, 0.05193651467561722, 0.05862714722752571, 0.0653177797794342, 0.072008416056633, 0.07869905233383179, 0.08538968116044998, 0.09208031743764877, 0.09877094626426697, 0.10546158254146576, 0.11215221881866455, 0.11884284764528275, 0.12553349137306213, 0.13222411274909973, 0.13891474902629852, 0.14560538530349731, 0.1522960215806961, 0.1589866578578949, 0.1656772941350937, 0.17236793041229248, 0.17905855178833008, 0.18574918806552887, 0.19243982434272766, 0.19913046061992645, 0.20582109689712524, 0.21251171827316284]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 6.0, 4.0, 8.0, 9.0, 11.0, 7.0, 13.0, 17.0, 29.0, 37.0, 56.0, 79.0, 111.0, 210.0, 281.0, 505.0, 882.0, 1592.0, 3475.0, 9205.0, 32732.0, 146280.0, 453460.0, 300554.0, 70508.0, 17511.0, 5617.0, 2428.0, 1189.0, 685.0, 351.0, 238.0, 137.0, 103.0, 56.0, 45.0, 45.0, 18.0, 14.0, 21.0, 4.0, 8.0, 7.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2076416015625, -0.20089149475097656, -0.19414138793945312, -0.1873912811279297, -0.18064117431640625, -0.1738910675048828, -0.16714096069335938, -0.16039085388183594, -0.1536407470703125, -0.14689064025878906, -0.14014053344726562, -0.1333904266357422, -0.12664031982421875, -0.11989021301269531, -0.11314010620117188, -0.10638999938964844, -0.099639892578125, -0.09288978576660156, -0.08613967895507812, -0.07938957214355469, -0.07263946533203125, -0.06588935852050781, -0.059139251708984375, -0.05238914489746094, -0.0456390380859375, -0.03888893127441406, -0.032138824462890625, -0.025388717651367188, -0.01863861083984375, -0.011888504028320312, -0.005138397216796875, 0.0016117095947265625, 0.00836181640625, 0.015111923217773438, 0.021862030029296875, 0.028612136840820312, 0.03536224365234375, 0.04211235046386719, 0.048862457275390625, 0.05561256408691406, 0.0623626708984375, 0.06911277770996094, 0.07586288452148438, 0.08261299133300781, 0.08936309814453125, 0.09611320495605469, 0.10286331176757812, 0.10961341857910156, 0.116363525390625, 0.12311363220214844, 0.12986373901367188, 0.1366138458251953, 0.14336395263671875, 0.1501140594482422, 0.15686416625976562, 0.16361427307128906, 0.1703643798828125, 0.17711448669433594, 0.18386459350585938, 0.1906147003173828, 0.19736480712890625, 0.2041149139404297, 0.21086502075195312, 0.21761512756347656, 0.224365234375]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 11.0, 10.0, 8.0, 16.0, 27.0, 30.0, 46.0, 41.0, 58.0, 61.0, 84.0, 78.0, 81.0, 90.0, 77.0, 59.0, 47.0, 47.0, 37.0, 30.0, 23.0, 17.0, 5.0, 5.0, 5.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.056732177734375, -0.05479097366333008, -0.052849769592285156, -0.050908565521240234, -0.04896736145019531, -0.04702615737915039, -0.04508495330810547, -0.04314374923706055, -0.041202545166015625, -0.0392613410949707, -0.03732013702392578, -0.03537893295288086, -0.03343772888183594, -0.031496524810791016, -0.029555320739746094, -0.027614116668701172, -0.02567291259765625, -0.023731708526611328, -0.021790504455566406, -0.019849300384521484, -0.017908096313476562, -0.01596689224243164, -0.014025688171386719, -0.012084484100341797, -0.010143280029296875, -0.008202075958251953, -0.006260871887207031, -0.004319667816162109, -0.0023784637451171875, -0.0004372596740722656, 0.0015039443969726562, 0.003445148468017578, 0.0053863525390625, 0.007327556610107422, 0.009268760681152344, 0.011209964752197266, 0.013151168823242188, 0.01509237289428711, 0.01703357696533203, 0.018974781036376953, 0.020915985107421875, 0.022857189178466797, 0.02479839324951172, 0.02673959732055664, 0.028680801391601562, 0.030622005462646484, 0.032563209533691406, 0.03450441360473633, 0.03644561767578125, 0.03838682174682617, 0.040328025817871094, 0.042269229888916016, 0.04421043395996094, 0.04615163803100586, 0.04809284210205078, 0.0500340461730957, 0.051975250244140625, 0.05391645431518555, 0.05585765838623047, 0.05779886245727539, 0.05974006652832031, 0.061681270599365234, 0.06362247467041016, 0.06556367874145508, 0.0675048828125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 6.0, 1.0, 0.0, 3.0, 4.0, 4.0, 1.0, 6.0, 15.0, 11.0, 9.0, 19.0, 33.0, 43.0, 48.0, 82.0, 135.0, 173.0, 266.0, 377.0, 708.0, 1090.0, 2069.0, 4748.0, 13639.0, 51018.0, 231135.0, 486850.0, 192391.0, 42885.0, 11865.0, 4125.0, 1955.0, 1032.0, 634.0, 381.0, 250.0, 147.0, 120.0, 78.0, 57.0, 38.0, 31.0, 20.0, 20.0, 11.0, 11.0, 10.0, 3.0, 0.0, 6.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1763916015625, -0.17018890380859375, -0.1639862060546875, -0.15778350830078125, -0.151580810546875, -0.14537811279296875, -0.1391754150390625, -0.13297271728515625, -0.12677001953125, -0.12056732177734375, -0.1143646240234375, -0.10816192626953125, -0.101959228515625, -0.09575653076171875, -0.0895538330078125, -0.08335113525390625, -0.0771484375, -0.07094573974609375, -0.0647430419921875, -0.05854034423828125, -0.052337646484375, -0.04613494873046875, -0.0399322509765625, -0.03372955322265625, -0.02752685546875, -0.02132415771484375, -0.0151214599609375, -0.00891876220703125, -0.002716064453125, 0.00348663330078125, 0.0096893310546875, 0.01589202880859375, 0.0220947265625, 0.02829742431640625, 0.0345001220703125, 0.04070281982421875, 0.046905517578125, 0.05310821533203125, 0.0593109130859375, 0.06551361083984375, 0.07171630859375, 0.07791900634765625, 0.0841217041015625, 0.09032440185546875, 0.096527099609375, 0.10272979736328125, 0.1089324951171875, 0.11513519287109375, 0.121337890625, 0.12754058837890625, 0.1337432861328125, 0.13994598388671875, 0.146148681640625, 0.15235137939453125, 0.1585540771484375, 0.16475677490234375, 0.17095947265625, 0.17716217041015625, 0.1833648681640625, 0.18956756591796875, 0.195770263671875, 0.20197296142578125, 0.2081756591796875, 0.21437835693359375, 0.2205810546875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 6.0, 3.0, 6.0, 12.0, 11.0, 18.0, 20.0, 24.0, 22.0, 28.0, 33.0, 39.0, 28.0, 39.0, 32.0, 49.0, 42.0, 60.0, 45.0, 40.0, 32.0, 43.0, 37.0, 37.0, 36.0, 38.0, 23.0, 33.0, 29.0, 21.0, 24.0, 21.0, 11.0, 15.0, 8.0, 11.0, 4.0, 5.0, 6.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.2159423828125, -0.2097148895263672, -0.20348739624023438, -0.19725990295410156, -0.19103240966796875, -0.18480491638183594, -0.17857742309570312, -0.1723499298095703, -0.1661224365234375, -0.1598949432373047, -0.15366744995117188, -0.14743995666503906, -0.14121246337890625, -0.13498497009277344, -0.12875747680664062, -0.12252998352050781, -0.116302490234375, -0.11007499694824219, -0.10384750366210938, -0.09762001037597656, -0.09139251708984375, -0.08516502380371094, -0.07893753051757812, -0.07271003723144531, -0.0664825439453125, -0.06025505065917969, -0.054027557373046875, -0.04780006408691406, -0.04157257080078125, -0.03534507751464844, -0.029117584228515625, -0.022890090942382812, -0.01666259765625, -0.010435104370117188, -0.004207611083984375, 0.0020198822021484375, 0.00824737548828125, 0.014474868774414062, 0.020702362060546875, 0.026929855346679688, 0.0331573486328125, 0.03938484191894531, 0.045612335205078125, 0.05183982849121094, 0.05806732177734375, 0.06429481506347656, 0.07052230834960938, 0.07674980163574219, 0.082977294921875, 0.08920478820800781, 0.09543228149414062, 0.10165977478027344, 0.10788726806640625, 0.11411476135253906, 0.12034225463867188, 0.1265697479248047, 0.1327972412109375, 0.1390247344970703, 0.14525222778320312, 0.15147972106933594, 0.15770721435546875, 0.16393470764160156, 0.17016220092773438, 0.1763896942138672, 0.1826171875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 2.0, 7.0, 6.0, 11.0, 16.0, 24.0, 31.0, 48.0, 76.0, 138.0, 219.0, 387.0, 949.0, 2079.0, 6875.0, 31005.0, 280290.0, 630033.0, 77040.0, 13174.0, 3555.0, 1271.0, 561.0, 320.0, 152.0, 93.0, 59.0, 41.0, 21.0, 29.0, 16.0, 8.0, 5.0, 4.0, 2.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.17236328125, -0.16747093200683594, -0.16257858276367188, -0.1576862335205078, -0.15279388427734375, -0.1479015350341797, -0.14300918579101562, -0.13811683654785156, -0.1332244873046875, -0.12833213806152344, -0.12343978881835938, -0.11854743957519531, -0.11365509033203125, -0.10876274108886719, -0.10387039184570312, -0.09897804260253906, -0.094085693359375, -0.08919334411621094, -0.08430099487304688, -0.07940864562988281, -0.07451629638671875, -0.06962394714355469, -0.06473159790039062, -0.05983924865722656, -0.0549468994140625, -0.05005455017089844, -0.045162200927734375, -0.04026985168457031, -0.03537750244140625, -0.030485153198242188, -0.025592803955078125, -0.020700454711914062, -0.01580810546875, -0.010915756225585938, -0.006023406982421875, -0.0011310577392578125, 0.00376129150390625, 0.008653640747070312, 0.013545989990234375, 0.018438339233398438, 0.0233306884765625, 0.028223037719726562, 0.033115386962890625, 0.03800773620605469, 0.04290008544921875, 0.04779243469238281, 0.052684783935546875, 0.05757713317871094, 0.062469482421875, 0.06736183166503906, 0.07225418090820312, 0.07714653015136719, 0.08203887939453125, 0.08693122863769531, 0.09182357788085938, 0.09671592712402344, 0.1016082763671875, 0.10650062561035156, 0.11139297485351562, 0.11628532409667969, 0.12117767333984375, 0.1260700225830078, 0.13096237182617188, 0.13585472106933594, 0.1407470703125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 5.0, 9.0, 6.0, 9.0, 9.0, 14.0, 23.0, 49.0, 56.0, 95.0, 124.0, 131.0, 133.0, 115.0, 72.0, 53.0, 36.0, 16.0, 11.0, 7.0, 3.0, 4.0, 7.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6464462280273438e-05, -2.556759864091873e-05, -2.4670735001564026e-05, -2.377387136220932e-05, -2.2877007722854614e-05, -2.198014408349991e-05, -2.1083280444145203e-05, -2.0186416804790497e-05, -1.928955316543579e-05, -1.8392689526081085e-05, -1.749582588672638e-05, -1.6598962247371674e-05, -1.5702098608016968e-05, -1.4805234968662262e-05, -1.3908371329307556e-05, -1.301150768995285e-05, -1.2114644050598145e-05, -1.1217780411243439e-05, -1.0320916771888733e-05, -9.424053132534027e-06, -8.527189493179321e-06, -7.630325853824615e-06, -6.73346221446991e-06, -5.836598575115204e-06, -4.939734935760498e-06, -4.042871296405792e-06, -3.1460076570510864e-06, -2.2491440176963806e-06, -1.3522803783416748e-06, -4.55416738986969e-07, 4.414469003677368e-07, 1.3383105397224426e-06, 2.2351741790771484e-06, 3.1320378184318542e-06, 4.02890145778656e-06, 4.925765097141266e-06, 5.822628736495972e-06, 6.7194923758506775e-06, 7.616356015205383e-06, 8.513219654560089e-06, 9.410083293914795e-06, 1.03069469332695e-05, 1.1203810572624207e-05, 1.2100674211978912e-05, 1.2997537851333618e-05, 1.3894401490688324e-05, 1.479126513004303e-05, 1.5688128769397736e-05, 1.658499240875244e-05, 1.7481856048107147e-05, 1.8378719687461853e-05, 1.927558332681656e-05, 2.0172446966171265e-05, 2.106931060552597e-05, 2.1966174244880676e-05, 2.2863037884235382e-05, 2.3759901523590088e-05, 2.4656765162944794e-05, 2.55536288022995e-05, 2.6450492441654205e-05, 2.734735608100891e-05, 2.8244219720363617e-05, 2.9141083359718323e-05, 3.003794699907303e-05, 3.0934810638427734e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 9.0, 18.0, 33.0, 46.0, 104.0, 205.0, 529.0, 1915.0, 12139.0, 343530.0, 666972.0, 19293.0, 2564.0, 688.0, 254.0, 108.0, 57.0, 28.0, 30.0, 11.0, 6.0, 6.0, 0.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.4248046875, -0.414947509765625, -0.40509033203125, -0.395233154296875, -0.3853759765625, -0.375518798828125, -0.36566162109375, -0.355804443359375, -0.345947265625, -0.336090087890625, -0.32623291015625, -0.316375732421875, -0.3065185546875, -0.296661376953125, -0.28680419921875, -0.276947021484375, -0.26708984375, -0.257232666015625, -0.24737548828125, -0.237518310546875, -0.2276611328125, -0.217803955078125, -0.20794677734375, -0.198089599609375, -0.188232421875, -0.178375244140625, -0.16851806640625, -0.158660888671875, -0.1488037109375, -0.138946533203125, -0.12908935546875, -0.119232177734375, -0.109375, -0.099517822265625, -0.08966064453125, -0.079803466796875, -0.0699462890625, -0.060089111328125, -0.05023193359375, -0.040374755859375, -0.030517578125, -0.020660400390625, -0.01080322265625, -0.000946044921875, 0.0089111328125, 0.018768310546875, 0.02862548828125, 0.038482666015625, 0.04833984375, 0.058197021484375, 0.06805419921875, 0.077911376953125, 0.0877685546875, 0.097625732421875, 0.10748291015625, 0.117340087890625, 0.127197265625, 0.137054443359375, 0.14691162109375, 0.156768798828125, 0.1666259765625, 0.176483154296875, 0.18634033203125, 0.196197509765625, 0.2060546875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 6.0, 6.0, 13.0, 14.0, 20.0, 42.0, 34.0, 63.0, 110.0, 102.0, 131.0, 105.0, 107.0, 72.0, 45.0, 32.0, 25.0, 27.0, 13.0, 7.0, 7.0, 5.0, 2.0, 2.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1702880859375, -0.16576671600341797, -0.16124534606933594, -0.1567239761352539, -0.15220260620117188, -0.14768123626708984, -0.1431598663330078, -0.13863849639892578, -0.13411712646484375, -0.12959575653076172, -0.1250743865966797, -0.12055301666259766, -0.11603164672851562, -0.1115102767944336, -0.10698890686035156, -0.10246753692626953, -0.0979461669921875, -0.09342479705810547, -0.08890342712402344, -0.0843820571899414, -0.07986068725585938, -0.07533931732177734, -0.07081794738769531, -0.06629657745361328, -0.06177520751953125, -0.05725383758544922, -0.05273246765136719, -0.048211097717285156, -0.043689727783203125, -0.039168357849121094, -0.03464698791503906, -0.03012561798095703, -0.025604248046875, -0.02108287811279297, -0.016561508178710938, -0.012040138244628906, -0.007518768310546875, -0.0029973983764648438, 0.0015239715576171875, 0.006045341491699219, 0.01056671142578125, 0.015088081359863281, 0.019609451293945312, 0.024130821228027344, 0.028652191162109375, 0.033173561096191406, 0.03769493103027344, 0.04221630096435547, 0.0467376708984375, 0.05125904083251953, 0.05578041076660156, 0.060301780700683594, 0.06482315063476562, 0.06934452056884766, 0.07386589050292969, 0.07838726043701172, 0.08290863037109375, 0.08743000030517578, 0.09195137023925781, 0.09647274017333984, 0.10099411010742188, 0.1055154800415039, 0.11003684997558594, 0.11455821990966797, 0.11907958984375]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 8.0, 25.0, 56.0, 136.0, 282.0, 263.0, 137.0, 64.0, 23.0, 9.0, 5.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-3.8246986865997314, -3.739745616912842, -3.654792308807373, -3.5698392391204834, -3.4848861694335938, -3.399932861328125, -3.3149797916412354, -3.2300267219543457, -3.145073413848877, -3.0601203441619873, -2.9751670360565186, -2.890213966369629, -2.8052608966827393, -2.7203078269958496, -2.635354518890381, -2.550401449203491, -2.4654483795166016, -2.380495309829712, -2.295542001724243, -2.2105889320373535, -2.125635862350464, -2.040682792663574, -1.9557294845581055, -1.8707764148712158, -1.7858232259750366, -1.7008700370788574, -1.6159169673919678, -1.5309637784957886, -1.4460105895996094, -1.3610575199127197, -1.2761043310165405, -1.1911511421203613, -1.1061981916427612, -1.021245002746582, -0.9362919330596924, -0.8513387441635132, -0.7663856148719788, -0.6814324855804443, -0.5964792966842651, -0.5115261673927307, -0.4265730381011963, -0.34161990880966187, -0.25666674971580505, -0.17171359062194824, -0.08676046133041382, -0.0018073320388793945, 0.0831458568572998, 0.16809898614883423, 0.25305211544036865, 0.3380052447319031, 0.4229584038257599, 0.5079115629196167, 0.5928646922111511, 0.6778178215026855, 0.7627710103988647, 0.8477241396903992, 0.9326772689819336, 1.0176304578781128, 1.1025835275650024, 1.1875367164611816, 1.2724897861480713, 1.3574429750442505, 1.4423961639404297, 1.5273492336273193, 1.6123024225234985]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 4.0, 4.0, 5.0, 9.0, 10.0, 14.0, 21.0, 27.0, 18.0, 29.0, 39.0, 27.0, 40.0, 44.0, 45.0, 43.0, 62.0, 55.0, 45.0, 53.0, 54.0, 45.0, 43.0, 49.0, 36.0, 23.0, 30.0, 19.0, 22.0, 14.0, 14.0, 12.0, 13.0, 6.0, 10.0, 1.0, 7.0, 3.0, 3.0, 1.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0], "bins": [-1.460639238357544, -1.4199659824371338, -1.3792927265167236, -1.3386194705963135, -1.2979462146759033, -1.2572729587554932, -1.216599702835083, -1.1759264469146729, -1.1352531909942627, -1.0945799350738525, -1.0539066791534424, -1.0132334232330322, -0.9725601673126221, -0.9318869113922119, -0.8912137150764465, -0.8505404591560364, -0.809867262840271, -0.7691940069198608, -0.7285207509994507, -0.6878474950790405, -0.6471742391586304, -0.6065009832382202, -0.5658277869224548, -0.5251545310020447, -0.4844812750816345, -0.44380801916122437, -0.4031347632408142, -0.36246153712272644, -0.3217882812023163, -0.28111502528190613, -0.24044178426265717, -0.1997685432434082, -0.15909528732299805, -0.11842203885316849, -0.07774879038333893, -0.03707554191350937, 0.0035977065563201904, 0.04427096247673035, 0.08494420349597931, 0.12561744451522827, 0.16629070043563843, 0.20696395635604858, 0.24763719737529755, 0.2883104383945465, 0.32898369431495667, 0.3696569502353668, 0.4103301763534546, 0.45100343227386475, 0.4916766881942749, 0.5323499441146851, 0.5730232000350952, 0.6136964559555054, 0.6543697118759155, 0.6950429677963257, 0.7357161641120911, 0.7763894200325012, 0.8170626759529114, 0.8577359318733215, 0.8984091877937317, 0.9390824437141418, 0.9797556400299072, 1.0204288959503174, 1.0611021518707275, 1.1017754077911377, 1.1424486637115479]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 5.0, 2.0, 3.0, 10.0, 11.0, 16.0, 28.0, 41.0, 86.0, 143.0, 322.0, 810.0, 2101.0, 8620.0, 80361.0, 3741173.0, 337139.0, 17930.0, 3580.0, 1035.0, 445.0, 216.0, 90.0, 53.0, 33.0, 16.0, 11.0, 4.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5986328125, -0.58392333984375, -0.5692138671875, -0.55450439453125, -0.539794921875, -0.52508544921875, -0.5103759765625, -0.49566650390625, -0.48095703125, -0.46624755859375, -0.4515380859375, -0.43682861328125, -0.422119140625, -0.40740966796875, -0.3927001953125, -0.37799072265625, -0.36328125, -0.34857177734375, -0.3338623046875, -0.31915283203125, -0.304443359375, -0.28973388671875, -0.2750244140625, -0.26031494140625, -0.24560546875, -0.23089599609375, -0.2161865234375, -0.20147705078125, -0.186767578125, -0.17205810546875, -0.1573486328125, -0.14263916015625, -0.1279296875, -0.11322021484375, -0.0985107421875, -0.08380126953125, -0.069091796875, -0.05438232421875, -0.0396728515625, -0.02496337890625, -0.01025390625, 0.00445556640625, 0.0191650390625, 0.03387451171875, 0.048583984375, 0.06329345703125, 0.0780029296875, 0.09271240234375, 0.107421875, 0.12213134765625, 0.1368408203125, 0.15155029296875, 0.166259765625, 0.18096923828125, 0.1956787109375, 0.21038818359375, 0.22509765625, 0.23980712890625, 0.2545166015625, 0.26922607421875, 0.283935546875, 0.29864501953125, 0.3133544921875, 0.32806396484375, 0.3427734375]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 2.0, 10.0, 8.0, 20.0, 22.0, 32.0, 21.0, 35.0, 49.0, 56.0, 76.0, 77.0, 78.0, 83.0, 88.0, 72.0, 71.0, 46.0, 43.0, 31.0, 24.0, 9.0, 13.0, 6.0, 10.0, 5.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06488037109375, -0.06290817260742188, -0.06093597412109375, -0.058963775634765625, -0.0569915771484375, -0.055019378662109375, -0.05304718017578125, -0.051074981689453125, -0.049102783203125, -0.047130584716796875, -0.04515838623046875, -0.043186187744140625, -0.0412139892578125, -0.039241790771484375, -0.03726959228515625, -0.035297393798828125, -0.0333251953125, -0.031352996826171875, -0.02938079833984375, -0.027408599853515625, -0.0254364013671875, -0.023464202880859375, -0.02149200439453125, -0.019519805908203125, -0.017547607421875, -0.015575408935546875, -0.01360321044921875, -0.011631011962890625, -0.0096588134765625, -0.007686614990234375, -0.00571441650390625, -0.003742218017578125, -0.00177001953125, 0.000202178955078125, 0.00217437744140625, 0.004146575927734375, 0.0061187744140625, 0.008090972900390625, 0.01006317138671875, 0.012035369873046875, 0.014007568359375, 0.015979766845703125, 0.01795196533203125, 0.019924163818359375, 0.0218963623046875, 0.023868560791015625, 0.02584075927734375, 0.027812957763671875, 0.02978515625, 0.031757354736328125, 0.03372955322265625, 0.035701751708984375, 0.0376739501953125, 0.039646148681640625, 0.04161834716796875, 0.043590545654296875, 0.045562744140625, 0.047534942626953125, 0.04950714111328125, 0.051479339599609375, 0.0534515380859375, 0.055423736572265625, 0.05739593505859375, 0.059368133544921875, 0.06134033203125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 6.0, 3.0, 3.0, 2.0, 6.0, 6.0, 4.0, 13.0, 19.0, 28.0, 30.0, 36.0, 73.0, 148.0, 278.0, 690.0, 1941.0, 6553.0, 38265.0, 879182.0, 3172580.0, 80562.0, 9921.0, 2405.0, 798.0, 327.0, 159.0, 87.0, 56.0, 29.0, 20.0, 11.0, 16.0, 11.0, 1.0, 6.0, 5.0, 9.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.298583984375, -0.28717041015625, -0.2757568359375, -0.26434326171875, -0.2529296875, -0.24151611328125, -0.2301025390625, -0.21868896484375, -0.207275390625, -0.19586181640625, -0.1844482421875, -0.17303466796875, -0.16162109375, -0.15020751953125, -0.1387939453125, -0.12738037109375, -0.115966796875, -0.10455322265625, -0.0931396484375, -0.08172607421875, -0.0703125, -0.05889892578125, -0.0474853515625, -0.03607177734375, -0.024658203125, -0.01324462890625, -0.0018310546875, 0.00958251953125, 0.02099609375, 0.03240966796875, 0.0438232421875, 0.05523681640625, 0.066650390625, 0.07806396484375, 0.0894775390625, 0.10089111328125, 0.1123046875, 0.12371826171875, 0.1351318359375, 0.14654541015625, 0.157958984375, 0.16937255859375, 0.1807861328125, 0.19219970703125, 0.20361328125, 0.21502685546875, 0.2264404296875, 0.23785400390625, 0.249267578125, 0.26068115234375, 0.2720947265625, 0.28350830078125, 0.294921875, 0.30633544921875, 0.3177490234375, 0.32916259765625, 0.340576171875, 0.35198974609375, 0.3634033203125, 0.37481689453125, 0.38623046875, 0.39764404296875, 0.4090576171875, 0.42047119140625, 0.431884765625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 5.0, 6.0, 9.0, 5.0, 12.0, 11.0, 8.0, 12.0, 20.0, 33.0, 48.0, 73.0, 106.0, 143.0, 213.0, 410.0, 629.0, 968.0, 535.0, 308.0, 170.0, 119.0, 65.0, 48.0, 30.0, 34.0, 14.0, 11.0, 8.0, 5.0, 6.0, 3.0, 1.0, 4.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.101318359375, -0.09844589233398438, -0.09557342529296875, -0.09270095825195312, -0.0898284912109375, -0.08695602416992188, -0.08408355712890625, -0.08121109008789062, -0.078338623046875, -0.07546615600585938, -0.07259368896484375, -0.06972122192382812, -0.0668487548828125, -0.06397628784179688, -0.06110382080078125, -0.058231353759765625, -0.05535888671875, -0.052486419677734375, -0.04961395263671875, -0.046741485595703125, -0.0438690185546875, -0.040996551513671875, -0.03812408447265625, -0.035251617431640625, -0.032379150390625, -0.029506683349609375, -0.02663421630859375, -0.023761749267578125, -0.0208892822265625, -0.018016815185546875, -0.01514434814453125, -0.012271881103515625, -0.0093994140625, -0.006526947021484375, -0.00365447998046875, -0.000782012939453125, 0.0020904541015625, 0.004962921142578125, 0.00783538818359375, 0.010707855224609375, 0.013580322265625, 0.016452789306640625, 0.01932525634765625, 0.022197723388671875, 0.0250701904296875, 0.027942657470703125, 0.03081512451171875, 0.033687591552734375, 0.03656005859375, 0.039432525634765625, 0.04230499267578125, 0.045177459716796875, 0.0480499267578125, 0.050922393798828125, 0.05379486083984375, 0.056667327880859375, 0.059539794921875, 0.062412261962890625, 0.06528472900390625, 0.06815719604492188, 0.0710296630859375, 0.07390213012695312, 0.07677459716796875, 0.07964706420898438, 0.08251953125]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 4.0, 3.0, 17.0, 43.0, 132.0, 284.0, 296.0, 156.0, 56.0, 12.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0190787315368652, -1.9753565788269043, -1.931634545326233, -1.887912392616272, -1.8441903591156006, -1.8004682064056396, -1.7567460536956787, -1.7130240201950073, -1.669301986694336, -1.625579833984375, -1.5818578004837036, -1.5381356477737427, -1.4944136142730713, -1.4506914615631104, -1.4069693088531494, -1.363247275352478, -1.319525122642517, -1.2758029699325562, -1.2320809364318848, -1.1883587837219238, -1.1446367502212524, -1.1009145975112915, -1.0571925640106201, -1.0134704113006592, -0.969748318195343, -0.9260262250900269, -0.8823041319847107, -0.8385820388793945, -0.7948598861694336, -0.7511378526687622, -0.7074156999588013, -0.6636936068534851, -0.6199716329574585, -0.5762495398521423, -0.5325274467468262, -0.4888053238391876, -0.44508323073387146, -0.4013611376285553, -0.35763901472091675, -0.3139169216156006, -0.2701948285102844, -0.22647273540496826, -0.1827506273984909, -0.13902851939201355, -0.09530642628669739, -0.051584333181381226, -0.007862210273742676, 0.035859882831573486, 0.07958197593688965, 0.12330407649278641, 0.16702617704868317, 0.21074828505516052, 0.2544703781604767, 0.29819247126579285, 0.3419145941734314, 0.38563668727874756, 0.4293587803840637, 0.4730808734893799, 0.516802966594696, 0.5605250597000122, 0.6042472124099731, 0.6479692459106445, 0.6916913986206055, 0.7354134917259216, 0.7791355848312378]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 4.0, 9.0, 14.0, 14.0, 16.0, 17.0, 22.0, 29.0, 42.0, 29.0, 43.0, 37.0, 40.0, 51.0, 65.0, 65.0, 63.0, 52.0, 53.0, 58.0, 45.0, 54.0, 18.0, 27.0, 17.0, 30.0, 18.0, 9.0, 17.0, 11.0, 6.0, 7.0, 5.0, 2.0, 4.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3626059889793396, -0.3488750755786896, -0.33514416217803955, -0.3214132487773895, -0.3076823353767395, -0.2939514219760895, -0.28022050857543945, -0.26648956537246704, -0.2527586817741394, -0.23902776837348938, -0.22529685497283936, -0.21156594157218933, -0.1978350281715393, -0.18410411477088928, -0.17037318646907806, -0.15664227306842804, -0.14291134476661682, -0.1291804313659668, -0.11544951796531677, -0.10171859711408615, -0.08798768371343613, -0.0742567703127861, -0.06052584946155548, -0.04679493606090546, -0.03306402266025543, -0.01933310739696026, -0.005602192133665085, 0.008128724992275238, 0.021859638392925262, 0.03559055179357529, 0.04932147264480591, 0.06305238604545593, 0.07678329944610596, 0.09051421284675598, 0.104245126247406, 0.11797604709863663, 0.13170695304870605, 0.14543786644935608, 0.1591687947511673, 0.17289970815181732, 0.18663062155246735, 0.20036153495311737, 0.2140924483537674, 0.2278233766555786, 0.24155429005622864, 0.25528520345687866, 0.2690161168575287, 0.2827470302581787, 0.29647794365882874, 0.31020885705947876, 0.3239397704601288, 0.3376706838607788, 0.35140159726142883, 0.36513251066207886, 0.37886345386505127, 0.3925943374633789, 0.4063252806663513, 0.42005619406700134, 0.43378710746765137, 0.4475180208683014, 0.4612489342689514, 0.47497984766960144, 0.48871076107025146, 0.5024417042732239, 0.5161725878715515]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 3.0, 3.0, 7.0, 14.0, 12.0, 15.0, 20.0, 22.0, 32.0, 45.0, 87.0, 145.0, 226.0, 391.0, 665.0, 1200.0, 2571.0, 6826.0, 24448.0, 120433.0, 474428.0, 326749.0, 66676.0, 14814.0, 4581.0, 1851.0, 896.0, 505.0, 302.0, 183.0, 140.0, 92.0, 56.0, 36.0, 27.0, 19.0, 9.0, 10.0, 6.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.245361328125, -0.23740005493164062, -0.22943878173828125, -0.22147750854492188, -0.2135162353515625, -0.20555496215820312, -0.19759368896484375, -0.18963241577148438, -0.181671142578125, -0.17370986938476562, -0.16574859619140625, -0.15778732299804688, -0.1498260498046875, -0.14186477661132812, -0.13390350341796875, -0.12594223022460938, -0.11798095703125, -0.11001968383789062, -0.10205841064453125, -0.09409713745117188, -0.0861358642578125, -0.07817459106445312, -0.07021331787109375, -0.062252044677734375, -0.054290771484375, -0.046329498291015625, -0.03836822509765625, -0.030406951904296875, -0.0224456787109375, -0.014484405517578125, -0.00652313232421875, 0.001438140869140625, 0.0093994140625, 0.017360687255859375, 0.02532196044921875, 0.033283233642578125, 0.0412445068359375, 0.049205780029296875, 0.05716705322265625, 0.06512832641601562, 0.073089599609375, 0.08105087280273438, 0.08901214599609375, 0.09697341918945312, 0.1049346923828125, 0.11289596557617188, 0.12085723876953125, 0.12881851196289062, 0.13677978515625, 0.14474105834960938, 0.15270233154296875, 0.16066360473632812, 0.1686248779296875, 0.17658615112304688, 0.18454742431640625, 0.19250869750976562, 0.200469970703125, 0.20843124389648438, 0.21639251708984375, 0.22435379028320312, 0.2323150634765625, 0.24027633666992188, 0.24823760986328125, 0.2561988830566406, 0.26416015625]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 6.0, 5.0, 10.0, 17.0, 15.0, 26.0, 29.0, 30.0, 48.0, 64.0, 67.0, 76.0, 78.0, 88.0, 95.0, 75.0, 61.0, 45.0, 36.0, 39.0, 27.0, 18.0, 12.0, 12.0, 7.0, 5.0, 2.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0631103515625, -0.061145782470703125, -0.05918121337890625, -0.057216644287109375, -0.0552520751953125, -0.053287506103515625, -0.05132293701171875, -0.049358367919921875, -0.047393798828125, -0.045429229736328125, -0.04346466064453125, -0.041500091552734375, -0.0395355224609375, -0.037570953369140625, -0.03560638427734375, -0.033641815185546875, -0.03167724609375, -0.029712677001953125, -0.02774810791015625, -0.025783538818359375, -0.0238189697265625, -0.021854400634765625, -0.01988983154296875, -0.017925262451171875, -0.015960693359375, -0.013996124267578125, -0.01203155517578125, -0.010066986083984375, -0.0081024169921875, -0.006137847900390625, -0.00417327880859375, -0.002208709716796875, -0.000244140625, 0.001720428466796875, 0.00368499755859375, 0.005649566650390625, 0.0076141357421875, 0.009578704833984375, 0.01154327392578125, 0.013507843017578125, 0.015472412109375, 0.017436981201171875, 0.01940155029296875, 0.021366119384765625, 0.0233306884765625, 0.025295257568359375, 0.02725982666015625, 0.029224395751953125, 0.03118896484375, 0.033153533935546875, 0.03511810302734375, 0.037082672119140625, 0.0390472412109375, 0.041011810302734375, 0.04297637939453125, 0.044940948486328125, 0.046905517578125, 0.048870086669921875, 0.05083465576171875, 0.052799224853515625, 0.0547637939453125, 0.056728363037109375, 0.05869293212890625, 0.060657501220703125, 0.0626220703125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 2.0, 4.0, 3.0, 9.0, 10.0, 17.0, 25.0, 38.0, 56.0, 83.0, 132.0, 190.0, 319.0, 582.0, 1210.0, 2835.0, 8584.0, 32686.0, 160327.0, 491354.0, 271913.0, 56771.0, 13506.0, 4393.0, 1657.0, 763.0, 425.0, 239.0, 155.0, 74.0, 53.0, 52.0, 27.0, 19.0, 13.0, 13.0, 4.0, 1.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.191650390625, -0.184967041015625, -0.17828369140625, -0.171600341796875, -0.1649169921875, -0.158233642578125, -0.15155029296875, -0.144866943359375, -0.13818359375, -0.131500244140625, -0.12481689453125, -0.118133544921875, -0.1114501953125, -0.104766845703125, -0.09808349609375, -0.091400146484375, -0.084716796875, -0.078033447265625, -0.07135009765625, -0.064666748046875, -0.0579833984375, -0.051300048828125, -0.04461669921875, -0.037933349609375, -0.03125, -0.024566650390625, -0.01788330078125, -0.011199951171875, -0.0045166015625, 0.002166748046875, 0.00885009765625, 0.015533447265625, 0.022216796875, 0.028900146484375, 0.03558349609375, 0.042266845703125, 0.0489501953125, 0.055633544921875, 0.06231689453125, 0.069000244140625, 0.07568359375, 0.082366943359375, 0.08905029296875, 0.095733642578125, 0.1024169921875, 0.109100341796875, 0.11578369140625, 0.122467041015625, 0.129150390625, 0.135833740234375, 0.14251708984375, 0.149200439453125, 0.1558837890625, 0.162567138671875, 0.16925048828125, 0.175933837890625, 0.1826171875, 0.189300537109375, 0.19598388671875, 0.202667236328125, 0.2093505859375, 0.216033935546875, 0.22271728515625, 0.229400634765625, 0.236083984375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 2.0, 4.0, 8.0, 6.0, 13.0, 18.0, 12.0, 24.0, 21.0, 38.0, 36.0, 41.0, 34.0, 42.0, 52.0, 56.0, 67.0, 65.0, 52.0, 66.0, 39.0, 41.0, 51.0, 46.0, 29.0, 32.0, 27.0, 14.0, 13.0, 13.0, 11.0, 6.0, 7.0, 2.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.20654296875, -0.1993255615234375, -0.192108154296875, -0.1848907470703125, -0.17767333984375, -0.1704559326171875, -0.163238525390625, -0.1560211181640625, -0.1488037109375, -0.1415863037109375, -0.134368896484375, -0.1271514892578125, -0.11993408203125, -0.1127166748046875, -0.105499267578125, -0.0982818603515625, -0.091064453125, -0.0838470458984375, -0.076629638671875, -0.0694122314453125, -0.06219482421875, -0.0549774169921875, -0.047760009765625, -0.0405426025390625, -0.0333251953125, -0.0261077880859375, -0.018890380859375, -0.0116729736328125, -0.00445556640625, 0.0027618408203125, 0.009979248046875, 0.0171966552734375, 0.0244140625, 0.0316314697265625, 0.038848876953125, 0.0460662841796875, 0.05328369140625, 0.0605010986328125, 0.067718505859375, 0.0749359130859375, 0.0821533203125, 0.0893707275390625, 0.096588134765625, 0.1038055419921875, 0.11102294921875, 0.1182403564453125, 0.125457763671875, 0.1326751708984375, 0.139892578125, 0.1471099853515625, 0.154327392578125, 0.1615447998046875, 0.16876220703125, 0.1759796142578125, 0.183197021484375, 0.1904144287109375, 0.1976318359375, 0.2048492431640625, 0.212066650390625, 0.2192840576171875, 0.22650146484375, 0.2337188720703125, 0.240936279296875, 0.2481536865234375, 0.25537109375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 5.0, 0.0, 4.0, 6.0, 7.0, 4.0, 20.0, 8.0, 17.0, 29.0, 31.0, 43.0, 68.0, 96.0, 130.0, 247.0, 355.0, 583.0, 1135.0, 2348.0, 5808.0, 16995.0, 62612.0, 299064.0, 480243.0, 132158.0, 29986.0, 9328.0, 3565.0, 1607.0, 798.0, 407.0, 275.0, 167.0, 135.0, 80.0, 51.0, 36.0, 37.0, 16.0, 20.0, 8.0, 11.0, 2.0, 2.0, 4.0, 4.0, 2.0, 5.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0853271484375, -0.08219432830810547, -0.07906150817871094, -0.0759286880493164, -0.07279586791992188, -0.06966304779052734, -0.06653022766113281, -0.06339740753173828, -0.06026458740234375, -0.05713176727294922, -0.05399894714355469, -0.050866127014160156, -0.047733306884765625, -0.044600486755371094, -0.04146766662597656, -0.03833484649658203, -0.0352020263671875, -0.03206920623779297, -0.028936386108398438, -0.025803565979003906, -0.022670745849609375, -0.019537925720214844, -0.016405105590820312, -0.013272285461425781, -0.01013946533203125, -0.007006645202636719, -0.0038738250732421875, -0.0007410049438476562, 0.002391815185546875, 0.005524635314941406, 0.008657455444335938, 0.011790275573730469, 0.014923095703125, 0.01805591583251953, 0.021188735961914062, 0.024321556091308594, 0.027454376220703125, 0.030587196350097656, 0.03372001647949219, 0.03685283660888672, 0.03998565673828125, 0.04311847686767578, 0.04625129699707031, 0.049384117126464844, 0.052516937255859375, 0.055649757385253906, 0.05878257751464844, 0.06191539764404297, 0.0650482177734375, 0.06818103790283203, 0.07131385803222656, 0.0744466781616211, 0.07757949829101562, 0.08071231842041016, 0.08384513854980469, 0.08697795867919922, 0.09011077880859375, 0.09324359893798828, 0.09637641906738281, 0.09950923919677734, 0.10264205932617188, 0.1057748794555664, 0.10890769958496094, 0.11204051971435547, 0.11517333984375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 7.0, 6.0, 20.0, 20.0, 38.0, 60.0, 71.0, 124.0, 87.0, 126.0, 111.0, 108.0, 64.0, 49.0, 36.0, 27.0, 20.0, 12.0, 7.0, 3.0, 7.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6106834411621094e-05, -2.537202090024948e-05, -2.463720738887787e-05, -2.3902393877506256e-05, -2.3167580366134644e-05, -2.243276685476303e-05, -2.169795334339142e-05, -2.0963139832019806e-05, -2.0228326320648193e-05, -1.949351280927658e-05, -1.8758699297904968e-05, -1.8023885786533356e-05, -1.7289072275161743e-05, -1.655425876379013e-05, -1.5819445252418518e-05, -1.5084631741046906e-05, -1.4349818229675293e-05, -1.361500471830368e-05, -1.2880191206932068e-05, -1.2145377695560455e-05, -1.1410564184188843e-05, -1.067575067281723e-05, -9.940937161445618e-06, -9.206123650074005e-06, -8.471310138702393e-06, -7.73649662733078e-06, -7.0016831159591675e-06, -6.266869604587555e-06, -5.532056093215942e-06, -4.79724258184433e-06, -4.062429070472717e-06, -3.3276155591011047e-06, -2.592802047729492e-06, -1.8579885363578796e-06, -1.123175024986267e-06, -3.8836151361465454e-07, 3.46451997756958e-07, 1.0812655091285706e-06, 1.816079020500183e-06, 2.5508925318717957e-06, 3.285706043243408e-06, 4.020519554615021e-06, 4.755333065986633e-06, 5.490146577358246e-06, 6.224960088729858e-06, 6.959773600101471e-06, 7.694587111473083e-06, 8.429400622844696e-06, 9.164214134216309e-06, 9.899027645587921e-06, 1.0633841156959534e-05, 1.1368654668331146e-05, 1.2103468179702759e-05, 1.2838281691074371e-05, 1.3573095202445984e-05, 1.4307908713817596e-05, 1.5042722225189209e-05, 1.577753573656082e-05, 1.6512349247932434e-05, 1.7247162759304047e-05, 1.798197627067566e-05, 1.8716789782047272e-05, 1.9451603293418884e-05, 2.0186416804790497e-05, 2.092123031616211e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 4.0, 3.0, 6.0, 13.0, 14.0, 12.0, 16.0, 34.0, 64.0, 86.0, 168.0, 361.0, 650.0, 1429.0, 4018.0, 14319.0, 78103.0, 470668.0, 399863.0, 60835.0, 11802.0, 3495.0, 1309.0, 598.0, 298.0, 163.0, 91.0, 37.0, 24.0, 24.0, 21.0, 11.0, 9.0, 3.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10516357421875, -0.10152912139892578, -0.09789466857910156, -0.09426021575927734, -0.09062576293945312, -0.0869913101196289, -0.08335685729980469, -0.07972240447998047, -0.07608795166015625, -0.07245349884033203, -0.06881904602050781, -0.0651845932006836, -0.061550140380859375, -0.057915687561035156, -0.05428123474121094, -0.05064678192138672, -0.0470123291015625, -0.04337787628173828, -0.03974342346191406, -0.036108970642089844, -0.032474517822265625, -0.028840065002441406, -0.025205612182617188, -0.02157115936279297, -0.01793670654296875, -0.014302253723144531, -0.010667800903320312, -0.007033348083496094, -0.003398895263671875, 0.00023555755615234375, 0.0038700103759765625, 0.007504463195800781, 0.011138916015625, 0.014773368835449219, 0.018407821655273438, 0.022042274475097656, 0.025676727294921875, 0.029311180114746094, 0.03294563293457031, 0.03658008575439453, 0.04021453857421875, 0.04384899139404297, 0.04748344421386719, 0.051117897033691406, 0.054752349853515625, 0.058386802673339844, 0.06202125549316406, 0.06565570831298828, 0.0692901611328125, 0.07292461395263672, 0.07655906677246094, 0.08019351959228516, 0.08382797241210938, 0.0874624252319336, 0.09109687805175781, 0.09473133087158203, 0.09836578369140625, 0.10200023651123047, 0.10563468933105469, 0.1092691421508789, 0.11290359497070312, 0.11653804779052734, 0.12017250061035156, 0.12380695343017578, 0.12744140625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 1.0, 6.0, 10.0, 10.0, 13.0, 15.0, 24.0, 45.0, 29.0, 68.0, 74.0, 64.0, 85.0, 80.0, 86.0, 66.0, 83.0, 61.0, 38.0, 39.0, 27.0, 21.0, 14.0, 9.0, 8.0, 6.0, 3.0, 5.0, 1.0, 3.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.09466552734375, -0.09191131591796875, -0.0891571044921875, -0.08640289306640625, -0.083648681640625, -0.08089447021484375, -0.0781402587890625, -0.07538604736328125, -0.0726318359375, -0.06987762451171875, -0.0671234130859375, -0.06436920166015625, -0.061614990234375, -0.05886077880859375, -0.0561065673828125, -0.05335235595703125, -0.05059814453125, -0.04784393310546875, -0.0450897216796875, -0.04233551025390625, -0.039581298828125, -0.03682708740234375, -0.0340728759765625, -0.03131866455078125, -0.028564453125, -0.02581024169921875, -0.0230560302734375, -0.02030181884765625, -0.017547607421875, -0.01479339599609375, -0.0120391845703125, -0.00928497314453125, -0.00653076171875, -0.00377655029296875, -0.0010223388671875, 0.00173187255859375, 0.004486083984375, 0.00724029541015625, 0.0099945068359375, 0.01274871826171875, 0.0155029296875, 0.01825714111328125, 0.0210113525390625, 0.02376556396484375, 0.026519775390625, 0.02927398681640625, 0.0320281982421875, 0.03478240966796875, 0.03753662109375, 0.04029083251953125, 0.0430450439453125, 0.04579925537109375, 0.048553466796875, 0.05130767822265625, 0.0540618896484375, 0.05681610107421875, 0.0595703125, 0.06232452392578125, 0.0650787353515625, 0.06783294677734375, 0.070587158203125, 0.07334136962890625, 0.0760955810546875, 0.07884979248046875, 0.08160400390625]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 7.0, 32.0, 108.0, 306.0, 354.0, 157.0, 30.0, 10.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2423827648162842, -1.13003408908844, -1.0176854133605957, -0.9053367972373962, -0.792988121509552, -0.6806394457817078, -0.5682908296585083, -0.45594215393066406, -0.3435934782028198, -0.23124481737613678, -0.11889615654945374, -0.006547510623931885, 0.10580116510391235, 0.2181498408317566, 0.33049845695495605, 0.4428471326828003, 0.5551958084106445, 0.6675444841384888, 0.779893159866333, 0.8922417759895325, 1.0045905113220215, 1.1169390678405762, 1.2292877435684204, 1.3416364192962646, 1.4539850950241089, 1.5663337707519531, 1.6786824464797974, 1.7910311222076416, 1.9033796787261963, 2.01572847366333, 2.1280770301818848, 2.2404255867004395, 2.352774143218994, 2.465122699737549, 2.5774714946746826, 2.6898200511932373, 2.802168846130371, 2.914517402648926, 3.0268659591674805, 3.1392147541046143, 3.251563549041748, 3.3639121055603027, 3.4762609004974365, 3.588609457015991, 3.700958251953125, 3.8133068084716797, 3.9256553649902344, 4.038003921508789, 4.150352478027344, 4.262701034545898, 4.375049591064453, 4.487398624420166, 4.599747180938721, 4.712095737457275, 4.82444429397583, 4.936793327331543, 5.049141883850098, 5.161490440368652, 5.273838996887207, 5.38618803024292, 5.498536586761475, 5.610885143280029, 5.723233699798584, 5.835582733154297, 5.947931289672852]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 6.0, 8.0, 2.0, 3.0, 7.0, 7.0, 18.0, 8.0, 13.0, 21.0, 17.0, 22.0, 33.0, 35.0, 62.0, 56.0, 55.0, 49.0, 52.0, 56.0, 56.0, 41.0, 42.0, 52.0, 58.0, 41.0, 37.0, 31.0, 27.0, 27.0, 14.0, 13.0, 14.0, 7.0, 7.0, 4.0, 4.0, 4.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.2890863418579102, -1.2471674680709839, -1.2052485942840576, -1.1633297204971313, -1.121410846710205, -1.0794919729232788, -1.0375730991363525, -0.9956542253494263, -0.9537353515625, -0.9118164777755737, -0.8698976039886475, -0.8279787302017212, -0.7860598564147949, -0.7441409826278687, -0.7022221088409424, -0.6603032350540161, -0.6183843612670898, -0.5764654874801636, -0.5345466136932373, -0.49262773990631104, -0.45070886611938477, -0.4087899923324585, -0.3668711185455322, -0.32495224475860596, -0.2830333709716797, -0.24111449718475342, -0.19919562339782715, -0.15727674961090088, -0.11535787582397461, -0.07343900203704834, -0.03152012825012207, 0.0103987455368042, 0.05231761932373047, 0.09423649311065674, 0.136155366897583, 0.17807424068450928, 0.21999311447143555, 0.2619119882583618, 0.3038308620452881, 0.34574973583221436, 0.3876686096191406, 0.4295874834060669, 0.47150635719299316, 0.5134252309799194, 0.5553441047668457, 0.597262978553772, 0.6391818523406982, 0.6811007261276245, 0.7230195999145508, 0.764938473701477, 0.8068573474884033, 0.8487762212753296, 0.8906950950622559, 0.9326139688491821, 0.9745328426361084, 1.0164517164230347, 1.058370590209961, 1.1002894639968872, 1.1422083377838135, 1.1841272115707397, 1.226046085357666, 1.2679649591445923, 1.3098838329315186, 1.3518027067184448, 1.393721580505371]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 4.0, 6.0, 1.0, 7.0, 11.0, 31.0, 46.0, 115.0, 251.0, 791.0, 3708.0, 50113.0, 4032544.0, 100048.0, 5126.0, 968.0, 277.0, 125.0, 52.0, 28.0, 15.0, 7.0, 5.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.69970703125, -0.6828804016113281, -0.6660537719726562, -0.6492271423339844, -0.6324005126953125, -0.6155738830566406, -0.5987472534179688, -0.5819206237792969, -0.565093994140625, -0.5482673645019531, -0.5314407348632812, -0.5146141052246094, -0.4977874755859375, -0.4809608459472656, -0.46413421630859375, -0.4473075866699219, -0.43048095703125, -0.4136543273925781, -0.39682769775390625, -0.3800010681152344, -0.3631744384765625, -0.3463478088378906, -0.32952117919921875, -0.3126945495605469, -0.295867919921875, -0.2790412902832031, -0.26221466064453125, -0.24538803100585938, -0.2285614013671875, -0.21173477172851562, -0.19490814208984375, -0.17808151245117188, -0.1612548828125, -0.14442825317382812, -0.12760162353515625, -0.11077499389648438, -0.0939483642578125, -0.07712173461914062, -0.06029510498046875, -0.043468475341796875, -0.026641845703125, -0.009815216064453125, 0.00701141357421875, 0.023838043212890625, 0.0406646728515625, 0.057491302490234375, 0.07431793212890625, 0.09114456176757812, 0.10797119140625, 0.12479782104492188, 0.14162445068359375, 0.15845108032226562, 0.1752777099609375, 0.19210433959960938, 0.20893096923828125, 0.22575759887695312, 0.242584228515625, 0.2594108581542969, 0.27623748779296875, 0.2930641174316406, 0.3098907470703125, 0.3267173767089844, 0.34354400634765625, 0.3603706359863281, 0.377197265625]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 4.0, 4.0, 9.0, 7.0, 20.0, 31.0, 39.0, 32.0, 44.0, 67.0, 69.0, 72.0, 104.0, 89.0, 75.0, 84.0, 57.0, 55.0, 36.0, 29.0, 21.0, 17.0, 16.0, 6.0, 5.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08197021484375, -0.07968902587890625, -0.0774078369140625, -0.07512664794921875, -0.072845458984375, -0.07056427001953125, -0.0682830810546875, -0.06600189208984375, -0.063720703125, -0.06143951416015625, -0.0591583251953125, -0.05687713623046875, -0.054595947265625, -0.05231475830078125, -0.0500335693359375, -0.04775238037109375, -0.04547119140625, -0.04319000244140625, -0.0409088134765625, -0.03862762451171875, -0.036346435546875, -0.03406524658203125, -0.0317840576171875, -0.02950286865234375, -0.0272216796875, -0.02494049072265625, -0.0226593017578125, -0.02037811279296875, -0.018096923828125, -0.01581573486328125, -0.0135345458984375, -0.01125335693359375, -0.00897216796875, -0.00669097900390625, -0.0044097900390625, -0.00212860107421875, 0.000152587890625, 0.00243377685546875, 0.0047149658203125, 0.00699615478515625, 0.00927734375, 0.01155853271484375, 0.0138397216796875, 0.01612091064453125, 0.018402099609375, 0.02068328857421875, 0.0229644775390625, 0.02524566650390625, 0.02752685546875, 0.02980804443359375, 0.0320892333984375, 0.03437042236328125, 0.036651611328125, 0.03893280029296875, 0.0412139892578125, 0.04349517822265625, 0.0457763671875, 0.04805755615234375, 0.0503387451171875, 0.05261993408203125, 0.054901123046875, 0.05718231201171875, 0.0594635009765625, 0.06174468994140625, 0.06402587890625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 4.0, 8.0, 8.0, 18.0, 17.0, 34.0, 89.0, 223.0, 740.0, 4089.0, 49327.0, 3568302.0, 551828.0, 16922.0, 1939.0, 439.0, 151.0, 70.0, 27.0, 17.0, 7.0, 15.0, 2.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2685546875, -0.2562408447265625, -0.243927001953125, -0.2316131591796875, -0.21929931640625, -0.2069854736328125, -0.194671630859375, -0.1823577880859375, -0.1700439453125, -0.1577301025390625, -0.145416259765625, -0.1331024169921875, -0.12078857421875, -0.1084747314453125, -0.096160888671875, -0.0838470458984375, -0.071533203125, -0.0592193603515625, -0.046905517578125, -0.0345916748046875, -0.02227783203125, -0.0099639892578125, 0.002349853515625, 0.0146636962890625, 0.0269775390625, 0.0392913818359375, 0.051605224609375, 0.0639190673828125, 0.07623291015625, 0.0885467529296875, 0.100860595703125, 0.1131744384765625, 0.12548828125, 0.1378021240234375, 0.150115966796875, 0.1624298095703125, 0.17474365234375, 0.1870574951171875, 0.199371337890625, 0.2116851806640625, 0.2239990234375, 0.2363128662109375, 0.248626708984375, 0.2609405517578125, 0.27325439453125, 0.2855682373046875, 0.297882080078125, 0.3101959228515625, 0.322509765625, 0.3348236083984375, 0.347137451171875, 0.3594512939453125, 0.37176513671875, 0.3840789794921875, 0.396392822265625, 0.4087066650390625, 0.4210205078125, 0.4333343505859375, 0.445648193359375, 0.4579620361328125, 0.47027587890625, 0.4825897216796875, 0.494903564453125, 0.5072174072265625, 0.51953125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 7.0, 6.0, 8.0, 9.0, 18.0, 15.0, 27.0, 36.0, 74.0, 84.0, 174.0, 332.0, 615.0, 1343.0, 577.0, 297.0, 161.0, 97.0, 56.0, 42.0, 28.0, 23.0, 11.0, 10.0, 4.0, 9.0, 5.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0653076171875, -0.06283378601074219, -0.060359954833984375, -0.05788612365722656, -0.05541229248046875, -0.05293846130371094, -0.050464630126953125, -0.04799079895019531, -0.0455169677734375, -0.04304313659667969, -0.040569305419921875, -0.03809547424316406, -0.03562164306640625, -0.03314781188964844, -0.030673980712890625, -0.028200149536132812, -0.025726318359375, -0.023252487182617188, -0.020778656005859375, -0.018304824829101562, -0.01583099365234375, -0.013357162475585938, -0.010883331298828125, -0.008409500122070312, -0.0059356689453125, -0.0034618377685546875, -0.000988006591796875, 0.0014858245849609375, 0.00395965576171875, 0.0064334869384765625, 0.008907318115234375, 0.011381149291992188, 0.01385498046875, 0.016328811645507812, 0.018802642822265625, 0.021276473999023438, 0.02375030517578125, 0.026224136352539062, 0.028697967529296875, 0.031171798706054688, 0.0336456298828125, 0.03611946105957031, 0.038593292236328125, 0.04106712341308594, 0.04354095458984375, 0.04601478576660156, 0.048488616943359375, 0.05096244812011719, 0.053436279296875, 0.05591011047363281, 0.058383941650390625, 0.06085777282714844, 0.06333160400390625, 0.06580543518066406, 0.06827926635742188, 0.07075309753417969, 0.0732269287109375, 0.07570075988769531, 0.07817459106445312, 0.08064842224121094, 0.08312225341796875, 0.08559608459472656, 0.08806991577148438, 0.09054374694824219, 0.093017578125]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 11.0, 26.0, 101.0, 225.0, 320.0, 198.0, 81.0, 24.0, 14.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.324871301651001, -1.2955931425094604, -1.26631498336792, -1.2370368242263794, -1.2077586650848389, -1.1784805059432983, -1.1492023468017578, -1.1199240684509277, -1.0906459093093872, -1.0613677501678467, -1.0320895910263062, -1.0028114318847656, -0.9735332131385803, -0.9442550539970398, -0.9149768948554993, -0.8856987357139587, -0.856420636177063, -0.8271424770355225, -0.7978643178939819, -0.7685861587524414, -0.7393079400062561, -0.7100297808647156, -0.680751621723175, -0.6514734625816345, -0.6221952438354492, -0.5929170846939087, -0.5636389255523682, -0.5343607664108276, -0.5050825476646423, -0.4758043885231018, -0.4465262293815613, -0.41724807024002075, -0.3879699110984802, -0.3586917519569397, -0.3294135630130768, -0.30013540387153625, -0.2708572447299957, -0.241579070687294, -0.21230089664459229, -0.18302273750305176, -0.15374456346035004, -0.12446639686822891, -0.09518823027610779, -0.06591005623340607, -0.03663188964128494, -0.007353723049163818, 0.021924450993537903, 0.05120261013507843, 0.08048078417778015, 0.10975895076990128, 0.1390371173620224, 0.16831529140472412, 0.19759345054626465, 0.22687162458896637, 0.2561497986316681, 0.2854279577732086, 0.31470614671707153, 0.34398430585861206, 0.373262494802475, 0.4025406539440155, 0.43181881308555603, 0.46109700202941895, 0.4903751611709595, 0.5196533203125, 0.5489314794540405]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 5.0, 4.0, 2.0, 3.0, 2.0, 6.0, 10.0, 4.0, 11.0, 16.0, 18.0, 11.0, 15.0, 27.0, 28.0, 29.0, 38.0, 45.0, 32.0, 47.0, 31.0, 42.0, 39.0, 37.0, 49.0, 42.0, 39.0, 53.0, 41.0, 42.0, 25.0, 25.0, 38.0, 20.0, 28.0, 18.0, 14.0, 17.0, 4.0, 13.0, 10.0, 8.0, 3.0, 7.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.24283915758132935, -0.2355090081691742, -0.22817884385585785, -0.2208486944437027, -0.21351853013038635, -0.2061883807182312, -0.19885823130607605, -0.1915280818939209, -0.18419791758060455, -0.1768677681684494, -0.16953760385513306, -0.1622074544429779, -0.15487730503082275, -0.1475471407175064, -0.14021699130535126, -0.1328868269920349, -0.12555667757987976, -0.11822652071714401, -0.11089636385440826, -0.10356621444225311, -0.09623605757951736, -0.08890590071678162, -0.08157575130462646, -0.07424559444189072, -0.06691543757915497, -0.05958528071641922, -0.05225512757897377, -0.04492497444152832, -0.03759481757879257, -0.030264660716056824, -0.022934507578611374, -0.015604354441165924, -0.008274197578430176, -0.0009440425783395767, 0.006386112421751022, 0.013716267421841621, 0.02104642242193222, 0.02837657928466797, 0.03570673242211342, 0.04303688555955887, 0.05036704242229462, 0.057697199285030365, 0.06502735614776611, 0.07235750555992126, 0.07968766242265701, 0.08701781928539276, 0.09434796869754791, 0.10167812556028366, 0.10900828242301941, 0.11633843928575516, 0.1236685961484909, 0.13099874556064606, 0.1383289098739624, 0.14565905928611755, 0.1529892086982727, 0.16031935811042786, 0.1676495224237442, 0.17497967183589935, 0.1823098361492157, 0.18963998556137085, 0.196970134973526, 0.20430029928684235, 0.2116304486989975, 0.21896061301231384, 0.226290762424469]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 7.0, 6.0, 14.0, 9.0, 17.0, 18.0, 18.0, 25.0, 49.0, 63.0, 94.0, 141.0, 178.0, 259.0, 403.0, 646.0, 1116.0, 2165.0, 4878.0, 13733.0, 46143.0, 166882.0, 422936.0, 273269.0, 78909.0, 22288.0, 7481.0, 3008.0, 1444.0, 828.0, 489.0, 284.0, 214.0, 147.0, 95.0, 80.0, 62.0, 39.0, 30.0, 21.0, 16.0, 16.0, 8.0, 6.0, 7.0, 7.0, 3.0, 7.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.205322265625, -0.19904518127441406, -0.19276809692382812, -0.1864910125732422, -0.18021392822265625, -0.1739368438720703, -0.16765975952148438, -0.16138267517089844, -0.1551055908203125, -0.14882850646972656, -0.14255142211914062, -0.1362743377685547, -0.12999725341796875, -0.12372016906738281, -0.11744308471679688, -0.11116600036621094, -0.104888916015625, -0.09861183166503906, -0.09233474731445312, -0.08605766296386719, -0.07978057861328125, -0.07350349426269531, -0.06722640991210938, -0.06094932556152344, -0.0546722412109375, -0.04839515686035156, -0.042118072509765625, -0.03584098815917969, -0.02956390380859375, -0.023286819458007812, -0.017009735107421875, -0.010732650756835938, -0.00445556640625, 0.0018215179443359375, 0.008098602294921875, 0.014375686645507812, 0.02065277099609375, 0.026929855346679688, 0.033206939697265625, 0.03948402404785156, 0.0457611083984375, 0.05203819274902344, 0.058315277099609375, 0.06459236145019531, 0.07086944580078125, 0.07714653015136719, 0.08342361450195312, 0.08970069885253906, 0.095977783203125, 0.10225486755371094, 0.10853195190429688, 0.11480903625488281, 0.12108612060546875, 0.1273632049560547, 0.13364028930664062, 0.13991737365722656, 0.1461944580078125, 0.15247154235839844, 0.15874862670898438, 0.1650257110595703, 0.17130279541015625, 0.1775798797607422, 0.18385696411132812, 0.19013404846191406, 0.1964111328125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 4.0, 2.0, 11.0, 13.0, 17.0, 29.0, 33.0, 48.0, 48.0, 68.0, 72.0, 88.0, 91.0, 109.0, 76.0, 73.0, 55.0, 52.0, 30.0, 21.0, 26.0, 14.0, 10.0, 3.0, 4.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08685302734375, -0.08447647094726562, -0.08209991455078125, -0.07972335815429688, -0.0773468017578125, -0.07497024536132812, -0.07259368896484375, -0.07021713256835938, -0.067840576171875, -0.06546401977539062, -0.06308746337890625, -0.060710906982421875, -0.0583343505859375, -0.055957794189453125, -0.05358123779296875, -0.051204681396484375, -0.048828125, -0.046451568603515625, -0.04407501220703125, -0.041698455810546875, -0.0393218994140625, -0.036945343017578125, -0.03456878662109375, -0.032192230224609375, -0.029815673828125, -0.027439117431640625, -0.02506256103515625, -0.022686004638671875, -0.0203094482421875, -0.017932891845703125, -0.01555633544921875, -0.013179779052734375, -0.01080322265625, -0.008426666259765625, -0.00605010986328125, -0.003673553466796875, -0.0012969970703125, 0.001079559326171875, 0.00345611572265625, 0.005832672119140625, 0.008209228515625, 0.010585784912109375, 0.01296234130859375, 0.015338897705078125, 0.0177154541015625, 0.020092010498046875, 0.02246856689453125, 0.024845123291015625, 0.0272216796875, 0.029598236083984375, 0.03197479248046875, 0.034351348876953125, 0.0367279052734375, 0.039104461669921875, 0.04148101806640625, 0.043857574462890625, 0.046234130859375, 0.048610687255859375, 0.05098724365234375, 0.053363800048828125, 0.0557403564453125, 0.058116912841796875, 0.06049346923828125, 0.06287002563476562, 0.06524658203125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 7.0, 8.0, 3.0, 8.0, 15.0, 19.0, 13.0, 34.0, 35.0, 60.0, 65.0, 95.0, 132.0, 179.0, 243.0, 365.0, 544.0, 862.0, 1515.0, 2773.0, 5910.0, 14933.0, 41415.0, 116927.0, 275820.0, 326346.0, 163049.0, 59433.0, 21299.0, 8098.0, 3576.0, 1835.0, 980.0, 588.0, 377.0, 278.0, 192.0, 147.0, 104.0, 76.0, 58.0, 45.0, 30.0, 16.0, 24.0, 4.0, 8.0, 8.0, 2.0, 4.0, 5.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11431884765625, -0.1102609634399414, -0.10620307922363281, -0.10214519500732422, -0.09808731079101562, -0.09402942657470703, -0.08997154235839844, -0.08591365814208984, -0.08185577392578125, -0.07779788970947266, -0.07374000549316406, -0.06968212127685547, -0.06562423706054688, -0.06156635284423828, -0.05750846862792969, -0.053450584411621094, -0.0493927001953125, -0.045334815979003906, -0.04127693176269531, -0.03721904754638672, -0.033161163330078125, -0.02910327911376953, -0.025045394897460938, -0.020987510681152344, -0.01692962646484375, -0.012871742248535156, -0.008813858032226562, -0.004755973815917969, -0.000698089599609375, 0.0033597946166992188, 0.0074176788330078125, 0.011475563049316406, 0.015533447265625, 0.019591331481933594, 0.023649215698242188, 0.02770709991455078, 0.031764984130859375, 0.03582286834716797, 0.03988075256347656, 0.043938636779785156, 0.04799652099609375, 0.052054405212402344, 0.05611228942871094, 0.06017017364501953, 0.06422805786132812, 0.06828594207763672, 0.07234382629394531, 0.0764017105102539, 0.0804595947265625, 0.0845174789428711, 0.08857536315917969, 0.09263324737548828, 0.09669113159179688, 0.10074901580810547, 0.10480690002441406, 0.10886478424072266, 0.11292266845703125, 0.11698055267333984, 0.12103843688964844, 0.12509632110595703, 0.12915420532226562, 0.13321208953857422, 0.1372699737548828, 0.1413278579711914, 0.1453857421875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 5.0, 13.0, 8.0, 9.0, 13.0, 14.0, 10.0, 17.0, 15.0, 16.0, 19.0, 20.0, 35.0, 33.0, 31.0, 34.0, 36.0, 39.0, 48.0, 31.0, 45.0, 37.0, 37.0, 54.0, 43.0, 26.0, 33.0, 36.0, 32.0, 25.0, 29.0, 28.0, 25.0, 17.0, 15.0, 17.0, 12.0, 11.0, 13.0, 6.0, 5.0, 2.0, 5.0, 2.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.1878662109375, -0.182525634765625, -0.17718505859375, -0.171844482421875, -0.16650390625, -0.161163330078125, -0.15582275390625, -0.150482177734375, -0.1451416015625, -0.139801025390625, -0.13446044921875, -0.129119873046875, -0.123779296875, -0.118438720703125, -0.11309814453125, -0.107757568359375, -0.1024169921875, -0.097076416015625, -0.09173583984375, -0.086395263671875, -0.0810546875, -0.075714111328125, -0.07037353515625, -0.065032958984375, -0.0596923828125, -0.054351806640625, -0.04901123046875, -0.043670654296875, -0.038330078125, -0.032989501953125, -0.02764892578125, -0.022308349609375, -0.0169677734375, -0.011627197265625, -0.00628662109375, -0.000946044921875, 0.00439453125, 0.009735107421875, 0.01507568359375, 0.020416259765625, 0.0257568359375, 0.031097412109375, 0.03643798828125, 0.041778564453125, 0.047119140625, 0.052459716796875, 0.05780029296875, 0.063140869140625, 0.0684814453125, 0.073822021484375, 0.07916259765625, 0.084503173828125, 0.08984375, 0.095184326171875, 0.10052490234375, 0.105865478515625, 0.1112060546875, 0.116546630859375, 0.12188720703125, 0.127227783203125, 0.132568359375, 0.137908935546875, 0.14324951171875, 0.148590087890625, 0.1539306640625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 5.0, 6.0, 5.0, 7.0, 12.0, 13.0, 16.0, 23.0, 44.0, 62.0, 107.0, 172.0, 292.0, 470.0, 869.0, 1714.0, 3530.0, 9608.0, 33697.0, 172691.0, 537914.0, 224714.0, 43057.0, 11228.0, 4097.0, 1941.0, 941.0, 512.0, 307.0, 209.0, 96.0, 66.0, 40.0, 31.0, 16.0, 11.0, 9.0, 9.0, 3.0, 2.0, 3.0, 4.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.09246826171875, -0.08934211730957031, -0.08621597290039062, -0.08308982849121094, -0.07996368408203125, -0.07683753967285156, -0.07371139526367188, -0.07058525085449219, -0.0674591064453125, -0.06433296203613281, -0.061206817626953125, -0.05808067321777344, -0.05495452880859375, -0.05182838439941406, -0.048702239990234375, -0.04557609558105469, -0.042449951171875, -0.03932380676269531, -0.036197662353515625, -0.03307151794433594, -0.02994537353515625, -0.026819229125976562, -0.023693084716796875, -0.020566940307617188, -0.0174407958984375, -0.014314651489257812, -0.011188507080078125, -0.008062362670898438, -0.00493621826171875, -0.0018100738525390625, 0.001316070556640625, 0.0044422149658203125, 0.007568359375, 0.010694503784179688, 0.013820648193359375, 0.016946792602539062, 0.02007293701171875, 0.023199081420898438, 0.026325225830078125, 0.029451370239257812, 0.0325775146484375, 0.03570365905761719, 0.038829803466796875, 0.04195594787597656, 0.04508209228515625, 0.04820823669433594, 0.051334381103515625, 0.05446052551269531, 0.057586669921875, 0.06071281433105469, 0.06383895874023438, 0.06696510314941406, 0.07009124755859375, 0.07321739196777344, 0.07634353637695312, 0.07946968078613281, 0.0825958251953125, 0.08572196960449219, 0.08884811401367188, 0.09197425842285156, 0.09510040283203125, 0.09822654724121094, 0.10135269165039062, 0.10447883605957031, 0.10760498046875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 4.0, 3.0, 3.0, 4.0, 6.0, 14.0, 12.0, 11.0, 21.0, 19.0, 17.0, 46.0, 42.0, 61.0, 74.0, 86.0, 77.0, 90.0, 92.0, 66.0, 55.0, 55.0, 32.0, 29.0, 21.0, 16.0, 7.0, 13.0, 6.0, 2.0, 3.0, 5.0, 3.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.7821788787841797e-05, -1.73225998878479e-05, -1.6823410987854004e-05, -1.6324222087860107e-05, -1.582503318786621e-05, -1.5325844287872314e-05, -1.4826655387878418e-05, -1.4327466487884521e-05, -1.3828277587890625e-05, -1.3329088687896729e-05, -1.2829899787902832e-05, -1.2330710887908936e-05, -1.1831521987915039e-05, -1.1332333087921143e-05, -1.0833144187927246e-05, -1.033395528793335e-05, -9.834766387939453e-06, -9.335577487945557e-06, -8.83638858795166e-06, -8.337199687957764e-06, -7.838010787963867e-06, -7.338821887969971e-06, -6.839632987976074e-06, -6.340444087982178e-06, -5.841255187988281e-06, -5.342066287994385e-06, -4.842877388000488e-06, -4.343688488006592e-06, -3.844499588012695e-06, -3.345310688018799e-06, -2.8461217880249023e-06, -2.346932888031006e-06, -1.8477439880371094e-06, -1.3485550880432129e-06, -8.493661880493164e-07, -3.501772880554199e-07, 1.4901161193847656e-07, 6.48200511932373e-07, 1.1473894119262695e-06, 1.646578311920166e-06, 2.1457672119140625e-06, 2.644956111907959e-06, 3.1441450119018555e-06, 3.643333911895752e-06, 4.1425228118896484e-06, 4.641711711883545e-06, 5.140900611877441e-06, 5.640089511871338e-06, 6.139278411865234e-06, 6.638467311859131e-06, 7.137656211853027e-06, 7.636845111846924e-06, 8.13603401184082e-06, 8.635222911834717e-06, 9.134411811828613e-06, 9.63360071182251e-06, 1.0132789611816406e-05, 1.0631978511810303e-05, 1.11311674118042e-05, 1.1630356311798096e-05, 1.2129545211791992e-05, 1.2628734111785889e-05, 1.3127923011779785e-05, 1.3627111911773682e-05, 1.4126300811767578e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 2.0, 5.0, 5.0, 8.0, 13.0, 13.0, 15.0, 36.0, 66.0, 96.0, 165.0, 318.0, 631.0, 1382.0, 3262.0, 10285.0, 51745.0, 366006.0, 510559.0, 81576.0, 14898.0, 4171.0, 1679.0, 738.0, 382.0, 208.0, 125.0, 65.0, 38.0, 14.0, 19.0, 8.0, 8.0, 4.0, 6.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13720703125, -0.1334085464477539, -0.1296100616455078, -0.12581157684326172, -0.12201309204101562, -0.11821460723876953, -0.11441612243652344, -0.11061763763427734, -0.10681915283203125, -0.10302066802978516, -0.09922218322753906, -0.09542369842529297, -0.09162521362304688, -0.08782672882080078, -0.08402824401855469, -0.0802297592163086, -0.0764312744140625, -0.0726327896118164, -0.06883430480957031, -0.06503582000732422, -0.061237335205078125, -0.05743885040283203, -0.05364036560058594, -0.049841880798339844, -0.04604339599609375, -0.042244911193847656, -0.03844642639160156, -0.03464794158935547, -0.030849456787109375, -0.02705097198486328, -0.023252487182617188, -0.019454002380371094, -0.015655517578125, -0.011857032775878906, -0.008058547973632812, -0.004260063171386719, -0.000461578369140625, 0.0033369064331054688, 0.0071353912353515625, 0.010933876037597656, 0.01473236083984375, 0.018530845642089844, 0.022329330444335938, 0.02612781524658203, 0.029926300048828125, 0.03372478485107422, 0.03752326965332031, 0.041321754455566406, 0.0451202392578125, 0.048918724060058594, 0.05271720886230469, 0.05651569366455078, 0.060314178466796875, 0.06411266326904297, 0.06791114807128906, 0.07170963287353516, 0.07550811767578125, 0.07930660247802734, 0.08310508728027344, 0.08690357208251953, 0.09070205688476562, 0.09450054168701172, 0.09829902648925781, 0.1020975112915039, 0.10589599609375]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 5.0, 4.0, 7.0, 13.0, 20.0, 10.0, 22.0, 34.0, 27.0, 45.0, 63.0, 72.0, 74.0, 86.0, 86.0, 79.0, 81.0, 49.0, 55.0, 38.0, 32.0, 19.0, 21.0, 21.0, 17.0, 8.0, 6.0, 6.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0950927734375, -0.09210872650146484, -0.08912467956542969, -0.08614063262939453, -0.08315658569335938, -0.08017253875732422, -0.07718849182128906, -0.0742044448852539, -0.07122039794921875, -0.0682363510131836, -0.06525230407714844, -0.06226825714111328, -0.059284210205078125, -0.05630016326904297, -0.05331611633300781, -0.050332069396972656, -0.0473480224609375, -0.044363975524902344, -0.04137992858886719, -0.03839588165283203, -0.035411834716796875, -0.03242778778076172, -0.029443740844726562, -0.026459693908691406, -0.02347564697265625, -0.020491600036621094, -0.017507553100585938, -0.014523506164550781, -0.011539459228515625, -0.008555412292480469, -0.0055713653564453125, -0.0025873184204101562, 0.000396728515625, 0.0033807754516601562, 0.0063648223876953125, 0.009348869323730469, 0.012332916259765625, 0.015316963195800781, 0.018301010131835938, 0.021285057067871094, 0.02426910400390625, 0.027253150939941406, 0.030237197875976562, 0.03322124481201172, 0.036205291748046875, 0.03918933868408203, 0.04217338562011719, 0.045157432556152344, 0.0481414794921875, 0.051125526428222656, 0.05410957336425781, 0.05709362030029297, 0.060077667236328125, 0.06306171417236328, 0.06604576110839844, 0.0690298080444336, 0.07201385498046875, 0.0749979019165039, 0.07798194885253906, 0.08096599578857422, 0.08395004272460938, 0.08693408966064453, 0.08991813659667969, 0.09290218353271484, 0.09588623046875]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 0.0, 6.0, 4.0, 0.0, 9.0, 16.0, 18.0, 32.0, 50.0, 88.0, 123.0, 173.0, 131.0, 137.0, 82.0, 56.0, 43.0, 12.0, 9.0, 2.0, 8.0, 2.0, 4.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6538020372390747, -1.6111658811569214, -1.568529725074768, -1.5258935689926147, -1.4832572937011719, -1.4406211376190186, -1.3979849815368652, -1.355348825454712, -1.3127126693725586, -1.2700765132904053, -1.227440357208252, -1.1848042011260986, -1.1421680450439453, -1.0995317697525024, -1.0568956136703491, -1.0142594575881958, -0.9716233015060425, -0.9289871454238892, -0.8863509893417358, -0.8437147736549377, -0.8010786175727844, -0.7584424614906311, -0.715806245803833, -0.6731700897216797, -0.6305339336395264, -0.587897777557373, -0.5452616214752197, -0.5026254057884216, -0.4599892497062683, -0.417353093624115, -0.3747169077396393, -0.3320807218551636, -0.2894444465637207, -0.2468082755804062, -0.20417210459709167, -0.16153593361377716, -0.11889976263046265, -0.07626359164714813, -0.03362742066383362, 0.00900876522064209, 0.05164492130279541, 0.09428109228610992, 0.13691726326942444, 0.17955343425273895, 0.22218960523605347, 0.2648257613182068, 0.3074619472026825, 0.3500981330871582, 0.3927342891693115, 0.43537044525146484, 0.47800663113594055, 0.5206428170204163, 0.5632789731025696, 0.6059151291847229, 0.648551344871521, 0.6911875009536743, 0.7338236570358276, 0.776459813117981, 0.8190959692001343, 0.8617321848869324, 0.9043683409690857, 0.947004497051239, 0.9896407127380371, 1.0322768688201904, 1.0749130249023438]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 6.0, 7.0, 5.0, 11.0, 16.0, 10.0, 19.0, 29.0, 34.0, 30.0, 36.0, 37.0, 52.0, 57.0, 81.0, 54.0, 59.0, 72.0, 64.0, 50.0, 38.0, 40.0, 40.0, 37.0, 26.0, 29.0, 13.0, 13.0, 17.0, 9.0, 3.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.642538070678711, -1.6005433797836304, -1.5585488080978394, -1.5165541172027588, -1.4745595455169678, -1.4325648546218872, -1.3905701637268066, -1.3485755920410156, -1.3065810203552246, -1.264586329460144, -1.222591757774353, -1.1805970668792725, -1.1386024951934814, -1.0966078042984009, -1.0546131134033203, -1.0126185417175293, -0.9706238508224487, -0.9286292195320129, -0.8866345882415771, -0.8446398973464966, -0.8026453256607056, -0.760650634765625, -0.7186560034751892, -0.6766613721847534, -0.6346667408943176, -0.5926721096038818, -0.550677478313446, -0.5086828470230103, -0.4666881859302521, -0.4246935546398163, -0.3826988935470581, -0.3407042622566223, -0.2987097501754761, -0.2567151188850403, -0.2147204726934433, -0.1727258265018463, -0.13073119521141052, -0.08873656392097473, -0.04674190282821655, -0.004747271537780762, 0.03724735975265503, 0.07924199849367142, 0.1212366372346878, 0.1632312834262848, 0.20522591471672058, 0.24722054600715637, 0.28921520709991455, 0.33120983839035034, 0.37320446968078613, 0.4151991009712219, 0.4571937322616577, 0.4991883933544159, 0.5411829948425293, 0.5831776857376099, 0.6251723170280457, 0.6671669483184814, 0.7091615796089172, 0.751156210899353, 0.7931508421897888, 0.8351454734802246, 0.8771401643753052, 0.9191347360610962, 0.9611294269561768, 1.0031239986419678, 1.0451186895370483]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 3.0, 3.0, 7.0, 3.0, 8.0, 13.0, 22.0, 36.0, 48.0, 84.0, 133.0, 290.0, 598.0, 1421.0, 4167.0, 17498.0, 157521.0, 3763590.0, 219802.0, 21175.0, 4894.0, 1560.0, 668.0, 341.0, 162.0, 82.0, 59.0, 45.0, 18.0, 17.0, 8.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.252685546875, -0.2435150146484375, -0.234344482421875, -0.2251739501953125, -0.21600341796875, -0.2068328857421875, -0.197662353515625, -0.1884918212890625, -0.1793212890625, -0.1701507568359375, -0.160980224609375, -0.1518096923828125, -0.14263916015625, -0.1334686279296875, -0.124298095703125, -0.1151275634765625, -0.10595703125, -0.0967864990234375, -0.087615966796875, -0.0784454345703125, -0.06927490234375, -0.0601043701171875, -0.050933837890625, -0.0417633056640625, -0.0325927734375, -0.0234222412109375, -0.014251708984375, -0.0050811767578125, 0.00408935546875, 0.0132598876953125, 0.022430419921875, 0.0316009521484375, 0.040771484375, 0.0499420166015625, 0.059112548828125, 0.0682830810546875, 0.07745361328125, 0.0866241455078125, 0.095794677734375, 0.1049652099609375, 0.1141357421875, 0.1233062744140625, 0.132476806640625, 0.1416473388671875, 0.15081787109375, 0.1599884033203125, 0.169158935546875, 0.1783294677734375, 0.1875, 0.1966705322265625, 0.205841064453125, 0.2150115966796875, 0.22418212890625, 0.2333526611328125, 0.242523193359375, 0.2516937255859375, 0.2608642578125, 0.2700347900390625, 0.279205322265625, 0.2883758544921875, 0.29754638671875, 0.3067169189453125, 0.315887451171875, 0.3250579833984375, 0.334228515625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 4.0, 4.0, 7.0, 12.0, 20.0, 23.0, 32.0, 58.0, 69.0, 79.0, 95.0, 96.0, 93.0, 94.0, 86.0, 68.0, 55.0, 43.0, 24.0, 11.0, 7.0, 7.0, 5.0, 7.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10906982421875, -0.10633659362792969, -0.10360336303710938, -0.10087013244628906, -0.09813690185546875, -0.09540367126464844, -0.09267044067382812, -0.08993721008300781, -0.0872039794921875, -0.08447074890136719, -0.08173751831054688, -0.07900428771972656, -0.07627105712890625, -0.07353782653808594, -0.07080459594726562, -0.06807136535644531, -0.065338134765625, -0.06260490417480469, -0.059871673583984375, -0.05713844299316406, -0.05440521240234375, -0.05167198181152344, -0.048938751220703125, -0.04620552062988281, -0.0434722900390625, -0.04073905944824219, -0.038005828857421875, -0.03527259826660156, -0.03253936767578125, -0.029806137084960938, -0.027072906494140625, -0.024339675903320312, -0.0216064453125, -0.018873214721679688, -0.016139984130859375, -0.013406753540039062, -0.01067352294921875, -0.007940292358398438, -0.005207061767578125, -0.0024738311767578125, 0.0002593994140625, 0.0029926300048828125, 0.005725860595703125, 0.008459091186523438, 0.01119232177734375, 0.013925552368164062, 0.016658782958984375, 0.019392013549804688, 0.022125244140625, 0.024858474731445312, 0.027591705322265625, 0.030324935913085938, 0.03305816650390625, 0.03579139709472656, 0.038524627685546875, 0.04125785827636719, 0.0439910888671875, 0.04672431945800781, 0.049457550048828125, 0.05219078063964844, 0.05492401123046875, 0.05765724182128906, 0.060390472412109375, 0.06312370300292969, 0.06585693359375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 8.0, 1.0, 7.0, 8.0, 7.0, 16.0, 23.0, 37.0, 93.0, 228.0, 689.0, 2039.0, 7547.0, 40853.0, 573869.0, 3402561.0, 143075.0, 17336.0, 3978.0, 1170.0, 414.0, 184.0, 65.0, 33.0, 14.0, 9.0, 3.0, 3.0, 3.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.261474609375, -0.2533721923828125, -0.245269775390625, -0.2371673583984375, -0.22906494140625, -0.2209625244140625, -0.212860107421875, -0.2047576904296875, -0.1966552734375, -0.1885528564453125, -0.180450439453125, -0.1723480224609375, -0.16424560546875, -0.1561431884765625, -0.148040771484375, -0.1399383544921875, -0.1318359375, -0.1237335205078125, -0.115631103515625, -0.1075286865234375, -0.09942626953125, -0.0913238525390625, -0.083221435546875, -0.0751190185546875, -0.0670166015625, -0.0589141845703125, -0.050811767578125, -0.0427093505859375, -0.03460693359375, -0.0265045166015625, -0.018402099609375, -0.0102996826171875, -0.002197265625, 0.0059051513671875, 0.014007568359375, 0.0221099853515625, 0.03021240234375, 0.0383148193359375, 0.046417236328125, 0.0545196533203125, 0.0626220703125, 0.0707244873046875, 0.078826904296875, 0.0869293212890625, 0.09503173828125, 0.1031341552734375, 0.111236572265625, 0.1193389892578125, 0.12744140625, 0.1355438232421875, 0.143646240234375, 0.1517486572265625, 0.15985107421875, 0.1679534912109375, 0.176055908203125, 0.1841583251953125, 0.1922607421875, 0.2003631591796875, 0.208465576171875, 0.2165679931640625, 0.22467041015625, 0.2327728271484375, 0.240875244140625, 0.2489776611328125, 0.257080078125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 6.0, 3.0, 3.0, 4.0, 11.0, 14.0, 20.0, 25.0, 26.0, 35.0, 62.0, 101.0, 159.0, 193.0, 349.0, 607.0, 1131.0, 477.0, 245.0, 195.0, 130.0, 93.0, 52.0, 34.0, 27.0, 20.0, 10.0, 7.0, 8.0, 6.0, 6.0, 3.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0650634765625, -0.06268978118896484, -0.06031608581542969, -0.05794239044189453, -0.055568695068359375, -0.05319499969482422, -0.05082130432128906, -0.048447608947753906, -0.04607391357421875, -0.043700218200683594, -0.04132652282714844, -0.03895282745361328, -0.036579132080078125, -0.03420543670654297, -0.03183174133300781, -0.029458045959472656, -0.0270843505859375, -0.024710655212402344, -0.022336959838867188, -0.01996326446533203, -0.017589569091796875, -0.015215873718261719, -0.012842178344726562, -0.010468482971191406, -0.00809478759765625, -0.005721092224121094, -0.0033473968505859375, -0.0009737014770507812, 0.001399993896484375, 0.0037736892700195312, 0.0061473846435546875, 0.008521080017089844, 0.010894775390625, 0.013268470764160156, 0.015642166137695312, 0.01801586151123047, 0.020389556884765625, 0.02276325225830078, 0.025136947631835938, 0.027510643005371094, 0.02988433837890625, 0.032258033752441406, 0.03463172912597656, 0.03700542449951172, 0.039379119873046875, 0.04175281524658203, 0.04412651062011719, 0.046500205993652344, 0.0488739013671875, 0.051247596740722656, 0.05362129211425781, 0.05599498748779297, 0.058368682861328125, 0.06074237823486328, 0.06311607360839844, 0.0654897689819336, 0.06786346435546875, 0.0702371597290039, 0.07261085510253906, 0.07498455047607422, 0.07735824584960938, 0.07973194122314453, 0.08210563659667969, 0.08447933197021484, 0.08685302734375]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 5.0, 10.0, 30.0, 73.0, 159.0, 259.0, 256.0, 132.0, 57.0, 17.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.6587209701538086, -1.6280401945114136, -1.597359538078308, -1.566678762435913, -1.5359981060028076, -1.5053173303604126, -1.4746365547180176, -1.443955898284912, -1.413275122642517, -1.382594347000122, -1.3519136905670166, -1.3212329149246216, -1.2905522584915161, -1.259871482849121, -1.2291908264160156, -1.1985100507736206, -1.1678292751312256, -1.1371484994888306, -1.106467843055725, -1.07578706741333, -1.0451064109802246, -1.0144256353378296, -0.9837449193000793, -0.9530642032623291, -0.9223835468292236, -0.8917028307914734, -0.8610221147537231, -0.8303413391113281, -0.7996606230735779, -0.7689799070358276, -0.7382991909980774, -0.7076184749603271, -0.6769376993179321, -0.6462569832801819, -0.6155762672424316, -0.5848954916000366, -0.5542147755622864, -0.5235340595245361, -0.4928533434867859, -0.46217262744903564, -0.4314918518066406, -0.4008111357688904, -0.37013038992881775, -0.3394496738910675, -0.3087689280509949, -0.27808821201324463, -0.24740749597549438, -0.21672676503658295, -0.1860460340976715, -0.15536530315876007, -0.12468457967042923, -0.09400385618209839, -0.06332312524318695, -0.03264239430427551, -0.0019616782665252686, 0.02871905267238617, 0.05939978361129761, 0.09008051455020905, 0.12076123803853989, 0.15144196152687073, 0.18212269246578217, 0.2128034234046936, 0.24348413944244385, 0.2741648554801941, 0.3048456013202667]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 8.0, 3.0, 3.0, 11.0, 6.0, 5.0, 11.0, 14.0, 17.0, 21.0, 27.0, 26.0, 37.0, 42.0, 56.0, 46.0, 50.0, 52.0, 51.0, 47.0, 46.0, 46.0, 46.0, 40.0, 38.0, 53.0, 32.0, 32.0, 34.0, 20.0, 13.0, 21.0, 11.0, 17.0, 14.0, 6.0, 2.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.4095225930213928, -0.39907369017601013, -0.38862475752830505, -0.37817585468292236, -0.3677269220352173, -0.3572780191898346, -0.3468290865421295, -0.3363801836967468, -0.32593125104904175, -0.31548234820365906, -0.305033415555954, -0.2945845127105713, -0.2841355800628662, -0.2736866772174835, -0.26323774456977844, -0.25278884172439575, -0.24233992397785187, -0.23189100623130798, -0.2214420884847641, -0.21099317073822021, -0.20054425299167633, -0.19009533524513245, -0.17964643239974976, -0.16919749975204468, -0.158748596906662, -0.1482996791601181, -0.13785076141357422, -0.12740184366703033, -0.11695292592048645, -0.10650400817394257, -0.09605509787797928, -0.0856061801314354, -0.07515725493431091, -0.06470833718776703, -0.054259419441223145, -0.04381050541996956, -0.033361587673425674, -0.02291266992688179, -0.012463755905628204, -0.00201483815908432, 0.008434079587459564, 0.01888299733400345, 0.029331913217902184, 0.03978082910180092, 0.0502297468483448, 0.06067866459488869, 0.07112757861614227, 0.08157649636268616, 0.09202541410923004, 0.10247433185577393, 0.11292324960231781, 0.1233721673488617, 0.13382108509540558, 0.14427000284194946, 0.15471890568733215, 0.16516783833503723, 0.17561674118041992, 0.1860656589269638, 0.1965145766735077, 0.20696349442005157, 0.21741241216659546, 0.22786132991313934, 0.23831024765968323, 0.24875915050506592, 0.259208083152771]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 4.0, 9.0, 8.0, 7.0, 18.0, 22.0, 25.0, 42.0, 90.0, 128.0, 212.0, 407.0, 808.0, 1630.0, 4293.0, 16354.0, 107881.0, 658357.0, 218826.0, 28770.0, 6345.0, 2195.0, 963.0, 489.0, 263.0, 146.0, 92.0, 55.0, 39.0, 22.0, 17.0, 20.0, 7.0, 9.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.318603515625, -0.3088493347167969, -0.29909515380859375, -0.2893409729003906, -0.2795867919921875, -0.2698326110839844, -0.26007843017578125, -0.2503242492675781, -0.240570068359375, -0.23081588745117188, -0.22106170654296875, -0.21130752563476562, -0.2015533447265625, -0.19179916381835938, -0.18204498291015625, -0.17229080200195312, -0.16253662109375, -0.15278244018554688, -0.14302825927734375, -0.13327407836914062, -0.1235198974609375, -0.11376571655273438, -0.10401153564453125, -0.09425735473632812, -0.084503173828125, -0.07474899291992188, -0.06499481201171875, -0.055240631103515625, -0.0454864501953125, -0.035732269287109375, -0.02597808837890625, -0.016223907470703125, -0.0064697265625, 0.003284454345703125, 0.01303863525390625, 0.022792816162109375, 0.0325469970703125, 0.042301177978515625, 0.05205535888671875, 0.061809539794921875, 0.071563720703125, 0.08131790161132812, 0.09107208251953125, 0.10082626342773438, 0.1105804443359375, 0.12033462524414062, 0.13008880615234375, 0.13984298706054688, 0.14959716796875, 0.15935134887695312, 0.16910552978515625, 0.17885971069335938, 0.1886138916015625, 0.19836807250976562, 0.20812225341796875, 0.21787643432617188, 0.227630615234375, 0.23738479614257812, 0.24713897705078125, 0.2568931579589844, 0.2666473388671875, 0.2764015197753906, 0.28615570068359375, 0.2959098815917969, 0.3056640625]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 4.0, 11.0, 15.0, 33.0, 35.0, 55.0, 66.0, 87.0, 116.0, 102.0, 105.0, 93.0, 71.0, 70.0, 53.0, 32.0, 12.0, 13.0, 11.0, 6.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12188720703125, -0.11896324157714844, -0.11603927612304688, -0.11311531066894531, -0.11019134521484375, -0.10726737976074219, -0.10434341430664062, -0.10141944885253906, -0.0984954833984375, -0.09557151794433594, -0.09264755249023438, -0.08972358703613281, -0.08679962158203125, -0.08387565612792969, -0.08095169067382812, -0.07802772521972656, -0.075103759765625, -0.07217979431152344, -0.06925582885742188, -0.06633186340332031, -0.06340789794921875, -0.06048393249511719, -0.057559967041015625, -0.05463600158691406, -0.0517120361328125, -0.04878807067871094, -0.045864105224609375, -0.04294013977050781, -0.04001617431640625, -0.03709220886230469, -0.034168243408203125, -0.031244277954101562, -0.0283203125, -0.025396347045898438, -0.022472381591796875, -0.019548416137695312, -0.01662445068359375, -0.013700485229492188, -0.010776519775390625, -0.007852554321289062, -0.0049285888671875, -0.0020046234130859375, 0.000919342041015625, 0.0038433074951171875, 0.00676727294921875, 0.009691238403320312, 0.012615203857421875, 0.015539169311523438, 0.018463134765625, 0.021387100219726562, 0.024311065673828125, 0.027235031127929688, 0.03015899658203125, 0.03308296203613281, 0.036006927490234375, 0.03893089294433594, 0.0418548583984375, 0.04477882385253906, 0.047702789306640625, 0.05062675476074219, 0.05355072021484375, 0.05647468566894531, 0.059398651123046875, 0.06232261657714844, 0.06524658203125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 4.0, 3.0, 6.0, 6.0, 13.0, 7.0, 20.0, 25.0, 29.0, 37.0, 53.0, 81.0, 112.0, 169.0, 272.0, 437.0, 713.0, 1330.0, 2862.0, 7662.0, 25026.0, 98741.0, 381293.0, 388917.0, 101055.0, 25705.0, 7696.0, 2939.0, 1396.0, 698.0, 417.0, 241.0, 188.0, 104.0, 100.0, 54.0, 35.0, 28.0, 24.0, 15.0, 14.0, 10.0, 7.0, 6.0, 1.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.14501953125, -0.14002037048339844, -0.13502120971679688, -0.1300220489501953, -0.12502288818359375, -0.12002372741699219, -0.11502456665039062, -0.11002540588378906, -0.1050262451171875, -0.10002708435058594, -0.09502792358398438, -0.09002876281738281, -0.08502960205078125, -0.08003044128417969, -0.07503128051757812, -0.07003211975097656, -0.065032958984375, -0.06003379821777344, -0.055034637451171875, -0.05003547668457031, -0.04503631591796875, -0.04003715515136719, -0.035037994384765625, -0.030038833618164062, -0.0250396728515625, -0.020040512084960938, -0.015041351318359375, -0.010042190551757812, -0.00504302978515625, -4.38690185546875e-05, 0.004955291748046875, 0.009954452514648438, 0.01495361328125, 0.019952774047851562, 0.024951934814453125, 0.029951095581054688, 0.03495025634765625, 0.03994941711425781, 0.044948577880859375, 0.04994773864746094, 0.0549468994140625, 0.05994606018066406, 0.06494522094726562, 0.06994438171386719, 0.07494354248046875, 0.07994270324707031, 0.08494186401367188, 0.08994102478027344, 0.094940185546875, 0.09993934631347656, 0.10493850708007812, 0.10993766784667969, 0.11493682861328125, 0.11993598937988281, 0.12493515014648438, 0.12993431091308594, 0.1349334716796875, 0.13993263244628906, 0.14493179321289062, 0.1499309539794922, 0.15493011474609375, 0.1599292755126953, 0.16492843627929688, 0.16992759704589844, 0.1749267578125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 6.0, 4.0, 5.0, 9.0, 14.0, 15.0, 12.0, 20.0, 20.0, 28.0, 35.0, 45.0, 48.0, 48.0, 43.0, 38.0, 56.0, 54.0, 47.0, 51.0, 47.0, 51.0, 58.0, 45.0, 37.0, 31.0, 18.0, 18.0, 16.0, 19.0, 19.0, 14.0, 10.0, 4.0, 4.0, 4.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1962890625, -0.1897411346435547, -0.18319320678710938, -0.17664527893066406, -0.17009735107421875, -0.16354942321777344, -0.15700149536132812, -0.1504535675048828, -0.1439056396484375, -0.1373577117919922, -0.13080978393554688, -0.12426185607910156, -0.11771392822265625, -0.11116600036621094, -0.10461807250976562, -0.09807014465332031, -0.091522216796875, -0.08497428894042969, -0.07842636108398438, -0.07187843322753906, -0.06533050537109375, -0.05878257751464844, -0.052234649658203125, -0.04568672180175781, -0.0391387939453125, -0.03259086608886719, -0.026042938232421875, -0.019495010375976562, -0.01294708251953125, -0.0063991546630859375, 0.000148773193359375, 0.0066967010498046875, 0.01324462890625, 0.019792556762695312, 0.026340484619140625, 0.03288841247558594, 0.03943634033203125, 0.04598426818847656, 0.052532196044921875, 0.05908012390136719, 0.0656280517578125, 0.07217597961425781, 0.07872390747070312, 0.08527183532714844, 0.09181976318359375, 0.09836769104003906, 0.10491561889648438, 0.11146354675292969, 0.118011474609375, 0.12455940246582031, 0.13110733032226562, 0.13765525817871094, 0.14420318603515625, 0.15075111389160156, 0.15729904174804688, 0.1638469696044922, 0.1703948974609375, 0.1769428253173828, 0.18349075317382812, 0.19003868103027344, 0.19658660888671875, 0.20313453674316406, 0.20968246459960938, 0.2162303924560547, 0.2227783203125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 9.0, 13.0, 10.0, 28.0, 31.0, 57.0, 93.0, 134.0, 242.0, 370.0, 740.0, 1985.0, 7533.0, 44640.0, 435762.0, 492111.0, 52365.0, 8475.0, 2146.0, 776.0, 426.0, 220.0, 140.0, 81.0, 71.0, 36.0, 20.0, 14.0, 10.0, 6.0, 7.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1285400390625, -0.12411308288574219, -0.11968612670898438, -0.11525917053222656, -0.11083221435546875, -0.10640525817871094, -0.10197830200195312, -0.09755134582519531, -0.0931243896484375, -0.08869743347167969, -0.08427047729492188, -0.07984352111816406, -0.07541656494140625, -0.07098960876464844, -0.06656265258789062, -0.06213569641113281, -0.057708740234375, -0.05328178405761719, -0.048854827880859375, -0.04442787170410156, -0.04000091552734375, -0.03557395935058594, -0.031147003173828125, -0.026720046997070312, -0.0222930908203125, -0.017866134643554688, -0.013439178466796875, -0.009012222290039062, -0.00458526611328125, -0.0001583099365234375, 0.004268646240234375, 0.008695602416992188, 0.01312255859375, 0.017549514770507812, 0.021976470947265625, 0.026403427124023438, 0.03083038330078125, 0.03525733947753906, 0.039684295654296875, 0.04411125183105469, 0.0485382080078125, 0.05296516418457031, 0.057392120361328125, 0.06181907653808594, 0.06624603271484375, 0.07067298889160156, 0.07509994506835938, 0.07952690124511719, 0.083953857421875, 0.08838081359863281, 0.09280776977539062, 0.09723472595214844, 0.10166168212890625, 0.10608863830566406, 0.11051559448242188, 0.11494255065917969, 0.1193695068359375, 0.12379646301269531, 0.12822341918945312, 0.13265037536621094, 0.13707733154296875, 0.14150428771972656, 0.14593124389648438, 0.1503582000732422, 0.15478515625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 2.0, 3.0, 7.0, 9.0, 22.0, 27.0, 43.0, 113.0, 146.0, 179.0, 144.0, 123.0, 58.0, 35.0, 27.0, 20.0, 14.0, 9.0, 4.0, 2.0, 1.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.0994415283203125e-05, -3.0013732612133026e-05, -2.9033049941062927e-05, -2.805236726999283e-05, -2.707168459892273e-05, -2.609100192785263e-05, -2.5110319256782532e-05, -2.4129636585712433e-05, -2.3148953914642334e-05, -2.2168271243572235e-05, -2.1187588572502136e-05, -2.0206905901432037e-05, -1.922622323036194e-05, -1.824554055929184e-05, -1.726485788822174e-05, -1.6284175217151642e-05, -1.5303492546081543e-05, -1.4322809875011444e-05, -1.3342127203941345e-05, -1.2361444532871246e-05, -1.1380761861801147e-05, -1.0400079190731049e-05, -9.41939651966095e-06, -8.43871384859085e-06, -7.458031177520752e-06, -6.477348506450653e-06, -5.496665835380554e-06, -4.515983164310455e-06, -3.5353004932403564e-06, -2.5546178221702576e-06, -1.5739351511001587e-06, -5.932524800300598e-07, 3.8743019104003906e-07, 1.368112862110138e-06, 2.348795533180237e-06, 3.3294782042503357e-06, 4.3101608753204346e-06, 5.2908435463905334e-06, 6.271526217460632e-06, 7.252208888530731e-06, 8.23289155960083e-06, 9.213574230670929e-06, 1.0194256901741028e-05, 1.1174939572811127e-05, 1.2155622243881226e-05, 1.3136304914951324e-05, 1.4116987586021423e-05, 1.5097670257091522e-05, 1.607835292816162e-05, 1.705903559923172e-05, 1.803971827030182e-05, 1.9020400941371918e-05, 2.0001083612442017e-05, 2.0981766283512115e-05, 2.1962448954582214e-05, 2.2943131625652313e-05, 2.3923814296722412e-05, 2.490449696779251e-05, 2.588517963886261e-05, 2.686586230993271e-05, 2.7846544981002808e-05, 2.8827227652072906e-05, 2.9807910323143005e-05, 3.0788592994213104e-05, 3.17692756652832e-05]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 5.0, 15.0, 22.0, 32.0, 69.0, 115.0, 201.0, 389.0, 612.0, 1254.0, 2581.0, 6187.0, 22014.0, 153519.0, 701201.0, 129972.0, 19626.0, 5736.0, 2394.0, 1201.0, 620.0, 354.0, 191.0, 90.0, 52.0, 32.0, 21.0, 18.0, 13.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.14111328125, -0.1367664337158203, -0.13241958618164062, -0.12807273864746094, -0.12372589111328125, -0.11937904357910156, -0.11503219604492188, -0.11068534851074219, -0.1063385009765625, -0.10199165344238281, -0.09764480590820312, -0.09329795837402344, -0.08895111083984375, -0.08460426330566406, -0.08025741577148438, -0.07591056823730469, -0.071563720703125, -0.06721687316894531, -0.06287002563476562, -0.05852317810058594, -0.05417633056640625, -0.04982948303222656, -0.045482635498046875, -0.04113578796386719, -0.0367889404296875, -0.03244209289550781, -0.028095245361328125, -0.023748397827148438, -0.01940155029296875, -0.015054702758789062, -0.010707855224609375, -0.0063610076904296875, -0.00201416015625, 0.0023326873779296875, 0.006679534912109375, 0.011026382446289062, 0.01537322998046875, 0.019720077514648438, 0.024066925048828125, 0.028413772583007812, 0.0327606201171875, 0.03710746765136719, 0.041454315185546875, 0.04580116271972656, 0.05014801025390625, 0.05449485778808594, 0.058841705322265625, 0.06318855285644531, 0.067535400390625, 0.07188224792480469, 0.07622909545898438, 0.08057594299316406, 0.08492279052734375, 0.08926963806152344, 0.09361648559570312, 0.09796333312988281, 0.1023101806640625, 0.10665702819824219, 0.11100387573242188, 0.11535072326660156, 0.11969757080078125, 0.12404441833496094, 0.12839126586914062, 0.1327381134033203, 0.1370849609375]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 0.0, 7.0, 9.0, 7.0, 7.0, 17.0, 34.0, 44.0, 60.0, 83.0, 107.0, 121.0, 115.0, 123.0, 81.0, 60.0, 48.0, 30.0, 17.0, 13.0, 9.0, 5.0, 3.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1279296875, -0.12381553649902344, -0.11970138549804688, -0.11558723449707031, -0.11147308349609375, -0.10735893249511719, -0.10324478149414062, -0.09913063049316406, -0.0950164794921875, -0.09090232849121094, -0.08678817749023438, -0.08267402648925781, -0.07855987548828125, -0.07444572448730469, -0.07033157348632812, -0.06621742248535156, -0.062103271484375, -0.05798912048339844, -0.053874969482421875, -0.04976081848144531, -0.04564666748046875, -0.04153251647949219, -0.037418365478515625, -0.03330421447753906, -0.0291900634765625, -0.025075912475585938, -0.020961761474609375, -0.016847610473632812, -0.01273345947265625, -0.008619308471679688, -0.004505157470703125, -0.0003910064697265625, 0.00372314453125, 0.007837295532226562, 0.011951446533203125, 0.016065597534179688, 0.02017974853515625, 0.024293899536132812, 0.028408050537109375, 0.03252220153808594, 0.0366363525390625, 0.04075050354003906, 0.044864654541015625, 0.04897880554199219, 0.05309295654296875, 0.05720710754394531, 0.061321258544921875, 0.06543540954589844, 0.069549560546875, 0.07366371154785156, 0.07777786254882812, 0.08189201354980469, 0.08600616455078125, 0.09012031555175781, 0.09423446655273438, 0.09834861755371094, 0.1024627685546875, 0.10657691955566406, 0.11069107055664062, 0.11480522155761719, 0.11891937255859375, 0.12303352355957031, 0.12714767456054688, 0.13126182556152344, 0.1353759765625]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 11.0, 24.0, 137.0, 305.0, 319.0, 148.0, 40.0, 8.0, 7.0, 7.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.199532985687256, -5.095624923706055, -4.991716384887695, -4.887808322906494, -4.783900260925293, -4.679991722106934, -4.576083660125732, -4.472175121307373, -4.368267059326172, -4.264358997344971, -4.160450458526611, -4.05654239654541, -3.95263409614563, -3.8487257957458496, -3.7448177337646484, -3.640909433364868, -3.537001132965088, -3.4330928325653076, -3.3291845321655273, -3.225276470184326, -3.121368169784546, -3.0174598693847656, -2.9135518074035645, -2.809643507003784, -2.705735206604004, -2.6018269062042236, -2.4979186058044434, -2.394010543823242, -2.290102243423462, -2.1861939430236816, -2.0822858810424805, -1.9783775806427002, -1.874469518661499, -1.7705612182617188, -1.666653037071228, -1.5627448558807373, -1.458836555480957, -1.3549282550811768, -1.251020073890686, -1.1471118927001953, -1.043203592300415, -0.9392953515052795, -0.835387110710144, -0.7314788699150085, -0.627570629119873, -0.5236623883247375, -0.41975414752960205, -0.31584590673446655, -0.21193766593933105, -0.10802942514419556, -0.004121184349060059, 0.09978705644607544, 0.20369529724121094, 0.30760353803634644, 0.41151177883148193, 0.5154200196266174, 0.6193282604217529, 0.7232365012168884, 0.8271447420120239, 0.9310529828071594, 1.034961223602295, 1.1388695240020752, 1.242777705192566, 1.3466858863830566, 1.450594186782837]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 4.0, 4.0, 4.0, 8.0, 10.0, 7.0, 9.0, 10.0, 14.0, 17.0, 21.0, 23.0, 18.0, 27.0, 29.0, 35.0, 41.0, 35.0, 36.0, 41.0, 33.0, 44.0, 48.0, 47.0, 44.0, 34.0, 36.0, 40.0, 32.0, 31.0, 28.0, 37.0, 23.0, 27.0, 24.0, 18.0, 20.0, 13.0, 10.0, 11.0, 3.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.8141882419586182, -0.7876115441322327, -0.7610348463058472, -0.7344581484794617, -0.7078814506530762, -0.6813047528266907, -0.6547280550003052, -0.6281514167785645, -0.6015746593475342, -0.5749979615211487, -0.5484212636947632, -0.5218445658683777, -0.4952678680419922, -0.4686911702156067, -0.4421145021915436, -0.4155378043651581, -0.38896113634109497, -0.3623844385147095, -0.335807740688324, -0.3092310428619385, -0.282654345035553, -0.2560776472091675, -0.22950097918510437, -0.20292428135871887, -0.17634758353233337, -0.14977088570594788, -0.12319419533014297, -0.09661750495433807, -0.07004080712795258, -0.04346410930156708, -0.016887426376342773, 0.009689271450042725, 0.03626596927642822, 0.06284266710281372, 0.08941935747861862, 0.11599604785442352, 0.14257274568080902, 0.16914944350719452, 0.19572612643241882, 0.22230282425880432, 0.24887952208518982, 0.2754562199115753, 0.3020329177379608, 0.3286095857620239, 0.3551862835884094, 0.3817629814147949, 0.4083396792411804, 0.4349163770675659, 0.4614930748939514, 0.4880697727203369, 0.5146464705467224, 0.5412231683731079, 0.5677998661994934, 0.5943765640258789, 0.6209532022476196, 0.6475299596786499, 0.6741065979003906, 0.7006832957267761, 0.7272599935531616, 0.7538366913795471, 0.7804133892059326, 0.8069900870323181, 0.8335667848587036, 0.8601434230804443, 0.8867201805114746]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 4.0, 10.0, 12.0, 22.0, 23.0, 39.0, 67.0, 95.0, 153.0, 259.0, 486.0, 865.0, 1582.0, 3674.0, 9785.0, 36924.0, 271969.0, 3633790.0, 189509.0, 29941.0, 8412.0, 3189.0, 1537.0, 767.0, 450.0, 286.0, 149.0, 93.0, 70.0, 41.0, 19.0, 17.0, 6.0, 11.0, 9.0, 3.0, 1.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.230224609375, -0.2237262725830078, -0.21722793579101562, -0.21072959899902344, -0.20423126220703125, -0.19773292541503906, -0.19123458862304688, -0.1847362518310547, -0.1782379150390625, -0.1717395782470703, -0.16524124145507812, -0.15874290466308594, -0.15224456787109375, -0.14574623107910156, -0.13924789428710938, -0.1327495574951172, -0.126251220703125, -0.11975288391113281, -0.11325454711914062, -0.10675621032714844, -0.10025787353515625, -0.09375953674316406, -0.08726119995117188, -0.08076286315917969, -0.0742645263671875, -0.06776618957519531, -0.061267852783203125, -0.05476951599121094, -0.04827117919921875, -0.04177284240722656, -0.035274505615234375, -0.028776168823242188, -0.02227783203125, -0.015779495239257812, -0.009281158447265625, -0.0027828216552734375, 0.00371551513671875, 0.010213851928710938, 0.016712188720703125, 0.023210525512695312, 0.0297088623046875, 0.03620719909667969, 0.042705535888671875, 0.04920387268066406, 0.05570220947265625, 0.06220054626464844, 0.06869888305664062, 0.07519721984863281, 0.081695556640625, 0.08819389343261719, 0.09469223022460938, 0.10119056701660156, 0.10768890380859375, 0.11418724060058594, 0.12068557739257812, 0.1271839141845703, 0.1336822509765625, 0.1401805877685547, 0.14667892456054688, 0.15317726135253906, 0.15967559814453125, 0.16617393493652344, 0.17267227172851562, 0.1791706085205078, 0.1856689453125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 5.0, 11.0, 13.0, 21.0, 38.0, 59.0, 51.0, 90.0, 95.0, 115.0, 104.0, 105.0, 84.0, 73.0, 43.0, 23.0, 28.0, 18.0, 8.0, 8.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.12432861328125, -0.12136650085449219, -0.11840438842773438, -0.11544227600097656, -0.11248016357421875, -0.10951805114746094, -0.10655593872070312, -0.10359382629394531, -0.1006317138671875, -0.09766960144042969, -0.09470748901367188, -0.09174537658691406, -0.08878326416015625, -0.08582115173339844, -0.08285903930664062, -0.07989692687988281, -0.076934814453125, -0.07397270202636719, -0.07101058959960938, -0.06804847717285156, -0.06508636474609375, -0.06212425231933594, -0.059162139892578125, -0.05620002746582031, -0.0532379150390625, -0.05027580261230469, -0.047313690185546875, -0.04435157775878906, -0.04138946533203125, -0.03842735290527344, -0.035465240478515625, -0.03250312805175781, -0.029541015625, -0.026578903198242188, -0.023616790771484375, -0.020654678344726562, -0.01769256591796875, -0.014730453491210938, -0.011768341064453125, -0.008806228637695312, -0.0058441162109375, -0.0028820037841796875, 8.0108642578125e-05, 0.0030422210693359375, 0.00600433349609375, 0.008966445922851562, 0.011928558349609375, 0.014890670776367188, 0.017852783203125, 0.020814895629882812, 0.023777008056640625, 0.026739120483398438, 0.02970123291015625, 0.03266334533691406, 0.035625457763671875, 0.03858757019042969, 0.0415496826171875, 0.04451179504394531, 0.047473907470703125, 0.05043601989746094, 0.05339813232421875, 0.05636024475097656, 0.059322357177734375, 0.06228446960449219, 0.06524658203125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 10.0, 21.0, 37.0, 71.0, 180.0, 515.0, 2245.0, 13973.0, 223524.0, 3853332.0, 90227.0, 8075.0, 1451.0, 358.0, 127.0, 67.0, 37.0, 15.0, 11.0, 3.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2413330078125, -0.2300395965576172, -0.21874618530273438, -0.20745277404785156, -0.19615936279296875, -0.18486595153808594, -0.17357254028320312, -0.1622791290283203, -0.1509857177734375, -0.1396923065185547, -0.12839889526367188, -0.11710548400878906, -0.10581207275390625, -0.09451866149902344, -0.08322525024414062, -0.07193183898925781, -0.060638427734375, -0.04934501647949219, -0.038051605224609375, -0.026758193969726562, -0.01546478271484375, -0.0041713714599609375, 0.007122039794921875, 0.018415451049804688, 0.0297088623046875, 0.04100227355957031, 0.052295684814453125, 0.06358909606933594, 0.07488250732421875, 0.08617591857910156, 0.09746932983398438, 0.10876274108886719, 0.12005615234375, 0.1313495635986328, 0.14264297485351562, 0.15393638610839844, 0.16522979736328125, 0.17652320861816406, 0.18781661987304688, 0.1991100311279297, 0.2104034423828125, 0.2216968536376953, 0.23299026489257812, 0.24428367614746094, 0.25557708740234375, 0.26687049865722656, 0.2781639099121094, 0.2894573211669922, 0.300750732421875, 0.3120441436767578, 0.3233375549316406, 0.33463096618652344, 0.34592437744140625, 0.35721778869628906, 0.3685111999511719, 0.3798046112060547, 0.3910980224609375, 0.4023914337158203, 0.4136848449707031, 0.42497825622558594, 0.43627166748046875, 0.44756507873535156, 0.4588584899902344, 0.4701519012451172, 0.4814453125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 2.0, 5.0, 4.0, 6.0, 13.0, 24.0, 33.0, 47.0, 68.0, 124.0, 264.0, 588.0, 1852.0, 524.0, 246.0, 117.0, 57.0, 41.0, 22.0, 15.0, 10.0, 8.0, 2.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.062408447265625, -0.05919790267944336, -0.05598735809326172, -0.05277681350708008, -0.04956626892089844, -0.0463557243347168, -0.043145179748535156, -0.039934635162353516, -0.036724090576171875, -0.033513545989990234, -0.030303001403808594, -0.027092456817626953, -0.023881912231445312, -0.020671367645263672, -0.01746082305908203, -0.01425027847290039, -0.01103973388671875, -0.00782918930053711, -0.004618644714355469, -0.0014081001281738281, 0.0018024444580078125, 0.005012989044189453, 0.008223533630371094, 0.011434078216552734, 0.014644622802734375, 0.017855167388916016, 0.021065711975097656, 0.024276256561279297, 0.027486801147460938, 0.030697345733642578, 0.03390789031982422, 0.03711843490600586, 0.0403289794921875, 0.04353952407836914, 0.04675006866455078, 0.04996061325073242, 0.05317115783691406, 0.0563817024230957, 0.059592247009277344, 0.06280279159545898, 0.06601333618164062, 0.06922388076782227, 0.0724344253540039, 0.07564496994018555, 0.07885551452636719, 0.08206605911254883, 0.08527660369873047, 0.08848714828491211, 0.09169769287109375, 0.09490823745727539, 0.09811878204345703, 0.10132932662963867, 0.10453987121582031, 0.10775041580200195, 0.1109609603881836, 0.11417150497436523, 0.11738204956054688, 0.12059259414672852, 0.12380313873291016, 0.1270136833190918, 0.13022422790527344, 0.13343477249145508, 0.13664531707763672, 0.13985586166381836, 0.14306640625]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 13.0, 25.0, 95.0, 201.0, 279.0, 229.0, 100.0, 46.0, 10.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.324263334274292, -1.295900583267212, -1.2675378322601318, -1.2391750812530518, -1.2108123302459717, -1.1824495792388916, -1.1540868282318115, -1.125724196434021, -1.097361445426941, -1.0689986944198608, -1.0406359434127808, -1.0122731924057007, -0.9839105010032654, -0.9555477499961853, -0.9271849989891052, -0.8988222479820251, -0.8704594969749451, -0.842096745967865, -0.8137339949607849, -0.7853713035583496, -0.7570085525512695, -0.7286458015441895, -0.7002830505371094, -0.6719202995300293, -0.6435575485229492, -0.6151947975158691, -0.5868320465087891, -0.558469295501709, -0.5301066040992737, -0.5017438530921936, -0.4733811020851135, -0.44501835107803345, -0.41665568947792053, -0.38829293847084045, -0.35993021726608276, -0.3315674662590027, -0.3032047152519226, -0.2748419940471649, -0.24647924304008484, -0.21811650693416595, -0.18975377082824707, -0.16139103472232819, -0.1330282986164093, -0.10466554760932922, -0.07630281150341034, -0.047940075397491455, -0.019577324390411377, 0.008785411715507507, 0.03714814782142639, 0.06551088392734528, 0.09387362748384476, 0.12223637104034424, 0.15059910714626312, 0.178961843252182, 0.20732459425926208, 0.23568733036518097, 0.26405006647109985, 0.29241281747817993, 0.3207755386829376, 0.3491382896900177, 0.3775010108947754, 0.40586376190185547, 0.43422651290893555, 0.4625892639160156, 0.4909519851207733]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 2.0, 5.0, 6.0, 7.0, 9.0, 5.0, 12.0, 16.0, 20.0, 25.0, 30.0, 28.0, 38.0, 42.0, 46.0, 41.0, 36.0, 46.0, 55.0, 57.0, 50.0, 48.0, 55.0, 50.0, 35.0, 29.0, 32.0, 29.0, 32.0, 26.0, 16.0, 13.0, 15.0, 12.0, 9.0, 7.0, 5.0, 3.0, 3.0, 2.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.23632711172103882, -0.22833795845508575, -0.2203487902879715, -0.21235963702201843, -0.20437048375606537, -0.1963813304901123, -0.18839216232299805, -0.18040300905704498, -0.17241385579109192, -0.16442470252513885, -0.1564355343580246, -0.14844638109207153, -0.14045722782611847, -0.1324680745601654, -0.12447890639305115, -0.11648975312709808, -0.10850058495998383, -0.10051142424345016, -0.0925222709774971, -0.08453311026096344, -0.07654395699501038, -0.06855479627847672, -0.060565635561943054, -0.05257647857069969, -0.04458732157945633, -0.03659816458821297, -0.028609005734324455, -0.020619846880435944, -0.012630689889192581, -0.004641532897949219, 0.003347627818584442, 0.011336784809827805, 0.019325941801071167, 0.02731509879231453, 0.03530425578355789, 0.04329341650009155, 0.051282573491334915, 0.05927173048257828, 0.06726089119911194, 0.075250044465065, 0.08323920518159866, 0.09122836589813232, 0.09921751916408539, 0.10720667988061905, 0.11519584059715271, 0.12318499386310577, 0.13117414712905884, 0.1391633152961731, 0.14715246856212616, 0.15514162182807922, 0.16313078999519348, 0.17111994326114655, 0.1791090965270996, 0.18709826469421387, 0.19508741796016693, 0.20307657122612, 0.21106573939323425, 0.21905489265918732, 0.22704406082630157, 0.23503321409225464, 0.2430223673582077, 0.25101152062416077, 0.259000688791275, 0.2669898569583893, 0.27497899532318115]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 3.0, 6.0, 10.0, 10.0, 22.0, 41.0, 68.0, 149.0, 278.0, 465.0, 1063.0, 2566.0, 7903.0, 39949.0, 337970.0, 568138.0, 72046.0, 11774.0, 3480.0, 1298.0, 591.0, 354.0, 157.0, 99.0, 48.0, 29.0, 14.0, 12.0, 7.0, 7.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33203125, -0.322845458984375, -0.31365966796875, -0.304473876953125, -0.2952880859375, -0.286102294921875, -0.27691650390625, -0.267730712890625, -0.258544921875, -0.249359130859375, -0.24017333984375, -0.230987548828125, -0.2218017578125, -0.212615966796875, -0.20343017578125, -0.194244384765625, -0.18505859375, -0.175872802734375, -0.16668701171875, -0.157501220703125, -0.1483154296875, -0.139129638671875, -0.12994384765625, -0.120758056640625, -0.111572265625, -0.102386474609375, -0.09320068359375, -0.084014892578125, -0.0748291015625, -0.065643310546875, -0.05645751953125, -0.047271728515625, -0.0380859375, -0.028900146484375, -0.01971435546875, -0.010528564453125, -0.0013427734375, 0.007843017578125, 0.01702880859375, 0.026214599609375, 0.035400390625, 0.044586181640625, 0.05377197265625, 0.062957763671875, 0.0721435546875, 0.081329345703125, 0.09051513671875, 0.099700927734375, 0.10888671875, 0.118072509765625, 0.12725830078125, 0.136444091796875, 0.1456298828125, 0.154815673828125, 0.16400146484375, 0.173187255859375, 0.182373046875, 0.191558837890625, 0.20074462890625, 0.209930419921875, 0.2191162109375, 0.228302001953125, 0.23748779296875, 0.246673583984375, 0.255859375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 5.0, 11.0, 19.0, 18.0, 25.0, 56.0, 69.0, 80.0, 97.0, 121.0, 106.0, 114.0, 76.0, 69.0, 46.0, 28.0, 36.0, 8.0, 10.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1295166015625, -0.12643051147460938, -0.12334442138671875, -0.12025833129882812, -0.1171722412109375, -0.11408615112304688, -0.11100006103515625, -0.10791397094726562, -0.104827880859375, -0.10174179077148438, -0.09865570068359375, -0.09556961059570312, -0.0924835205078125, -0.08939743041992188, -0.08631134033203125, -0.08322525024414062, -0.08013916015625, -0.07705307006835938, -0.07396697998046875, -0.07088088989257812, -0.0677947998046875, -0.06470870971679688, -0.06162261962890625, -0.058536529541015625, -0.055450439453125, -0.052364349365234375, -0.04927825927734375, -0.046192169189453125, -0.0431060791015625, -0.040019989013671875, -0.03693389892578125, -0.033847808837890625, -0.03076171875, -0.027675628662109375, -0.02458953857421875, -0.021503448486328125, -0.0184173583984375, -0.015331268310546875, -0.01224517822265625, -0.009159088134765625, -0.006072998046875, -0.002986907958984375, 9.918212890625e-05, 0.003185272216796875, 0.0062713623046875, 0.009357452392578125, 0.01244354248046875, 0.015529632568359375, 0.01861572265625, 0.021701812744140625, 0.02478790283203125, 0.027873992919921875, 0.0309600830078125, 0.034046173095703125, 0.03713226318359375, 0.040218353271484375, 0.043304443359375, 0.046390533447265625, 0.04947662353515625, 0.052562713623046875, 0.0556488037109375, 0.058734893798828125, 0.06182098388671875, 0.06490707397460938, 0.0679931640625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 7.0, 8.0, 15.0, 10.0, 16.0, 19.0, 21.0, 26.0, 32.0, 48.0, 61.0, 94.0, 120.0, 181.0, 299.0, 475.0, 903.0, 1872.0, 4084.0, 10702.0, 30067.0, 91277.0, 287334.0, 397060.0, 149025.0, 47172.0, 16156.0, 5978.0, 2616.0, 1127.0, 600.0, 358.0, 237.0, 144.0, 116.0, 64.0, 53.0, 43.0, 22.0, 28.0, 11.0, 9.0, 7.0, 14.0, 10.0, 5.0, 9.0, 7.0, 5.0, 2.0, 1.0, 4.0, 1.0, 3.0, 1.0, 3.0], "bins": [-0.1177978515625, -0.11402320861816406, -0.11024856567382812, -0.10647392272949219, -0.10269927978515625, -0.09892463684082031, -0.09514999389648438, -0.09137535095214844, -0.0876007080078125, -0.08382606506347656, -0.08005142211914062, -0.07627677917480469, -0.07250213623046875, -0.06872749328613281, -0.06495285034179688, -0.06117820739746094, -0.057403564453125, -0.05362892150878906, -0.049854278564453125, -0.04607963562011719, -0.04230499267578125, -0.03853034973144531, -0.034755706787109375, -0.030981063842773438, -0.0272064208984375, -0.023431777954101562, -0.019657135009765625, -0.015882492065429688, -0.01210784912109375, -0.008333206176757812, -0.004558563232421875, -0.0007839202880859375, 0.00299072265625, 0.0067653656005859375, 0.010540008544921875, 0.014314651489257812, 0.01808929443359375, 0.021863937377929688, 0.025638580322265625, 0.029413223266601562, 0.0331878662109375, 0.03696250915527344, 0.040737152099609375, 0.04451179504394531, 0.04828643798828125, 0.05206108093261719, 0.055835723876953125, 0.05961036682128906, 0.063385009765625, 0.06715965270996094, 0.07093429565429688, 0.07470893859863281, 0.07848358154296875, 0.08225822448730469, 0.08603286743164062, 0.08980751037597656, 0.0935821533203125, 0.09735679626464844, 0.10113143920898438, 0.10490608215332031, 0.10868072509765625, 0.11245536804199219, 0.11623001098632812, 0.12000465393066406, 0.123779296875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 5.0, 5.0, 9.0, 10.0, 5.0, 9.0, 10.0, 9.0, 19.0, 16.0, 18.0, 23.0, 17.0, 32.0, 29.0, 38.0, 39.0, 41.0, 38.0, 40.0, 46.0, 36.0, 42.0, 40.0, 33.0, 34.0, 28.0, 36.0, 42.0, 40.0, 24.0, 37.0, 19.0, 21.0, 14.0, 17.0, 10.0, 13.0, 15.0, 8.0, 3.0, 10.0, 11.0, 0.0, 4.0, 4.0, 3.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1527099609375, -0.14769363403320312, -0.14267730712890625, -0.13766098022460938, -0.1326446533203125, -0.12762832641601562, -0.12261199951171875, -0.11759567260742188, -0.112579345703125, -0.10756301879882812, -0.10254669189453125, -0.09753036499023438, -0.0925140380859375, -0.08749771118164062, -0.08248138427734375, -0.07746505737304688, -0.07244873046875, -0.06743240356445312, -0.06241607666015625, -0.057399749755859375, -0.0523834228515625, -0.047367095947265625, -0.04235076904296875, -0.037334442138671875, -0.032318115234375, -0.027301788330078125, -0.02228546142578125, -0.017269134521484375, -0.0122528076171875, -0.007236480712890625, -0.00222015380859375, 0.002796173095703125, 0.0078125, 0.012828826904296875, 0.01784515380859375, 0.022861480712890625, 0.0278778076171875, 0.032894134521484375, 0.03791046142578125, 0.042926788330078125, 0.047943115234375, 0.052959442138671875, 0.05797576904296875, 0.06299209594726562, 0.0680084228515625, 0.07302474975585938, 0.07804107666015625, 0.08305740356445312, 0.08807373046875, 0.09309005737304688, 0.09810638427734375, 0.10312271118164062, 0.1081390380859375, 0.11315536499023438, 0.11817169189453125, 0.12318801879882812, 0.128204345703125, 0.13322067260742188, 0.13823699951171875, 0.14325332641601562, 0.1482696533203125, 0.15328598022460938, 0.15830230712890625, 0.16331863403320312, 0.1683349609375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 3.0, 9.0, 6.0, 13.0, 24.0, 17.0, 24.0, 39.0, 47.0, 87.0, 119.0, 187.0, 376.0, 732.0, 1737.0, 4872.0, 20312.0, 146005.0, 660552.0, 180181.0, 24055.0, 5588.0, 1838.0, 769.0, 385.0, 202.0, 95.0, 65.0, 44.0, 38.0, 23.0, 24.0, 24.0, 13.0, 9.0, 7.0, 11.0, 5.0, 10.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.11248779296875, -0.10913467407226562, -0.10578155517578125, -0.10242843627929688, -0.0990753173828125, -0.09572219848632812, -0.09236907958984375, -0.08901596069335938, -0.085662841796875, -0.08230972290039062, -0.07895660400390625, -0.07560348510742188, -0.0722503662109375, -0.06889724731445312, -0.06554412841796875, -0.062191009521484375, -0.058837890625, -0.055484771728515625, -0.05213165283203125, -0.048778533935546875, -0.0454254150390625, -0.042072296142578125, -0.03871917724609375, -0.035366058349609375, -0.032012939453125, -0.028659820556640625, -0.02530670166015625, -0.021953582763671875, -0.0186004638671875, -0.015247344970703125, -0.01189422607421875, -0.008541107177734375, -0.00518798828125, -0.001834869384765625, 0.00151824951171875, 0.004871368408203125, 0.0082244873046875, 0.011577606201171875, 0.01493072509765625, 0.018283843994140625, 0.021636962890625, 0.024990081787109375, 0.02834320068359375, 0.031696319580078125, 0.0350494384765625, 0.038402557373046875, 0.04175567626953125, 0.045108795166015625, 0.0484619140625, 0.051815032958984375, 0.05516815185546875, 0.058521270751953125, 0.0618743896484375, 0.06522750854492188, 0.06858062744140625, 0.07193374633789062, 0.075286865234375, 0.07863998413085938, 0.08199310302734375, 0.08534622192382812, 0.0886993408203125, 0.09205245971679688, 0.09540557861328125, 0.09875869750976562, 0.10211181640625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 3.0, 4.0, 1.0, 9.0, 7.0, 11.0, 25.0, 28.0, 55.0, 64.0, 89.0, 139.0, 122.0, 140.0, 112.0, 78.0, 49.0, 22.0, 16.0, 15.0, 10.0, 5.0, 4.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5451183319091797e-05, -2.4788081645965576e-05, -2.4124979972839355e-05, -2.3461878299713135e-05, -2.2798776626586914e-05, -2.2135674953460693e-05, -2.1472573280334473e-05, -2.0809471607208252e-05, -2.014636993408203e-05, -1.948326826095581e-05, -1.882016658782959e-05, -1.815706491470337e-05, -1.749396324157715e-05, -1.6830861568450928e-05, -1.6167759895324707e-05, -1.5504658222198486e-05, -1.4841556549072266e-05, -1.4178454875946045e-05, -1.3515353202819824e-05, -1.2852251529693604e-05, -1.2189149856567383e-05, -1.1526048183441162e-05, -1.0862946510314941e-05, -1.019984483718872e-05, -9.5367431640625e-06, -8.87364149093628e-06, -8.210539817810059e-06, -7.547438144683838e-06, -6.884336471557617e-06, -6.2212347984313965e-06, -5.558133125305176e-06, -4.895031452178955e-06, -4.231929779052734e-06, -3.5688281059265137e-06, -2.905726432800293e-06, -2.2426247596740723e-06, -1.5795230865478516e-06, -9.164214134216309e-07, -2.5331974029541016e-07, 4.0978193283081055e-07, 1.0728836059570312e-06, 1.735985279083252e-06, 2.3990869522094727e-06, 3.0621886253356934e-06, 3.725290298461914e-06, 4.388391971588135e-06, 5.0514936447143555e-06, 5.714595317840576e-06, 6.377696990966797e-06, 7.040798664093018e-06, 7.703900337219238e-06, 8.367002010345459e-06, 9.03010368347168e-06, 9.6932053565979e-06, 1.0356307029724121e-05, 1.1019408702850342e-05, 1.1682510375976562e-05, 1.2345612049102783e-05, 1.3008713722229004e-05, 1.3671815395355225e-05, 1.4334917068481445e-05, 1.4998018741607666e-05, 1.5661120414733887e-05, 1.6324222087860107e-05, 1.6987323760986328e-05]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 10.0, 9.0, 14.0, 17.0, 26.0, 35.0, 71.0, 148.0, 286.0, 601.0, 1649.0, 6070.0, 42842.0, 570048.0, 391338.0, 28316.0, 4632.0, 1331.0, 541.0, 258.0, 113.0, 72.0, 46.0, 30.0, 16.0, 10.0, 8.0, 3.0, 2.0, 4.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.10443115234375, -0.10055065155029297, -0.09667015075683594, -0.0927896499633789, -0.08890914916992188, -0.08502864837646484, -0.08114814758300781, -0.07726764678955078, -0.07338714599609375, -0.06950664520263672, -0.06562614440917969, -0.061745643615722656, -0.057865142822265625, -0.053984642028808594, -0.05010414123535156, -0.04622364044189453, -0.0423431396484375, -0.03846263885498047, -0.03458213806152344, -0.030701637268066406, -0.026821136474609375, -0.022940635681152344, -0.019060134887695312, -0.015179634094238281, -0.01129913330078125, -0.007418632507324219, -0.0035381317138671875, 0.00034236907958984375, 0.004222869873046875, 0.008103370666503906, 0.011983871459960938, 0.01586437225341797, 0.019744873046875, 0.02362537384033203, 0.027505874633789062, 0.031386375427246094, 0.035266876220703125, 0.039147377014160156, 0.04302787780761719, 0.04690837860107422, 0.05078887939453125, 0.05466938018798828, 0.05854988098144531, 0.062430381774902344, 0.06631088256835938, 0.0701913833618164, 0.07407188415527344, 0.07795238494873047, 0.0818328857421875, 0.08571338653564453, 0.08959388732910156, 0.0934743881225586, 0.09735488891601562, 0.10123538970947266, 0.10511589050292969, 0.10899639129638672, 0.11287689208984375, 0.11675739288330078, 0.12063789367675781, 0.12451839447021484, 0.12839889526367188, 0.1322793960571289, 0.13615989685058594, 0.14004039764404297, 0.1439208984375]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 9.0, 18.0, 29.0, 53.0, 85.0, 136.0, 207.0, 201.0, 121.0, 61.0, 35.0, 18.0, 16.0, 10.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.140625, -0.13537979125976562, -0.13013458251953125, -0.12488937377929688, -0.1196441650390625, -0.11439895629882812, -0.10915374755859375, -0.10390853881835938, -0.098663330078125, -0.09341812133789062, -0.08817291259765625, -0.08292770385742188, -0.0776824951171875, -0.07243728637695312, -0.06719207763671875, -0.061946868896484375, -0.05670166015625, -0.051456451416015625, -0.04621124267578125, -0.040966033935546875, -0.0357208251953125, -0.030475616455078125, -0.02523040771484375, -0.019985198974609375, -0.014739990234375, -0.009494781494140625, -0.00424957275390625, 0.000995635986328125, 0.0062408447265625, 0.011486053466796875, 0.01673126220703125, 0.021976470947265625, 0.0272216796875, 0.032466888427734375, 0.03771209716796875, 0.042957305908203125, 0.0482025146484375, 0.053447723388671875, 0.05869293212890625, 0.06393814086914062, 0.069183349609375, 0.07442855834960938, 0.07967376708984375, 0.08491897583007812, 0.0901641845703125, 0.09540939331054688, 0.10065460205078125, 0.10589981079101562, 0.11114501953125, 0.11639022827148438, 0.12163543701171875, 0.12688064575195312, 0.1321258544921875, 0.13737106323242188, 0.14261627197265625, 0.14786148071289062, 0.153106689453125, 0.15835189819335938, 0.16359710693359375, 0.16884231567382812, 0.1740875244140625, 0.17933273315429688, 0.18457794189453125, 0.18982315063476562, 0.195068359375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 9.0, 14.0, 36.0, 156.0, 322.0, 268.0, 138.0, 48.0, 18.0, 6.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-4.185859680175781, -4.106629371643066, -4.027399063110352, -3.9481687545776367, -3.868938446044922, -3.789708375930786, -3.7104780673980713, -3.6312477588653564, -3.5520174503326416, -3.4727871417999268, -3.393556833267212, -3.314326524734497, -3.2350964546203613, -3.1558661460876465, -3.0766358375549316, -2.997405529022217, -2.918175220489502, -2.838944911956787, -2.7597146034240723, -2.6804842948913574, -2.6012539863586426, -2.522023916244507, -2.442793607711792, -2.363563299179077, -2.2843329906463623, -2.2051026821136475, -2.1258723735809326, -2.0466420650482178, -1.9674118757247925, -1.8881815671920776, -1.8089513778686523, -1.7297210693359375, -1.6504907608032227, -1.5712604522705078, -1.492030143737793, -1.4127999544143677, -1.3335696458816528, -1.254339337348938, -1.1751091480255127, -1.0958788394927979, -1.016648530960083, -0.9374182224273682, -0.8581879734992981, -0.778957724571228, -0.6997274160385132, -0.6204971075057983, -0.5412668585777283, -0.4620366096496582, -0.38280630111694336, -0.3035760223865509, -0.22434574365615845, -0.145115464925766, -0.06588518619537354, 0.013345092535018921, 0.09257537126541138, 0.17180562019348145, 0.2510359287261963, 0.33026620745658875, 0.4094964861869812, 0.48872676491737366, 0.5679570436477661, 0.647187352180481, 0.726417601108551, 0.8056478500366211, 0.8848781585693359]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 5.0, 3.0, 6.0, 4.0, 7.0, 5.0, 18.0, 17.0, 21.0, 16.0, 23.0, 18.0, 21.0, 29.0, 38.0, 41.0, 33.0, 33.0, 49.0, 39.0, 40.0, 43.0, 38.0, 57.0, 32.0, 46.0, 36.0, 33.0, 33.0, 31.0, 37.0, 24.0, 22.0, 17.0, 15.0, 16.0, 15.0, 9.0, 8.0, 10.0, 3.0, 4.0, 3.0, 5.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.905797004699707, -0.8790604472160339, -0.8523238897323608, -0.8255873322486877, -0.7988507747650146, -0.7721142172813416, -0.7453776597976685, -0.7186411619186401, -0.6919045448303223, -0.6651679873466492, -0.6384314298629761, -0.611694872379303, -0.5849583148956299, -0.5582217574119568, -0.5314851999282837, -0.5047487020492554, -0.4780121445655823, -0.4512755870819092, -0.4245390295982361, -0.397802472114563, -0.3710659146308899, -0.3443293571472168, -0.3175928294658661, -0.290856271982193, -0.2641197144985199, -0.2373831570148468, -0.2106465995311737, -0.1839100569486618, -0.1571734994649887, -0.1304369419813156, -0.10370039939880371, -0.07696384191513062, -0.05022728443145752, -0.023490730673074722, 0.003245823085308075, 0.029982373118400574, 0.05671893060207367, 0.08345548808574677, 0.11019203066825867, 0.13692858815193176, 0.16366514563560486, 0.19040170311927795, 0.21713826060295105, 0.24387480318546295, 0.27061134576797485, 0.29734790325164795, 0.32408446073532104, 0.35082101821899414, 0.37755757570266724, 0.40429413318634033, 0.4310306906700134, 0.4577672481536865, 0.4845038056373596, 0.5112403631210327, 0.537976861000061, 0.5647134780883789, 0.5914499759674072, 0.6181865334510803, 0.6449230909347534, 0.6716596484184265, 0.6983962059020996, 0.7251327633857727, 0.7518693208694458, 0.7786058187484741, 0.805342435836792]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 3.0, 10.0, 7.0, 9.0, 18.0, 16.0, 11.0, 27.0, 31.0, 38.0, 46.0, 59.0, 104.0, 160.0, 286.0, 533.0, 982.0, 2318.0, 6047.0, 23613.0, 280052.0, 3796885.0, 64468.0, 11587.0, 3703.0, 1485.0, 718.0, 419.0, 205.0, 144.0, 90.0, 64.0, 48.0, 31.0, 18.0, 15.0, 8.0, 10.0, 3.0, 6.0, 3.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.36279296875, -0.3530540466308594, -0.34331512451171875, -0.3335762023925781, -0.3238372802734375, -0.3140983581542969, -0.30435943603515625, -0.2946205139160156, -0.284881591796875, -0.2751426696777344, -0.26540374755859375, -0.2556648254394531, -0.2459259033203125, -0.23618698120117188, -0.22644805908203125, -0.21670913696289062, -0.20697021484375, -0.19723129272460938, -0.18749237060546875, -0.17775344848632812, -0.1680145263671875, -0.15827560424804688, -0.14853668212890625, -0.13879776000976562, -0.129058837890625, -0.11931991577148438, -0.10958099365234375, -0.09984207153320312, -0.0901031494140625, -0.08036422729492188, -0.07062530517578125, -0.060886383056640625, -0.0511474609375, -0.041408538818359375, -0.03166961669921875, -0.021930694580078125, -0.0121917724609375, -0.002452850341796875, 0.00728607177734375, 0.017024993896484375, 0.026763916015625, 0.036502838134765625, 0.04624176025390625, 0.055980682373046875, 0.0657196044921875, 0.07545852661132812, 0.08519744873046875, 0.09493637084960938, 0.10467529296875, 0.11441421508789062, 0.12415313720703125, 0.13389205932617188, 0.1436309814453125, 0.15336990356445312, 0.16310882568359375, 0.17284774780273438, 0.182586669921875, 0.19232559204101562, 0.20206451416015625, 0.21180343627929688, 0.2215423583984375, 0.23128128051757812, 0.24102020263671875, 0.2507591247558594, 0.260498046875]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 7.0, 13.0, 14.0, 31.0, 30.0, 57.0, 68.0, 84.0, 109.0, 120.0, 118.0, 91.0, 84.0, 69.0, 38.0, 26.0, 18.0, 7.0, 8.0, 3.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1336669921875, -0.13052845001220703, -0.12738990783691406, -0.1242513656616211, -0.12111282348632812, -0.11797428131103516, -0.11483573913574219, -0.11169719696044922, -0.10855865478515625, -0.10542011260986328, -0.10228157043457031, -0.09914302825927734, -0.09600448608398438, -0.0928659439086914, -0.08972740173339844, -0.08658885955810547, -0.0834503173828125, -0.08031177520751953, -0.07717323303222656, -0.0740346908569336, -0.07089614868164062, -0.06775760650634766, -0.06461906433105469, -0.06148052215576172, -0.05834197998046875, -0.05520343780517578, -0.05206489562988281, -0.048926353454589844, -0.045787811279296875, -0.042649269104003906, -0.03951072692871094, -0.03637218475341797, -0.033233642578125, -0.03009510040283203, -0.026956558227539062, -0.023818016052246094, -0.020679473876953125, -0.017540931701660156, -0.014402389526367188, -0.011263847351074219, -0.00812530517578125, -0.004986763000488281, -0.0018482208251953125, 0.0012903213500976562, 0.004428863525390625, 0.007567405700683594, 0.010705947875976562, 0.013844490051269531, 0.0169830322265625, 0.02012157440185547, 0.023260116577148438, 0.026398658752441406, 0.029537200927734375, 0.032675743103027344, 0.03581428527832031, 0.03895282745361328, 0.04209136962890625, 0.04522991180419922, 0.04836845397949219, 0.051506996154785156, 0.054645538330078125, 0.057784080505371094, 0.06092262268066406, 0.06406116485595703, 0.06719970703125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 3.0, 14.0, 22.0, 34.0, 95.0, 214.0, 602.0, 1711.0, 5988.0, 27590.0, 323436.0, 3732014.0, 84512.0, 13112.0, 3256.0, 1082.0, 324.0, 131.0, 75.0, 34.0, 17.0, 8.0, 7.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.357177734375, -0.3483085632324219, -0.33943939208984375, -0.3305702209472656, -0.3217010498046875, -0.3128318786621094, -0.30396270751953125, -0.2950935363769531, -0.286224365234375, -0.2773551940917969, -0.26848602294921875, -0.2596168518066406, -0.2507476806640625, -0.24187850952148438, -0.23300933837890625, -0.22414016723632812, -0.21527099609375, -0.20640182495117188, -0.19753265380859375, -0.18866348266601562, -0.1797943115234375, -0.17092514038085938, -0.16205596923828125, -0.15318679809570312, -0.144317626953125, -0.13544845581054688, -0.12657928466796875, -0.11771011352539062, -0.1088409423828125, -0.09997177124023438, -0.09110260009765625, -0.08223342895507812, -0.0733642578125, -0.06449508666992188, -0.05562591552734375, -0.046756744384765625, -0.0378875732421875, -0.029018402099609375, -0.02014923095703125, -0.011280059814453125, -0.002410888671875, 0.006458282470703125, 0.01532745361328125, 0.024196624755859375, 0.0330657958984375, 0.041934967041015625, 0.05080413818359375, 0.059673309326171875, 0.06854248046875, 0.07741165161132812, 0.08628082275390625, 0.09514999389648438, 0.1040191650390625, 0.11288833618164062, 0.12175750732421875, 0.13062667846679688, 0.139495849609375, 0.14836502075195312, 0.15723419189453125, 0.16610336303710938, 0.1749725341796875, 0.18384170532226562, 0.19271087646484375, 0.20158004760742188, 0.21044921875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 0.0, 4.0, 3.0, 4.0, 8.0, 11.0, 10.0, 15.0, 10.0, 32.0, 51.0, 66.0, 155.0, 259.0, 1628.0, 1122.0, 294.0, 149.0, 85.0, 53.0, 35.0, 29.0, 13.0, 9.0, 9.0, 7.0, 6.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.1058349609375, -0.10337209701538086, -0.10090923309326172, -0.09844636917114258, -0.09598350524902344, -0.0935206413269043, -0.09105777740478516, -0.08859491348266602, -0.08613204956054688, -0.08366918563842773, -0.0812063217163086, -0.07874345779418945, -0.07628059387207031, -0.07381772994995117, -0.07135486602783203, -0.06889200210571289, -0.06642913818359375, -0.06396627426147461, -0.06150341033935547, -0.05904054641723633, -0.05657768249511719, -0.05411481857299805, -0.051651954650878906, -0.049189090728759766, -0.046726226806640625, -0.044263362884521484, -0.041800498962402344, -0.0393376350402832, -0.03687477111816406, -0.03441190719604492, -0.03194904327392578, -0.02948617935180664, -0.0270233154296875, -0.02456045150756836, -0.02209758758544922, -0.019634723663330078, -0.017171859741210938, -0.014708995819091797, -0.012246131896972656, -0.009783267974853516, -0.007320404052734375, -0.004857540130615234, -0.0023946762084960938, 6.818771362304688e-05, 0.0025310516357421875, 0.004993915557861328, 0.007456779479980469, 0.00991964340209961, 0.01238250732421875, 0.01484537124633789, 0.01730823516845703, 0.019771099090576172, 0.022233963012695312, 0.024696826934814453, 0.027159690856933594, 0.029622554779052734, 0.032085418701171875, 0.034548282623291016, 0.037011146545410156, 0.0394740104675293, 0.04193687438964844, 0.04439973831176758, 0.04686260223388672, 0.04932546615600586, 0.051788330078125]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 12.0, 119.0, 575.0, 263.0, 31.0, 8.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3651638627052307, -0.30975639820098877, -0.2543489336967468, -0.19894149899482727, -0.14353403449058533, -0.08812656998634338, -0.03271913528442383, 0.022688329219818115, 0.07809579372406006, 0.133503258228302, 0.18891070783138275, 0.2443181574344635, 0.29972562193870544, 0.3551330864429474, 0.41054052114486694, 0.4659479856491089, 0.5213554501533508, 0.5767629146575928, 0.6321703791618347, 0.6875778436660767, 0.7429852485656738, 0.7983927726745605, 0.8538001775741577, 0.9092076420783997, 0.9646151065826416, 1.0200225114822388, 1.0754300355911255, 1.1308374404907227, 1.1862449645996094, 1.2416523694992065, 1.2970597743988037, 1.3524672985076904, 1.4078748226165771, 1.4632822275161743, 1.518689751625061, 1.5740971565246582, 1.629504680633545, 1.684912085533142, 1.7403194904327393, 1.795727014541626, 1.8511345386505127, 1.9065419435501099, 1.9619494676589966, 2.0173568725585938, 2.0727643966674805, 2.128171920776367, 2.183579206466675, 2.2389867305755615, 2.294394016265869, 2.349801540374756, 2.4052088260650635, 2.46061635017395, 2.516023874282837, 2.5714313983917236, 2.6268386840820312, 2.682246208190918, 2.7376537322998047, 2.7930612564086914, 2.848468542098999, 2.9038760662078857, 2.9592835903167725, 3.014691114425659, 3.070098400115967, 3.1255059242248535, 3.1809134483337402]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 5.0, 6.0, 3.0, 3.0, 10.0, 16.0, 19.0, 27.0, 29.0, 27.0, 45.0, 45.0, 33.0, 46.0, 41.0, 54.0, 54.0, 51.0, 62.0, 49.0, 59.0, 50.0, 30.0, 41.0, 35.0, 33.0, 26.0, 18.0, 19.0, 16.0, 17.0, 7.0, 5.0, 3.0, 3.0, 3.0, 3.0, 1.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.2763725519180298, -0.26861557364463806, -0.26085859537124634, -0.2531016170978546, -0.2453446388244629, -0.23758766055107117, -0.22983068227767944, -0.22207370400428772, -0.214316725730896, -0.20655974745750427, -0.19880276918411255, -0.19104579091072083, -0.1832888126373291, -0.17553183436393738, -0.16777485609054565, -0.16001787781715393, -0.1522608995437622, -0.14450392127037048, -0.13674694299697876, -0.12898996472358704, -0.12123298645019531, -0.11347600817680359, -0.10571902990341187, -0.09796205163002014, -0.09020507335662842, -0.0824480950832367, -0.07469111680984497, -0.06693413853645325, -0.05917716026306152, -0.0514201819896698, -0.043663203716278076, -0.03590622544288635, -0.02814924716949463, -0.020392268896102905, -0.012635290622711182, -0.004878312349319458, 0.0028786659240722656, 0.01063564419746399, 0.018392622470855713, 0.026149600744247437, 0.03390657901763916, 0.041663557291030884, 0.04942053556442261, 0.05717751383781433, 0.06493449211120605, 0.07269147038459778, 0.0804484486579895, 0.08820542693138123, 0.09596240520477295, 0.10371938347816467, 0.1114763617515564, 0.11923334002494812, 0.12699031829833984, 0.13474729657173157, 0.1425042748451233, 0.15026125311851501, 0.15801823139190674, 0.16577520966529846, 0.17353218793869019, 0.1812891662120819, 0.18904614448547363, 0.19680312275886536, 0.20456010103225708, 0.2123170793056488, 0.22007405757904053]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 2.0, 2.0, 6.0, 4.0, 10.0, 16.0, 24.0, 36.0, 42.0, 78.0, 117.0, 173.0, 299.0, 526.0, 1050.0, 2349.0, 6424.0, 24249.0, 117109.0, 457008.0, 340736.0, 73894.0, 16010.0, 4630.0, 1808.0, 834.0, 394.0, 264.0, 185.0, 99.0, 61.0, 39.0, 21.0, 17.0, 11.0, 10.0, 4.0, 4.0, 8.0, 2.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1939697265625, -0.18646812438964844, -0.17896652221679688, -0.1714649200439453, -0.16396331787109375, -0.1564617156982422, -0.14896011352539062, -0.14145851135253906, -0.1339569091796875, -0.12645530700683594, -0.11895370483398438, -0.11145210266113281, -0.10395050048828125, -0.09644889831542969, -0.08894729614257812, -0.08144569396972656, -0.073944091796875, -0.06644248962402344, -0.058940887451171875, -0.05143928527832031, -0.04393768310546875, -0.03643608093261719, -0.028934478759765625, -0.021432876586914062, -0.0139312744140625, -0.0064296722412109375, 0.001071929931640625, 0.008573532104492188, 0.01607513427734375, 0.023576736450195312, 0.031078338623046875, 0.03857994079589844, 0.04608154296875, 0.05358314514160156, 0.061084747314453125, 0.06858634948730469, 0.07608795166015625, 0.08358955383300781, 0.09109115600585938, 0.09859275817871094, 0.1060943603515625, 0.11359596252441406, 0.12109756469726562, 0.1285991668701172, 0.13610076904296875, 0.1436023712158203, 0.15110397338867188, 0.15860557556152344, 0.166107177734375, 0.17360877990722656, 0.18111038208007812, 0.1886119842529297, 0.19611358642578125, 0.2036151885986328, 0.21111679077148438, 0.21861839294433594, 0.2261199951171875, 0.23362159729003906, 0.24112319946289062, 0.2486248016357422, 0.25612640380859375, 0.2636280059814453, 0.2711296081542969, 0.27863121032714844, 0.2861328125]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 7.0, 12.0, 15.0, 20.0, 33.0, 43.0, 64.0, 76.0, 88.0, 119.0, 116.0, 103.0, 86.0, 70.0, 59.0, 36.0, 26.0, 14.0, 8.0, 5.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.13720703125, -0.13402748107910156, -0.13084793090820312, -0.1276683807373047, -0.12448883056640625, -0.12130928039550781, -0.11812973022460938, -0.11495018005371094, -0.1117706298828125, -0.10859107971191406, -0.10541152954101562, -0.10223197937011719, -0.09905242919921875, -0.09587287902832031, -0.09269332885742188, -0.08951377868652344, -0.086334228515625, -0.08315467834472656, -0.07997512817382812, -0.07679557800292969, -0.07361602783203125, -0.07043647766113281, -0.06725692749023438, -0.06407737731933594, -0.0608978271484375, -0.05771827697753906, -0.054538726806640625, -0.05135917663574219, -0.04817962646484375, -0.04500007629394531, -0.041820526123046875, -0.03864097595214844, -0.03546142578125, -0.03228187561035156, -0.029102325439453125, -0.025922775268554688, -0.02274322509765625, -0.019563674926757812, -0.016384124755859375, -0.013204574584960938, -0.0100250244140625, -0.0068454742431640625, -0.003665924072265625, -0.0004863739013671875, 0.00269317626953125, 0.0058727264404296875, 0.009052276611328125, 0.012231826782226562, 0.015411376953125, 0.018590927124023438, 0.021770477294921875, 0.024950027465820312, 0.02812957763671875, 0.03130912780761719, 0.034488677978515625, 0.03766822814941406, 0.0408477783203125, 0.04402732849121094, 0.047206878662109375, 0.05038642883300781, 0.05356597900390625, 0.05674552917480469, 0.059925079345703125, 0.06310462951660156, 0.0662841796875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 6.0, 4.0, 3.0, 9.0, 9.0, 14.0, 15.0, 25.0, 33.0, 39.0, 97.0, 103.0, 138.0, 196.0, 354.0, 526.0, 1032.0, 2360.0, 6957.0, 27202.0, 140523.0, 534480.0, 266486.0, 49814.0, 11381.0, 3482.0, 1404.0, 675.0, 407.0, 235.0, 153.0, 107.0, 89.0, 46.0, 34.0, 32.0, 22.0, 21.0, 10.0, 7.0, 9.0, 9.0, 5.0, 2.0, 1.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.211669921875, -0.2055683135986328, -0.19946670532226562, -0.19336509704589844, -0.18726348876953125, -0.18116188049316406, -0.17506027221679688, -0.1689586639404297, -0.1628570556640625, -0.1567554473876953, -0.15065383911132812, -0.14455223083496094, -0.13845062255859375, -0.13234901428222656, -0.12624740600585938, -0.12014579772949219, -0.114044189453125, -0.10794258117675781, -0.10184097290039062, -0.09573936462402344, -0.08963775634765625, -0.08353614807128906, -0.07743453979492188, -0.07133293151855469, -0.0652313232421875, -0.05912971496582031, -0.053028106689453125, -0.04692649841308594, -0.04082489013671875, -0.03472328186035156, -0.028621673583984375, -0.022520065307617188, -0.01641845703125, -0.010316848754882812, -0.004215240478515625, 0.0018863677978515625, 0.00798797607421875, 0.014089584350585938, 0.020191192626953125, 0.026292800903320312, 0.0323944091796875, 0.03849601745605469, 0.044597625732421875, 0.05069923400878906, 0.05680084228515625, 0.06290245056152344, 0.06900405883789062, 0.07510566711425781, 0.081207275390625, 0.08730888366699219, 0.09341049194335938, 0.09951210021972656, 0.10561370849609375, 0.11171531677246094, 0.11781692504882812, 0.12391853332519531, 0.1300201416015625, 0.1361217498779297, 0.14222335815429688, 0.14832496643066406, 0.15442657470703125, 0.16052818298339844, 0.16662979125976562, 0.1727313995361328, 0.1788330078125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 3.0, 3.0, 3.0, 9.0, 8.0, 8.0, 17.0, 11.0, 21.0, 18.0, 19.0, 20.0, 26.0, 26.0, 40.0, 44.0, 35.0, 35.0, 38.0, 52.0, 46.0, 42.0, 43.0, 28.0, 51.0, 41.0, 29.0, 29.0, 36.0, 28.0, 22.0, 17.0, 22.0, 26.0, 14.0, 17.0, 8.0, 16.0, 6.0, 4.0, 7.0, 8.0, 8.0, 5.0, 3.0, 4.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.178466796875, -0.1728191375732422, -0.16717147827148438, -0.16152381896972656, -0.15587615966796875, -0.15022850036621094, -0.14458084106445312, -0.1389331817626953, -0.1332855224609375, -0.1276378631591797, -0.12199020385742188, -0.11634254455566406, -0.11069488525390625, -0.10504722595214844, -0.09939956665039062, -0.09375190734863281, -0.088104248046875, -0.08245658874511719, -0.07680892944335938, -0.07116127014160156, -0.06551361083984375, -0.05986595153808594, -0.054218292236328125, -0.04857063293457031, -0.0429229736328125, -0.03727531433105469, -0.031627655029296875, -0.025979995727539062, -0.02033233642578125, -0.014684677124023438, -0.009037017822265625, -0.0033893585205078125, 0.00225830078125, 0.007905960083007812, 0.013553619384765625, 0.019201278686523438, 0.02484893798828125, 0.030496597290039062, 0.036144256591796875, 0.04179191589355469, 0.0474395751953125, 0.05308723449707031, 0.058734893798828125, 0.06438255310058594, 0.07003021240234375, 0.07567787170410156, 0.08132553100585938, 0.08697319030761719, 0.092620849609375, 0.09826850891113281, 0.10391616821289062, 0.10956382751464844, 0.11521148681640625, 0.12085914611816406, 0.12650680541992188, 0.1321544647216797, 0.1378021240234375, 0.1434497833251953, 0.14909744262695312, 0.15474510192871094, 0.16039276123046875, 0.16604042053222656, 0.17168807983398438, 0.1773357391357422, 0.1829833984375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 5.0, 15.0, 17.0, 29.0, 54.0, 100.0, 185.0, 366.0, 950.0, 3251.0, 21708.0, 577723.0, 422503.0, 17272.0, 2824.0, 847.0, 346.0, 143.0, 87.0, 51.0, 33.0, 17.0, 10.0, 4.0, 2.0, 5.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1617431640625, -0.15595626831054688, -0.15016937255859375, -0.14438247680664062, -0.1385955810546875, -0.13280868530273438, -0.12702178955078125, -0.12123489379882812, -0.115447998046875, -0.10966110229492188, -0.10387420654296875, -0.09808731079101562, -0.0923004150390625, -0.08651351928710938, -0.08072662353515625, -0.07493972778320312, -0.06915283203125, -0.06336593627929688, -0.05757904052734375, -0.051792144775390625, -0.0460052490234375, -0.040218353271484375, -0.03443145751953125, -0.028644561767578125, -0.022857666015625, -0.017070770263671875, -0.01128387451171875, -0.005496978759765625, 0.0002899169921875, 0.006076812744140625, 0.01186370849609375, 0.017650604248046875, 0.0234375, 0.029224395751953125, 0.03501129150390625, 0.040798187255859375, 0.0465850830078125, 0.052371978759765625, 0.05815887451171875, 0.06394577026367188, 0.069732666015625, 0.07551956176757812, 0.08130645751953125, 0.08709335327148438, 0.0928802490234375, 0.09866714477539062, 0.10445404052734375, 0.11024093627929688, 0.11602783203125, 0.12181472778320312, 0.12760162353515625, 0.13338851928710938, 0.1391754150390625, 0.14496231079101562, 0.15074920654296875, 0.15653610229492188, 0.162322998046875, 0.16810989379882812, 0.17389678955078125, 0.17968368530273438, 0.1854705810546875, 0.19125747680664062, 0.19704437255859375, 0.20283126831054688, 0.2086181640625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 11.0, 11.0, 7.0, 9.0, 21.0, 15.0, 24.0, 33.0, 39.0, 45.0, 71.0, 77.0, 91.0, 89.0, 70.0, 73.0, 71.0, 52.0, 42.0, 33.0, 31.0, 22.0, 16.0, 13.0, 5.0, 9.0, 3.0, 2.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.239776611328125e-05, -1.1976808309555054e-05, -1.1555850505828857e-05, -1.1134892702102661e-05, -1.0713934898376465e-05, -1.0292977094650269e-05, -9.872019290924072e-06, -9.451061487197876e-06, -9.03010368347168e-06, -8.609145879745483e-06, -8.188188076019287e-06, -7.76723027229309e-06, -7.3462724685668945e-06, -6.925314664840698e-06, -6.504356861114502e-06, -6.083399057388306e-06, -5.662441253662109e-06, -5.241483449935913e-06, -4.820525646209717e-06, -4.3995678424835205e-06, -3.978610038757324e-06, -3.557652235031128e-06, -3.1366944313049316e-06, -2.7157366275787354e-06, -2.294778823852539e-06, -1.8738210201263428e-06, -1.4528632164001465e-06, -1.0319054126739502e-06, -6.109476089477539e-07, -1.8998980522155762e-07, 2.3096799850463867e-07, 6.51925802230835e-07, 1.0728836059570312e-06, 1.4938414096832275e-06, 1.914799213409424e-06, 2.33575701713562e-06, 2.7567148208618164e-06, 3.1776726245880127e-06, 3.598630428314209e-06, 4.019588232040405e-06, 4.4405460357666016e-06, 4.861503839492798e-06, 5.282461643218994e-06, 5.7034194469451904e-06, 6.124377250671387e-06, 6.545335054397583e-06, 6.966292858123779e-06, 7.387250661849976e-06, 7.808208465576172e-06, 8.229166269302368e-06, 8.650124073028564e-06, 9.07108187675476e-06, 9.492039680480957e-06, 9.912997484207153e-06, 1.033395528793335e-05, 1.0754913091659546e-05, 1.1175870895385742e-05, 1.1596828699111938e-05, 1.2017786502838135e-05, 1.2438744306564331e-05, 1.2859702110290527e-05, 1.3280659914016724e-05, 1.370161771774292e-05, 1.4122575521469116e-05, 1.4543533325195312e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 3.0, 8.0, 14.0, 24.0, 32.0, 81.0, 186.0, 577.0, 2950.0, 90369.0, 931761.0, 20398.0, 1494.0, 363.0, 145.0, 66.0, 30.0, 23.0, 18.0, 5.0, 6.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.4296875, -0.4202079772949219, -0.41072845458984375, -0.4012489318847656, -0.3917694091796875, -0.3822898864746094, -0.37281036376953125, -0.3633308410644531, -0.353851318359375, -0.3443717956542969, -0.33489227294921875, -0.3254127502441406, -0.3159332275390625, -0.3064537048339844, -0.29697418212890625, -0.2874946594238281, -0.27801513671875, -0.2685356140136719, -0.25905609130859375, -0.24957656860351562, -0.2400970458984375, -0.23061752319335938, -0.22113800048828125, -0.21165847778320312, -0.202178955078125, -0.19269943237304688, -0.18321990966796875, -0.17374038696289062, -0.1642608642578125, -0.15478134155273438, -0.14530181884765625, -0.13582229614257812, -0.1263427734375, -0.11686325073242188, -0.10738372802734375, -0.09790420532226562, -0.0884246826171875, -0.07894515991210938, -0.06946563720703125, -0.059986114501953125, -0.050506591796875, -0.041027069091796875, -0.03154754638671875, -0.022068023681640625, -0.0125885009765625, -0.003108978271484375, 0.00637054443359375, 0.015850067138671875, 0.02532958984375, 0.034809112548828125, 0.04428863525390625, 0.053768157958984375, 0.0632476806640625, 0.07272720336914062, 0.08220672607421875, 0.09168624877929688, 0.101165771484375, 0.11064529418945312, 0.12012481689453125, 0.12960433959960938, 0.1390838623046875, 0.14856338500976562, 0.15804290771484375, 0.16752243041992188, 0.177001953125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 3.0, 5.0, 9.0, 17.0, 19.0, 29.0, 65.0, 67.0, 110.0, 103.0, 119.0, 106.0, 104.0, 83.0, 53.0, 31.0, 37.0, 19.0, 9.0, 8.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.195556640625, -0.19073486328125, -0.1859130859375, -0.18109130859375, -0.17626953125, -0.17144775390625, -0.1666259765625, -0.16180419921875, -0.156982421875, -0.15216064453125, -0.1473388671875, -0.14251708984375, -0.1376953125, -0.13287353515625, -0.1280517578125, -0.12322998046875, -0.118408203125, -0.11358642578125, -0.1087646484375, -0.10394287109375, -0.09912109375, -0.09429931640625, -0.0894775390625, -0.08465576171875, -0.079833984375, -0.07501220703125, -0.0701904296875, -0.06536865234375, -0.060546875, -0.05572509765625, -0.0509033203125, -0.04608154296875, -0.041259765625, -0.03643798828125, -0.0316162109375, -0.02679443359375, -0.02197265625, -0.01715087890625, -0.0123291015625, -0.00750732421875, -0.002685546875, 0.00213623046875, 0.0069580078125, 0.01177978515625, 0.0166015625, 0.02142333984375, 0.0262451171875, 0.03106689453125, 0.035888671875, 0.04071044921875, 0.0455322265625, 0.05035400390625, 0.05517578125, 0.05999755859375, 0.0648193359375, 0.06964111328125, 0.074462890625, 0.07928466796875, 0.0841064453125, 0.08892822265625, 0.09375, 0.09857177734375, 0.1033935546875, 0.10821533203125, 0.113037109375]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 9.0, 16.0, 37.0, 92.0, 220.0, 298.0, 201.0, 81.0, 35.0, 11.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1949808597564697, -3.104597330093384, -3.014213800430298, -2.923830270767212, -2.833446741104126, -2.74306321144104, -2.652679443359375, -2.562295913696289, -2.471912384033203, -2.381528854370117, -2.2911453247070312, -2.2007617950439453, -2.1103782653808594, -2.0199947357177734, -1.929611086845398, -1.839227557182312, -1.7488441467285156, -1.6584606170654297, -1.5680770874023438, -1.4776935577392578, -1.3873100280761719, -1.296926498413086, -1.2065428495407104, -1.1161593198776245, -1.0257757902145386, -0.9353922605514526, -0.8450087308883667, -0.754625141620636, -0.66424161195755, -0.5738580822944641, -0.4834744930267334, -0.39309096336364746, -0.3027071952819824, -0.2123236507177353, -0.12194010615348816, -0.031556546688079834, 0.058826982975006104, 0.14921051263809204, 0.23959410190582275, 0.3299776315689087, 0.42036116123199463, 0.5107446908950806, 0.6011282205581665, 0.6915118098258972, 0.7818953394889832, 0.8722788691520691, 0.9626624584197998, 1.0530459880828857, 1.1434295177459717, 1.2338130474090576, 1.3241965770721436, 1.4145801067352295, 1.5049636363983154, 1.5953471660614014, 1.6857308149337769, 1.7761143445968628, 1.8664978742599487, 1.9568814039230347, 2.04726505279541, 2.137648582458496, 2.228032112121582, 2.318415641784668, 2.408799171447754, 2.49918270111084, 2.589566230773926]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 2.0, 9.0, 2.0, 3.0, 3.0, 7.0, 10.0, 13.0, 11.0, 14.0, 16.0, 14.0, 19.0, 12.0, 29.0, 29.0, 30.0, 26.0, 42.0, 40.0, 27.0, 33.0, 40.0, 38.0, 45.0, 42.0, 35.0, 37.0, 39.0, 44.0, 35.0, 30.0, 35.0, 22.0, 15.0, 19.0, 22.0, 18.0, 20.0, 16.0, 13.0, 13.0, 5.0, 8.0, 5.0, 5.0, 3.0, 2.0, 5.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8250587582588196, -0.7978923916816711, -0.7707259654998779, -0.7435595989227295, -0.716393232345581, -0.6892268657684326, -0.6620604395866394, -0.634894073009491, -0.6077276468276978, -0.5805612802505493, -0.5533948540687561, -0.5262284874916077, -0.49906212091445923, -0.4718957245349884, -0.4447293281555176, -0.41756296157836914, -0.3903965950012207, -0.3632301986217499, -0.33606383204460144, -0.3088974356651306, -0.2817310690879822, -0.25456467270851135, -0.22739827632904053, -0.2002318948507309, -0.17306551337242126, -0.14589913189411163, -0.1187327429652214, -0.09156635403633118, -0.06439997255802155, -0.037233591079711914, -0.010067194700241089, 0.017099186778068542, 0.044265568256378174, 0.0714319497346878, 0.09859833866357803, 0.12576472759246826, 0.1529311090707779, 0.18009749054908752, 0.20726388692855835, 0.23443026840686798, 0.2615966498851776, 0.28876304626464844, 0.3159294128417969, 0.3430958092212677, 0.3702622056007385, 0.39742857217788696, 0.4245949685573578, 0.4517613649368286, 0.47892773151397705, 0.5060940980911255, 0.5332605242729187, 0.5604268908500671, 0.5875932574272156, 0.6147596836090088, 0.6419260501861572, 0.6690924167633057, 0.6962587833404541, 0.7234251499176025, 0.7505915760993958, 0.7777579426765442, 0.8049243092536926, 0.8320907354354858, 0.8592571020126343, 0.8864234685897827, 0.9135898947715759]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 2.0, 4.0, 4.0, 11.0, 8.0, 11.0, 17.0, 8.0, 16.0, 15.0, 24.0, 29.0, 31.0, 41.0, 42.0, 82.0, 115.0, 127.0, 220.0, 391.0, 745.0, 1737.0, 4936.0, 20630.0, 249129.0, 3831124.0, 68121.0, 10606.0, 3150.0, 1276.0, 583.0, 326.0, 201.0, 120.0, 104.0, 57.0, 66.0, 44.0, 24.0, 20.0, 26.0, 15.0, 10.0, 13.0, 5.0, 3.0, 5.0, 1.0, 6.0, 6.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.279052734375, -0.27040863037109375, -0.2617645263671875, -0.25312042236328125, -0.244476318359375, -0.23583221435546875, -0.2271881103515625, -0.21854400634765625, -0.20989990234375, -0.20125579833984375, -0.1926116943359375, -0.18396759033203125, -0.175323486328125, -0.16667938232421875, -0.1580352783203125, -0.14939117431640625, -0.1407470703125, -0.13210296630859375, -0.1234588623046875, -0.11481475830078125, -0.106170654296875, -0.09752655029296875, -0.0888824462890625, -0.08023834228515625, -0.07159423828125, -0.06295013427734375, -0.0543060302734375, -0.04566192626953125, -0.037017822265625, -0.02837371826171875, -0.0197296142578125, -0.01108551025390625, -0.00244140625, 0.00620269775390625, 0.0148468017578125, 0.02349090576171875, 0.032135009765625, 0.04077911376953125, 0.0494232177734375, 0.05806732177734375, 0.06671142578125, 0.07535552978515625, 0.0839996337890625, 0.09264373779296875, 0.101287841796875, 0.10993194580078125, 0.1185760498046875, 0.12722015380859375, 0.1358642578125, 0.14450836181640625, 0.1531524658203125, 0.16179656982421875, 0.170440673828125, 0.17908477783203125, 0.1877288818359375, 0.19637298583984375, 0.20501708984375, 0.21366119384765625, 0.2223052978515625, 0.23094940185546875, 0.239593505859375, 0.24823760986328125, 0.2568817138671875, 0.26552581787109375, 0.274169921875]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 5.0, 3.0, 21.0, 18.0, 15.0, 34.0, 49.0, 75.0, 88.0, 98.0, 118.0, 122.0, 96.0, 82.0, 62.0, 39.0, 41.0, 21.0, 10.0, 5.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.145751953125, -0.14233875274658203, -0.13892555236816406, -0.1355123519897461, -0.13209915161132812, -0.12868595123291016, -0.1252727508544922, -0.12185955047607422, -0.11844635009765625, -0.11503314971923828, -0.11161994934082031, -0.10820674896240234, -0.10479354858398438, -0.1013803482055664, -0.09796714782714844, -0.09455394744873047, -0.0911407470703125, -0.08772754669189453, -0.08431434631347656, -0.0809011459350586, -0.07748794555664062, -0.07407474517822266, -0.07066154479980469, -0.06724834442138672, -0.06383514404296875, -0.06042194366455078, -0.05700874328613281, -0.053595542907714844, -0.050182342529296875, -0.046769142150878906, -0.04335594177246094, -0.03994274139404297, -0.036529541015625, -0.03311634063720703, -0.029703140258789062, -0.026289939880371094, -0.022876739501953125, -0.019463539123535156, -0.016050338745117188, -0.012637138366699219, -0.00922393798828125, -0.005810737609863281, -0.0023975372314453125, 0.0010156631469726562, 0.004428863525390625, 0.007842063903808594, 0.011255264282226562, 0.014668464660644531, 0.0180816650390625, 0.02149486541748047, 0.024908065795898438, 0.028321266174316406, 0.031734466552734375, 0.035147666931152344, 0.03856086730957031, 0.04197406768798828, 0.04538726806640625, 0.04880046844482422, 0.05221366882324219, 0.055626869201660156, 0.059040069580078125, 0.062453269958496094, 0.06586647033691406, 0.06927967071533203, 0.07269287109375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 5.0, 4.0, 11.0, 14.0, 27.0, 43.0, 58.0, 118.0, 212.0, 445.0, 929.0, 2066.0, 5600.0, 19807.0, 114376.0, 3658859.0, 341148.0, 36063.0, 9023.0, 3046.0, 1240.0, 565.0, 244.0, 141.0, 108.0, 54.0, 25.0, 25.0, 8.0, 8.0, 8.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.301025390625, -0.2936286926269531, -0.28623199462890625, -0.2788352966308594, -0.2714385986328125, -0.2640419006347656, -0.25664520263671875, -0.24924850463867188, -0.241851806640625, -0.23445510864257812, -0.22705841064453125, -0.21966171264648438, -0.2122650146484375, -0.20486831665039062, -0.19747161865234375, -0.19007492065429688, -0.18267822265625, -0.17528152465820312, -0.16788482666015625, -0.16048812866210938, -0.1530914306640625, -0.14569473266601562, -0.13829803466796875, -0.13090133666992188, -0.123504638671875, -0.11610794067382812, -0.10871124267578125, -0.10131454467773438, -0.0939178466796875, -0.08652114868164062, -0.07912445068359375, -0.07172775268554688, -0.0643310546875, -0.056934356689453125, -0.04953765869140625, -0.042140960693359375, -0.0347442626953125, -0.027347564697265625, -0.01995086669921875, -0.012554168701171875, -0.005157470703125, 0.002239227294921875, 0.00963592529296875, 0.017032623291015625, 0.0244293212890625, 0.031826019287109375, 0.03922271728515625, 0.046619415283203125, 0.05401611328125, 0.061412811279296875, 0.06880950927734375, 0.07620620727539062, 0.0836029052734375, 0.09099960327148438, 0.09839630126953125, 0.10579299926757812, 0.113189697265625, 0.12058639526367188, 0.12798309326171875, 0.13537979125976562, 0.1427764892578125, 0.15017318725585938, 0.15756988525390625, 0.16496658325195312, 0.17236328125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 8.0, 10.0, 9.0, 18.0, 24.0, 34.0, 67.0, 134.0, 353.0, 2137.0, 799.0, 234.0, 89.0, 55.0, 35.0, 22.0, 11.0, 13.0, 7.0, 6.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1492919921875, -0.14533615112304688, -0.14138031005859375, -0.13742446899414062, -0.1334686279296875, -0.12951278686523438, -0.12555694580078125, -0.12160110473632812, -0.117645263671875, -0.11368942260742188, -0.10973358154296875, -0.10577774047851562, -0.1018218994140625, -0.09786605834960938, -0.09391021728515625, -0.08995437622070312, -0.08599853515625, -0.08204269409179688, -0.07808685302734375, -0.07413101196289062, -0.0701751708984375, -0.06621932983398438, -0.06226348876953125, -0.058307647705078125, -0.054351806640625, -0.050395965576171875, -0.04644012451171875, -0.042484283447265625, -0.0385284423828125, -0.034572601318359375, -0.03061676025390625, -0.026660919189453125, -0.022705078125, -0.018749237060546875, -0.01479339599609375, -0.010837554931640625, -0.0068817138671875, -0.002925872802734375, 0.00102996826171875, 0.004985809326171875, 0.008941650390625, 0.012897491455078125, 0.01685333251953125, 0.020809173583984375, 0.0247650146484375, 0.028720855712890625, 0.03267669677734375, 0.036632537841796875, 0.04058837890625, 0.044544219970703125, 0.04850006103515625, 0.052455902099609375, 0.0564117431640625, 0.060367584228515625, 0.06432342529296875, 0.06827926635742188, 0.072235107421875, 0.07619094848632812, 0.08014678955078125, 0.08410263061523438, 0.0880584716796875, 0.09201431274414062, 0.09597015380859375, 0.09992599487304688, 0.1038818359375]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0, 6.0, 7.0, 10.0, 19.0, 47.0, 82.0, 128.0, 162.0, 166.0, 147.0, 104.0, 57.0, 27.0, 16.0, 13.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9284676909446716, -0.906885027885437, -0.8853023052215576, -0.8637195825576782, -0.8421369194984436, -0.820554256439209, -0.7989715337753296, -0.7773888111114502, -0.7558061480522156, -0.734223484992981, -0.7126407623291016, -0.6910580396652222, -0.6694753766059875, -0.6478927135467529, -0.6263099908828735, -0.6047272682189941, -0.5831446051597595, -0.5615619421005249, -0.5399792194366455, -0.5183964967727661, -0.4968138337135315, -0.4752311408519745, -0.4536484479904175, -0.4320657551288605, -0.41048306226730347, -0.38890036940574646, -0.36731767654418945, -0.34573498368263245, -0.32415229082107544, -0.30256959795951843, -0.2809869050979614, -0.2594042122364044, -0.2378215789794922, -0.21623888611793518, -0.19465619325637817, -0.17307350039482117, -0.15149080753326416, -0.12990811467170715, -0.10832542181015015, -0.08674272894859314, -0.06516003608703613, -0.043577343225479126, -0.02199465036392212, -0.0004119575023651123, 0.021170735359191895, 0.0427534282207489, 0.06433612108230591, 0.08591881394386292, 0.10750150680541992, 0.12908419966697693, 0.15066689252853394, 0.17224958539009094, 0.19383227825164795, 0.21541497111320496, 0.23699766397476196, 0.25858035683631897, 0.280163049697876, 0.301745742559433, 0.32332843542099, 0.344911128282547, 0.366493821144104, 0.388076514005661, 0.409659206867218, 0.431241899728775, 0.45282459259033203]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 4.0, 3.0, 7.0, 14.0, 7.0, 8.0, 20.0, 19.0, 27.0, 29.0, 33.0, 52.0, 48.0, 59.0, 58.0, 54.0, 60.0, 56.0, 48.0, 52.0, 51.0, 45.0, 46.0, 51.0, 34.0, 31.0, 24.0, 15.0, 18.0, 8.0, 8.0, 7.0, 3.0, 8.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.42062103748321533, -0.4094921350479126, -0.39836323261260986, -0.38723433017730713, -0.3761054575443268, -0.36497655510902405, -0.3538476526737213, -0.3427187502384186, -0.33158984780311584, -0.3204609453678131, -0.3093320429325104, -0.29820317029953003, -0.2870742678642273, -0.27594536542892456, -0.2648164629936218, -0.2536875605583191, -0.24255867302417755, -0.23142977058887482, -0.22030088305473328, -0.20917198061943054, -0.1980430781841278, -0.18691417574882507, -0.17578528821468353, -0.1646563857793808, -0.15352749824523926, -0.14239859580993652, -0.13126970827579498, -0.12014080584049225, -0.10901190340518951, -0.09788300842046738, -0.08675411343574524, -0.0756252110004425, -0.06449630856513977, -0.053367409855127335, -0.0422385111451149, -0.03110961616039276, -0.019980717450380325, -0.00885181874036789, 0.002277076244354248, 0.013405978679656982, 0.02453487366437912, 0.035663772374391556, 0.04679267108440399, 0.05792156606912613, 0.06905046105384827, 0.080179363489151, 0.09130825847387314, 0.10243716090917587, 0.11356605589389801, 0.12469495087862015, 0.13582384586334229, 0.14695274829864502, 0.15808165073394775, 0.1692105531692505, 0.18033944070339203, 0.19146834313869476, 0.2025972306728363, 0.21372613310813904, 0.22485502064228058, 0.2359839230775833, 0.24711282551288605, 0.2582417130470276, 0.2693706154823303, 0.28049951791763306, 0.2916284203529358]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 4.0, 6.0, 5.0, 12.0, 21.0, 21.0, 35.0, 39.0, 74.0, 141.0, 219.0, 401.0, 825.0, 1786.0, 4438.0, 13554.0, 57436.0, 304722.0, 506485.0, 121120.0, 24939.0, 7150.0, 2668.0, 1157.0, 539.0, 281.0, 158.0, 93.0, 68.0, 52.0, 24.0, 20.0, 15.0, 10.0, 7.0, 10.0, 6.0, 6.0, 3.0, 5.0, 1.0], "bins": [-0.26513671875, -0.25870513916015625, -0.2522735595703125, -0.24584197998046875, -0.239410400390625, -0.23297882080078125, -0.2265472412109375, -0.22011566162109375, -0.21368408203125, -0.20725250244140625, -0.2008209228515625, -0.19438934326171875, -0.187957763671875, -0.18152618408203125, -0.1750946044921875, -0.16866302490234375, -0.1622314453125, -0.15579986572265625, -0.1493682861328125, -0.14293670654296875, -0.136505126953125, -0.13007354736328125, -0.1236419677734375, -0.11721038818359375, -0.11077880859375, -0.10434722900390625, -0.0979156494140625, -0.09148406982421875, -0.085052490234375, -0.07862091064453125, -0.0721893310546875, -0.06575775146484375, -0.059326171875, -0.05289459228515625, -0.0464630126953125, -0.04003143310546875, -0.033599853515625, -0.02716827392578125, -0.0207366943359375, -0.01430511474609375, -0.00787353515625, -0.00144195556640625, 0.0049896240234375, 0.01142120361328125, 0.017852783203125, 0.02428436279296875, 0.0307159423828125, 0.03714752197265625, 0.0435791015625, 0.05001068115234375, 0.0564422607421875, 0.06287384033203125, 0.069305419921875, 0.07573699951171875, 0.0821685791015625, 0.08860015869140625, 0.09503173828125, 0.10146331787109375, 0.1078948974609375, 0.11432647705078125, 0.120758056640625, 0.12718963623046875, 0.1336212158203125, 0.14005279541015625, 0.146484375]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 5.0, 12.0, 26.0, 25.0, 42.0, 54.0, 90.0, 71.0, 100.0, 100.0, 108.0, 95.0, 72.0, 78.0, 41.0, 30.0, 16.0, 20.0, 6.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1539306640625, -0.15040206909179688, -0.14687347412109375, -0.14334487915039062, -0.1398162841796875, -0.13628768920898438, -0.13275909423828125, -0.12923049926757812, -0.125701904296875, -0.12217330932617188, -0.11864471435546875, -0.11511611938476562, -0.1115875244140625, -0.10805892944335938, -0.10453033447265625, -0.10100173950195312, -0.09747314453125, -0.09394454956054688, -0.09041595458984375, -0.08688735961914062, -0.0833587646484375, -0.07983016967773438, -0.07630157470703125, -0.07277297973632812, -0.069244384765625, -0.06571578979492188, -0.06218719482421875, -0.058658599853515625, -0.0551300048828125, -0.051601409912109375, -0.04807281494140625, -0.044544219970703125, -0.041015625, -0.037487030029296875, -0.03395843505859375, -0.030429840087890625, -0.0269012451171875, -0.023372650146484375, -0.01984405517578125, -0.016315460205078125, -0.012786865234375, -0.009258270263671875, -0.00572967529296875, -0.002201080322265625, 0.0013275146484375, 0.004856109619140625, 0.00838470458984375, 0.011913299560546875, 0.01544189453125, 0.018970489501953125, 0.02249908447265625, 0.026027679443359375, 0.0295562744140625, 0.033084869384765625, 0.03661346435546875, 0.040142059326171875, 0.043670654296875, 0.047199249267578125, 0.05072784423828125, 0.054256439208984375, 0.0577850341796875, 0.061313629150390625, 0.06484222412109375, 0.06837081909179688, 0.0718994140625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 4.0, 7.0, 12.0, 16.0, 24.0, 23.0, 41.0, 37.0, 77.0, 96.0, 128.0, 195.0, 377.0, 651.0, 1526.0, 4036.0, 15100.0, 79249.0, 566458.0, 321923.0, 43635.0, 9544.0, 2775.0, 1128.0, 564.0, 302.0, 212.0, 114.0, 89.0, 66.0, 37.0, 26.0, 23.0, 21.0, 14.0, 4.0, 9.0, 8.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.260009765625, -0.25313758850097656, -0.24626541137695312, -0.2393932342529297, -0.23252105712890625, -0.2256488800048828, -0.21877670288085938, -0.21190452575683594, -0.2050323486328125, -0.19816017150878906, -0.19128799438476562, -0.1844158172607422, -0.17754364013671875, -0.1706714630126953, -0.16379928588867188, -0.15692710876464844, -0.150054931640625, -0.14318275451660156, -0.13631057739257812, -0.1294384002685547, -0.12256622314453125, -0.11569404602050781, -0.10882186889648438, -0.10194969177246094, -0.0950775146484375, -0.08820533752441406, -0.08133316040039062, -0.07446098327636719, -0.06758880615234375, -0.06071662902832031, -0.053844451904296875, -0.04697227478027344, -0.04010009765625, -0.03322792053222656, -0.026355743408203125, -0.019483566284179688, -0.01261138916015625, -0.0057392120361328125, 0.001132965087890625, 0.008005142211914062, 0.0148773193359375, 0.021749496459960938, 0.028621673583984375, 0.03549385070800781, 0.04236602783203125, 0.04923820495605469, 0.056110382080078125, 0.06298255920410156, 0.069854736328125, 0.07672691345214844, 0.08359909057617188, 0.09047126770019531, 0.09734344482421875, 0.10421562194824219, 0.11108779907226562, 0.11795997619628906, 0.1248321533203125, 0.13170433044433594, 0.13857650756835938, 0.1454486846923828, 0.15232086181640625, 0.1591930389404297, 0.16606521606445312, 0.17293739318847656, 0.1798095703125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 5.0, 1.0, 2.0, 8.0, 19.0, 20.0, 24.0, 24.0, 27.0, 29.0, 44.0, 47.0, 49.0, 53.0, 67.0, 48.0, 52.0, 58.0, 66.0, 54.0, 68.0, 45.0, 41.0, 29.0, 33.0, 28.0, 18.0, 12.0, 9.0, 6.0, 8.0, 3.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.330810546875, -0.321441650390625, -0.31207275390625, -0.302703857421875, -0.2933349609375, -0.283966064453125, -0.27459716796875, -0.265228271484375, -0.255859375, -0.246490478515625, -0.23712158203125, -0.227752685546875, -0.2183837890625, -0.209014892578125, -0.19964599609375, -0.190277099609375, -0.180908203125, -0.171539306640625, -0.16217041015625, -0.152801513671875, -0.1434326171875, -0.134063720703125, -0.12469482421875, -0.115325927734375, -0.10595703125, -0.096588134765625, -0.08721923828125, -0.077850341796875, -0.0684814453125, -0.059112548828125, -0.04974365234375, -0.040374755859375, -0.031005859375, -0.021636962890625, -0.01226806640625, -0.002899169921875, 0.0064697265625, 0.015838623046875, 0.02520751953125, 0.034576416015625, 0.0439453125, 0.053314208984375, 0.06268310546875, 0.072052001953125, 0.0814208984375, 0.090789794921875, 0.10015869140625, 0.109527587890625, 0.118896484375, 0.128265380859375, 0.13763427734375, 0.147003173828125, 0.1563720703125, 0.165740966796875, 0.17510986328125, 0.184478759765625, 0.19384765625, 0.203216552734375, 0.21258544921875, 0.221954345703125, 0.2313232421875, 0.240692138671875, 0.25006103515625, 0.259429931640625, 0.268798828125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 5.0, 5.0, 11.0, 9.0, 15.0, 16.0, 33.0, 47.0, 74.0, 125.0, 194.0, 349.0, 641.0, 1461.0, 3982.0, 16692.0, 158746.0, 749116.0, 98897.0, 12058.0, 3332.0, 1341.0, 588.0, 334.0, 171.0, 111.0, 75.0, 48.0, 18.0, 20.0, 9.0, 15.0, 5.0, 3.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.127685546875, -0.12407970428466797, -0.12047386169433594, -0.1168680191040039, -0.11326217651367188, -0.10965633392333984, -0.10605049133300781, -0.10244464874267578, -0.09883880615234375, -0.09523296356201172, -0.09162712097167969, -0.08802127838134766, -0.08441543579101562, -0.0808095932006836, -0.07720375061035156, -0.07359790802001953, -0.0699920654296875, -0.06638622283935547, -0.06278038024902344, -0.059174537658691406, -0.055568695068359375, -0.051962852478027344, -0.04835700988769531, -0.04475116729736328, -0.04114532470703125, -0.03753948211669922, -0.03393363952636719, -0.030327796936035156, -0.026721954345703125, -0.023116111755371094, -0.019510269165039062, -0.01590442657470703, -0.012298583984375, -0.008692741394042969, -0.0050868988037109375, -0.0014810562133789062, 0.002124786376953125, 0.005730628967285156, 0.009336471557617188, 0.012942314147949219, 0.01654815673828125, 0.02015399932861328, 0.023759841918945312, 0.027365684509277344, 0.030971527099609375, 0.034577369689941406, 0.03818321228027344, 0.04178905487060547, 0.0453948974609375, 0.04900074005126953, 0.05260658264160156, 0.056212425231933594, 0.059818267822265625, 0.06342411041259766, 0.06702995300292969, 0.07063579559326172, 0.07424163818359375, 0.07784748077392578, 0.08145332336425781, 0.08505916595458984, 0.08866500854492188, 0.0922708511352539, 0.09587669372558594, 0.09948253631591797, 0.10308837890625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 7.0, 4.0, 8.0, 11.0, 25.0, 31.0, 47.0, 78.0, 102.0, 144.0, 125.0, 138.0, 84.0, 70.0, 47.0, 29.0, 18.0, 9.0, 9.0, 8.0, 4.0, 2.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.615285873413086e-05, -1.5426427125930786e-05, -1.4699995517730713e-05, -1.397356390953064e-05, -1.3247132301330566e-05, -1.2520700693130493e-05, -1.179426908493042e-05, -1.1067837476730347e-05, -1.0341405868530273e-05, -9.6149742603302e-06, -8.888542652130127e-06, -8.162111043930054e-06, -7.4356794357299805e-06, -6.709247827529907e-06, -5.982816219329834e-06, -5.256384611129761e-06, -4.5299530029296875e-06, -3.8035213947296143e-06, -3.077089786529541e-06, -2.3506581783294678e-06, -1.6242265701293945e-06, -8.977949619293213e-07, -1.7136335372924805e-07, 5.550682544708252e-07, 1.2814998626708984e-06, 2.0079314708709717e-06, 2.734363079071045e-06, 3.460794687271118e-06, 4.187226295471191e-06, 4.913657903671265e-06, 5.640089511871338e-06, 6.366521120071411e-06, 7.092952728271484e-06, 7.819384336471558e-06, 8.545815944671631e-06, 9.272247552871704e-06, 9.998679161071777e-06, 1.072511076927185e-05, 1.1451542377471924e-05, 1.2177973985671997e-05, 1.290440559387207e-05, 1.3630837202072144e-05, 1.4357268810272217e-05, 1.508370041847229e-05, 1.5810132026672363e-05, 1.6536563634872437e-05, 1.726299524307251e-05, 1.7989426851272583e-05, 1.8715858459472656e-05, 1.944229006767273e-05, 2.0168721675872803e-05, 2.0895153284072876e-05, 2.162158489227295e-05, 2.2348016500473022e-05, 2.3074448108673096e-05, 2.380087971687317e-05, 2.4527311325073242e-05, 2.5253742933273315e-05, 2.598017454147339e-05, 2.6706606149673462e-05, 2.7433037757873535e-05, 2.815946936607361e-05, 2.888590097427368e-05, 2.9612332582473755e-05, 3.0338764190673828e-05]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 7.0, 6.0, 10.0, 11.0, 16.0, 23.0, 37.0, 64.0, 80.0, 167.0, 322.0, 573.0, 1278.0, 3338.0, 12034.0, 70920.0, 581212.0, 329606.0, 36973.0, 7514.0, 2404.0, 901.0, 451.0, 229.0, 157.0, 81.0, 54.0, 30.0, 14.0, 8.0, 13.0, 5.0, 3.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0980224609375, -0.09473705291748047, -0.09145164489746094, -0.0881662368774414, -0.08488082885742188, -0.08159542083740234, -0.07831001281738281, -0.07502460479736328, -0.07173919677734375, -0.06845378875732422, -0.06516838073730469, -0.061882972717285156, -0.058597564697265625, -0.055312156677246094, -0.05202674865722656, -0.04874134063720703, -0.0454559326171875, -0.04217052459716797, -0.03888511657714844, -0.035599708557128906, -0.032314300537109375, -0.029028892517089844, -0.025743484497070312, -0.02245807647705078, -0.01917266845703125, -0.01588726043701172, -0.012601852416992188, -0.009316444396972656, -0.006031036376953125, -0.0027456283569335938, 0.0005397796630859375, 0.0038251876831054688, 0.007110595703125, 0.010396003723144531, 0.013681411743164062, 0.016966819763183594, 0.020252227783203125, 0.023537635803222656, 0.026823043823242188, 0.03010845184326172, 0.03339385986328125, 0.03667926788330078, 0.03996467590332031, 0.043250083923339844, 0.046535491943359375, 0.049820899963378906, 0.05310630798339844, 0.05639171600341797, 0.0596771240234375, 0.06296253204345703, 0.06624794006347656, 0.0695333480834961, 0.07281875610351562, 0.07610416412353516, 0.07938957214355469, 0.08267498016357422, 0.08596038818359375, 0.08924579620361328, 0.09253120422363281, 0.09581661224365234, 0.09910202026367188, 0.1023874282836914, 0.10567283630371094, 0.10895824432373047, 0.11224365234375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 8.0, 2.0, 8.0, 16.0, 12.0, 23.0, 40.0, 83.0, 99.0, 140.0, 158.0, 142.0, 87.0, 60.0, 47.0, 30.0, 19.0, 12.0, 8.0, 3.0, 4.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1220703125, -0.11790847778320312, -0.11374664306640625, -0.10958480834960938, -0.1054229736328125, -0.10126113891601562, -0.09709930419921875, -0.09293746948242188, -0.088775634765625, -0.08461380004882812, -0.08045196533203125, -0.07629013061523438, -0.0721282958984375, -0.06796646118164062, -0.06380462646484375, -0.059642791748046875, -0.05548095703125, -0.051319122314453125, -0.04715728759765625, -0.042995452880859375, -0.0388336181640625, -0.034671783447265625, -0.03050994873046875, -0.026348114013671875, -0.022186279296875, -0.018024444580078125, -0.01386260986328125, -0.009700775146484375, -0.0055389404296875, -0.001377105712890625, 0.00278472900390625, 0.006946563720703125, 0.0111083984375, 0.015270233154296875, 0.01943206787109375, 0.023593902587890625, 0.0277557373046875, 0.031917572021484375, 0.03607940673828125, 0.040241241455078125, 0.044403076171875, 0.048564910888671875, 0.05272674560546875, 0.056888580322265625, 0.0610504150390625, 0.06521224975585938, 0.06937408447265625, 0.07353591918945312, 0.07769775390625, 0.08185958862304688, 0.08602142333984375, 0.09018325805664062, 0.0943450927734375, 0.09850692749023438, 0.10266876220703125, 0.10683059692382812, 0.110992431640625, 0.11515426635742188, 0.11931610107421875, 0.12347793579101562, 0.1276397705078125, 0.13180160522460938, 0.13596343994140625, 0.14012527465820312, 0.144287109375]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 7.0, 26.0, 97.0, 282.0, 350.0, 173.0, 42.0, 21.0, 6.0, 4.0, 1.0, 1.0, 2.0], "bins": [-6.060938835144043, -5.951106548309326, -5.841274261474609, -5.731441974639893, -5.621609687805176, -5.511777400970459, -5.401945114135742, -5.292112827301025, -5.182280540466309, -5.072448253631592, -4.962615966796875, -4.852783679962158, -4.742951393127441, -4.633119106292725, -4.523286819458008, -4.413454532623291, -4.303622245788574, -4.193789958953857, -4.083957672119141, -3.974125385284424, -3.864293098449707, -3.7544608116149902, -3.6446285247802734, -3.5347962379455566, -3.4249634742736816, -3.315131187438965, -3.205298900604248, -3.0954666137695312, -2.9856343269348145, -2.8758020401000977, -2.765969753265381, -2.656137466430664, -2.546304941177368, -2.4364726543426514, -2.3266403675079346, -2.2168080806732178, -2.106975793838501, -1.9971435070037842, -1.8873111009597778, -1.777478814125061, -1.6676465272903442, -1.5578142404556274, -1.4479819536209106, -1.3381495475769043, -1.2283172607421875, -1.1184849739074707, -1.008652687072754, -0.8988204002380371, -0.7889881134033203, -0.6791558265686035, -0.5693235397338867, -0.45949119329452515, -0.34965890645980835, -0.23982661962509155, -0.12999427318572998, -0.020161986351013184, 0.08967030048370361, 0.1995026022195816, 0.3093349039554596, 0.4191672205924988, 0.5289995074272156, 0.6388317942619324, 0.748664140701294, 0.8584964275360107, 0.9683287143707275]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 4.0, 0.0, 2.0, 3.0, 4.0, 3.0, 3.0, 10.0, 8.0, 12.0, 14.0, 14.0, 16.0, 20.0, 23.0, 26.0, 22.0, 22.0, 28.0, 35.0, 33.0, 35.0, 39.0, 44.0, 43.0, 42.0, 42.0, 44.0, 40.0, 39.0, 36.0, 39.0, 30.0, 31.0, 36.0, 29.0, 19.0, 19.0, 13.0, 14.0, 8.0, 5.0, 15.0, 12.0, 6.0, 7.0, 6.0, 5.0, 4.0, 2.0, 1.0, 4.0, 2.0, 3.0], "bins": [-1.18015718460083, -1.147339105606079, -1.1145210266113281, -1.0817028284072876, -1.0488847494125366, -1.0160666704177856, -0.9832485318183899, -0.9504303932189941, -0.9176123142242432, -0.8847942352294922, -0.8519760966300964, -0.8191579580307007, -0.7863398790359497, -0.7535218000411987, -0.720703661441803, -0.6878855228424072, -0.6550674438476562, -0.6222493648529053, -0.5894312262535095, -0.5566130876541138, -0.5237950086593628, -0.49097689986228943, -0.45815879106521606, -0.4253406822681427, -0.39252257347106934, -0.35970446467399597, -0.3268863558769226, -0.29406824707984924, -0.2612501382827759, -0.22843202948570251, -0.19561392068862915, -0.1627958118915558, -0.12997770309448242, -0.09715959429740906, -0.0643414855003357, -0.03152337670326233, 0.0012947320938110352, 0.0341128408908844, 0.06693094968795776, 0.09974905848503113, 0.1325671672821045, 0.16538527607917786, 0.19820338487625122, 0.23102149367332458, 0.26383960247039795, 0.2966577112674713, 0.3294758200645447, 0.36229392886161804, 0.3951120376586914, 0.42793014645576477, 0.46074825525283813, 0.4935663640499115, 0.5263844728469849, 0.5592025518417358, 0.5920206904411316, 0.6248388290405273, 0.6576569080352783, 0.6904749870300293, 0.723293125629425, 0.7561112642288208, 0.7889293432235718, 0.8217474222183228, 0.8545655608177185, 0.8873836994171143, 0.9202017784118652]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0, 3.0, 0.0, 11.0, 6.0, 18.0, 18.0, 20.0, 30.0, 36.0, 57.0, 50.0, 82.0, 125.0, 189.0, 221.0, 400.0, 692.0, 1367.0, 3117.0, 10315.0, 73424.0, 4068269.0, 25481.0, 5708.0, 2040.0, 982.0, 512.0, 334.0, 214.0, 141.0, 97.0, 83.0, 69.0, 27.0, 35.0, 26.0, 24.0, 9.0, 17.0, 9.0, 9.0, 9.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.255126953125, -0.247894287109375, -0.24066162109375, -0.233428955078125, -0.2261962890625, -0.218963623046875, -0.21173095703125, -0.204498291015625, -0.197265625, -0.190032958984375, -0.18280029296875, -0.175567626953125, -0.1683349609375, -0.161102294921875, -0.15386962890625, -0.146636962890625, -0.139404296875, -0.132171630859375, -0.12493896484375, -0.117706298828125, -0.1104736328125, -0.103240966796875, -0.09600830078125, -0.088775634765625, -0.08154296875, -0.074310302734375, -0.06707763671875, -0.059844970703125, -0.0526123046875, -0.045379638671875, -0.03814697265625, -0.030914306640625, -0.023681640625, -0.016448974609375, -0.00921630859375, -0.001983642578125, 0.0052490234375, 0.012481689453125, 0.01971435546875, 0.026947021484375, 0.0341796875, 0.041412353515625, 0.04864501953125, 0.055877685546875, 0.0631103515625, 0.070343017578125, 0.07757568359375, 0.084808349609375, 0.092041015625, 0.099273681640625, 0.10650634765625, 0.113739013671875, 0.1209716796875, 0.128204345703125, 0.13543701171875, 0.142669677734375, 0.14990234375, 0.157135009765625, 0.16436767578125, 0.171600341796875, 0.1788330078125, 0.186065673828125, 0.19329833984375, 0.200531005859375, 0.207763671875]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 7.0, 9.0, 13.0, 31.0, 36.0, 53.0, 67.0, 85.0, 99.0, 114.0, 95.0, 107.0, 73.0, 63.0, 51.0, 37.0, 31.0, 13.0, 12.0, 2.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16162109375, -0.15776634216308594, -0.15391159057617188, -0.1500568389892578, -0.14620208740234375, -0.1423473358154297, -0.13849258422851562, -0.13463783264160156, -0.1307830810546875, -0.12692832946777344, -0.12307357788085938, -0.11921882629394531, -0.11536407470703125, -0.11150932312011719, -0.10765457153320312, -0.10379981994628906, -0.099945068359375, -0.09609031677246094, -0.09223556518554688, -0.08838081359863281, -0.08452606201171875, -0.08067131042480469, -0.07681655883789062, -0.07296180725097656, -0.0691070556640625, -0.06525230407714844, -0.061397552490234375, -0.05754280090332031, -0.05368804931640625, -0.04983329772949219, -0.045978546142578125, -0.04212379455566406, -0.03826904296875, -0.03441429138183594, -0.030559539794921875, -0.026704788208007812, -0.02285003662109375, -0.018995285034179688, -0.015140533447265625, -0.011285781860351562, -0.0074310302734375, -0.0035762786865234375, 0.000278472900390625, 0.0041332244873046875, 0.00798797607421875, 0.011842727661132812, 0.015697479248046875, 0.019552230834960938, 0.023406982421875, 0.027261734008789062, 0.031116485595703125, 0.03497123718261719, 0.03882598876953125, 0.04268074035644531, 0.046535491943359375, 0.05039024353027344, 0.0542449951171875, 0.05809974670410156, 0.061954498291015625, 0.06580924987792969, 0.06966400146484375, 0.07351875305175781, 0.07737350463867188, 0.08122825622558594, 0.0850830078125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 6.0, 5.0, 10.0, 12.0, 21.0, 18.0, 23.0, 53.0, 88.0, 90.0, 115.0, 181.0, 323.0, 408.0, 725.0, 1237.0, 2416.0, 5267.0, 18292.0, 192441.0, 3932992.0, 26311.0, 6717.0, 2823.0, 1416.0, 772.0, 501.0, 312.0, 227.0, 135.0, 106.0, 63.0, 45.0, 29.0, 34.0, 21.0, 14.0, 11.0, 11.0, 5.0, 5.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2200927734375, -0.21344566345214844, -0.20679855346679688, -0.2001514434814453, -0.19350433349609375, -0.1868572235107422, -0.18021011352539062, -0.17356300354003906, -0.1669158935546875, -0.16026878356933594, -0.15362167358398438, -0.1469745635986328, -0.14032745361328125, -0.1336803436279297, -0.12703323364257812, -0.12038612365722656, -0.113739013671875, -0.10709190368652344, -0.10044479370117188, -0.09379768371582031, -0.08715057373046875, -0.08050346374511719, -0.07385635375976562, -0.06720924377441406, -0.0605621337890625, -0.05391502380371094, -0.047267913818359375, -0.04062080383300781, -0.03397369384765625, -0.027326583862304688, -0.020679473876953125, -0.014032363891601562, -0.00738525390625, -0.0007381439208984375, 0.005908966064453125, 0.012556076049804688, 0.01920318603515625, 0.025850296020507812, 0.032497406005859375, 0.03914451599121094, 0.0457916259765625, 0.05243873596191406, 0.059085845947265625, 0.06573295593261719, 0.07238006591796875, 0.07902717590332031, 0.08567428588867188, 0.09232139587402344, 0.098968505859375, 0.10561561584472656, 0.11226272583007812, 0.11890983581542969, 0.12555694580078125, 0.1322040557861328, 0.13885116577148438, 0.14549827575683594, 0.1521453857421875, 0.15879249572753906, 0.16543960571289062, 0.1720867156982422, 0.17873382568359375, 0.1853809356689453, 0.19202804565429688, 0.19867515563964844, 0.205322265625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 5.0, 10.0, 21.0, 37.0, 94.0, 3654.0, 153.0, 48.0, 25.0, 11.0, 3.0, 6.0, 3.0, 3.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0621337890625, -0.060044288635253906, -0.05795478820800781, -0.05586528778076172, -0.053775787353515625, -0.05168628692626953, -0.04959678649902344, -0.047507286071777344, -0.04541778564453125, -0.043328285217285156, -0.04123878479003906, -0.03914928436279297, -0.037059783935546875, -0.03497028350830078, -0.03288078308105469, -0.030791282653808594, -0.0287017822265625, -0.026612281799316406, -0.024522781372070312, -0.02243328094482422, -0.020343780517578125, -0.01825428009033203, -0.016164779663085938, -0.014075279235839844, -0.01198577880859375, -0.009896278381347656, -0.0078067779541015625, -0.005717277526855469, -0.003627777099609375, -0.0015382766723632812, 0.0005512237548828125, 0.0026407241821289062, 0.004730224609375, 0.006819725036621094, 0.008909225463867188, 0.010998725891113281, 0.013088226318359375, 0.015177726745605469, 0.017267227172851562, 0.019356727600097656, 0.02144622802734375, 0.023535728454589844, 0.025625228881835938, 0.02771472930908203, 0.029804229736328125, 0.03189373016357422, 0.03398323059082031, 0.036072731018066406, 0.0381622314453125, 0.040251731872558594, 0.04234123229980469, 0.04443073272705078, 0.046520233154296875, 0.04860973358154297, 0.05069923400878906, 0.052788734436035156, 0.05487823486328125, 0.056967735290527344, 0.05905723571777344, 0.06114673614501953, 0.06323623657226562, 0.06532573699951172, 0.06741523742675781, 0.0695047378540039, 0.07159423828125]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 14.0, 28.0, 114.0, 213.0, 268.0, 218.0, 97.0, 35.0, 13.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.614298939704895, -0.6028125286102295, -0.591326117515564, -0.5798397660255432, -0.5683533549308777, -0.5568669438362122, -0.5453805327415466, -0.5338941216468811, -0.5224077701568604, -0.5109213590621948, -0.4994349777698517, -0.48794856667518616, -0.476462185382843, -0.4649757742881775, -0.45348936319351196, -0.44200295209884644, -0.4305165410041809, -0.4190301299095154, -0.40754374861717224, -0.3960573375225067, -0.3845709562301636, -0.37308454513549805, -0.3615981340408325, -0.350111722946167, -0.33862534165382385, -0.3271389305591583, -0.3156525492668152, -0.30416613817214966, -0.29267972707748413, -0.281193345785141, -0.26970693469047546, -0.2582205533981323, -0.246734157204628, -0.23524776101112366, -0.22376134991645813, -0.2122749537229538, -0.20078855752944946, -0.18930216133594513, -0.1778157651424408, -0.16632935404777527, -0.15484295785427094, -0.1433565616607666, -0.13187015056610107, -0.12038375437259674, -0.10889735817909241, -0.09741096198558807, -0.08592455834150314, -0.07443815469741821, -0.06295175850391388, -0.05146535858511925, -0.039978958666324615, -0.028492558747529984, -0.01700615882873535, -0.00551975890994072, 0.005966641008853912, 0.017453044652938843, 0.028939440846443176, 0.04042584076523781, 0.05191224068403244, 0.06339864432811737, 0.0748850405216217, 0.08637143671512604, 0.09785784035921097, 0.1093442440032959, 0.12083064019680023]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 5.0, 3.0, 8.0, 10.0, 8.0, 6.0, 11.0, 10.0, 14.0, 14.0, 15.0, 17.0, 21.0, 18.0, 29.0, 29.0, 33.0, 32.0, 31.0, 34.0, 38.0, 43.0, 35.0, 37.0, 38.0, 42.0, 39.0, 36.0, 32.0, 28.0, 32.0, 36.0, 31.0, 24.0, 22.0, 18.0, 14.0, 20.0, 7.0, 13.0, 16.0, 6.0, 6.0, 10.0, 8.0, 6.0, 9.0, 3.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0], "bins": [-0.06738036870956421, -0.06517694145441055, -0.0629735141992569, -0.06077009439468384, -0.05856666713953018, -0.056363239884376526, -0.05415981635451317, -0.05195639282464981, -0.049752965569496155, -0.0475495383143425, -0.04534611478447914, -0.043142691254615784, -0.04093926399946213, -0.03873583674430847, -0.036532413214445114, -0.03432898968458176, -0.0321255624294281, -0.029922137036919594, -0.027718711644411087, -0.02551528625190258, -0.023311860859394073, -0.021108435466885567, -0.01890501007437706, -0.016701584681868553, -0.014498159289360046, -0.01229473389685154, -0.010091308504343033, -0.007887883111834526, -0.005684457719326019, -0.0034810323268175125, -0.0012776069343090057, 0.000925818458199501, 0.003129243850708008, 0.005332669243216515, 0.007536094635725021, 0.009739520028233528, 0.011942945420742035, 0.014146370813250542, 0.01634979620575905, 0.018553221598267555, 0.020756646990776062, 0.02296007238328457, 0.025163497775793076, 0.027366923168301582, 0.02957034856081009, 0.031773775815963745, 0.0339771993458271, 0.03618062287569046, 0.038384050130844116, 0.04058747738599777, 0.04279090091586113, 0.04499432444572449, 0.04719775170087814, 0.0494011789560318, 0.05160460248589516, 0.053808026015758514, 0.05601145327091217, 0.058214880526065826, 0.060418304055929184, 0.06262172758579254, 0.0648251548409462, 0.06702858209609985, 0.06923200190067291, 0.07143542915582657, 0.07363885641098022]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 4.0, 14.0, 18.0, 20.0, 49.0, 60.0, 90.0, 136.0, 212.0, 376.0, 661.0, 1413.0, 3364.0, 9620.0, 31387.0, 118320.0, 405863.0, 345678.0, 92584.0, 25317.0, 7769.0, 2986.0, 1177.0, 541.0, 331.0, 188.0, 122.0, 96.0, 40.0, 37.0, 27.0, 14.0, 7.0, 11.0, 4.0, 5.0, 7.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.154052734375, -0.14922523498535156, -0.14439773559570312, -0.1395702362060547, -0.13474273681640625, -0.1299152374267578, -0.12508773803710938, -0.12026023864746094, -0.1154327392578125, -0.11060523986816406, -0.10577774047851562, -0.10095024108886719, -0.09612274169921875, -0.09129524230957031, -0.08646774291992188, -0.08164024353027344, -0.076812744140625, -0.07198524475097656, -0.06715774536132812, -0.06233024597167969, -0.05750274658203125, -0.05267524719238281, -0.047847747802734375, -0.04302024841308594, -0.0381927490234375, -0.03336524963378906, -0.028537750244140625, -0.023710250854492188, -0.01888275146484375, -0.014055252075195312, -0.009227752685546875, -0.0044002532958984375, 0.00042724609375, 0.0052547454833984375, 0.010082244873046875, 0.014909744262695312, 0.01973724365234375, 0.024564743041992188, 0.029392242431640625, 0.03421974182128906, 0.0390472412109375, 0.04387474060058594, 0.048702239990234375, 0.05352973937988281, 0.05835723876953125, 0.06318473815917969, 0.06801223754882812, 0.07283973693847656, 0.077667236328125, 0.08249473571777344, 0.08732223510742188, 0.09214973449707031, 0.09697723388671875, 0.10180473327636719, 0.10663223266601562, 0.11145973205566406, 0.1162872314453125, 0.12111473083496094, 0.12594223022460938, 0.1307697296142578, 0.13559722900390625, 0.1404247283935547, 0.14525222778320312, 0.15007972717285156, 0.1549072265625]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 8.0, 19.0, 20.0, 36.0, 44.0, 54.0, 75.0, 93.0, 104.0, 91.0, 100.0, 96.0, 72.0, 57.0, 41.0, 38.0, 22.0, 14.0, 11.0, 3.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1644287109375, -0.16056060791015625, -0.1566925048828125, -0.15282440185546875, -0.148956298828125, -0.14508819580078125, -0.1412200927734375, -0.13735198974609375, -0.13348388671875, -0.12961578369140625, -0.1257476806640625, -0.12187957763671875, -0.118011474609375, -0.11414337158203125, -0.1102752685546875, -0.10640716552734375, -0.1025390625, -0.09867095947265625, -0.0948028564453125, -0.09093475341796875, -0.087066650390625, -0.08319854736328125, -0.0793304443359375, -0.07546234130859375, -0.07159423828125, -0.06772613525390625, -0.0638580322265625, -0.05998992919921875, -0.056121826171875, -0.05225372314453125, -0.0483856201171875, -0.04451751708984375, -0.0406494140625, -0.03678131103515625, -0.0329132080078125, -0.02904510498046875, -0.025177001953125, -0.02130889892578125, -0.0174407958984375, -0.01357269287109375, -0.00970458984375, -0.00583648681640625, -0.0019683837890625, 0.00189971923828125, 0.005767822265625, 0.00963592529296875, 0.0135040283203125, 0.01737213134765625, 0.021240234375, 0.02510833740234375, 0.0289764404296875, 0.03284454345703125, 0.036712646484375, 0.04058074951171875, 0.0444488525390625, 0.04831695556640625, 0.05218505859375, 0.05605316162109375, 0.0599212646484375, 0.06378936767578125, 0.067657470703125, 0.07152557373046875, 0.0753936767578125, 0.07926177978515625, 0.0831298828125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 3.0, 6.0, 5.0, 4.0, 10.0, 10.0, 11.0, 14.0, 18.0, 22.0, 26.0, 56.0, 59.0, 69.0, 112.0, 164.0, 279.0, 455.0, 987.0, 2736.0, 11829.0, 82645.0, 682067.0, 233587.0, 25499.0, 4801.0, 1453.0, 608.0, 312.0, 194.0, 136.0, 82.0, 77.0, 63.0, 42.0, 28.0, 20.0, 18.0, 18.0, 5.0, 7.0, 6.0, 2.0, 5.0, 3.0, 5.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.259033203125, -0.2515716552734375, -0.244110107421875, -0.2366485595703125, -0.22918701171875, -0.2217254638671875, -0.214263916015625, -0.2068023681640625, -0.1993408203125, -0.1918792724609375, -0.184417724609375, -0.1769561767578125, -0.16949462890625, -0.1620330810546875, -0.154571533203125, -0.1471099853515625, -0.1396484375, -0.1321868896484375, -0.124725341796875, -0.1172637939453125, -0.10980224609375, -0.1023406982421875, -0.094879150390625, -0.0874176025390625, -0.0799560546875, -0.0724945068359375, -0.065032958984375, -0.0575714111328125, -0.05010986328125, -0.0426483154296875, -0.035186767578125, -0.0277252197265625, -0.020263671875, -0.0128021240234375, -0.005340576171875, 0.0021209716796875, 0.00958251953125, 0.0170440673828125, 0.024505615234375, 0.0319671630859375, 0.0394287109375, 0.0468902587890625, 0.054351806640625, 0.0618133544921875, 0.06927490234375, 0.0767364501953125, 0.084197998046875, 0.0916595458984375, 0.09912109375, 0.1065826416015625, 0.114044189453125, 0.1215057373046875, 0.12896728515625, 0.1364288330078125, 0.143890380859375, 0.1513519287109375, 0.1588134765625, 0.1662750244140625, 0.173736572265625, 0.1811981201171875, 0.18865966796875, 0.1961212158203125, 0.203582763671875, 0.2110443115234375, 0.218505859375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 5.0, 4.0, 13.0, 11.0, 10.0, 15.0, 17.0, 17.0, 7.0, 27.0, 19.0, 46.0, 33.0, 46.0, 33.0, 51.0, 52.0, 51.0, 44.0, 30.0, 40.0, 45.0, 48.0, 36.0, 34.0, 42.0, 34.0, 28.0, 18.0, 17.0, 29.0, 20.0, 14.0, 14.0, 11.0, 11.0, 11.0, 6.0, 9.0, 2.0, 0.0, 3.0, 3.0, 0.0, 0.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2266845703125, -0.21920204162597656, -0.21171951293945312, -0.2042369842529297, -0.19675445556640625, -0.1892719268798828, -0.18178939819335938, -0.17430686950683594, -0.1668243408203125, -0.15934181213378906, -0.15185928344726562, -0.1443767547607422, -0.13689422607421875, -0.1294116973876953, -0.12192916870117188, -0.11444664001464844, -0.106964111328125, -0.09948158264160156, -0.09199905395507812, -0.08451652526855469, -0.07703399658203125, -0.06955146789550781, -0.062068939208984375, -0.05458641052246094, -0.0471038818359375, -0.03962135314941406, -0.032138824462890625, -0.024656295776367188, -0.01717376708984375, -0.009691238403320312, -0.002208709716796875, 0.0052738189697265625, 0.01275634765625, 0.020238876342773438, 0.027721405029296875, 0.03520393371582031, 0.04268646240234375, 0.05016899108886719, 0.057651519775390625, 0.06513404846191406, 0.0726165771484375, 0.08009910583496094, 0.08758163452148438, 0.09506416320800781, 0.10254669189453125, 0.11002922058105469, 0.11751174926757812, 0.12499427795410156, 0.132476806640625, 0.13995933532714844, 0.14744186401367188, 0.1549243927001953, 0.16240692138671875, 0.1698894500732422, 0.17737197875976562, 0.18485450744628906, 0.1923370361328125, 0.19981956481933594, 0.20730209350585938, 0.2147846221923828, 0.22226715087890625, 0.2297496795654297, 0.23723220825195312, 0.24471473693847656, 0.252197265625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 9.0, 8.0, 20.0, 25.0, 45.0, 58.0, 111.0, 221.0, 565.0, 1868.0, 9437.0, 77650.0, 722955.0, 211299.0, 19386.0, 3331.0, 893.0, 315.0, 157.0, 72.0, 45.0, 27.0, 22.0, 8.0, 4.0, 4.0, 7.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.11431884765625, -0.11150932312011719, -0.10869979858398438, -0.10589027404785156, -0.10308074951171875, -0.10027122497558594, -0.09746170043945312, -0.09465217590332031, -0.0918426513671875, -0.08903312683105469, -0.08622360229492188, -0.08341407775878906, -0.08060455322265625, -0.07779502868652344, -0.07498550415039062, -0.07217597961425781, -0.069366455078125, -0.06655693054199219, -0.06374740600585938, -0.06093788146972656, -0.05812835693359375, -0.05531883239746094, -0.052509307861328125, -0.04969978332519531, -0.0468902587890625, -0.04408073425292969, -0.041271209716796875, -0.03846168518066406, -0.03565216064453125, -0.03284263610839844, -0.030033111572265625, -0.027223587036132812, -0.0244140625, -0.021604537963867188, -0.018795013427734375, -0.015985488891601562, -0.01317596435546875, -0.010366439819335938, -0.007556915283203125, -0.0047473907470703125, -0.0019378662109375, 0.0008716583251953125, 0.003681182861328125, 0.0064907073974609375, 0.00930023193359375, 0.012109756469726562, 0.014919281005859375, 0.017728805541992188, 0.020538330078125, 0.023347854614257812, 0.026157379150390625, 0.028966903686523438, 0.03177642822265625, 0.03458595275878906, 0.037395477294921875, 0.04020500183105469, 0.0430145263671875, 0.04582405090332031, 0.048633575439453125, 0.05144309997558594, 0.05425262451171875, 0.05706214904785156, 0.059871673583984375, 0.06268119812011719, 0.06549072265625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 4.0, 2.0, 2.0, 2.0, 4.0, 1.0, 9.0, 6.0, 9.0, 15.0, 10.0, 20.0, 12.0, 44.0, 23.0, 44.0, 40.0, 67.0, 82.0, 91.0, 70.0, 75.0, 75.0, 61.0, 56.0, 45.0, 38.0, 19.0, 24.0, 15.0, 14.0, 6.0, 5.0, 4.0, 5.0, 2.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1026859283447266e-05, -1.0697171092033386e-05, -1.0367482900619507e-05, -1.0037794709205627e-05, -9.708106517791748e-06, -9.378418326377869e-06, -9.04873013496399e-06, -8.71904194355011e-06, -8.38935375213623e-06, -8.059665560722351e-06, -7.729977369308472e-06, -7.400289177894592e-06, -7.070600986480713e-06, -6.7409127950668335e-06, -6.411224603652954e-06, -6.081536412239075e-06, -5.751848220825195e-06, -5.422160029411316e-06, -5.0924718379974365e-06, -4.762783646583557e-06, -4.433095455169678e-06, -4.103407263755798e-06, -3.773719072341919e-06, -3.4440308809280396e-06, -3.11434268951416e-06, -2.7846544981002808e-06, -2.4549663066864014e-06, -2.125278115272522e-06, -1.7955899238586426e-06, -1.4659017324447632e-06, -1.1362135410308838e-06, -8.065253496170044e-07, -4.76837158203125e-07, -1.471489667892456e-07, 1.825392246246338e-07, 5.122274160385132e-07, 8.419156074523926e-07, 1.171603798866272e-06, 1.5012919902801514e-06, 1.8309801816940308e-06, 2.16066837310791e-06, 2.4903565645217896e-06, 2.820044755935669e-06, 3.1497329473495483e-06, 3.4794211387634277e-06, 3.809109330177307e-06, 4.1387975215911865e-06, 4.468485713005066e-06, 4.798173904418945e-06, 5.127862095832825e-06, 5.457550287246704e-06, 5.7872384786605835e-06, 6.116926670074463e-06, 6.446614861488342e-06, 6.776303052902222e-06, 7.105991244316101e-06, 7.4356794357299805e-06, 7.76536762714386e-06, 8.09505581855774e-06, 8.424744009971619e-06, 8.754432201385498e-06, 9.084120392799377e-06, 9.413808584213257e-06, 9.743496775627136e-06, 1.0073184967041016e-05]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 4.0, 4.0, 8.0, 11.0, 20.0, 26.0, 50.0, 83.0, 164.0, 330.0, 833.0, 2275.0, 8157.0, 47219.0, 477671.0, 454930.0, 45295.0, 7780.0, 2221.0, 762.0, 355.0, 122.0, 86.0, 53.0, 35.0, 24.0, 10.0, 6.0, 7.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.094970703125, -0.0923318862915039, -0.08969306945800781, -0.08705425262451172, -0.08441543579101562, -0.08177661895751953, -0.07913780212402344, -0.07649898529052734, -0.07386016845703125, -0.07122135162353516, -0.06858253479003906, -0.06594371795654297, -0.06330490112304688, -0.06066608428955078, -0.05802726745605469, -0.055388450622558594, -0.0527496337890625, -0.050110816955566406, -0.04747200012207031, -0.04483318328857422, -0.042194366455078125, -0.03955554962158203, -0.03691673278808594, -0.034277915954589844, -0.03163909912109375, -0.029000282287597656, -0.026361465454101562, -0.02372264862060547, -0.021083831787109375, -0.01844501495361328, -0.015806198120117188, -0.013167381286621094, -0.010528564453125, -0.007889747619628906, -0.0052509307861328125, -0.0026121139526367188, 2.6702880859375e-05, 0.0026655197143554688, 0.0053043365478515625, 0.007943153381347656, 0.01058197021484375, 0.013220787048339844, 0.015859603881835938, 0.01849842071533203, 0.021137237548828125, 0.02377605438232422, 0.026414871215820312, 0.029053688049316406, 0.0316925048828125, 0.034331321716308594, 0.03697013854980469, 0.03960895538330078, 0.042247772216796875, 0.04488658905029297, 0.04752540588378906, 0.050164222717285156, 0.05280303955078125, 0.055441856384277344, 0.05808067321777344, 0.06071949005126953, 0.06335830688476562, 0.06599712371826172, 0.06863594055175781, 0.0712747573852539, 0.07391357421875]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 8.0, 9.0, 6.0, 10.0, 17.0, 19.0, 41.0, 59.0, 94.0, 88.0, 116.0, 103.0, 121.0, 80.0, 81.0, 45.0, 36.0, 17.0, 13.0, 20.0, 6.0, 8.0, 8.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0938720703125, -0.09087085723876953, -0.08786964416503906, -0.0848684310913086, -0.08186721801757812, -0.07886600494384766, -0.07586479187011719, -0.07286357879638672, -0.06986236572265625, -0.06686115264892578, -0.06385993957519531, -0.060858726501464844, -0.057857513427734375, -0.054856300354003906, -0.05185508728027344, -0.04885387420654297, -0.0458526611328125, -0.04285144805908203, -0.03985023498535156, -0.036849021911621094, -0.033847808837890625, -0.030846595764160156, -0.027845382690429688, -0.02484416961669922, -0.02184295654296875, -0.01884174346923828, -0.015840530395507812, -0.012839317321777344, -0.009838104248046875, -0.006836891174316406, -0.0038356781005859375, -0.0008344650268554688, 0.002166748046875, 0.005167961120605469, 0.008169174194335938, 0.011170387268066406, 0.014171600341796875, 0.017172813415527344, 0.020174026489257812, 0.02317523956298828, 0.02617645263671875, 0.02917766571044922, 0.03217887878417969, 0.035180091857910156, 0.038181304931640625, 0.041182518005371094, 0.04418373107910156, 0.04718494415283203, 0.0501861572265625, 0.05318737030029297, 0.05618858337402344, 0.059189796447753906, 0.062191009521484375, 0.06519222259521484, 0.06819343566894531, 0.07119464874267578, 0.07419586181640625, 0.07719707489013672, 0.08019828796386719, 0.08319950103759766, 0.08620071411132812, 0.0892019271850586, 0.09220314025878906, 0.09520435333251953, 0.09820556640625]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 9.0, 23.0, 62.0, 154.0, 244.0, 253.0, 157.0, 79.0, 25.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.045063018798828, -3.965975284576416, -3.886887788772583, -3.807800054550171, -3.728712558746338, -3.649624824523926, -3.5705370903015137, -3.4914493560791016, -3.4123618602752686, -3.3332741260528564, -3.2541866302490234, -3.1750988960266113, -3.096011161804199, -3.016923666000366, -2.937835931777954, -2.858748435974121, -2.779660701751709, -2.700572967529297, -2.621485471725464, -2.5423977375030518, -2.4633102416992188, -2.3842225074768066, -2.3051347732543945, -2.2260470390319824, -2.1469595432281494, -2.0678718090057373, -1.9887843132019043, -1.9096965789794922, -1.8306089639663696, -1.751521348953247, -1.672433614730835, -1.5933459997177124, -1.5142581462860107, -1.4351705312728882, -1.3560829162597656, -1.2769951820373535, -1.197907567024231, -1.1188199520111084, -1.0397322177886963, -0.9606446027755737, -0.8815569877624512, -0.8024693727493286, -0.7233816981315613, -0.644294023513794, -0.5652064085006714, -0.48611876368522644, -0.4070311188697815, -0.32794344425201416, -0.2488558292388916, -0.16976818442344666, -0.09068053960800171, -0.011592894792556763, 0.06749475002288818, 0.14658239483833313, 0.22567003965377808, 0.3047577142715454, 0.38384532928466797, 0.4629329741001129, 0.5420206189155579, 0.6211082935333252, 0.7001959085464478, 0.7792835235595703, 0.8583711981773376, 0.937458872795105, 1.0165464878082275]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 2.0, 12.0, 9.0, 19.0, 9.0, 13.0, 13.0, 14.0, 18.0, 20.0, 27.0, 41.0, 40.0, 44.0, 35.0, 54.0, 43.0, 61.0, 48.0, 50.0, 61.0, 44.0, 45.0, 26.0, 41.0, 28.0, 31.0, 22.0, 19.0, 14.0, 18.0, 16.0, 9.0, 13.0, 12.0, 6.0, 5.0, 8.0, 2.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.1798052787780762, -1.1435506343841553, -1.107296109199524, -1.071041464805603, -1.0347869396209717, -0.9985323548316956, -0.9622777700424194, -0.9260231256484985, -0.8897686004638672, -0.8535140156745911, -0.8172594308853149, -0.7810048460960388, -0.7447502613067627, -0.7084956765174866, -0.6722410917282104, -0.6359864473342896, -0.5997318625450134, -0.5634772777557373, -0.5272226929664612, -0.49096810817718506, -0.45471352338790894, -0.4184589385986328, -0.3822043240070343, -0.3459497392177582, -0.30969515442848206, -0.27344056963920593, -0.2371859848499298, -0.2009313851594925, -0.16467680037021637, -0.12842221558094025, -0.09216761589050293, -0.05591303110122681, -0.019658446311950684, 0.016596142202615738, 0.05285073071718216, 0.08910532295703888, 0.125359907746315, 0.16161449253559113, 0.19786909222602844, 0.23412367701530457, 0.2703782618045807, 0.3066328465938568, 0.34288743138313293, 0.37914204597473145, 0.41539663076400757, 0.4516512155532837, 0.4879058003425598, 0.5241603851318359, 0.5604149699211121, 0.5966695547103882, 0.6329241394996643, 0.6691787242889404, 0.7054333090782166, 0.7416878938674927, 0.7779425382614136, 0.8141970634460449, 0.8504517078399658, 0.8867062926292419, 0.9229608774185181, 0.9592154622077942, 0.9954700469970703, 1.0317246913909912, 1.0679792165756226, 1.1042338609695435, 1.1404883861541748]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 5.0, 4.0, 6.0, 6.0, 11.0, 14.0, 26.0, 22.0, 30.0, 56.0, 83.0, 102.0, 173.0, 317.0, 784.0, 1770.0, 6245.0, 46257.0, 4106105.0, 25028.0, 4349.0, 1500.0, 599.0, 293.0, 186.0, 85.0, 53.0, 44.0, 34.0, 23.0, 12.0, 22.0, 12.0, 9.0, 9.0, 1.0, 2.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.242431640625, -0.23516845703125, -0.2279052734375, -0.22064208984375, -0.21337890625, -0.20611572265625, -0.1988525390625, -0.19158935546875, -0.184326171875, -0.17706298828125, -0.1697998046875, -0.16253662109375, -0.1552734375, -0.14801025390625, -0.1407470703125, -0.13348388671875, -0.126220703125, -0.11895751953125, -0.1116943359375, -0.10443115234375, -0.09716796875, -0.08990478515625, -0.0826416015625, -0.07537841796875, -0.068115234375, -0.06085205078125, -0.0535888671875, -0.04632568359375, -0.0390625, -0.03179931640625, -0.0245361328125, -0.01727294921875, -0.010009765625, -0.00274658203125, 0.0045166015625, 0.01177978515625, 0.01904296875, 0.02630615234375, 0.0335693359375, 0.04083251953125, 0.048095703125, 0.05535888671875, 0.0626220703125, 0.06988525390625, 0.0771484375, 0.08441162109375, 0.0916748046875, 0.09893798828125, 0.106201171875, 0.11346435546875, 0.1207275390625, 0.12799072265625, 0.13525390625, 0.14251708984375, 0.1497802734375, 0.15704345703125, 0.164306640625, 0.17156982421875, 0.1788330078125, 0.18609619140625, 0.193359375, 0.20062255859375, 0.2078857421875, 0.21514892578125, 0.222412109375]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 13.0, 16.0, 21.0, 36.0, 56.0, 75.0, 74.0, 97.0, 106.0, 104.0, 87.0, 90.0, 72.0, 54.0, 35.0, 25.0, 16.0, 12.0, 5.0, 5.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16357421875, -0.1596822738647461, -0.1557903289794922, -0.15189838409423828, -0.14800643920898438, -0.14411449432373047, -0.14022254943847656, -0.13633060455322266, -0.13243865966796875, -0.12854671478271484, -0.12465476989746094, -0.12076282501220703, -0.11687088012695312, -0.11297893524169922, -0.10908699035644531, -0.1051950454711914, -0.1013031005859375, -0.0974111557006836, -0.09351921081542969, -0.08962726593017578, -0.08573532104492188, -0.08184337615966797, -0.07795143127441406, -0.07405948638916016, -0.07016754150390625, -0.06627559661865234, -0.06238365173339844, -0.05849170684814453, -0.054599761962890625, -0.05070781707763672, -0.04681587219238281, -0.042923927307128906, -0.039031982421875, -0.035140037536621094, -0.031248092651367188, -0.02735614776611328, -0.023464202880859375, -0.01957225799560547, -0.015680313110351562, -0.011788368225097656, -0.00789642333984375, -0.004004478454589844, -0.0001125335693359375, 0.0037794113159179688, 0.007671356201171875, 0.011563301086425781, 0.015455245971679688, 0.019347190856933594, 0.0232391357421875, 0.027131080627441406, 0.031023025512695312, 0.03491497039794922, 0.038806915283203125, 0.04269886016845703, 0.04659080505371094, 0.050482749938964844, 0.05437469482421875, 0.058266639709472656, 0.06215858459472656, 0.06605052947998047, 0.06994247436523438, 0.07383441925048828, 0.07772636413574219, 0.0816183090209961, 0.08551025390625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 6.0, 5.0, 8.0, 11.0, 10.0, 18.0, 14.0, 31.0, 47.0, 58.0, 81.0, 130.0, 210.0, 332.0, 548.0, 904.0, 1700.0, 3368.0, 8228.0, 26520.0, 3763859.0, 348352.0, 24741.0, 7744.0, 3268.0, 1661.0, 876.0, 575.0, 354.0, 213.0, 137.0, 76.0, 63.0, 43.0, 28.0, 19.0, 15.0, 9.0, 7.0, 7.0, 2.0, 5.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.1622314453125, -0.15715789794921875, -0.1520843505859375, -0.14701080322265625, -0.141937255859375, -0.13686370849609375, -0.1317901611328125, -0.12671661376953125, -0.12164306640625, -0.11656951904296875, -0.1114959716796875, -0.10642242431640625, -0.101348876953125, -0.09627532958984375, -0.0912017822265625, -0.08612823486328125, -0.0810546875, -0.07598114013671875, -0.0709075927734375, -0.06583404541015625, -0.060760498046875, -0.05568695068359375, -0.0506134033203125, -0.04553985595703125, -0.04046630859375, -0.03539276123046875, -0.0303192138671875, -0.02524566650390625, -0.020172119140625, -0.01509857177734375, -0.0100250244140625, -0.00495147705078125, 0.0001220703125, 0.00519561767578125, 0.0102691650390625, 0.01534271240234375, 0.020416259765625, 0.02548980712890625, 0.0305633544921875, 0.03563690185546875, 0.04071044921875, 0.04578399658203125, 0.0508575439453125, 0.05593109130859375, 0.061004638671875, 0.06607818603515625, 0.0711517333984375, 0.07622528076171875, 0.081298828125, 0.08637237548828125, 0.0914459228515625, 0.09651947021484375, 0.101593017578125, 0.10666656494140625, 0.1117401123046875, 0.11681365966796875, 0.12188720703125, 0.12696075439453125, 0.1320343017578125, 0.13710784912109375, 0.142181396484375, 0.14725494384765625, 0.1523284912109375, 0.15740203857421875, 0.1624755859375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 5.0, 8.0, 6.0, 5.0, 13.0, 17.0, 28.0, 64.0, 245.0, 3511.0, 75.0, 38.0, 18.0, 13.0, 9.0, 4.0, 7.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05877685546875, -0.057274818420410156, -0.05577278137207031, -0.05427074432373047, -0.052768707275390625, -0.05126667022705078, -0.04976463317871094, -0.048262596130371094, -0.04676055908203125, -0.045258522033691406, -0.04375648498535156, -0.04225444793701172, -0.040752410888671875, -0.03925037384033203, -0.03774833679199219, -0.036246299743652344, -0.0347442626953125, -0.033242225646972656, -0.03174018859863281, -0.03023815155029297, -0.028736114501953125, -0.02723407745361328, -0.025732040405273438, -0.024230003356933594, -0.02272796630859375, -0.021225929260253906, -0.019723892211914062, -0.01822185516357422, -0.016719818115234375, -0.015217781066894531, -0.013715744018554688, -0.012213706970214844, -0.010711669921875, -0.009209632873535156, -0.0077075958251953125, -0.006205558776855469, -0.004703521728515625, -0.0032014846801757812, -0.0016994476318359375, -0.00019741058349609375, 0.00130462646484375, 0.0028066635131835938, 0.0043087005615234375, 0.005810737609863281, 0.007312774658203125, 0.008814811706542969, 0.010316848754882812, 0.011818885803222656, 0.0133209228515625, 0.014822959899902344, 0.016324996948242188, 0.01782703399658203, 0.019329071044921875, 0.02083110809326172, 0.022333145141601562, 0.023835182189941406, 0.02533721923828125, 0.026839256286621094, 0.028341293334960938, 0.02984333038330078, 0.031345367431640625, 0.03284740447998047, 0.03434944152832031, 0.035851478576660156, 0.037353515625]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 17.0, 69.0, 250.0, 367.0, 225.0, 67.0, 10.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17257609963417053, -0.1576010137796402, -0.14262592792510986, -0.12765082716941833, -0.1126757487654686, -0.09770066291093826, -0.08272556960582733, -0.067750483751297, -0.05277539789676666, -0.03780031204223633, -0.022825222462415695, -0.007850132882595062, 0.007124952971935272, 0.022100038826465607, 0.03707513213157654, 0.05205021798610687, 0.06702530384063721, 0.08200038969516754, 0.09697547554969788, 0.11195056885480881, 0.12692564725875854, 0.14190074801445007, 0.1568758338689804, 0.17185091972351074, 0.18682600557804108, 0.2018010914325714, 0.21677617728710175, 0.23175126314163208, 0.2467263638973236, 0.26170143485069275, 0.2766765356063843, 0.2916516065597534, 0.30662673711776733, 0.32160183787345886, 0.336576908826828, 0.35155200958251953, 0.36652708053588867, 0.3815021812915802, 0.39647728204727173, 0.41145235300064087, 0.42642742395401, 0.44140252470970154, 0.4563775956630707, 0.4713526964187622, 0.48632776737213135, 0.5013028383255005, 0.5162779688835144, 0.5312530398368835, 0.5462281703948975, 0.5612032413482666, 0.5761783719062805, 0.5911534428596497, 0.6061285138130188, 0.6211035847663879, 0.6360787153244019, 0.651053786277771, 0.6660288572311401, 0.6810039281845093, 0.6959790587425232, 0.7109541296958923, 0.7259292006492615, 0.7409042716026306, 0.7558794021606445, 0.7708544731140137, 0.7858295440673828]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 8.0, 4.0, 5.0, 3.0, 5.0, 16.0, 12.0, 15.0, 14.0, 22.0, 25.0, 34.0, 26.0, 34.0, 29.0, 29.0, 51.0, 31.0, 45.0, 38.0, 45.0, 50.0, 37.0, 53.0, 46.0, 37.0, 32.0, 38.0, 27.0, 32.0, 19.0, 18.0, 20.0, 14.0, 14.0, 13.0, 15.0, 13.0, 7.0, 7.0, 5.0, 3.0, 3.0, 5.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0809706449508667, -0.07838603854179382, -0.07580143213272095, -0.07321682572364807, -0.0706322193145752, -0.06804761290550232, -0.06546300649642944, -0.06287840008735657, -0.06029379367828369, -0.057709187269210815, -0.05512458086013794, -0.052539974451065063, -0.04995536804199219, -0.04737076163291931, -0.044786155223846436, -0.04220154881477356, -0.039616942405700684, -0.03703233599662781, -0.03444772958755493, -0.031863123178482056, -0.02927851676940918, -0.026693910360336304, -0.024109303951263428, -0.021524697542190552, -0.018940091133117676, -0.0163554847240448, -0.013770878314971924, -0.011186271905899048, -0.008601665496826172, -0.006017059087753296, -0.00343245267868042, -0.0008478462696075439, 0.001736760139465332, 0.004321366548538208, 0.006905972957611084, 0.00949057936668396, 0.012075185775756836, 0.014659792184829712, 0.017244398593902588, 0.019829005002975464, 0.02241361141204834, 0.024998217821121216, 0.027582824230194092, 0.030167430639266968, 0.032752037048339844, 0.03533664345741272, 0.037921249866485596, 0.04050585627555847, 0.04309046268463135, 0.045675069093704224, 0.0482596755027771, 0.050844281911849976, 0.05342888832092285, 0.05601349472999573, 0.058598101139068604, 0.06118270754814148, 0.06376731395721436, 0.06635192036628723, 0.06893652677536011, 0.07152113318443298, 0.07410573959350586, 0.07669034600257874, 0.07927495241165161, 0.08185955882072449, 0.08444416522979736]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 4.0, 7.0, 6.0, 6.0, 10.0, 21.0, 29.0, 41.0, 70.0, 89.0, 158.0, 234.0, 474.0, 930.0, 2179.0, 5911.0, 20184.0, 80988.0, 323173.0, 440457.0, 128629.0, 30973.0, 8533.0, 2897.0, 1222.0, 558.0, 280.0, 160.0, 122.0, 67.0, 41.0, 32.0, 25.0, 20.0, 12.0, 7.0, 4.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.15966796875, -0.15470314025878906, -0.14973831176757812, -0.1447734832763672, -0.13980865478515625, -0.1348438262939453, -0.12987899780273438, -0.12491416931152344, -0.1199493408203125, -0.11498451232910156, -0.11001968383789062, -0.10505485534667969, -0.10009002685546875, -0.09512519836425781, -0.09016036987304688, -0.08519554138183594, -0.080230712890625, -0.07526588439941406, -0.07030105590820312, -0.06533622741699219, -0.06037139892578125, -0.05540657043457031, -0.050441741943359375, -0.04547691345214844, -0.0405120849609375, -0.03554725646972656, -0.030582427978515625, -0.025617599487304688, -0.02065277099609375, -0.015687942504882812, -0.010723114013671875, -0.0057582855224609375, -0.00079345703125, 0.0041713714599609375, 0.009136199951171875, 0.014101028442382812, 0.01906585693359375, 0.024030685424804688, 0.028995513916015625, 0.03396034240722656, 0.0389251708984375, 0.04388999938964844, 0.048854827880859375, 0.05381965637207031, 0.05878448486328125, 0.06374931335449219, 0.06871414184570312, 0.07367897033691406, 0.078643798828125, 0.08360862731933594, 0.08857345581054688, 0.09353828430175781, 0.09850311279296875, 0.10346794128417969, 0.10843276977539062, 0.11339759826660156, 0.1183624267578125, 0.12332725524902344, 0.12829208374023438, 0.1332569122314453, 0.13822174072265625, 0.1431865692138672, 0.14815139770507812, 0.15311622619628906, 0.1580810546875]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 10.0, 11.0, 16.0, 28.0, 42.0, 59.0, 81.0, 87.0, 94.0, 89.0, 104.0, 102.0, 72.0, 59.0, 52.0, 36.0, 23.0, 15.0, 13.0, 6.0, 5.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.165283203125, -0.16132831573486328, -0.15737342834472656, -0.15341854095458984, -0.14946365356445312, -0.1455087661743164, -0.1415538787841797, -0.13759899139404297, -0.13364410400390625, -0.12968921661376953, -0.1257343292236328, -0.1217794418334961, -0.11782455444335938, -0.11386966705322266, -0.10991477966308594, -0.10595989227294922, -0.1020050048828125, -0.09805011749267578, -0.09409523010253906, -0.09014034271240234, -0.08618545532226562, -0.0822305679321289, -0.07827568054199219, -0.07432079315185547, -0.07036590576171875, -0.06641101837158203, -0.06245613098144531, -0.058501243591308594, -0.054546356201171875, -0.050591468811035156, -0.04663658142089844, -0.04268169403076172, -0.038726806640625, -0.03477191925048828, -0.030817031860351562, -0.026862144470214844, -0.022907257080078125, -0.018952369689941406, -0.014997482299804688, -0.011042594909667969, -0.00708770751953125, -0.0031328201293945312, 0.0008220672607421875, 0.004776954650878906, 0.008731842041015625, 0.012686729431152344, 0.016641616821289062, 0.02059650421142578, 0.0245513916015625, 0.02850627899169922, 0.03246116638183594, 0.036416053771972656, 0.040370941162109375, 0.044325828552246094, 0.04828071594238281, 0.05223560333251953, 0.05619049072265625, 0.06014537811279297, 0.06410026550292969, 0.0680551528930664, 0.07201004028320312, 0.07596492767333984, 0.07991981506347656, 0.08387470245361328, 0.08782958984375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 5.0, 3.0, 8.0, 10.0, 4.0, 6.0, 8.0, 11.0, 17.0, 14.0, 28.0, 40.0, 69.0, 107.0, 156.0, 229.0, 391.0, 814.0, 1991.0, 8153.0, 78805.0, 793463.0, 147327.0, 12114.0, 2616.0, 936.0, 441.0, 236.0, 152.0, 102.0, 68.0, 45.0, 40.0, 27.0, 26.0, 22.0, 12.0, 6.0, 13.0, 8.0, 10.0, 8.0, 8.0, 7.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.27392578125, -0.2660102844238281, -0.25809478759765625, -0.2501792907714844, -0.2422637939453125, -0.23434829711914062, -0.22643280029296875, -0.21851730346679688, -0.210601806640625, -0.20268630981445312, -0.19477081298828125, -0.18685531616210938, -0.1789398193359375, -0.17102432250976562, -0.16310882568359375, -0.15519332885742188, -0.14727783203125, -0.13936233520507812, -0.13144683837890625, -0.12353134155273438, -0.1156158447265625, -0.10770034790039062, -0.09978485107421875, -0.09186935424804688, -0.083953857421875, -0.07603836059570312, -0.06812286376953125, -0.060207366943359375, -0.0522918701171875, -0.044376373291015625, -0.03646087646484375, -0.028545379638671875, -0.0206298828125, -0.012714385986328125, -0.00479888916015625, 0.003116607666015625, 0.0110321044921875, 0.018947601318359375, 0.02686309814453125, 0.034778594970703125, 0.042694091796875, 0.050609588623046875, 0.05852508544921875, 0.06644058227539062, 0.0743560791015625, 0.08227157592773438, 0.09018707275390625, 0.09810256958007812, 0.10601806640625, 0.11393356323242188, 0.12184906005859375, 0.12976455688476562, 0.1376800537109375, 0.14559555053710938, 0.15351104736328125, 0.16142654418945312, 0.169342041015625, 0.17725753784179688, 0.18517303466796875, 0.19308853149414062, 0.2010040283203125, 0.20891952514648438, 0.21683502197265625, 0.22475051879882812, 0.232666015625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 2.0, 6.0, 3.0, 8.0, 6.0, 12.0, 8.0, 14.0, 10.0, 21.0, 17.0, 15.0, 22.0, 25.0, 22.0, 32.0, 27.0, 36.0, 34.0, 48.0, 36.0, 42.0, 35.0, 51.0, 45.0, 45.0, 42.0, 34.0, 34.0, 37.0, 31.0, 24.0, 31.0, 24.0, 18.0, 16.0, 21.0, 19.0, 13.0, 6.0, 7.0, 5.0, 5.0, 8.0, 4.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.173095703125, -0.16638565063476562, -0.15967559814453125, -0.15296554565429688, -0.1462554931640625, -0.13954544067382812, -0.13283538818359375, -0.12612533569335938, -0.119415283203125, -0.11270523071289062, -0.10599517822265625, -0.09928512573242188, -0.0925750732421875, -0.08586502075195312, -0.07915496826171875, -0.07244491577148438, -0.06573486328125, -0.059024810791015625, -0.05231475830078125, -0.045604705810546875, -0.0388946533203125, -0.032184600830078125, -0.02547454833984375, -0.018764495849609375, -0.012054443359375, -0.005344390869140625, 0.00136566162109375, 0.008075714111328125, 0.0147857666015625, 0.021495819091796875, 0.02820587158203125, 0.034915924072265625, 0.0416259765625, 0.048336029052734375, 0.05504608154296875, 0.061756134033203125, 0.0684661865234375, 0.07517623901367188, 0.08188629150390625, 0.08859634399414062, 0.095306396484375, 0.10201644897460938, 0.10872650146484375, 0.11543655395507812, 0.1221466064453125, 0.12885665893554688, 0.13556671142578125, 0.14227676391601562, 0.14898681640625, 0.15569686889648438, 0.16240692138671875, 0.16911697387695312, 0.1758270263671875, 0.18253707885742188, 0.18924713134765625, 0.19595718383789062, 0.202667236328125, 0.20937728881835938, 0.21608734130859375, 0.22279739379882812, 0.2295074462890625, 0.23621749877929688, 0.24292755126953125, 0.24963760375976562, 0.25634765625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 4.0, 4.0, 7.0, 11.0, 17.0, 26.0, 52.0, 50.0, 111.0, 207.0, 509.0, 1683.0, 9860.0, 271935.0, 740859.0, 19417.0, 2489.0, 664.0, 291.0, 147.0, 78.0, 37.0, 24.0, 20.0, 13.0, 12.0, 6.0, 9.0, 6.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10260009765625, -0.09834957122802734, -0.09409904479980469, -0.08984851837158203, -0.08559799194335938, -0.08134746551513672, -0.07709693908691406, -0.0728464126586914, -0.06859588623046875, -0.0643453598022461, -0.06009483337402344, -0.05584430694580078, -0.051593780517578125, -0.04734325408935547, -0.04309272766113281, -0.038842201232910156, -0.0345916748046875, -0.030341148376464844, -0.026090621948242188, -0.02184009552001953, -0.017589569091796875, -0.013339042663574219, -0.009088516235351562, -0.004837989807128906, -0.00058746337890625, 0.0036630630493164062, 0.007913589477539062, 0.012164115905761719, 0.016414642333984375, 0.02066516876220703, 0.024915695190429688, 0.029166221618652344, 0.033416748046875, 0.037667274475097656, 0.04191780090332031, 0.04616832733154297, 0.050418853759765625, 0.05466938018798828, 0.05891990661621094, 0.0631704330444336, 0.06742095947265625, 0.0716714859008789, 0.07592201232910156, 0.08017253875732422, 0.08442306518554688, 0.08867359161376953, 0.09292411804199219, 0.09717464447021484, 0.1014251708984375, 0.10567569732666016, 0.10992622375488281, 0.11417675018310547, 0.11842727661132812, 0.12267780303955078, 0.12692832946777344, 0.1311788558959961, 0.13542938232421875, 0.1396799087524414, 0.14393043518066406, 0.14818096160888672, 0.15243148803710938, 0.15668201446533203, 0.1609325408935547, 0.16518306732177734, 0.16943359375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 0.0, 2.0, 4.0, 3.0, 7.0, 19.0, 11.0, 18.0, 19.0, 30.0, 33.0, 54.0, 58.0, 65.0, 80.0, 87.0, 87.0, 76.0, 78.0, 52.0, 47.0, 37.0, 37.0, 34.0, 29.0, 11.0, 8.0, 5.0, 4.0, 4.0, 4.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.059906005859375e-06, -8.7004154920578e-06, -8.340924978256226e-06, -7.981434464454651e-06, -7.621943950653076e-06, -7.2624534368515015e-06, -6.902962923049927e-06, -6.543472409248352e-06, -6.183981895446777e-06, -5.824491381645203e-06, -5.465000867843628e-06, -5.105510354042053e-06, -4.7460198402404785e-06, -4.386529326438904e-06, -4.027038812637329e-06, -3.6675482988357544e-06, -3.3080577850341797e-06, -2.948567271232605e-06, -2.5890767574310303e-06, -2.2295862436294556e-06, -1.8700957298278809e-06, -1.5106052160263062e-06, -1.1511147022247314e-06, -7.916241884231567e-07, -4.3213367462158203e-07, -7.264316082000732e-08, 2.868473529815674e-07, 6.463378667831421e-07, 1.0058283805847168e-06, 1.3653188943862915e-06, 1.7248094081878662e-06, 2.084299921989441e-06, 2.4437904357910156e-06, 2.8032809495925903e-06, 3.162771463394165e-06, 3.5222619771957397e-06, 3.8817524909973145e-06, 4.241243004798889e-06, 4.600733518600464e-06, 4.9602240324020386e-06, 5.319714546203613e-06, 5.679205060005188e-06, 6.038695573806763e-06, 6.398186087608337e-06, 6.757676601409912e-06, 7.117167115211487e-06, 7.4766576290130615e-06, 7.836148142814636e-06, 8.195638656616211e-06, 8.555129170417786e-06, 8.91461968421936e-06, 9.274110198020935e-06, 9.63360071182251e-06, 9.993091225624084e-06, 1.035258173942566e-05, 1.0712072253227234e-05, 1.1071562767028809e-05, 1.1431053280830383e-05, 1.1790543794631958e-05, 1.2150034308433533e-05, 1.2509524822235107e-05, 1.2869015336036682e-05, 1.3228505849838257e-05, 1.3587996363639832e-05, 1.3947486877441406e-05]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 13.0, 7.0, 23.0, 34.0, 66.0, 102.0, 241.0, 602.0, 2384.0, 29524.0, 954672.0, 56383.0, 3302.0, 668.0, 250.0, 116.0, 62.0, 46.0, 22.0, 11.0, 10.0, 7.0, 3.0, 5.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.177490234375, -0.1712799072265625, -0.165069580078125, -0.1588592529296875, -0.15264892578125, -0.1464385986328125, -0.140228271484375, -0.1340179443359375, -0.1278076171875, -0.1215972900390625, -0.115386962890625, -0.1091766357421875, -0.10296630859375, -0.0967559814453125, -0.090545654296875, -0.0843353271484375, -0.078125, -0.0719146728515625, -0.065704345703125, -0.0594940185546875, -0.05328369140625, -0.0470733642578125, -0.040863037109375, -0.0346527099609375, -0.0284423828125, -0.0222320556640625, -0.016021728515625, -0.0098114013671875, -0.00360107421875, 0.0026092529296875, 0.008819580078125, 0.0150299072265625, 0.021240234375, 0.0274505615234375, 0.033660888671875, 0.0398712158203125, 0.04608154296875, 0.0522918701171875, 0.058502197265625, 0.0647125244140625, 0.0709228515625, 0.0771331787109375, 0.083343505859375, 0.0895538330078125, 0.09576416015625, 0.1019744873046875, 0.108184814453125, 0.1143951416015625, 0.12060546875, 0.1268157958984375, 0.133026123046875, 0.1392364501953125, 0.14544677734375, 0.1516571044921875, 0.157867431640625, 0.1640777587890625, 0.1702880859375, 0.1764984130859375, 0.182708740234375, 0.1889190673828125, 0.19512939453125, 0.2013397216796875, 0.207550048828125, 0.2137603759765625, 0.219970703125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 2.0, 3.0, 8.0, 8.0, 13.0, 27.0, 47.0, 88.0, 129.0, 168.0, 172.0, 140.0, 84.0, 48.0, 26.0, 23.0, 12.0, 4.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07586669921875, -0.07139873504638672, -0.06693077087402344, -0.062462806701660156, -0.057994842529296875, -0.053526878356933594, -0.04905891418457031, -0.04459095001220703, -0.04012298583984375, -0.03565502166748047, -0.031187057495117188, -0.026719093322753906, -0.022251129150390625, -0.017783164978027344, -0.013315200805664062, -0.008847236633300781, -0.0043792724609375, 8.869171142578125e-05, 0.0045566558837890625, 0.009024620056152344, 0.013492584228515625, 0.017960548400878906, 0.022428512573242188, 0.02689647674560547, 0.03136444091796875, 0.03583240509033203, 0.04030036926269531, 0.044768333435058594, 0.049236297607421875, 0.053704261779785156, 0.05817222595214844, 0.06264019012451172, 0.067108154296875, 0.07157611846923828, 0.07604408264160156, 0.08051204681396484, 0.08498001098632812, 0.0894479751586914, 0.09391593933105469, 0.09838390350341797, 0.10285186767578125, 0.10731983184814453, 0.11178779602050781, 0.1162557601928711, 0.12072372436523438, 0.12519168853759766, 0.12965965270996094, 0.13412761688232422, 0.1385955810546875, 0.14306354522705078, 0.14753150939941406, 0.15199947357177734, 0.15646743774414062, 0.1609354019165039, 0.1654033660888672, 0.16987133026123047, 0.17433929443359375, 0.17880725860595703, 0.1832752227783203, 0.1877431869506836, 0.19221115112304688, 0.19667911529541016, 0.20114707946777344, 0.20561504364013672, 0.2100830078125]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 9.0, 32.0, 123.0, 281.0, 363.0, 149.0, 37.0, 12.0, 6.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3114885091781616, -1.2109380960464478, -1.1103878021240234, -1.0098373889923096, -0.9092869758605957, -0.8087366223335266, -0.7081862688064575, -0.6076358556747437, -0.5070855021476746, -0.4065351188182831, -0.3059847354888916, -0.2054343819618225, -0.10488399863243103, -0.004333615303039551, 0.09621673822402954, 0.1967671513557434, 0.2973175048828125, 0.397867888212204, 0.49841827154159546, 0.5989686250686646, 0.6995190382003784, 0.8000693917274475, 0.9006197452545166, 1.0011701583862305, 1.1017205715179443, 1.2022709846496582, 1.3028212785720825, 1.4033716917037964, 1.5039221048355103, 1.6044723987579346, 1.7050228118896484, 1.8055732250213623, 1.906123399734497, 2.006673812866211, 2.107224225997925, 2.2077746391296387, 2.3083248138427734, 2.4088752269744873, 2.509425640106201, 2.609976053237915, 2.710526466369629, 2.8110768795013428, 2.9116272926330566, 3.0121774673461914, 3.1127278804779053, 3.213278293609619, 3.313828706741333, 3.414379119873047, 3.5149292945861816, 3.6154797077178955, 3.7160301208496094, 3.816580295562744, 3.917130708694458, 4.017681121826172, 4.118231773376465, 4.2187819480896, 4.319332599639893, 4.419882774353027, 4.52043342590332, 4.620983600616455, 4.721534252166748, 4.822084426879883, 4.922635078430176, 5.0231852531433105, 5.123735427856445]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 5.0, 1.0, 5.0, 3.0, 6.0, 10.0, 14.0, 11.0, 10.0, 17.0, 20.0, 19.0, 24.0, 37.0, 42.0, 36.0, 46.0, 57.0, 63.0, 69.0, 61.0, 50.0, 63.0, 51.0, 41.0, 39.0, 33.0, 38.0, 27.0, 20.0, 16.0, 19.0, 15.0, 11.0, 8.0, 7.0, 4.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.407359004020691, -1.3676804304122925, -1.328001856803894, -1.2883232831954956, -1.2486447095870972, -1.2089661359786987, -1.1692875623703003, -1.1296089887619019, -1.0899304151535034, -1.050251841545105, -1.0105732679367065, -0.9708946943283081, -0.9312161207199097, -0.8915375471115112, -0.8518589735031128, -0.8121803998947144, -0.7725018262863159, -0.7328232526779175, -0.693144679069519, -0.6534661054611206, -0.6137875318527222, -0.5741089582443237, -0.5344303846359253, -0.49475181102752686, -0.4550732374191284, -0.41539466381073, -0.37571609020233154, -0.3360375165939331, -0.29635894298553467, -0.25668036937713623, -0.2170017957687378, -0.17732322216033936, -0.13764476776123047, -0.09796619415283203, -0.058287620544433594, -0.018609046936035156, 0.02106952667236328, 0.06074810028076172, 0.10042667388916016, 0.1401052474975586, 0.17978382110595703, 0.21946239471435547, 0.2591409683227539, 0.29881954193115234, 0.3384981155395508, 0.3781766891479492, 0.41785526275634766, 0.4575338363647461, 0.49721240997314453, 0.536890983581543, 0.5765695571899414, 0.6162481307983398, 0.6559267044067383, 0.6956052780151367, 0.7352838516235352, 0.7749624252319336, 0.814640998840332, 0.8543195724487305, 0.8939981460571289, 0.9336767196655273, 0.9733552932739258, 1.0130338668823242, 1.0527124404907227, 1.092391014099121, 1.1320695877075195]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 14.0, 7.0, 15.0, 30.0, 51.0, 87.0, 140.0, 362.0, 1060.0, 5150.0, 4107461.0, 74789.0, 3654.0, 857.0, 300.0, 134.0, 58.0, 38.0, 33.0, 22.0, 14.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.54296875, -0.5296974182128906, -0.5164260864257812, -0.5031547546386719, -0.4898834228515625, -0.4766120910644531, -0.46334075927734375, -0.4500694274902344, -0.436798095703125, -0.4235267639160156, -0.41025543212890625, -0.3969841003417969, -0.3837127685546875, -0.3704414367675781, -0.35717010498046875, -0.3438987731933594, -0.33062744140625, -0.3173561096191406, -0.30408477783203125, -0.2908134460449219, -0.2775421142578125, -0.2642707824707031, -0.25099945068359375, -0.23772811889648438, -0.224456787109375, -0.21118545532226562, -0.19791412353515625, -0.18464279174804688, -0.1713714599609375, -0.15810012817382812, -0.14482879638671875, -0.13155746459960938, -0.1182861328125, -0.10501480102539062, -0.09174346923828125, -0.07847213745117188, -0.0652008056640625, -0.051929473876953125, -0.03865814208984375, -0.025386810302734375, -0.012115478515625, 0.001155853271484375, 0.01442718505859375, 0.027698516845703125, 0.0409698486328125, 0.054241180419921875, 0.06751251220703125, 0.08078384399414062, 0.09405517578125, 0.10732650756835938, 0.12059783935546875, 0.13386917114257812, 0.1471405029296875, 0.16041183471679688, 0.17368316650390625, 0.18695449829101562, 0.200225830078125, 0.21349716186523438, 0.22676849365234375, 0.24003982543945312, 0.2533111572265625, 0.2665824890136719, 0.27985382080078125, 0.2931251525878906, 0.306396484375]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 9.0, 10.0, 21.0, 22.0, 39.0, 64.0, 70.0, 99.0, 89.0, 94.0, 108.0, 99.0, 73.0, 60.0, 52.0, 35.0, 21.0, 15.0, 12.0, 5.0, 5.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.165283203125, -0.16132068634033203, -0.15735816955566406, -0.1533956527709961, -0.14943313598632812, -0.14547061920166016, -0.1415081024169922, -0.13754558563232422, -0.13358306884765625, -0.12962055206298828, -0.1256580352783203, -0.12169551849365234, -0.11773300170898438, -0.1137704849243164, -0.10980796813964844, -0.10584545135498047, -0.1018829345703125, -0.09792041778564453, -0.09395790100097656, -0.0899953842163086, -0.08603286743164062, -0.08207035064697266, -0.07810783386230469, -0.07414531707763672, -0.07018280029296875, -0.06622028350830078, -0.06225776672363281, -0.058295249938964844, -0.054332733154296875, -0.050370216369628906, -0.04640769958496094, -0.04244518280029297, -0.038482666015625, -0.03452014923095703, -0.030557632446289062, -0.026595115661621094, -0.022632598876953125, -0.018670082092285156, -0.014707565307617188, -0.010745048522949219, -0.00678253173828125, -0.0028200149536132812, 0.0011425018310546875, 0.005105018615722656, 0.009067535400390625, 0.013030052185058594, 0.016992568969726562, 0.02095508575439453, 0.0249176025390625, 0.02888011932373047, 0.03284263610839844, 0.036805152893066406, 0.040767669677734375, 0.044730186462402344, 0.04869270324707031, 0.05265522003173828, 0.05661773681640625, 0.06058025360107422, 0.06454277038574219, 0.06850528717041016, 0.07246780395507812, 0.0764303207397461, 0.08039283752441406, 0.08435535430908203, 0.08831787109375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 0.0, 5.0, 7.0, 4.0, 5.0, 8.0, 12.0, 15.0, 17.0, 18.0, 32.0, 29.0, 51.0, 52.0, 92.0, 97.0, 167.0, 263.0, 446.0, 931.0, 2092.0, 6132.0, 41799.0, 4117411.0, 17285.0, 3974.0, 1468.0, 724.0, 367.0, 226.0, 150.0, 103.0, 81.0, 70.0, 26.0, 33.0, 28.0, 27.0, 7.0, 8.0, 5.0, 11.0, 4.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.3525390625, -0.3422660827636719, -0.33199310302734375, -0.3217201232910156, -0.3114471435546875, -0.3011741638183594, -0.29090118408203125, -0.2806282043457031, -0.270355224609375, -0.2600822448730469, -0.24980926513671875, -0.23953628540039062, -0.2292633056640625, -0.21899032592773438, -0.20871734619140625, -0.19844436645507812, -0.18817138671875, -0.17789840698242188, -0.16762542724609375, -0.15735244750976562, -0.1470794677734375, -0.13680648803710938, -0.12653350830078125, -0.11626052856445312, -0.105987548828125, -0.09571456909179688, -0.08544158935546875, -0.07516860961914062, -0.0648956298828125, -0.054622650146484375, -0.04434967041015625, -0.034076690673828125, -0.0238037109375, -0.013530731201171875, -0.00325775146484375, 0.007015228271484375, 0.0172882080078125, 0.027561187744140625, 0.03783416748046875, 0.048107147216796875, 0.058380126953125, 0.06865310668945312, 0.07892608642578125, 0.08919906616210938, 0.0994720458984375, 0.10974502563476562, 0.12001800537109375, 0.13029098510742188, 0.14056396484375, 0.15083694458007812, 0.16110992431640625, 0.17138290405273438, 0.1816558837890625, 0.19192886352539062, 0.20220184326171875, 0.21247482299804688, 0.222747802734375, 0.23302078247070312, 0.24329376220703125, 0.2535667419433594, 0.2638397216796875, 0.2741127014160156, 0.28438568115234375, 0.2946586608886719, 0.304931640625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 2.0, 4.0, 5.0, 9.0, 16.0, 37.0, 3729.0, 205.0, 37.0, 18.0, 8.0, 5.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0906982421875, -0.0878591537475586, -0.08502006530761719, -0.08218097686767578, -0.07934188842773438, -0.07650279998779297, -0.07366371154785156, -0.07082462310791016, -0.06798553466796875, -0.06514644622802734, -0.06230735778808594, -0.05946826934814453, -0.056629180908203125, -0.05379009246826172, -0.05095100402832031, -0.048111915588378906, -0.0452728271484375, -0.042433738708496094, -0.03959465026855469, -0.03675556182861328, -0.033916473388671875, -0.03107738494873047, -0.028238296508789062, -0.025399208068847656, -0.02256011962890625, -0.019721031188964844, -0.016881942749023438, -0.014042854309082031, -0.011203765869140625, -0.008364677429199219, -0.0055255889892578125, -0.0026865005493164062, 0.000152587890625, 0.0029916763305664062, 0.0058307647705078125, 0.008669853210449219, 0.011508941650390625, 0.014348030090332031, 0.017187118530273438, 0.020026206970214844, 0.02286529541015625, 0.025704383850097656, 0.028543472290039062, 0.03138256072998047, 0.034221649169921875, 0.03706073760986328, 0.03989982604980469, 0.042738914489746094, 0.0455780029296875, 0.048417091369628906, 0.05125617980957031, 0.05409526824951172, 0.056934356689453125, 0.05977344512939453, 0.06261253356933594, 0.06545162200927734, 0.06829071044921875, 0.07112979888916016, 0.07396888732910156, 0.07680797576904297, 0.07964706420898438, 0.08248615264892578, 0.08532524108886719, 0.0881643295288086, 0.09100341796875]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 8.0, 23.0, 36.0, 99.0, 222.0, 299.0, 179.0, 81.0, 38.0, 14.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4417669177055359, -0.4273221790790558, -0.4128774404525757, -0.3984326720237732, -0.3839879333972931, -0.369543194770813, -0.3550984263420105, -0.3406536877155304, -0.3262089490890503, -0.3117642104625702, -0.2973194718360901, -0.2828747034072876, -0.2684299647808075, -0.2539852261543274, -0.2395404726266861, -0.2250957190990448, -0.2106509804725647, -0.1962062418460846, -0.1817614883184433, -0.167316734790802, -0.1528719961643219, -0.1384272575378418, -0.1239825040102005, -0.1095377579331398, -0.0950930118560791, -0.0806482657790184, -0.0662035197019577, -0.051758773624897, -0.037314027547836304, -0.022869281470775604, -0.008424535393714905, 0.006020210683345795, 0.020464956760406494, 0.034909702837467194, 0.04935444891452789, 0.06379919499158859, 0.07824394106864929, 0.09268868714570999, 0.10713343322277069, 0.12157817929983139, 0.1360229253768921, 0.1504676640033722, 0.1649124175310135, 0.17935717105865479, 0.1938019096851349, 0.208246648311615, 0.2226914018392563, 0.23713615536689758, 0.2515808939933777, 0.2660256326198578, 0.2804703712463379, 0.2949151396751404, 0.3093598783016205, 0.3238046169281006, 0.3382493853569031, 0.3526941239833832, 0.3671388626098633, 0.3815836012363434, 0.3960283398628235, 0.410473108291626, 0.4249178469181061, 0.4393625855445862, 0.45380735397338867, 0.4682520925998688, 0.4826968312263489]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 4.0, 7.0, 4.0, 12.0, 8.0, 9.0, 11.0, 13.0, 13.0, 18.0, 29.0, 18.0, 20.0, 25.0, 40.0, 49.0, 39.0, 36.0, 36.0, 42.0, 44.0, 39.0, 51.0, 48.0, 39.0, 42.0, 41.0, 40.0, 34.0, 26.0, 22.0, 17.0, 22.0, 18.0, 19.0, 18.0, 10.0, 8.0, 9.0, 10.0, 4.0, 2.0, 2.0, 4.0, 2.0, 0.0, 1.0, 5.0, 0.0, 3.0], "bins": [-0.11567831039428711, -0.11235958337783813, -0.10904086381196976, -0.10572214424610138, -0.1024034172296524, -0.09908469021320343, -0.09576597064733505, -0.09244725108146667, -0.0891285240650177, -0.08580979704856873, -0.08249107748270035, -0.07917235791683197, -0.075853630900383, -0.07253490388393402, -0.06921618431806564, -0.06589746475219727, -0.06257873773574829, -0.059260014444589615, -0.05594129115343094, -0.05262256786227226, -0.049303844571113586, -0.04598512127995491, -0.042666397988796234, -0.03934767469763756, -0.03602895140647888, -0.032710228115320206, -0.02939150482416153, -0.026072781533002853, -0.022754058241844177, -0.0194353349506855, -0.016116611659526825, -0.012797888368368149, -0.009479165077209473, -0.0061604417860507965, -0.0028417184948921204, 0.0004770047962665558, 0.003795728087425232, 0.007114451378583908, 0.010433174669742584, 0.01375189796090126, 0.017070621252059937, 0.020389344543218613, 0.02370806783437729, 0.027026791125535965, 0.03034551441669464, 0.03366423770785332, 0.03698296099901199, 0.04030168429017067, 0.043620407581329346, 0.04693913087248802, 0.0502578541636467, 0.053576577454805374, 0.05689530074596405, 0.060214024037122726, 0.0635327473282814, 0.06685146689414978, 0.07017019391059875, 0.07348892092704773, 0.07680764049291611, 0.08012636005878448, 0.08344508707523346, 0.08676381409168243, 0.09008253365755081, 0.09340125322341919, 0.09671998023986816]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 1.0, 1.0, 6.0, 10.0, 11.0, 21.0, 30.0, 34.0, 66.0, 136.0, 257.0, 576.0, 1293.0, 3644.0, 15393.0, 179164.0, 754777.0, 78890.0, 9673.0, 2686.0, 988.0, 414.0, 212.0, 107.0, 72.0, 27.0, 22.0, 9.0, 11.0, 8.0, 2.0, 3.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2880859375, -0.27918243408203125, -0.2702789306640625, -0.26137542724609375, -0.252471923828125, -0.24356842041015625, -0.2346649169921875, -0.22576141357421875, -0.21685791015625, -0.20795440673828125, -0.1990509033203125, -0.19014739990234375, -0.181243896484375, -0.17234039306640625, -0.1634368896484375, -0.15453338623046875, -0.1456298828125, -0.13672637939453125, -0.1278228759765625, -0.11891937255859375, -0.110015869140625, -0.10111236572265625, -0.0922088623046875, -0.08330535888671875, -0.07440185546875, -0.06549835205078125, -0.0565948486328125, -0.04769134521484375, -0.038787841796875, -0.02988433837890625, -0.0209808349609375, -0.01207733154296875, -0.003173828125, 0.00572967529296875, 0.0146331787109375, 0.02353668212890625, 0.032440185546875, 0.04134368896484375, 0.0502471923828125, 0.05915069580078125, 0.06805419921875, 0.07695770263671875, 0.0858612060546875, 0.09476470947265625, 0.103668212890625, 0.11257171630859375, 0.1214752197265625, 0.13037872314453125, 0.1392822265625, 0.14818572998046875, 0.1570892333984375, 0.16599273681640625, 0.174896240234375, 0.18379974365234375, 0.1927032470703125, 0.20160675048828125, 0.21051025390625, 0.21941375732421875, 0.2283172607421875, 0.23722076416015625, 0.246124267578125, 0.25502777099609375, 0.2639312744140625, 0.27283477783203125, 0.28173828125]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 8.0, 12.0, 10.0, 21.0, 40.0, 70.0, 51.0, 78.0, 91.0, 103.0, 92.0, 99.0, 68.0, 76.0, 47.0, 44.0, 27.0, 24.0, 17.0, 10.0, 7.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1650390625, -0.16112613677978516, -0.1572132110595703, -0.15330028533935547, -0.14938735961914062, -0.14547443389892578, -0.14156150817871094, -0.1376485824584961, -0.13373565673828125, -0.1298227310180664, -0.12590980529785156, -0.12199687957763672, -0.11808395385742188, -0.11417102813720703, -0.11025810241699219, -0.10634517669677734, -0.1024322509765625, -0.09851932525634766, -0.09460639953613281, -0.09069347381591797, -0.08678054809570312, -0.08286762237548828, -0.07895469665527344, -0.0750417709350586, -0.07112884521484375, -0.0672159194946289, -0.06330299377441406, -0.05939006805419922, -0.055477142333984375, -0.05156421661376953, -0.04765129089355469, -0.043738365173339844, -0.039825439453125, -0.035912513732910156, -0.03199958801269531, -0.02808666229248047, -0.024173736572265625, -0.02026081085205078, -0.016347885131835938, -0.012434959411621094, -0.00852203369140625, -0.004609107971191406, -0.0006961822509765625, 0.0032167434692382812, 0.007129669189453125, 0.011042594909667969, 0.014955520629882812, 0.018868446350097656, 0.0227813720703125, 0.026694297790527344, 0.030607223510742188, 0.03452014923095703, 0.038433074951171875, 0.04234600067138672, 0.04625892639160156, 0.050171852111816406, 0.05408477783203125, 0.057997703552246094, 0.06191062927246094, 0.06582355499267578, 0.06973648071289062, 0.07364940643310547, 0.07756233215332031, 0.08147525787353516, 0.08538818359375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 5.0, 5.0, 5.0, 5.0, 6.0, 3.0, 9.0, 17.0, 21.0, 12.0, 22.0, 28.0, 42.0, 47.0, 70.0, 114.0, 160.0, 345.0, 673.0, 1730.0, 8281.0, 156980.0, 835852.0, 37797.0, 3992.0, 1116.0, 493.0, 236.0, 137.0, 85.0, 55.0, 57.0, 34.0, 30.0, 22.0, 18.0, 16.0, 11.0, 8.0, 7.0, 5.0, 1.0, 3.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.287841796875, -0.27919769287109375, -0.2705535888671875, -0.26190948486328125, -0.253265380859375, -0.24462127685546875, -0.2359771728515625, -0.22733306884765625, -0.21868896484375, -0.21004486083984375, -0.2014007568359375, -0.19275665283203125, -0.184112548828125, -0.17546844482421875, -0.1668243408203125, -0.15818023681640625, -0.1495361328125, -0.14089202880859375, -0.1322479248046875, -0.12360382080078125, -0.114959716796875, -0.10631561279296875, -0.0976715087890625, -0.08902740478515625, -0.08038330078125, -0.07173919677734375, -0.0630950927734375, -0.05445098876953125, -0.045806884765625, -0.03716278076171875, -0.0285186767578125, -0.01987457275390625, -0.01123046875, -0.00258636474609375, 0.0060577392578125, 0.01470184326171875, 0.023345947265625, 0.03199005126953125, 0.0406341552734375, 0.04927825927734375, 0.05792236328125, 0.06656646728515625, 0.0752105712890625, 0.08385467529296875, 0.092498779296875, 0.10114288330078125, 0.1097869873046875, 0.11843109130859375, 0.1270751953125, 0.13571929931640625, 0.1443634033203125, 0.15300750732421875, 0.161651611328125, 0.17029571533203125, 0.1789398193359375, 0.18758392333984375, 0.19622802734375, 0.20487213134765625, 0.2135162353515625, 0.22216033935546875, 0.230804443359375, 0.23944854736328125, 0.2480926513671875, 0.25673675537109375, 0.265380859375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 7.0, 13.0, 5.0, 7.0, 11.0, 11.0, 13.0, 17.0, 13.0, 25.0, 28.0, 31.0, 30.0, 32.0, 32.0, 45.0, 52.0, 38.0, 40.0, 46.0, 59.0, 44.0, 47.0, 46.0, 39.0, 32.0, 27.0, 26.0, 31.0, 23.0, 31.0, 24.0, 10.0, 18.0, 13.0, 12.0, 7.0, 2.0, 3.0, 6.0, 3.0, 3.0, 6.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2171630859375, -0.20943260192871094, -0.20170211791992188, -0.1939716339111328, -0.18624114990234375, -0.1785106658935547, -0.17078018188476562, -0.16304969787597656, -0.1553192138671875, -0.14758872985839844, -0.13985824584960938, -0.1321277618408203, -0.12439727783203125, -0.11666679382324219, -0.10893630981445312, -0.10120582580566406, -0.093475341796875, -0.08574485778808594, -0.07801437377929688, -0.07028388977050781, -0.06255340576171875, -0.05482292175292969, -0.047092437744140625, -0.03936195373535156, -0.0316314697265625, -0.023900985717773438, -0.016170501708984375, -0.008440017700195312, -0.00070953369140625, 0.0070209503173828125, 0.014751434326171875, 0.022481918334960938, 0.03021240234375, 0.03794288635253906, 0.045673370361328125, 0.05340385437011719, 0.06113433837890625, 0.06886482238769531, 0.07659530639648438, 0.08432579040527344, 0.0920562744140625, 0.09978675842285156, 0.10751724243164062, 0.11524772644042969, 0.12297821044921875, 0.1307086944580078, 0.13843917846679688, 0.14616966247558594, 0.153900146484375, 0.16163063049316406, 0.16936111450195312, 0.1770915985107422, 0.18482208251953125, 0.1925525665283203, 0.20028305053710938, 0.20801353454589844, 0.2157440185546875, 0.22347450256347656, 0.23120498657226562, 0.2389354705810547, 0.24666595458984375, 0.2543964385986328, 0.2621269226074219, 0.26985740661621094, 0.277587890625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 6.0, 5.0, 5.0, 3.0, 6.0, 7.0, 14.0, 12.0, 14.0, 26.0, 33.0, 59.0, 78.0, 151.0, 214.0, 426.0, 965.0, 2975.0, 14308.0, 161630.0, 795858.0, 60416.0, 7734.0, 1992.0, 709.0, 352.0, 184.0, 122.0, 63.0, 49.0, 35.0, 23.0, 20.0, 13.0, 12.0, 10.0, 7.0, 7.0, 4.0, 2.0, 4.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.09136962890625, -0.08878326416015625, -0.0861968994140625, -0.08361053466796875, -0.081024169921875, -0.07843780517578125, -0.0758514404296875, -0.07326507568359375, -0.0706787109375, -0.06809234619140625, -0.0655059814453125, -0.06291961669921875, -0.060333251953125, -0.05774688720703125, -0.0551605224609375, -0.05257415771484375, -0.04998779296875, -0.04740142822265625, -0.0448150634765625, -0.04222869873046875, -0.039642333984375, -0.03705596923828125, -0.0344696044921875, -0.03188323974609375, -0.029296875, -0.02671051025390625, -0.0241241455078125, -0.02153778076171875, -0.018951416015625, -0.01636505126953125, -0.0137786865234375, -0.01119232177734375, -0.00860595703125, -0.00601959228515625, -0.0034332275390625, -0.00084686279296875, 0.001739501953125, 0.00432586669921875, 0.0069122314453125, 0.00949859619140625, 0.0120849609375, 0.01467132568359375, 0.0172576904296875, 0.01984405517578125, 0.022430419921875, 0.02501678466796875, 0.0276031494140625, 0.03018951416015625, 0.03277587890625, 0.03536224365234375, 0.0379486083984375, 0.04053497314453125, 0.043121337890625, 0.04570770263671875, 0.0482940673828125, 0.05088043212890625, 0.053466796875, 0.05605316162109375, 0.0586395263671875, 0.06122589111328125, 0.063812255859375, 0.06639862060546875, 0.0689849853515625, 0.07157135009765625, 0.07415771484375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 0.0, 2.0, 2.0, 10.0, 7.0, 11.0, 11.0, 14.0, 17.0, 23.0, 34.0, 37.0, 40.0, 45.0, 89.0, 92.0, 98.0, 78.0, 78.0, 63.0, 53.0, 45.0, 33.0, 16.0, 33.0, 21.0, 9.0, 13.0, 6.0, 8.0, 8.0, 3.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0967254638671875e-05, -1.0611489415168762e-05, -1.025572419166565e-05, -9.899958968162537e-06, -9.544193744659424e-06, -9.188428521156311e-06, -8.832663297653198e-06, -8.476898074150085e-06, -8.121132850646973e-06, -7.76536762714386e-06, -7.409602403640747e-06, -7.053837180137634e-06, -6.6980719566345215e-06, -6.342306733131409e-06, -5.986541509628296e-06, -5.630776286125183e-06, -5.27501106262207e-06, -4.9192458391189575e-06, -4.563480615615845e-06, -4.207715392112732e-06, -3.851950168609619e-06, -3.4961849451065063e-06, -3.1404197216033936e-06, -2.7846544981002808e-06, -2.428889274597168e-06, -2.073124051094055e-06, -1.7173588275909424e-06, -1.3615936040878296e-06, -1.0058283805847168e-06, -6.50063157081604e-07, -2.942979335784912e-07, 6.146728992462158e-08, 4.172325134277344e-07, 7.729977369308472e-07, 1.12876296043396e-06, 1.4845281839370728e-06, 1.8402934074401855e-06, 2.1960586309432983e-06, 2.551823854446411e-06, 2.907589077949524e-06, 3.2633543014526367e-06, 3.6191195249557495e-06, 3.974884748458862e-06, 4.330649971961975e-06, 4.686415195465088e-06, 5.042180418968201e-06, 5.3979456424713135e-06, 5.753710865974426e-06, 6.109476089477539e-06, 6.465241312980652e-06, 6.821006536483765e-06, 7.1767717599868774e-06, 7.53253698348999e-06, 7.888302206993103e-06, 8.244067430496216e-06, 8.599832653999329e-06, 8.955597877502441e-06, 9.311363101005554e-06, 9.667128324508667e-06, 1.002289354801178e-05, 1.0378658771514893e-05, 1.0734423995018005e-05, 1.1090189218521118e-05, 1.1445954442024231e-05, 1.1801719665527344e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 3.0, 4.0, 7.0, 3.0, 13.0, 9.0, 18.0, 26.0, 45.0, 85.0, 139.0, 256.0, 537.0, 1355.0, 4253.0, 23064.0, 391437.0, 590077.0, 29478.0, 5042.0, 1465.0, 563.0, 285.0, 142.0, 97.0, 54.0, 41.0, 19.0, 14.0, 6.0, 5.0, 6.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10357666015625, -0.10024166107177734, -0.09690666198730469, -0.09357166290283203, -0.09023666381835938, -0.08690166473388672, -0.08356666564941406, -0.0802316665649414, -0.07689666748046875, -0.0735616683959961, -0.07022666931152344, -0.06689167022705078, -0.06355667114257812, -0.06022167205810547, -0.05688667297363281, -0.053551673889160156, -0.0502166748046875, -0.046881675720214844, -0.04354667663574219, -0.04021167755126953, -0.036876678466796875, -0.03354167938232422, -0.030206680297851562, -0.026871681213378906, -0.02353668212890625, -0.020201683044433594, -0.016866683959960938, -0.013531684875488281, -0.010196685791015625, -0.006861686706542969, -0.0035266876220703125, -0.00019168853759765625, 0.003143310546875, 0.006478309631347656, 0.009813308715820312, 0.013148307800292969, 0.016483306884765625, 0.01981830596923828, 0.023153305053710938, 0.026488304138183594, 0.02982330322265625, 0.033158302307128906, 0.03649330139160156, 0.03982830047607422, 0.043163299560546875, 0.04649829864501953, 0.04983329772949219, 0.053168296813964844, 0.0565032958984375, 0.059838294982910156, 0.06317329406738281, 0.06650829315185547, 0.06984329223632812, 0.07317829132080078, 0.07651329040527344, 0.0798482894897461, 0.08318328857421875, 0.0865182876586914, 0.08985328674316406, 0.09318828582763672, 0.09652328491210938, 0.09985828399658203, 0.10319328308105469, 0.10652828216552734, 0.10986328125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 6.0, 1.0, 8.0, 8.0, 18.0, 23.0, 31.0, 43.0, 61.0, 104.0, 144.0, 145.0, 141.0, 100.0, 66.0, 36.0, 22.0, 17.0, 12.0, 4.0, 6.0, 5.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09576416015625, -0.09200382232666016, -0.08824348449707031, -0.08448314666748047, -0.08072280883789062, -0.07696247100830078, -0.07320213317871094, -0.0694417953491211, -0.06568145751953125, -0.061921119689941406, -0.05816078186035156, -0.05440044403076172, -0.050640106201171875, -0.04687976837158203, -0.04311943054199219, -0.039359092712402344, -0.0355987548828125, -0.031838417053222656, -0.028078079223632812, -0.02431774139404297, -0.020557403564453125, -0.01679706573486328, -0.013036727905273438, -0.009276390075683594, -0.00551605224609375, -0.0017557144165039062, 0.0020046234130859375, 0.005764961242675781, 0.009525299072265625, 0.013285636901855469, 0.017045974731445312, 0.020806312561035156, 0.024566650390625, 0.028326988220214844, 0.03208732604980469, 0.03584766387939453, 0.039608001708984375, 0.04336833953857422, 0.04712867736816406, 0.050889015197753906, 0.05464935302734375, 0.058409690856933594, 0.06217002868652344, 0.06593036651611328, 0.06969070434570312, 0.07345104217529297, 0.07721138000488281, 0.08097171783447266, 0.0847320556640625, 0.08849239349365234, 0.09225273132324219, 0.09601306915283203, 0.09977340698242188, 0.10353374481201172, 0.10729408264160156, 0.1110544204711914, 0.11481475830078125, 0.1185750961303711, 0.12233543395996094, 0.12609577178955078, 0.12985610961914062, 0.13361644744873047, 0.1373767852783203, 0.14113712310791016, 0.1448974609375]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 7.0, 3.0, 11.0, 17.0, 27.0, 50.0, 59.0, 96.0, 116.0, 132.0, 147.0, 114.0, 87.0, 55.0, 33.0, 23.0, 14.0, 5.0, 3.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0], "bins": [-1.5127534866333008, -1.4784622192382812, -1.4441709518432617, -1.4098796844482422, -1.3755885362625122, -1.3412972688674927, -1.3070060014724731, -1.2727147340774536, -1.238423466682434, -1.2041321992874146, -1.169840931892395, -1.135549783706665, -1.1012585163116455, -1.066967248916626, -1.0326759815216064, -0.9983847141265869, -0.9640935063362122, -0.9298022389411926, -0.8955110311508179, -0.8612197637557983, -0.8269284963607788, -0.7926372289657593, -0.7583460211753845, -0.724054753780365, -0.6897635459899902, -0.6554722785949707, -0.621181070804596, -0.5868898034095764, -0.5525985360145569, -0.5183073282241821, -0.4840160608291626, -0.44972479343414307, -0.41543352603912354, -0.3811422884464264, -0.34685102105140686, -0.3125597834587097, -0.2782685160636902, -0.24397727847099304, -0.2096860408782959, -0.17539478838443756, -0.14110353589057922, -0.10681228339672089, -0.07252103835344315, -0.038229793310165405, -0.003938540816307068, 0.03035271167755127, 0.06464394927024841, 0.09893520176410675, 0.1332264542579651, 0.16751770675182343, 0.20180895924568176, 0.2361001968383789, 0.27039146423339844, 0.3046827018260956, 0.3389739394187927, 0.37326520681381226, 0.4075564444065094, 0.44184768199920654, 0.4761389493942261, 0.5104302167892456, 0.5447214245796204, 0.5790126919746399, 0.6133038997650146, 0.6475951671600342, 0.6818864345550537]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 5.0, 5.0, 8.0, 5.0, 10.0, 19.0, 11.0, 12.0, 29.0, 21.0, 21.0, 34.0, 37.0, 41.0, 39.0, 43.0, 50.0, 54.0, 50.0, 43.0, 55.0, 47.0, 51.0, 41.0, 47.0, 29.0, 21.0, 30.0, 23.0, 22.0, 16.0, 19.0, 15.0, 9.0, 9.0, 10.0, 9.0, 3.0, 0.0, 1.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.2254700660705566, -1.1885262727737427, -1.1515825986862183, -1.1146388053894043, -1.0776951313018799, -1.040751338005066, -1.003807544708252, -0.9668638110160828, -0.9299200773239136, -0.8929763436317444, -0.8560326099395752, -0.8190888166427612, -0.782145082950592, -0.7452013492584229, -0.7082575559616089, -0.6713138222694397, -0.6343700885772705, -0.5974263548851013, -0.5604826211929321, -0.5235388278961182, -0.486595094203949, -0.4496513605117798, -0.4127075970172882, -0.37576383352279663, -0.33882009983062744, -0.30187636613845825, -0.2649326026439667, -0.2279888540506363, -0.1910451054573059, -0.15410135686397552, -0.11715760827064514, -0.08021384477615356, -0.043270111083984375, -0.006326362490653992, 0.03061738610267639, 0.06756113469600677, 0.10450488328933716, 0.14144863188266754, 0.17839238047599792, 0.2153361439704895, 0.2522798776626587, 0.2892236113548279, 0.32616737484931946, 0.36311113834381104, 0.4000548720359802, 0.4369986057281494, 0.473942369222641, 0.5108861327171326, 0.5478298664093018, 0.584773600101471, 0.6217173337936401, 0.6586611270904541, 0.6956048607826233, 0.7325485944747925, 0.7694923877716064, 0.8064361214637756, 0.8433798551559448, 0.880323588848114, 0.9172673225402832, 0.9542111158370972, 0.9911548495292664, 1.0280985832214355, 1.0650423765182495, 1.1019861698150635, 1.138929843902588]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 4.0, 4.0, 6.0, 15.0, 14.0, 33.0, 34.0, 70.0, 120.0, 268.0, 907.0, 6374.0, 4127621.0, 55401.0, 2485.0, 510.0, 161.0, 101.0, 70.0, 33.0, 23.0, 17.0, 7.0, 5.0, 5.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.626953125, -0.6123046875, -0.59765625, -0.5830078125, -0.568359375, -0.5537109375, -0.5390625, -0.5244140625, -0.509765625, -0.4951171875, -0.48046875, -0.4658203125, -0.451171875, -0.4365234375, -0.421875, -0.4072265625, -0.392578125, -0.3779296875, -0.36328125, -0.3486328125, -0.333984375, -0.3193359375, -0.3046875, -0.2900390625, -0.275390625, -0.2607421875, -0.24609375, -0.2314453125, -0.216796875, -0.2021484375, -0.1875, -0.1728515625, -0.158203125, -0.1435546875, -0.12890625, -0.1142578125, -0.099609375, -0.0849609375, -0.0703125, -0.0556640625, -0.041015625, -0.0263671875, -0.01171875, 0.0029296875, 0.017578125, 0.0322265625, 0.046875, 0.0615234375, 0.076171875, 0.0908203125, 0.10546875, 0.1201171875, 0.134765625, 0.1494140625, 0.1640625, 0.1787109375, 0.193359375, 0.2080078125, 0.22265625, 0.2373046875, 0.251953125, 0.2666015625, 0.28125, 0.2958984375, 0.310546875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 7.0, 0.0, 8.0, 7.0, 14.0, 13.0, 16.0, 41.0, 52.0, 73.0, 74.0, 89.0, 108.0, 91.0, 119.0, 62.0, 69.0, 54.0, 37.0, 26.0, 21.0, 13.0, 10.0, 4.0, 1.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.165771484375, -0.16182804107666016, -0.1578845977783203, -0.15394115447998047, -0.14999771118164062, -0.14605426788330078, -0.14211082458496094, -0.1381673812866211, -0.13422393798828125, -0.1302804946899414, -0.12633705139160156, -0.12239360809326172, -0.11845016479492188, -0.11450672149658203, -0.11056327819824219, -0.10661983489990234, -0.1026763916015625, -0.09873294830322266, -0.09478950500488281, -0.09084606170654297, -0.08690261840820312, -0.08295917510986328, -0.07901573181152344, -0.0750722885131836, -0.07112884521484375, -0.0671854019165039, -0.06324195861816406, -0.05929851531982422, -0.055355072021484375, -0.05141162872314453, -0.04746818542480469, -0.043524742126464844, -0.039581298828125, -0.035637855529785156, -0.03169441223144531, -0.02775096893310547, -0.023807525634765625, -0.01986408233642578, -0.015920639038085938, -0.011977195739746094, -0.00803375244140625, -0.004090309143066406, -0.0001468658447265625, 0.0037965774536132812, 0.007740020751953125, 0.011683464050292969, 0.015626907348632812, 0.019570350646972656, 0.0235137939453125, 0.027457237243652344, 0.03140068054199219, 0.03534412384033203, 0.039287567138671875, 0.04323101043701172, 0.04717445373535156, 0.051117897033691406, 0.05506134033203125, 0.059004783630371094, 0.06294822692871094, 0.06689167022705078, 0.07083511352539062, 0.07477855682373047, 0.07872200012207031, 0.08266544342041016, 0.08660888671875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 13.0, 10.0, 10.0, 17.0, 27.0, 33.0, 43.0, 64.0, 115.0, 144.0, 235.0, 287.0, 474.0, 744.0, 1208.0, 2161.0, 4249.0, 10493.0, 36255.0, 3933369.0, 167955.0, 21095.0, 7327.0, 3320.0, 1705.0, 1027.0, 620.0, 430.0, 269.0, 173.0, 111.0, 88.0, 59.0, 55.0, 21.0, 16.0, 26.0, 13.0, 5.0, 8.0, 2.0, 6.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1578369140625, -0.1525440216064453, -0.14725112915039062, -0.14195823669433594, -0.13666534423828125, -0.13137245178222656, -0.12607955932617188, -0.12078666687011719, -0.1154937744140625, -0.11020088195800781, -0.10490798950195312, -0.09961509704589844, -0.09432220458984375, -0.08902931213378906, -0.08373641967773438, -0.07844352722167969, -0.073150634765625, -0.06785774230957031, -0.06256484985351562, -0.05727195739746094, -0.05197906494140625, -0.04668617248535156, -0.041393280029296875, -0.03610038757324219, -0.0308074951171875, -0.025514602661132812, -0.020221710205078125, -0.014928817749023438, -0.00963592529296875, -0.0043430328369140625, 0.000949859619140625, 0.0062427520751953125, 0.01153564453125, 0.016828536987304688, 0.022121429443359375, 0.027414321899414062, 0.03270721435546875, 0.03800010681152344, 0.043292999267578125, 0.04858589172363281, 0.0538787841796875, 0.05917167663574219, 0.06446456909179688, 0.06975746154785156, 0.07505035400390625, 0.08034324645996094, 0.08563613891601562, 0.09092903137207031, 0.096221923828125, 0.10151481628417969, 0.10680770874023438, 0.11210060119628906, 0.11739349365234375, 0.12268638610839844, 0.12797927856445312, 0.1332721710205078, 0.1385650634765625, 0.1438579559326172, 0.14915084838867188, 0.15444374084472656, 0.15973663330078125, 0.16502952575683594, 0.17032241821289062, 0.1756153106689453, 0.180908203125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 3.0, 4.0, 3.0, 11.0, 9.0, 31.0, 49.0, 217.0, 3540.0, 106.0, 43.0, 16.0, 9.0, 12.0, 4.0, 7.0, 4.0, 2.0, 4.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10321044921875, -0.09969043731689453, -0.09617042541503906, -0.0926504135131836, -0.08913040161132812, -0.08561038970947266, -0.08209037780761719, -0.07857036590576172, -0.07505035400390625, -0.07153034210205078, -0.06801033020019531, -0.06449031829833984, -0.060970306396484375, -0.057450294494628906, -0.05393028259277344, -0.05041027069091797, -0.0468902587890625, -0.04337024688720703, -0.03985023498535156, -0.036330223083496094, -0.032810211181640625, -0.029290199279785156, -0.025770187377929688, -0.02225017547607422, -0.01873016357421875, -0.015210151672363281, -0.011690139770507812, -0.008170127868652344, -0.004650115966796875, -0.0011301040649414062, 0.0023899078369140625, 0.005909919738769531, 0.009429931640625, 0.012949943542480469, 0.016469955444335938, 0.019989967346191406, 0.023509979248046875, 0.027029991149902344, 0.030550003051757812, 0.03407001495361328, 0.03759002685546875, 0.04111003875732422, 0.04463005065917969, 0.048150062561035156, 0.051670074462890625, 0.055190086364746094, 0.05871009826660156, 0.06223011016845703, 0.0657501220703125, 0.06927013397216797, 0.07279014587402344, 0.0763101577758789, 0.07983016967773438, 0.08335018157958984, 0.08687019348144531, 0.09039020538330078, 0.09391021728515625, 0.09743022918701172, 0.10095024108886719, 0.10447025299072266, 0.10799026489257812, 0.1115102767944336, 0.11503028869628906, 0.11855030059814453, 0.1220703125]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 5.0, 5.0, 4.0, 13.0, 45.0, 96.0, 198.0, 272.0, 198.0, 89.0, 52.0, 17.0, 6.0, 8.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.20950669050216675, -0.18953141570091248, -0.169556125998497, -0.14958083629608154, -0.12960556149482727, -0.1096302792429924, -0.08965499699115753, -0.06967970728874207, -0.04970443248748779, -0.029729150235652924, -0.009753867983818054, 0.010221414268016815, 0.030196696519851685, 0.050171978771686554, 0.07014726102352142, 0.09012255072593689, 0.11009782552719116, 0.13007310032844543, 0.1500483900308609, 0.17002367973327637, 0.18999895453453064, 0.2099742293357849, 0.22994951903820038, 0.24992480874061584, 0.2699000835418701, 0.2898753583431244, 0.30985063314437866, 0.3298259377479553, 0.3498012125492096, 0.36977648735046387, 0.3897517919540405, 0.4097270667552948, 0.4297022819519043, 0.44967755675315857, 0.46965283155441284, 0.4896281361579895, 0.5096033811569214, 0.529578685760498, 0.5495539903640747, 0.5695292949676514, 0.5895045399665833, 0.6094798445701599, 0.6294550895690918, 0.6494303941726685, 0.6694056987762451, 0.689380943775177, 0.7093562483787537, 0.7293314933776855, 0.7493067979812622, 0.7692821025848389, 0.7892573475837708, 0.8092326521873474, 0.8292078971862793, 0.849183201789856, 0.8691585063934326, 0.8891338109970093, 0.9091090559959412, 0.9290843605995178, 0.9490596055984497, 0.9690349102020264, 0.989010214805603, 1.0089855194091797, 1.0289607048034668, 1.0489360094070435, 1.0689113140106201]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 4.0, 6.0, 3.0, 6.0, 7.0, 12.0, 14.0, 26.0, 23.0, 14.0, 22.0, 21.0, 30.0, 32.0, 32.0, 38.0, 53.0, 42.0, 48.0, 53.0, 66.0, 40.0, 28.0, 40.0, 41.0, 31.0, 38.0, 27.0, 24.0, 31.0, 29.0, 15.0, 21.0, 16.0, 13.0, 14.0, 7.0, 9.0, 5.0, 7.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.17073500156402588, -0.165257066488266, -0.1597791314125061, -0.15430119633674622, -0.14882326126098633, -0.14334532618522644, -0.13786739110946655, -0.13238945603370667, -0.12691152095794678, -0.12143358588218689, -0.115955650806427, -0.11047771573066711, -0.10499978065490723, -0.09952184557914734, -0.09404391795396805, -0.08856598287820816, -0.08308805525302887, -0.07761012017726898, -0.0721321851015091, -0.0666542500257492, -0.06117631867527962, -0.05569838359951973, -0.05022045224905014, -0.04474251717329025, -0.039264582097530365, -0.03378664702177048, -0.02830871380865574, -0.022830780595541, -0.017352845519781113, -0.011874910444021225, -0.006396979093551636, -0.000919044017791748, 0.00455889105796814, 0.010036825202405453, 0.015514759346842766, 0.020992692559957504, 0.026470627635717392, 0.03194856271147728, 0.03742649406194687, 0.04290442913770676, 0.048382364213466644, 0.05386029928922653, 0.05933823436498642, 0.06481616199016571, 0.0702940970659256, 0.07577203214168549, 0.08124996721744537, 0.08672790229320526, 0.09220583736896515, 0.09768377244472504, 0.10316170752048492, 0.10863964259624481, 0.1141175776720047, 0.11959551274776459, 0.12507343292236328, 0.13055136799812317, 0.13602930307388306, 0.14150723814964294, 0.14698517322540283, 0.15246310830116272, 0.1579410433769226, 0.1634189784526825, 0.16889691352844238, 0.17437484860420227, 0.17985278367996216]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 7.0, 7.0, 5.0, 6.0, 7.0, 11.0, 29.0, 31.0, 46.0, 63.0, 94.0, 186.0, 325.0, 573.0, 1418.0, 3438.0, 9551.0, 33076.0, 133182.0, 433182.0, 319346.0, 81078.0, 21446.0, 6829.0, 2445.0, 971.0, 481.0, 288.0, 156.0, 84.0, 55.0, 52.0, 24.0, 19.0, 13.0, 8.0, 9.0, 3.0, 7.0, 5.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.1671142578125, -0.16217422485351562, -0.15723419189453125, -0.15229415893554688, -0.1473541259765625, -0.14241409301757812, -0.13747406005859375, -0.13253402709960938, -0.127593994140625, -0.12265396118164062, -0.11771392822265625, -0.11277389526367188, -0.1078338623046875, -0.10289382934570312, -0.09795379638671875, -0.09301376342773438, -0.08807373046875, -0.08313369750976562, -0.07819366455078125, -0.07325363159179688, -0.0683135986328125, -0.06337356567382812, -0.05843353271484375, -0.053493499755859375, -0.048553466796875, -0.043613433837890625, -0.03867340087890625, -0.033733367919921875, -0.0287933349609375, -0.023853302001953125, -0.01891326904296875, -0.013973236083984375, -0.009033203125, -0.004093170166015625, 0.00084686279296875, 0.005786895751953125, 0.0107269287109375, 0.015666961669921875, 0.02060699462890625, 0.025547027587890625, 0.030487060546875, 0.035427093505859375, 0.04036712646484375, 0.045307159423828125, 0.0502471923828125, 0.055187225341796875, 0.06012725830078125, 0.06506729125976562, 0.07000732421875, 0.07494735717773438, 0.07988739013671875, 0.08482742309570312, 0.0897674560546875, 0.09470748901367188, 0.09964752197265625, 0.10458755493164062, 0.109527587890625, 0.11446762084960938, 0.11940765380859375, 0.12434768676757812, 0.1292877197265625, 0.13422775268554688, 0.13916778564453125, 0.14410781860351562, 0.1490478515625]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 10.0, 8.0, 16.0, 20.0, 30.0, 42.0, 59.0, 86.0, 84.0, 98.0, 89.0, 101.0, 85.0, 61.0, 65.0, 39.0, 39.0, 32.0, 12.0, 17.0, 1.0, 4.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.169189453125, -0.1652088165283203, -0.16122817993164062, -0.15724754333496094, -0.15326690673828125, -0.14928627014160156, -0.14530563354492188, -0.1413249969482422, -0.1373443603515625, -0.1333637237548828, -0.12938308715820312, -0.12540245056152344, -0.12142181396484375, -0.11744117736816406, -0.11346054077148438, -0.10947990417480469, -0.105499267578125, -0.10151863098144531, -0.09753799438476562, -0.09355735778808594, -0.08957672119140625, -0.08559608459472656, -0.08161544799804688, -0.07763481140136719, -0.0736541748046875, -0.06967353820800781, -0.06569290161132812, -0.06171226501464844, -0.05773162841796875, -0.05375099182128906, -0.049770355224609375, -0.04578971862792969, -0.04180908203125, -0.03782844543457031, -0.033847808837890625, -0.029867172241210938, -0.02588653564453125, -0.021905899047851562, -0.017925262451171875, -0.013944625854492188, -0.0099639892578125, -0.0059833526611328125, -0.002002716064453125, 0.0019779205322265625, 0.00595855712890625, 0.009939193725585938, 0.013919830322265625, 0.017900466918945312, 0.021881103515625, 0.025861740112304688, 0.029842376708984375, 0.03382301330566406, 0.03780364990234375, 0.04178428649902344, 0.045764923095703125, 0.04974555969238281, 0.0537261962890625, 0.05770683288574219, 0.061687469482421875, 0.06566810607910156, 0.06964874267578125, 0.07362937927246094, 0.07761001586914062, 0.08159065246582031, 0.0855712890625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 8.0, 5.0, 7.0, 6.0, 8.0, 15.0, 29.0, 29.0, 41.0, 58.0, 90.0, 185.0, 338.0, 744.0, 2129.0, 9577.0, 107011.0, 820276.0, 95526.0, 8923.0, 2004.0, 728.0, 342.0, 176.0, 102.0, 59.0, 34.0, 36.0, 11.0, 20.0, 11.0, 9.0, 9.0, 1.0, 3.0, 4.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.30029296875, -0.2915840148925781, -0.28287506103515625, -0.2741661071777344, -0.2654571533203125, -0.2567481994628906, -0.24803924560546875, -0.23933029174804688, -0.230621337890625, -0.22191238403320312, -0.21320343017578125, -0.20449447631835938, -0.1957855224609375, -0.18707656860351562, -0.17836761474609375, -0.16965866088867188, -0.16094970703125, -0.15224075317382812, -0.14353179931640625, -0.13482284545898438, -0.1261138916015625, -0.11740493774414062, -0.10869598388671875, -0.09998703002929688, -0.091278076171875, -0.08256912231445312, -0.07386016845703125, -0.06515121459960938, -0.0564422607421875, -0.047733306884765625, -0.03902435302734375, -0.030315399169921875, -0.0216064453125, -0.012897491455078125, -0.00418853759765625, 0.004520416259765625, 0.0132293701171875, 0.021938323974609375, 0.03064727783203125, 0.039356231689453125, 0.048065185546875, 0.056774139404296875, 0.06548309326171875, 0.07419204711914062, 0.0829010009765625, 0.09160995483398438, 0.10031890869140625, 0.10902786254882812, 0.11773681640625, 0.12644577026367188, 0.13515472412109375, 0.14386367797851562, 0.1525726318359375, 0.16128158569335938, 0.16999053955078125, 0.17869949340820312, 0.187408447265625, 0.19611740112304688, 0.20482635498046875, 0.21353530883789062, 0.2222442626953125, 0.23095321655273438, 0.23966217041015625, 0.24837112426757812, 0.257080078125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 2.0, 3.0, 7.0, 7.0, 5.0, 11.0, 12.0, 5.0, 17.0, 19.0, 18.0, 23.0, 19.0, 27.0, 33.0, 34.0, 29.0, 30.0, 55.0, 48.0, 51.0, 48.0, 55.0, 47.0, 55.0, 47.0, 41.0, 36.0, 36.0, 22.0, 25.0, 20.0, 22.0, 22.0, 11.0, 11.0, 14.0, 9.0, 10.0, 10.0, 1.0, 1.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.2474365234375, -0.2397174835205078, -0.23199844360351562, -0.22427940368652344, -0.21656036376953125, -0.20884132385253906, -0.20112228393554688, -0.1934032440185547, -0.1856842041015625, -0.1779651641845703, -0.17024612426757812, -0.16252708435058594, -0.15480804443359375, -0.14708900451660156, -0.13936996459960938, -0.1316509246826172, -0.123931884765625, -0.11621284484863281, -0.10849380493164062, -0.10077476501464844, -0.09305572509765625, -0.08533668518066406, -0.07761764526367188, -0.06989860534667969, -0.0621795654296875, -0.05446052551269531, -0.046741485595703125, -0.03902244567871094, -0.03130340576171875, -0.023584365844726562, -0.015865325927734375, -0.008146286010742188, -0.00042724609375, 0.0072917938232421875, 0.015010833740234375, 0.022729873657226562, 0.03044891357421875, 0.03816795349121094, 0.045886993408203125, 0.05360603332519531, 0.0613250732421875, 0.06904411315917969, 0.07676315307617188, 0.08448219299316406, 0.09220123291015625, 0.09992027282714844, 0.10763931274414062, 0.11535835266113281, 0.123077392578125, 0.1307964324951172, 0.13851547241210938, 0.14623451232910156, 0.15395355224609375, 0.16167259216308594, 0.16939163208007812, 0.1771106719970703, 0.1848297119140625, 0.1925487518310547, 0.20026779174804688, 0.20798683166503906, 0.21570587158203125, 0.22342491149902344, 0.23114395141601562, 0.2388629913330078, 0.24658203125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 3.0, 2.0, 2.0, 7.0, 10.0, 6.0, 14.0, 19.0, 27.0, 49.0, 57.0, 102.0, 132.0, 293.0, 531.0, 1085.0, 2972.0, 12566.0, 113641.0, 795137.0, 104756.0, 11979.0, 2882.0, 1066.0, 494.0, 270.0, 144.0, 109.0, 67.0, 41.0, 38.0, 12.0, 14.0, 5.0, 8.0, 6.0, 6.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.08123779296875, -0.0788116455078125, -0.076385498046875, -0.0739593505859375, -0.071533203125, -0.0691070556640625, -0.066680908203125, -0.0642547607421875, -0.06182861328125, -0.0594024658203125, -0.056976318359375, -0.0545501708984375, -0.0521240234375, -0.0496978759765625, -0.047271728515625, -0.0448455810546875, -0.04241943359375, -0.0399932861328125, -0.037567138671875, -0.0351409912109375, -0.03271484375, -0.0302886962890625, -0.027862548828125, -0.0254364013671875, -0.02301025390625, -0.0205841064453125, -0.018157958984375, -0.0157318115234375, -0.0133056640625, -0.0108795166015625, -0.008453369140625, -0.0060272216796875, -0.00360107421875, -0.0011749267578125, 0.001251220703125, 0.0036773681640625, 0.006103515625, 0.0085296630859375, 0.010955810546875, 0.0133819580078125, 0.01580810546875, 0.0182342529296875, 0.020660400390625, 0.0230865478515625, 0.0255126953125, 0.0279388427734375, 0.030364990234375, 0.0327911376953125, 0.03521728515625, 0.0376434326171875, 0.040069580078125, 0.0424957275390625, 0.044921875, 0.0473480224609375, 0.049774169921875, 0.0522003173828125, 0.05462646484375, 0.0570526123046875, 0.059478759765625, 0.0619049072265625, 0.0643310546875, 0.0667572021484375, 0.069183349609375, 0.0716094970703125, 0.07403564453125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 7.0, 5.0, 8.0, 14.0, 18.0, 27.0, 49.0, 92.0, 153.0, 176.0, 162.0, 115.0, 74.0, 42.0, 19.0, 19.0, 13.0, 10.0, 5.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3768672943115234e-05, -1.304037868976593e-05, -1.2312084436416626e-05, -1.1583790183067322e-05, -1.0855495929718018e-05, -1.0127201676368713e-05, -9.39890742301941e-06, -8.670613169670105e-06, -7.9423189163208e-06, -7.214024662971497e-06, -6.485730409622192e-06, -5.757436156272888e-06, -5.029141902923584e-06, -4.30084764957428e-06, -3.5725533962249756e-06, -2.8442591428756714e-06, -2.115964889526367e-06, -1.387670636177063e-06, -6.593763828277588e-07, 6.891787052154541e-08, 7.972121238708496e-07, 1.5255063772201538e-06, 2.253800630569458e-06, 2.982094883918762e-06, 3.7103891372680664e-06, 4.438683390617371e-06, 5.166977643966675e-06, 5.895271897315979e-06, 6.623566150665283e-06, 7.351860404014587e-06, 8.080154657363892e-06, 8.808448910713196e-06, 9.5367431640625e-06, 1.0265037417411804e-05, 1.0993331670761108e-05, 1.1721625924110413e-05, 1.2449920177459717e-05, 1.3178214430809021e-05, 1.3906508684158325e-05, 1.463480293750763e-05, 1.5363097190856934e-05, 1.6091391444206238e-05, 1.6819685697555542e-05, 1.7547979950904846e-05, 1.827627420425415e-05, 1.9004568457603455e-05, 1.973286271095276e-05, 2.0461156964302063e-05, 2.1189451217651367e-05, 2.191774547100067e-05, 2.2646039724349976e-05, 2.337433397769928e-05, 2.4102628231048584e-05, 2.4830922484397888e-05, 2.5559216737747192e-05, 2.6287510991096497e-05, 2.70158052444458e-05, 2.7744099497795105e-05, 2.847239375114441e-05, 2.9200688004493713e-05, 2.9928982257843018e-05, 3.065727651119232e-05, 3.1385570764541626e-05, 3.211386501789093e-05, 3.2842159271240234e-05]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 4.0, 7.0, 8.0, 6.0, 19.0, 27.0, 50.0, 66.0, 113.0, 222.0, 460.0, 1182.0, 3380.0, 15181.0, 144624.0, 781800.0, 85811.0, 10995.0, 2742.0, 990.0, 402.0, 179.0, 102.0, 62.0, 46.0, 22.0, 15.0, 13.0, 8.0, 7.0, 3.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.08770751953125, -0.08500099182128906, -0.08229446411132812, -0.07958793640136719, -0.07688140869140625, -0.07417488098144531, -0.07146835327148438, -0.06876182556152344, -0.0660552978515625, -0.06334877014160156, -0.060642242431640625, -0.05793571472167969, -0.05522918701171875, -0.05252265930175781, -0.049816131591796875, -0.04710960388183594, -0.044403076171875, -0.04169654846191406, -0.038990020751953125, -0.03628349304199219, -0.03357696533203125, -0.030870437622070312, -0.028163909912109375, -0.025457382202148438, -0.0227508544921875, -0.020044326782226562, -0.017337799072265625, -0.014631271362304688, -0.01192474365234375, -0.009218215942382812, -0.006511688232421875, -0.0038051605224609375, -0.0010986328125, 0.0016078948974609375, 0.004314422607421875, 0.0070209503173828125, 0.00972747802734375, 0.012434005737304688, 0.015140533447265625, 0.017847061157226562, 0.0205535888671875, 0.023260116577148438, 0.025966644287109375, 0.028673171997070312, 0.03137969970703125, 0.03408622741699219, 0.036792755126953125, 0.03949928283691406, 0.042205810546875, 0.04491233825683594, 0.047618865966796875, 0.05032539367675781, 0.05303192138671875, 0.05573844909667969, 0.058444976806640625, 0.06115150451660156, 0.0638580322265625, 0.06656455993652344, 0.06927108764648438, 0.07197761535644531, 0.07468414306640625, 0.07739067077636719, 0.08009719848632812, 0.08280372619628906, 0.08551025390625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 3.0, 2.0, 3.0, 7.0, 12.0, 5.0, 12.0, 7.0, 12.0, 13.0, 36.0, 41.0, 39.0, 54.0, 68.0, 77.0, 74.0, 97.0, 74.0, 63.0, 61.0, 48.0, 42.0, 47.0, 29.0, 20.0, 16.0, 13.0, 11.0, 10.0, 5.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06787109375, -0.06555747985839844, -0.06324386596679688, -0.06093025207519531, -0.05861663818359375, -0.05630302429199219, -0.053989410400390625, -0.05167579650878906, -0.0493621826171875, -0.04704856872558594, -0.044734954833984375, -0.04242134094238281, -0.04010772705078125, -0.03779411315917969, -0.035480499267578125, -0.03316688537597656, -0.030853271484375, -0.028539657592773438, -0.026226043701171875, -0.023912429809570312, -0.02159881591796875, -0.019285202026367188, -0.016971588134765625, -0.014657974243164062, -0.0123443603515625, -0.010030746459960938, -0.007717132568359375, -0.0054035186767578125, -0.00308990478515625, -0.0007762908935546875, 0.001537322998046875, 0.0038509368896484375, 0.00616455078125, 0.008478164672851562, 0.010791778564453125, 0.013105392456054688, 0.01541900634765625, 0.017732620239257812, 0.020046234130859375, 0.022359848022460938, 0.0246734619140625, 0.026987075805664062, 0.029300689697265625, 0.03161430358886719, 0.03392791748046875, 0.03624153137207031, 0.038555145263671875, 0.04086875915527344, 0.043182373046875, 0.04549598693847656, 0.047809600830078125, 0.05012321472167969, 0.05243682861328125, 0.05475044250488281, 0.057064056396484375, 0.05937767028808594, 0.0616912841796875, 0.06400489807128906, 0.06631851196289062, 0.06863212585449219, 0.07094573974609375, 0.07325935363769531, 0.07557296752929688, 0.07788658142089844, 0.0802001953125]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 8.0, 38.0, 94.0, 209.0, 292.0, 221.0, 89.0, 30.0, 15.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6636955738067627, -3.5793709754943848, -3.495046377182007, -3.410721778869629, -3.326397180557251, -3.242072582244873, -3.157748222351074, -3.0734236240386963, -2.9890990257263184, -2.9047744274139404, -2.8204498291015625, -2.7361252307891846, -2.6518006324768066, -2.567476272583008, -2.483151435852051, -2.398827075958252, -2.314502239227295, -2.230177640914917, -2.145853042602539, -2.061528444290161, -1.9772039651870728, -1.8928793668746948, -1.808554768562317, -1.7242302894592285, -1.6399056911468506, -1.5555810928344727, -1.4712564945220947, -1.3869318962097168, -1.3026074171066284, -1.2182828187942505, -1.1339582204818726, -1.0496337413787842, -0.9653091430664062, -0.8809845447540283, -0.7966600060462952, -0.7123354077339172, -0.6280108690261841, -0.5436862707138062, -0.4593616724014282, -0.37503713369369507, -0.29071253538131714, -0.2063879668712616, -0.12206338346004486, -0.037738800048828125, 0.04658576846122742, 0.13091033697128296, 0.2152349352836609, 0.29955947399139404, 0.383884072303772, 0.4682086408138275, 0.5525332093238831, 0.636857807636261, 0.7211823463439941, 0.8055069446563721, 0.88983154296875, 0.9741560816764832, 1.0584807395935059, 1.1428053379058838, 1.2271299362182617, 1.3114545345306396, 1.395779013633728, 1.480103611946106, 1.5644282102584839, 1.6487526893615723, 1.7330772876739502]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 6.0, 5.0, 8.0, 16.0, 9.0, 16.0, 9.0, 14.0, 24.0, 20.0, 31.0, 27.0, 31.0, 42.0, 39.0, 56.0, 48.0, 54.0, 53.0, 40.0, 56.0, 45.0, 48.0, 43.0, 41.0, 47.0, 30.0, 26.0, 26.0, 20.0, 21.0, 12.0, 10.0, 8.0, 7.0, 4.0, 4.0, 4.0, 0.0, 3.0, 2.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.154894471168518, -1.1187984943389893, -1.0827025175094604, -1.0466065406799316, -1.0105106830596924, -0.9744146466255188, -0.9383187294006348, -0.902222752571106, -0.8661267757415771, -0.8300307989120483, -0.7939348220825195, -0.7578389048576355, -0.7217429280281067, -0.6856469511985779, -0.6495510339736938, -0.613455057144165, -0.5773590803146362, -0.5412631034851074, -0.5051671266555786, -0.4690712094306946, -0.43297523260116577, -0.39687925577163696, -0.36078330874443054, -0.3246873617172241, -0.2885913848876953, -0.2524954080581665, -0.21639946103096008, -0.18030349910259247, -0.14420753717422485, -0.10811157524585724, -0.07201561331748962, -0.0359196662902832, 0.00017642974853515625, 0.03627239167690277, 0.07236835360527039, 0.108464315533638, 0.14456027746200562, 0.18065623939037323, 0.21675220131874084, 0.25284814834594727, 0.2889441251754761, 0.3250401020050049, 0.3611360490322113, 0.3972319960594177, 0.43332797288894653, 0.46942394971847534, 0.5055198669433594, 0.5416158437728882, 0.577711820602417, 0.6138077974319458, 0.6499037742614746, 0.6859996914863586, 0.7220956683158875, 0.7581916451454163, 0.7942875623703003, 0.8303835391998291, 0.8664795160293579, 0.9025754928588867, 0.9386714696884155, 0.9747673869132996, 1.0108633041381836, 1.0469592809677124, 1.0830552577972412, 1.11915123462677, 1.1552472114562988]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 4.0, 12.0, 7.0, 18.0, 33.0, 68.0, 87.0, 211.0, 548.0, 2138.0, 15911.0, 608859.0, 3528022.0, 33517.0, 3656.0, 748.0, 245.0, 86.0, 48.0, 29.0, 25.0, 9.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3359375, -0.32637786865234375, -0.3168182373046875, -0.30725860595703125, -0.297698974609375, -0.28813934326171875, -0.2785797119140625, -0.26902008056640625, -0.25946044921875, -0.24990081787109375, -0.2403411865234375, -0.23078155517578125, -0.221221923828125, -0.21166229248046875, -0.2021026611328125, -0.19254302978515625, -0.1829833984375, -0.17342376708984375, -0.1638641357421875, -0.15430450439453125, -0.144744873046875, -0.13518524169921875, -0.1256256103515625, -0.11606597900390625, -0.10650634765625, -0.09694671630859375, -0.0873870849609375, -0.07782745361328125, -0.068267822265625, -0.05870819091796875, -0.0491485595703125, -0.03958892822265625, -0.030029296875, -0.02046966552734375, -0.0109100341796875, -0.00135040283203125, 0.008209228515625, 0.01776885986328125, 0.0273284912109375, 0.03688812255859375, 0.04644775390625, 0.05600738525390625, 0.0655670166015625, 0.07512664794921875, 0.084686279296875, 0.09424591064453125, 0.1038055419921875, 0.11336517333984375, 0.1229248046875, 0.13248443603515625, 0.1420440673828125, 0.15160369873046875, 0.161163330078125, 0.17072296142578125, 0.1802825927734375, 0.18984222412109375, 0.19940185546875, 0.20896148681640625, 0.2185211181640625, 0.22808074951171875, 0.237640380859375, 0.24720001220703125, 0.2567596435546875, 0.26631927490234375, 0.27587890625]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 7.0, 11.0, 12.0, 18.0, 37.0, 36.0, 59.0, 63.0, 76.0, 98.0, 96.0, 100.0, 91.0, 82.0, 66.0, 37.0, 34.0, 41.0, 21.0, 12.0, 5.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1654052734375, -0.1614522933959961, -0.1574993133544922, -0.15354633331298828, -0.14959335327148438, -0.14564037322998047, -0.14168739318847656, -0.13773441314697266, -0.13378143310546875, -0.12982845306396484, -0.12587547302246094, -0.12192249298095703, -0.11796951293945312, -0.11401653289794922, -0.11006355285644531, -0.1061105728149414, -0.1021575927734375, -0.0982046127319336, -0.09425163269042969, -0.09029865264892578, -0.08634567260742188, -0.08239269256591797, -0.07843971252441406, -0.07448673248291016, -0.07053375244140625, -0.06658077239990234, -0.06262779235839844, -0.05867481231689453, -0.054721832275390625, -0.05076885223388672, -0.04681587219238281, -0.042862892150878906, -0.038909912109375, -0.034956932067871094, -0.031003952026367188, -0.02705097198486328, -0.023097991943359375, -0.01914501190185547, -0.015192031860351562, -0.011239051818847656, -0.00728607177734375, -0.0033330917358398438, 0.0006198883056640625, 0.004572868347167969, 0.008525848388671875, 0.012478828430175781, 0.016431808471679688, 0.020384788513183594, 0.0243377685546875, 0.028290748596191406, 0.03224372863769531, 0.03619670867919922, 0.040149688720703125, 0.04410266876220703, 0.04805564880371094, 0.052008628845214844, 0.05596160888671875, 0.059914588928222656, 0.06386756896972656, 0.06782054901123047, 0.07177352905273438, 0.07572650909423828, 0.07967948913574219, 0.0836324691772461, 0.08758544921875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 6.0, 6.0, 3.0, 8.0, 13.0, 8.0, 10.0, 18.0, 26.0, 40.0, 62.0, 182.0, 397.0, 1221.0, 5417.0, 31357.0, 870378.0, 3228675.0, 47004.0, 6894.0, 1610.0, 513.0, 197.0, 105.0, 38.0, 22.0, 16.0, 17.0, 10.0, 7.0, 10.0, 2.0, 5.0, 3.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.2861328125, -0.277740478515625, -0.26934814453125, -0.260955810546875, -0.2525634765625, -0.244171142578125, -0.23577880859375, -0.227386474609375, -0.218994140625, -0.210601806640625, -0.20220947265625, -0.193817138671875, -0.1854248046875, -0.177032470703125, -0.16864013671875, -0.160247802734375, -0.15185546875, -0.143463134765625, -0.13507080078125, -0.126678466796875, -0.1182861328125, -0.109893798828125, -0.10150146484375, -0.093109130859375, -0.084716796875, -0.076324462890625, -0.06793212890625, -0.059539794921875, -0.0511474609375, -0.042755126953125, -0.03436279296875, -0.025970458984375, -0.017578125, -0.009185791015625, -0.00079345703125, 0.007598876953125, 0.0159912109375, 0.024383544921875, 0.03277587890625, 0.041168212890625, 0.049560546875, 0.057952880859375, 0.06634521484375, 0.074737548828125, 0.0831298828125, 0.091522216796875, 0.09991455078125, 0.108306884765625, 0.11669921875, 0.125091552734375, 0.13348388671875, 0.141876220703125, 0.1502685546875, 0.158660888671875, 0.16705322265625, 0.175445556640625, 0.183837890625, 0.192230224609375, 0.20062255859375, 0.209014892578125, 0.2174072265625, 0.225799560546875, 0.23419189453125, 0.242584228515625, 0.2509765625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 5.0, 2.0, 4.0, 3.0, 6.0, 8.0, 1.0, 8.0, 11.0, 14.0, 19.0, 20.0, 54.0, 67.0, 79.0, 237.0, 757.0, 1562.0, 647.0, 252.0, 132.0, 55.0, 39.0, 39.0, 16.0, 19.0, 6.0, 6.0, 7.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1822509765625, -0.1753826141357422, -0.16851425170898438, -0.16164588928222656, -0.15477752685546875, -0.14790916442871094, -0.14104080200195312, -0.1341724395751953, -0.1273040771484375, -0.12043571472167969, -0.11356735229492188, -0.10669898986816406, -0.09983062744140625, -0.09296226501464844, -0.08609390258789062, -0.07922554016113281, -0.072357177734375, -0.06548881530761719, -0.058620452880859375, -0.05175209045410156, -0.04488372802734375, -0.03801536560058594, -0.031147003173828125, -0.024278640747070312, -0.0174102783203125, -0.010541915893554688, -0.003673553466796875, 0.0031948089599609375, 0.01006317138671875, 0.016931533813476562, 0.023799896240234375, 0.030668258666992188, 0.03753662109375, 0.04440498352050781, 0.051273345947265625, 0.05814170837402344, 0.06501007080078125, 0.07187843322753906, 0.07874679565429688, 0.08561515808105469, 0.0924835205078125, 0.09935188293457031, 0.10622024536132812, 0.11308860778808594, 0.11995697021484375, 0.12682533264160156, 0.13369369506835938, 0.1405620574951172, 0.147430419921875, 0.1542987823486328, 0.16116714477539062, 0.16803550720214844, 0.17490386962890625, 0.18177223205566406, 0.18864059448242188, 0.1955089569091797, 0.2023773193359375, 0.2092456817626953, 0.21611404418945312, 0.22298240661621094, 0.22985076904296875, 0.23671913146972656, 0.24358749389648438, 0.2504558563232422, 0.25732421875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 8.0, 6.0, 13.0, 22.0, 41.0, 78.0, 120.0, 152.0, 152.0, 131.0, 98.0, 54.0, 36.0, 26.0, 9.0, 11.0, 9.0, 7.0, 5.0, 3.0, 3.0, 1.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.063185453414917, -1.025383710861206, -0.9875818490982056, -0.9497801065444946, -0.9119783043861389, -0.8741765022277832, -0.8363747000694275, -0.7985728979110718, -0.7607711553573608, -0.7229693531990051, -0.6851675510406494, -0.6473658084869385, -0.6095640063285828, -0.571762204170227, -0.5339604020118713, -0.496158629655838, -0.4583567976951599, -0.4205549955368042, -0.3827532231807709, -0.34495142102241516, -0.30714964866638184, -0.2693478465080261, -0.2315460443496704, -0.19374427199363708, -0.15594246983528137, -0.11814068257808685, -0.08033888787031174, -0.04253709316253662, -0.004735305905342102, 0.03306648135185242, 0.07086828351020813, 0.10867005586624146, 0.14647185802459717, 0.1842736452817917, 0.2220754325389862, 0.2598772346973419, 0.29767900705337524, 0.33548080921173096, 0.37328261137008667, 0.41108438372612, 0.4488861858844757, 0.4866879880428314, 0.5244897603988647, 0.5622915625572205, 0.6000933647155762, 0.6378951072692871, 0.6756969690322876, 0.7134987115859985, 0.7513005137443542, 0.78910231590271, 0.8269041180610657, 0.8647059202194214, 0.9025076627731323, 0.940309464931488, 0.9781112670898438, 1.0159130096435547, 1.0537148714065552, 1.0915166139602661, 1.1293184757232666, 1.1671202182769775, 1.204922080039978, 1.242723822593689, 1.2805256843566895, 1.3183274269104004, 1.3561291694641113]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 4.0, 4.0, 5.0, 6.0, 17.0, 6.0, 15.0, 20.0, 17.0, 14.0, 18.0, 23.0, 25.0, 29.0, 34.0, 31.0, 48.0, 35.0, 42.0, 47.0, 30.0, 48.0, 44.0, 40.0, 44.0, 33.0, 44.0, 40.0, 25.0, 39.0, 26.0, 28.0, 23.0, 11.0, 18.0, 23.0, 11.0, 4.0, 7.0, 8.0, 7.0, 4.0, 3.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.6841775178909302, -0.662675142288208, -0.6411727666854858, -0.6196704506874084, -0.5981680750846863, -0.5766656994819641, -0.5551633834838867, -0.5336610078811646, -0.5121586322784424, -0.4906562566757202, -0.46915391087532043, -0.44765156507492065, -0.4261491894721985, -0.4046468138694763, -0.38314446806907654, -0.36164212226867676, -0.3401397466659546, -0.3186373710632324, -0.29713502526283264, -0.27563267946243286, -0.2541303038597107, -0.23262794315814972, -0.21112558245658875, -0.18962322175502777, -0.1681208610534668, -0.14661850035190582, -0.12511613965034485, -0.10361377894878387, -0.0821114182472229, -0.060609057545661926, -0.03910669684410095, -0.017604336142539978, 0.003898024559020996, 0.02540038526058197, 0.046902745962142944, 0.06840510666370392, 0.08990746736526489, 0.11140982806682587, 0.13291218876838684, 0.15441454946994781, 0.1759169101715088, 0.19741927087306976, 0.21892163157463074, 0.2404239922761917, 0.2619263529777527, 0.28342872858047485, 0.30493107438087463, 0.3264334201812744, 0.3479357957839966, 0.36943817138671875, 0.39094051718711853, 0.4124428629875183, 0.4339452385902405, 0.45544761419296265, 0.4769499599933624, 0.4984523057937622, 0.5199546813964844, 0.5414570569992065, 0.5629594326019287, 0.5844617486000061, 0.6059641242027283, 0.6274664998054504, 0.6489688158035278, 0.67047119140625, 0.6919735670089722]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 1.0, 8.0, 5.0, 12.0, 17.0, 29.0, 32.0, 44.0, 83.0, 113.0, 177.0, 323.0, 632.0, 1337.0, 3321.0, 9322.0, 31562.0, 118549.0, 361985.0, 357876.0, 116682.0, 31046.0, 9279.0, 3244.0, 1339.0, 664.0, 313.0, 200.0, 109.0, 90.0, 48.0, 39.0, 28.0, 15.0, 5.0, 9.0, 5.0, 4.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1514892578125, -0.1464385986328125, -0.141387939453125, -0.1363372802734375, -0.13128662109375, -0.1262359619140625, -0.121185302734375, -0.1161346435546875, -0.111083984375, -0.1060333251953125, -0.100982666015625, -0.0959320068359375, -0.09088134765625, -0.0858306884765625, -0.080780029296875, -0.0757293701171875, -0.0706787109375, -0.0656280517578125, -0.060577392578125, -0.0555267333984375, -0.05047607421875, -0.0454254150390625, -0.040374755859375, -0.0353240966796875, -0.0302734375, -0.0252227783203125, -0.020172119140625, -0.0151214599609375, -0.01007080078125, -0.0050201416015625, 3.0517578125e-05, 0.0050811767578125, 0.0101318359375, 0.0151824951171875, 0.020233154296875, 0.0252838134765625, 0.03033447265625, 0.0353851318359375, 0.040435791015625, 0.0454864501953125, 0.050537109375, 0.0555877685546875, 0.060638427734375, 0.0656890869140625, 0.07073974609375, 0.0757904052734375, 0.080841064453125, 0.0858917236328125, 0.0909423828125, 0.0959930419921875, 0.101043701171875, 0.1060943603515625, 0.11114501953125, 0.1161956787109375, 0.121246337890625, 0.1262969970703125, 0.13134765625, 0.1363983154296875, 0.141448974609375, 0.1464996337890625, 0.15155029296875, 0.1566009521484375, 0.161651611328125, 0.1667022705078125, 0.1717529296875]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 6.0, 10.0, 13.0, 33.0, 32.0, 46.0, 44.0, 77.0, 84.0, 102.0, 97.0, 100.0, 98.0, 67.0, 53.0, 56.0, 33.0, 25.0, 8.0, 9.0, 5.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17236328125, -0.16820335388183594, -0.16404342651367188, -0.1598834991455078, -0.15572357177734375, -0.1515636444091797, -0.14740371704101562, -0.14324378967285156, -0.1390838623046875, -0.13492393493652344, -0.13076400756835938, -0.1266040802001953, -0.12244415283203125, -0.11828422546386719, -0.11412429809570312, -0.10996437072753906, -0.105804443359375, -0.10164451599121094, -0.09748458862304688, -0.09332466125488281, -0.08916473388671875, -0.08500480651855469, -0.08084487915039062, -0.07668495178222656, -0.0725250244140625, -0.06836509704589844, -0.06420516967773438, -0.06004524230957031, -0.05588531494140625, -0.05172538757324219, -0.047565460205078125, -0.04340553283691406, -0.03924560546875, -0.03508567810058594, -0.030925750732421875, -0.026765823364257812, -0.02260589599609375, -0.018445968627929688, -0.014286041259765625, -0.010126113891601562, -0.0059661865234375, -0.0018062591552734375, 0.002353668212890625, 0.0065135955810546875, 0.01067352294921875, 0.014833450317382812, 0.018993377685546875, 0.023153305053710938, 0.027313232421875, 0.03147315979003906, 0.035633087158203125, 0.03979301452636719, 0.04395294189453125, 0.04811286926269531, 0.052272796630859375, 0.05643272399902344, 0.0605926513671875, 0.06475257873535156, 0.06891250610351562, 0.07307243347167969, 0.07723236083984375, 0.08139228820800781, 0.08555221557617188, 0.08971214294433594, 0.0938720703125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 5.0, 9.0, 14.0, 23.0, 26.0, 45.0, 75.0, 149.0, 281.0, 545.0, 1270.0, 3770.0, 23694.0, 591559.0, 403141.0, 18400.0, 3299.0, 1165.0, 553.0, 233.0, 110.0, 73.0, 31.0, 24.0, 21.0, 15.0, 6.0, 9.0, 5.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.462158203125, -0.4513969421386719, -0.44063568115234375, -0.4298744201660156, -0.4191131591796875, -0.4083518981933594, -0.39759063720703125, -0.3868293762207031, -0.376068115234375, -0.3653068542480469, -0.35454559326171875, -0.3437843322753906, -0.3330230712890625, -0.3222618103027344, -0.31150054931640625, -0.3007392883300781, -0.28997802734375, -0.2792167663574219, -0.26845550537109375, -0.2576942443847656, -0.2469329833984375, -0.23617172241210938, -0.22541046142578125, -0.21464920043945312, -0.203887939453125, -0.19312667846679688, -0.18236541748046875, -0.17160415649414062, -0.1608428955078125, -0.15008163452148438, -0.13932037353515625, -0.12855911254882812, -0.1177978515625, -0.10703659057617188, -0.09627532958984375, -0.08551406860351562, -0.0747528076171875, -0.06399154663085938, -0.05323028564453125, -0.042469024658203125, -0.031707763671875, -0.020946502685546875, -0.01018524169921875, 0.000576019287109375, 0.0113372802734375, 0.022098541259765625, 0.03285980224609375, 0.043621063232421875, 0.05438232421875, 0.06514358520507812, 0.07590484619140625, 0.08666610717773438, 0.0974273681640625, 0.10818862915039062, 0.11894989013671875, 0.12971115112304688, 0.140472412109375, 0.15123367309570312, 0.16199493408203125, 0.17275619506835938, 0.1835174560546875, 0.19427871704101562, 0.20503997802734375, 0.21580123901367188, 0.2265625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 5.0, 4.0, 3.0, 7.0, 12.0, 14.0, 14.0, 22.0, 21.0, 27.0, 33.0, 45.0, 47.0, 35.0, 53.0, 41.0, 67.0, 41.0, 60.0, 51.0, 61.0, 54.0, 32.0, 41.0, 36.0, 36.0, 37.0, 22.0, 20.0, 15.0, 15.0, 9.0, 10.0, 6.0, 6.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.418212890625, -0.4077796936035156, -0.39734649658203125, -0.3869132995605469, -0.3764801025390625, -0.3660469055175781, -0.35561370849609375, -0.3451805114746094, -0.334747314453125, -0.3243141174316406, -0.31388092041015625, -0.3034477233886719, -0.2930145263671875, -0.2825813293457031, -0.27214813232421875, -0.2617149353027344, -0.25128173828125, -0.24084854125976562, -0.23041534423828125, -0.21998214721679688, -0.2095489501953125, -0.19911575317382812, -0.18868255615234375, -0.17824935913085938, -0.167816162109375, -0.15738296508789062, -0.14694976806640625, -0.13651657104492188, -0.1260833740234375, -0.11565017700195312, -0.10521697998046875, -0.09478378295898438, -0.0843505859375, -0.07391738891601562, -0.06348419189453125, -0.053050994873046875, -0.0426177978515625, -0.032184600830078125, -0.02175140380859375, -0.011318206787109375, -0.000885009765625, 0.009548187255859375, 0.01998138427734375, 0.030414581298828125, 0.0408477783203125, 0.051280975341796875, 0.06171417236328125, 0.07214736938476562, 0.08258056640625, 0.09301376342773438, 0.10344696044921875, 0.11388015747070312, 0.1243133544921875, 0.13474655151367188, 0.14517974853515625, 0.15561294555664062, 0.166046142578125, 0.17647933959960938, 0.18691253662109375, 0.19734573364257812, 0.2077789306640625, 0.21821212768554688, 0.22864532470703125, 0.23907852172851562, 0.24951171875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 2.0, 3.0, 1.0, 3.0, 6.0, 4.0, 6.0, 11.0, 14.0, 19.0, 28.0, 37.0, 59.0, 89.0, 159.0, 310.0, 555.0, 1190.0, 3263.0, 12085.0, 113041.0, 792231.0, 108151.0, 11649.0, 3116.0, 1202.0, 554.0, 279.0, 168.0, 100.0, 71.0, 34.0, 33.0, 23.0, 15.0, 15.0, 5.0, 3.0, 5.0, 3.0, 6.0, 3.0, 5.0, 0.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08721923828125, -0.08426189422607422, -0.08130455017089844, -0.07834720611572266, -0.07538986206054688, -0.0724325180053711, -0.06947517395019531, -0.06651782989501953, -0.06356048583984375, -0.06060314178466797, -0.05764579772949219, -0.054688453674316406, -0.051731109619140625, -0.048773765563964844, -0.04581642150878906, -0.04285907745361328, -0.0399017333984375, -0.03694438934326172, -0.03398704528808594, -0.031029701232910156, -0.028072357177734375, -0.025115013122558594, -0.022157669067382812, -0.01920032501220703, -0.01624298095703125, -0.013285636901855469, -0.010328292846679688, -0.007370948791503906, -0.004413604736328125, -0.0014562606811523438, 0.0015010833740234375, 0.004458427429199219, 0.007415771484375, 0.010373115539550781, 0.013330459594726562, 0.016287803649902344, 0.019245147705078125, 0.022202491760253906, 0.025159835815429688, 0.02811717987060547, 0.03107452392578125, 0.03403186798095703, 0.03698921203613281, 0.039946556091308594, 0.042903900146484375, 0.045861244201660156, 0.04881858825683594, 0.05177593231201172, 0.0547332763671875, 0.05769062042236328, 0.06064796447753906, 0.06360530853271484, 0.06656265258789062, 0.0695199966430664, 0.07247734069824219, 0.07543468475341797, 0.07839202880859375, 0.08134937286376953, 0.08430671691894531, 0.0872640609741211, 0.09022140502929688, 0.09317874908447266, 0.09613609313964844, 0.09909343719482422, 0.10205078125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 0.0, 4.0, 8.0, 7.0, 6.0, 17.0, 24.0, 37.0, 34.0, 53.0, 81.0, 95.0, 118.0, 98.0, 109.0, 86.0, 63.0, 56.0, 42.0, 24.0, 9.0, 13.0, 6.0, 3.0, 5.0, 0.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.4318695068359375e-05, -2.364814281463623e-05, -2.2977590560913086e-05, -2.230703830718994e-05, -2.1636486053466797e-05, -2.0965933799743652e-05, -2.0295381546020508e-05, -1.9624829292297363e-05, -1.895427703857422e-05, -1.8283724784851074e-05, -1.761317253112793e-05, -1.6942620277404785e-05, -1.627206802368164e-05, -1.5601515769958496e-05, -1.4930963516235352e-05, -1.4260411262512207e-05, -1.3589859008789062e-05, -1.2919306755065918e-05, -1.2248754501342773e-05, -1.1578202247619629e-05, -1.0907649993896484e-05, -1.023709774017334e-05, -9.566545486450195e-06, -8.89599323272705e-06, -8.225440979003906e-06, -7.554888725280762e-06, -6.884336471557617e-06, -6.213784217834473e-06, -5.543231964111328e-06, -4.872679710388184e-06, -4.202127456665039e-06, -3.5315752029418945e-06, -2.86102294921875e-06, -2.1904706954956055e-06, -1.519918441772461e-06, -8.493661880493164e-07, -1.7881393432617188e-07, 4.917383193969727e-07, 1.1622905731201172e-06, 1.8328428268432617e-06, 2.5033950805664062e-06, 3.1739473342895508e-06, 3.844499588012695e-06, 4.51505184173584e-06, 5.185604095458984e-06, 5.856156349182129e-06, 6.5267086029052734e-06, 7.197260856628418e-06, 7.867813110351562e-06, 8.538365364074707e-06, 9.208917617797852e-06, 9.879469871520996e-06, 1.055002212524414e-05, 1.1220574378967285e-05, 1.189112663269043e-05, 1.2561678886413574e-05, 1.3232231140136719e-05, 1.3902783393859863e-05, 1.4573335647583008e-05, 1.5243887901306152e-05, 1.5914440155029297e-05, 1.658499240875244e-05, 1.7255544662475586e-05, 1.792609691619873e-05, 1.8596649169921875e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 10.0, 7.0, 11.0, 12.0, 14.0, 24.0, 45.0, 59.0, 85.0, 135.0, 282.0, 475.0, 1122.0, 2948.0, 10262.0, 55659.0, 534582.0, 385348.0, 44075.0, 8542.0, 2675.0, 1101.0, 492.0, 248.0, 134.0, 66.0, 41.0, 31.0, 13.0, 24.0, 9.0, 7.0, 3.0, 6.0, 1.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05926513671875, -0.05668163299560547, -0.05409812927246094, -0.051514625549316406, -0.048931121826171875, -0.046347618103027344, -0.04376411437988281, -0.04118061065673828, -0.03859710693359375, -0.03601360321044922, -0.03343009948730469, -0.030846595764160156, -0.028263092041015625, -0.025679588317871094, -0.023096084594726562, -0.02051258087158203, -0.0179290771484375, -0.015345573425292969, -0.012762069702148438, -0.010178565979003906, -0.007595062255859375, -0.005011558532714844, -0.0024280548095703125, 0.00015544891357421875, 0.00273895263671875, 0.005322456359863281, 0.007905960083007812, 0.010489463806152344, 0.013072967529296875, 0.015656471252441406, 0.018239974975585938, 0.02082347869873047, 0.023406982421875, 0.02599048614501953, 0.028573989868164062, 0.031157493591308594, 0.033740997314453125, 0.036324501037597656, 0.03890800476074219, 0.04149150848388672, 0.04407501220703125, 0.04665851593017578, 0.04924201965332031, 0.051825523376464844, 0.054409027099609375, 0.056992530822753906, 0.05957603454589844, 0.06215953826904297, 0.0647430419921875, 0.06732654571533203, 0.06991004943847656, 0.0724935531616211, 0.07507705688476562, 0.07766056060791016, 0.08024406433105469, 0.08282756805419922, 0.08541107177734375, 0.08799457550048828, 0.09057807922363281, 0.09316158294677734, 0.09574508666992188, 0.0983285903930664, 0.10091209411621094, 0.10349559783935547, 0.1060791015625]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [7.0, 4.0, 4.0, 3.0, 7.0, 7.0, 8.0, 12.0, 16.0, 10.0, 18.0, 17.0, 28.0, 36.0, 36.0, 47.0, 69.0, 79.0, 66.0, 59.0, 78.0, 67.0, 66.0, 47.0, 40.0, 43.0, 33.0, 38.0, 17.0, 16.0, 12.0, 3.0, 8.0, 4.0, 2.0, 8.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04827880859375, -0.045783042907714844, -0.04328727722167969, -0.04079151153564453, -0.038295745849609375, -0.03579998016357422, -0.03330421447753906, -0.030808448791503906, -0.02831268310546875, -0.025816917419433594, -0.023321151733398438, -0.02082538604736328, -0.018329620361328125, -0.01583385467529297, -0.013338088989257812, -0.010842323303222656, -0.0083465576171875, -0.005850791931152344, -0.0033550262451171875, -0.0008592605590820312, 0.001636505126953125, 0.004132270812988281, 0.0066280364990234375, 0.009123802185058594, 0.01161956787109375, 0.014115333557128906, 0.016611099243164062, 0.01910686492919922, 0.021602630615234375, 0.02409839630126953, 0.026594161987304688, 0.029089927673339844, 0.031585693359375, 0.034081459045410156, 0.03657722473144531, 0.03907299041748047, 0.041568756103515625, 0.04406452178955078, 0.04656028747558594, 0.049056053161621094, 0.05155181884765625, 0.054047584533691406, 0.05654335021972656, 0.05903911590576172, 0.061534881591796875, 0.06403064727783203, 0.06652641296386719, 0.06902217864990234, 0.0715179443359375, 0.07401371002197266, 0.07650947570800781, 0.07900524139404297, 0.08150100708007812, 0.08399677276611328, 0.08649253845214844, 0.0889883041381836, 0.09148406982421875, 0.0939798355102539, 0.09647560119628906, 0.09897136688232422, 0.10146713256835938, 0.10396289825439453, 0.10645866394042969, 0.10895442962646484, 0.1114501953125]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 4.0, 11.0, 66.0, 175.0, 396.0, 239.0, 84.0, 21.0, 7.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.593566656112671, -3.4835944175720215, -3.373621940612793, -3.2636497020721436, -3.153677463531494, -3.0437052249908447, -2.9337329864501953, -2.823760509490967, -2.7137882709503174, -2.603816032409668, -2.4938435554504395, -2.38387131690979, -2.2738990783691406, -2.163926839828491, -2.053954601287842, -1.9439821243286133, -1.8340098857879639, -1.7240376472473145, -1.6140652894973755, -1.5040929317474365, -1.394120693206787, -1.2841484546661377, -1.1741760969161987, -1.0642037391662598, -0.9542315006256104, -0.8442592024803162, -0.734286904335022, -0.6243146061897278, -0.5143423080444336, -0.4043700098991394, -0.2943977117538452, -0.18442541360855103, -0.07445311546325684, 0.035519182682037354, 0.14549148082733154, 0.25546377897262573, 0.3654360771179199, 0.4754083752632141, 0.5853806734085083, 0.6953529715538025, 0.8053252696990967, 0.9152975678443909, 1.025269865989685, 1.135242223739624, 1.2452144622802734, 1.3551867008209229, 1.4651590585708618, 1.5751314163208008, 1.6851036548614502, 1.7950758934020996, 1.9050482511520386, 2.0150206089019775, 2.124992847442627, 2.2349650859832764, 2.344937324523926, 2.4549098014831543, 2.5648820400238037, 2.674854278564453, 2.7848267555236816, 2.894798994064331, 3.0047712326049805, 3.11474347114563, 3.2247157096862793, 3.334688186645508, 3.4446604251861572]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 0.0, 3.0, 8.0, 9.0, 10.0, 18.0, 21.0, 18.0, 22.0, 28.0, 39.0, 50.0, 48.0, 59.0, 59.0, 84.0, 75.0, 75.0, 66.0, 74.0, 47.0, 42.0, 36.0, 27.0, 24.0, 19.0, 12.0, 16.0, 5.0, 7.0, 5.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9950193166732788, -1.9455151557922363, -1.8960109949111938, -1.8465068340301514, -1.7970026731491089, -1.7474985122680664, -1.6979942321777344, -1.648490071296692, -1.5989859104156494, -1.549481749534607, -1.4999775886535645, -1.450473427772522, -1.4009692668914795, -1.3514649868011475, -1.3019609451293945, -1.2524566650390625, -1.2029526233673096, -1.153448462486267, -1.1039443016052246, -1.0544401407241821, -1.0049359798431396, -0.9554317593574524, -0.9059275984764099, -0.8564233779907227, -0.8069192171096802, -0.7574150562286377, -0.7079108953475952, -0.6584067344665527, -0.6089025139808655, -0.559398353099823, -0.5098941922187805, -0.46039000153541565, -0.4108858108520508, -0.3613816499710083, -0.31187745928764343, -0.26237329840660095, -0.21286912262439728, -0.1633649468421936, -0.11386078596115112, -0.06435659527778625, -0.014852434396743774, 0.0346517376601696, 0.08415590971708298, 0.13366007804870605, 0.18316425383090973, 0.2326684296131134, 0.2821725904941559, 0.33167678117752075, 0.38118094205856323, 0.4306851029396057, 0.4801892936229706, 0.5296934843063354, 0.5791976451873779, 0.6287018060684204, 0.6782059669494629, 0.7277101278305054, 0.7772142887115479, 0.8267184495925903, 0.8762226104736328, 0.9257267713546753, 0.9752309918403625, 1.0247352123260498, 1.0742392539978027, 1.1237435340881348, 1.1732476949691772]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 3.0, 3.0, 4.0, 8.0, 9.0, 22.0, 28.0, 22.0, 66.0, 97.0, 120.0, 212.0, 309.0, 1306.0, 4189874.0, 1335.0, 297.0, 194.0, 120.0, 78.0, 56.0, 36.0, 25.0, 20.0, 14.0, 8.0, 7.0, 1.0, 7.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.359375, -1.308074951171875, -1.25677490234375, -1.205474853515625, -1.1541748046875, -1.102874755859375, -1.05157470703125, -1.000274658203125, -0.948974609375, -0.897674560546875, -0.84637451171875, -0.795074462890625, -0.7437744140625, -0.692474365234375, -0.64117431640625, -0.589874267578125, -0.53857421875, -0.487274169921875, -0.43597412109375, -0.384674072265625, -0.3333740234375, -0.282073974609375, -0.23077392578125, -0.179473876953125, -0.128173828125, -0.076873779296875, -0.02557373046875, 0.025726318359375, 0.0770263671875, 0.128326416015625, 0.17962646484375, 0.230926513671875, 0.2822265625, 0.333526611328125, 0.38482666015625, 0.436126708984375, 0.4874267578125, 0.538726806640625, 0.59002685546875, 0.641326904296875, 0.692626953125, 0.743927001953125, 0.79522705078125, 0.846527099609375, 0.8978271484375, 0.949127197265625, 1.00042724609375, 1.051727294921875, 1.10302734375, 1.154327392578125, 1.20562744140625, 1.256927490234375, 1.3082275390625, 1.359527587890625, 1.41082763671875, 1.462127685546875, 1.513427734375, 1.564727783203125, 1.61602783203125, 1.667327880859375, 1.7186279296875, 1.769927978515625, 1.82122802734375, 1.872528076171875, 1.923828125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 8.0, 4.0, 17.0, 16.0, 44.0, 57.0, 86.0, 119.0, 125.0, 157.0, 133.0, 85.0, 73.0, 43.0, 17.0, 14.0, 7.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.27978515625, -0.2739572525024414, -0.2681293487548828, -0.2623014450073242, -0.2564735412597656, -0.25064563751220703, -0.24481773376464844, -0.23898983001708984, -0.23316192626953125, -0.22733402252197266, -0.22150611877441406, -0.21567821502685547, -0.20985031127929688, -0.20402240753173828, -0.1981945037841797, -0.1923666000366211, -0.1865386962890625, -0.1807107925415039, -0.1748828887939453, -0.16905498504638672, -0.16322708129882812, -0.15739917755126953, -0.15157127380371094, -0.14574337005615234, -0.13991546630859375, -0.13408756256103516, -0.12825965881347656, -0.12243175506591797, -0.11660385131835938, -0.11077594757080078, -0.10494804382324219, -0.0991201400756836, -0.093292236328125, -0.0874643325805664, -0.08163642883300781, -0.07580852508544922, -0.06998062133789062, -0.06415271759033203, -0.05832481384277344, -0.052496910095214844, -0.04666900634765625, -0.040841102600097656, -0.03501319885253906, -0.02918529510498047, -0.023357391357421875, -0.01752948760986328, -0.011701583862304688, -0.005873680114746094, -4.57763671875e-05, 0.005782127380371094, 0.011610031127929688, 0.01743793487548828, 0.023265838623046875, 0.02909374237060547, 0.03492164611816406, 0.040749549865722656, 0.04657745361328125, 0.052405357360839844, 0.05823326110839844, 0.06406116485595703, 0.06988906860351562, 0.07571697235107422, 0.08154487609863281, 0.0873727798461914, 0.09320068359375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 10.0, 7.0, 13.0, 10.0, 20.0, 36.0, 54.0, 94.0, 140.0, 325.0, 537.0, 1072.0, 2146.0, 4431.0, 10036.0, 27537.0, 95634.0, 727219.0, 2972508.0, 267253.0, 54207.0, 17633.0, 7028.0, 3209.0, 1502.0, 714.0, 398.0, 187.0, 116.0, 66.0, 34.0, 24.0, 24.0, 16.0, 10.0, 8.0, 7.0, 2.0, 5.0, 0.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1207275390625, -0.1169900894165039, -0.11325263977050781, -0.10951519012451172, -0.10577774047851562, -0.10204029083251953, -0.09830284118652344, -0.09456539154052734, -0.09082794189453125, -0.08709049224853516, -0.08335304260253906, -0.07961559295654297, -0.07587814331054688, -0.07214069366455078, -0.06840324401855469, -0.0646657943725586, -0.0609283447265625, -0.057190895080566406, -0.05345344543457031, -0.04971599578857422, -0.045978546142578125, -0.04224109649658203, -0.03850364685058594, -0.034766197204589844, -0.03102874755859375, -0.027291297912597656, -0.023553848266601562, -0.01981639862060547, -0.016078948974609375, -0.012341499328613281, -0.008604049682617188, -0.004866600036621094, -0.001129150390625, 0.0026082992553710938, 0.0063457489013671875, 0.010083198547363281, 0.013820648193359375, 0.01755809783935547, 0.021295547485351562, 0.025032997131347656, 0.02877044677734375, 0.032507896423339844, 0.03624534606933594, 0.03998279571533203, 0.043720245361328125, 0.04745769500732422, 0.05119514465332031, 0.054932594299316406, 0.0586700439453125, 0.062407493591308594, 0.06614494323730469, 0.06988239288330078, 0.07361984252929688, 0.07735729217529297, 0.08109474182128906, 0.08483219146728516, 0.08856964111328125, 0.09230709075927734, 0.09604454040527344, 0.09978199005126953, 0.10351943969726562, 0.10725688934326172, 0.11099433898925781, 0.1147317886352539, 0.11846923828125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 1.0, 3.0, 1.0, 3.0, 0.0, 3.0, 5.0, 9.0, 14.0, 15.0, 29.0, 30.0, 38.0, 69.0, 106.0, 172.0, 320.0, 616.0, 1007.0, 737.0, 382.0, 187.0, 95.0, 85.0, 33.0, 33.0, 21.0, 16.0, 8.0, 8.0, 9.0, 5.0, 8.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.186279296875, -0.18120193481445312, -0.17612457275390625, -0.17104721069335938, -0.1659698486328125, -0.16089248657226562, -0.15581512451171875, -0.15073776245117188, -0.145660400390625, -0.14058303833007812, -0.13550567626953125, -0.13042831420898438, -0.1253509521484375, -0.12027359008789062, -0.11519622802734375, -0.11011886596679688, -0.10504150390625, -0.09996414184570312, -0.09488677978515625, -0.08980941772460938, -0.0847320556640625, -0.07965469360351562, -0.07457733154296875, -0.06949996948242188, -0.064422607421875, -0.059345245361328125, -0.05426788330078125, -0.049190521240234375, -0.0441131591796875, -0.039035797119140625, -0.03395843505859375, -0.028881072998046875, -0.0238037109375, -0.018726348876953125, -0.01364898681640625, -0.008571624755859375, -0.0034942626953125, 0.001583099365234375, 0.00666046142578125, 0.011737823486328125, 0.016815185546875, 0.021892547607421875, 0.02696990966796875, 0.032047271728515625, 0.0371246337890625, 0.042201995849609375, 0.04727935791015625, 0.052356719970703125, 0.05743408203125, 0.06251144409179688, 0.06758880615234375, 0.07266616821289062, 0.0777435302734375, 0.08282089233398438, 0.08789825439453125, 0.09297561645507812, 0.098052978515625, 0.10313034057617188, 0.10820770263671875, 0.11328506469726562, 0.1183624267578125, 0.12343978881835938, 0.12851715087890625, 0.13359451293945312, 0.138671875]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 3.0, 4.0, 2.0, 9.0, 16.0, 28.0, 85.0, 221.0, 271.0, 215.0, 88.0, 37.0, 16.0, 6.0, 6.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8368782997131348, -2.770357131958008, -2.703835964202881, -2.637314796447754, -2.570793628692627, -2.504272222518921, -2.437751054763794, -2.371229887008667, -2.30470871925354, -2.238187551498413, -2.171666383743286, -2.105145215988159, -2.038623809814453, -1.9721027612686157, -1.9055814743041992, -1.8390603065490723, -1.7725391387939453, -1.7060179710388184, -1.6394968032836914, -1.572975516319275, -1.506454348564148, -1.439933180809021, -1.3734118938446045, -1.3068907260894775, -1.2403695583343506, -1.1738483905792236, -1.1073272228240967, -1.0408059358596802, -0.9742847681045532, -0.9077636003494263, -0.8412423729896545, -0.7747211456298828, -0.7081997394561768, -0.6416785717010498, -0.5751573443412781, -0.5086361169815063, -0.4421149492263794, -0.37559375166893005, -0.3090725541114807, -0.24255135655403137, -0.17603015899658203, -0.10950896143913269, -0.04298776388168335, 0.02353343367576599, 0.09005463123321533, 0.15657582879066467, 0.223097026348114, 0.28961822390556335, 0.3561394214630127, 0.42266061902046204, 0.4891818165779114, 0.5557030439376831, 0.6222242116928101, 0.688745379447937, 0.7552666068077087, 0.8217878341674805, 0.8883090019226074, 0.9548301696777344, 1.0213513374328613, 1.0878726243972778, 1.1543937921524048, 1.2209149599075317, 1.2874362468719482, 1.3539574146270752, 1.4204785823822021]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 2.0, 6.0, 6.0, 21.0, 15.0, 26.0, 27.0, 32.0, 43.0, 78.0, 63.0, 76.0, 72.0, 79.0, 92.0, 80.0, 88.0, 51.0, 48.0, 31.0, 26.0, 19.0, 14.0, 8.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9754476547241211, -0.9402709603309631, -0.9050942659378052, -0.8699175715446472, -0.8347408771514893, -0.7995641231536865, -0.7643874287605286, -0.7292107343673706, -0.6940340399742126, -0.6588573455810547, -0.6236806511878967, -0.5885039567947388, -0.553327202796936, -0.5181505680084229, -0.4829738140106201, -0.44779711961746216, -0.4126204252243042, -0.37744373083114624, -0.3422670364379883, -0.30709031224250793, -0.27191361784935, -0.23673692345619202, -0.20156021416187286, -0.1663835048675537, -0.13120681047439575, -0.0960301086306572, -0.06085340678691864, -0.025676704943180084, 0.009499996900558472, 0.04467669129371643, 0.07985340058803558, 0.11503010988235474, 0.15020692348480225, 0.1853836178779602, 0.22056032717227936, 0.2557370364665985, 0.29091373085975647, 0.32609042525291443, 0.3612671494483948, 0.39644384384155273, 0.4316205382347107, 0.46679723262786865, 0.5019739270210266, 0.5371506214141846, 0.5723273754119873, 0.6075040102005005, 0.6426807641983032, 0.6778574585914612, 0.7130341529846191, 0.7482108473777771, 0.7833875417709351, 0.818564236164093, 0.853740930557251, 0.8889176845550537, 0.9240943789482117, 0.9592710733413696, 0.9944477677345276, 1.0296244621276855, 1.0648012161254883, 1.0999778509140015, 1.1351546049118042, 1.1703312397003174, 1.2055079936981201, 1.2406847476959229, 1.275861382484436]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 7.0, 5.0, 4.0, 10.0, 15.0, 25.0, 54.0, 67.0, 137.0, 261.0, 573.0, 1326.0, 4255.0, 17129.0, 85625.0, 419361.0, 412413.0, 84024.0, 16617.0, 4156.0, 1416.0, 519.0, 286.0, 119.0, 54.0, 38.0, 22.0, 18.0, 8.0, 4.0, 6.0, 4.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2144775390625, -0.2068157196044922, -0.19915390014648438, -0.19149208068847656, -0.18383026123046875, -0.17616844177246094, -0.16850662231445312, -0.1608448028564453, -0.1531829833984375, -0.1455211639404297, -0.13785934448242188, -0.13019752502441406, -0.12253570556640625, -0.11487388610839844, -0.10721206665039062, -0.09955024719238281, -0.091888427734375, -0.08422660827636719, -0.07656478881835938, -0.06890296936035156, -0.06124114990234375, -0.05357933044433594, -0.045917510986328125, -0.03825569152832031, -0.0305938720703125, -0.022932052612304688, -0.015270233154296875, -0.0076084136962890625, 5.340576171875e-05, 0.0077152252197265625, 0.015377044677734375, 0.023038864135742188, 0.03070068359375, 0.03836250305175781, 0.046024322509765625, 0.05368614196777344, 0.06134796142578125, 0.06900978088378906, 0.07667160034179688, 0.08433341979980469, 0.0919952392578125, 0.09965705871582031, 0.10731887817382812, 0.11498069763183594, 0.12264251708984375, 0.13030433654785156, 0.13796615600585938, 0.1456279754638672, 0.153289794921875, 0.1609516143798828, 0.16861343383789062, 0.17627525329589844, 0.18393707275390625, 0.19159889221191406, 0.19926071166992188, 0.2069225311279297, 0.2145843505859375, 0.2222461700439453, 0.22990798950195312, 0.23756980895996094, 0.24523162841796875, 0.25289344787597656, 0.2605552673339844, 0.2682170867919922, 0.27587890625]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 8.0, 11.0, 17.0, 18.0, 29.0, 44.0, 55.0, 86.0, 90.0, 95.0, 110.0, 114.0, 77.0, 62.0, 55.0, 44.0, 34.0, 19.0, 18.0, 6.0, 8.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1788330078125, -0.17451000213623047, -0.17018699645996094, -0.1658639907836914, -0.16154098510742188, -0.15721797943115234, -0.1528949737548828, -0.14857196807861328, -0.14424896240234375, -0.13992595672607422, -0.1356029510498047, -0.13127994537353516, -0.12695693969726562, -0.1226339340209961, -0.11831092834472656, -0.11398792266845703, -0.1096649169921875, -0.10534191131591797, -0.10101890563964844, -0.0966958999633789, -0.09237289428710938, -0.08804988861083984, -0.08372688293457031, -0.07940387725830078, -0.07508087158203125, -0.07075786590576172, -0.06643486022949219, -0.062111854553222656, -0.057788848876953125, -0.053465843200683594, -0.04914283752441406, -0.04481983184814453, -0.040496826171875, -0.03617382049560547, -0.03185081481933594, -0.027527809143066406, -0.023204803466796875, -0.018881797790527344, -0.014558792114257812, -0.010235786437988281, -0.00591278076171875, -0.0015897750854492188, 0.0027332305908203125, 0.007056236267089844, 0.011379241943359375, 0.015702247619628906, 0.020025253295898438, 0.02434825897216797, 0.0286712646484375, 0.03299427032470703, 0.03731727600097656, 0.041640281677246094, 0.045963287353515625, 0.050286293029785156, 0.05460929870605469, 0.05893230438232422, 0.06325531005859375, 0.06757831573486328, 0.07190132141113281, 0.07622432708740234, 0.08054733276367188, 0.0848703384399414, 0.08919334411621094, 0.09351634979248047, 0.09783935546875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 4.0, 10.0, 5.0, 13.0, 18.0, 22.0, 29.0, 60.0, 92.0, 196.0, 381.0, 898.0, 2604.0, 11167.0, 86220.0, 678023.0, 236403.0, 25379.0, 4544.0, 1379.0, 526.0, 241.0, 135.0, 80.0, 47.0, 24.0, 21.0, 13.0, 2.0, 9.0, 3.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.2734375, -0.263916015625, -0.25439453125, -0.244873046875, -0.2353515625, -0.225830078125, -0.21630859375, -0.206787109375, -0.197265625, -0.187744140625, -0.17822265625, -0.168701171875, -0.1591796875, -0.149658203125, -0.14013671875, -0.130615234375, -0.12109375, -0.111572265625, -0.10205078125, -0.092529296875, -0.0830078125, -0.073486328125, -0.06396484375, -0.054443359375, -0.044921875, -0.035400390625, -0.02587890625, -0.016357421875, -0.0068359375, 0.002685546875, 0.01220703125, 0.021728515625, 0.03125, 0.040771484375, 0.05029296875, 0.059814453125, 0.0693359375, 0.078857421875, 0.08837890625, 0.097900390625, 0.107421875, 0.116943359375, 0.12646484375, 0.135986328125, 0.1455078125, 0.155029296875, 0.16455078125, 0.174072265625, 0.18359375, 0.193115234375, 0.20263671875, 0.212158203125, 0.2216796875, 0.231201171875, 0.24072265625, 0.250244140625, 0.259765625, 0.269287109375, 0.27880859375, 0.288330078125, 0.2978515625, 0.307373046875, 0.31689453125, 0.326416015625, 0.3359375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 4.0, 3.0, 4.0, 9.0, 9.0, 7.0, 16.0, 14.0, 20.0, 20.0, 18.0, 26.0, 23.0, 29.0, 43.0, 41.0, 30.0, 41.0, 63.0, 50.0, 37.0, 38.0, 46.0, 58.0, 41.0, 39.0, 39.0, 31.0, 29.0, 33.0, 27.0, 24.0, 13.0, 21.0, 8.0, 14.0, 9.0, 6.0, 5.0, 6.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.2386474609375, -0.2305583953857422, -0.22246932983398438, -0.21438026428222656, -0.20629119873046875, -0.19820213317871094, -0.19011306762695312, -0.1820240020751953, -0.1739349365234375, -0.1658458709716797, -0.15775680541992188, -0.14966773986816406, -0.14157867431640625, -0.13348960876464844, -0.12540054321289062, -0.11731147766113281, -0.109222412109375, -0.10113334655761719, -0.09304428100585938, -0.08495521545410156, -0.07686614990234375, -0.06877708435058594, -0.060688018798828125, -0.05259895324707031, -0.0445098876953125, -0.03642082214355469, -0.028331756591796875, -0.020242691040039062, -0.01215362548828125, -0.0040645599365234375, 0.004024505615234375, 0.012113571166992188, 0.02020263671875, 0.028291702270507812, 0.036380767822265625, 0.04446983337402344, 0.05255889892578125, 0.06064796447753906, 0.06873703002929688, 0.07682609558105469, 0.0849151611328125, 0.09300422668457031, 0.10109329223632812, 0.10918235778808594, 0.11727142333984375, 0.12536048889160156, 0.13344955444335938, 0.1415386199951172, 0.149627685546875, 0.1577167510986328, 0.16580581665039062, 0.17389488220214844, 0.18198394775390625, 0.19007301330566406, 0.19816207885742188, 0.2062511444091797, 0.2143402099609375, 0.2224292755126953, 0.23051834106445312, 0.23860740661621094, 0.24669647216796875, 0.25478553771972656, 0.2628746032714844, 0.2709636688232422, 0.279052734375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 2.0, 3.0, 4.0, 3.0, 9.0, 7.0, 7.0, 13.0, 23.0, 37.0, 50.0, 105.0, 161.0, 365.0, 859.0, 2376.0, 11624.0, 210565.0, 785298.0, 30564.0, 4174.0, 1239.0, 518.0, 249.0, 109.0, 67.0, 42.0, 22.0, 13.0, 12.0, 8.0, 2.0, 3.0, 8.0, 4.0, 0.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1788330078125, -0.17249298095703125, -0.1661529541015625, -0.15981292724609375, -0.153472900390625, -0.14713287353515625, -0.1407928466796875, -0.13445281982421875, -0.12811279296875, -0.12177276611328125, -0.1154327392578125, -0.10909271240234375, -0.102752685546875, -0.09641265869140625, -0.0900726318359375, -0.08373260498046875, -0.077392578125, -0.07105255126953125, -0.0647125244140625, -0.05837249755859375, -0.052032470703125, -0.04569244384765625, -0.0393524169921875, -0.03301239013671875, -0.02667236328125, -0.02033233642578125, -0.0139923095703125, -0.00765228271484375, -0.001312255859375, 0.00502777099609375, 0.0113677978515625, 0.01770782470703125, 0.0240478515625, 0.03038787841796875, 0.0367279052734375, 0.04306793212890625, 0.049407958984375, 0.05574798583984375, 0.0620880126953125, 0.06842803955078125, 0.07476806640625, 0.08110809326171875, 0.0874481201171875, 0.09378814697265625, 0.100128173828125, 0.10646820068359375, 0.1128082275390625, 0.11914825439453125, 0.12548828125, 0.13182830810546875, 0.1381683349609375, 0.14450836181640625, 0.150848388671875, 0.15718841552734375, 0.1635284423828125, 0.16986846923828125, 0.17620849609375, 0.18254852294921875, 0.1888885498046875, 0.19522857666015625, 0.201568603515625, 0.20790863037109375, 0.2142486572265625, 0.22058868408203125, 0.2269287109375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 2.0, 4.0, 8.0, 9.0, 6.0, 8.0, 14.0, 19.0, 30.0, 40.0, 52.0, 53.0, 57.0, 89.0, 102.0, 102.0, 93.0, 65.0, 55.0, 43.0, 43.0, 30.0, 18.0, 20.0, 10.0, 5.0, 4.0, 6.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6927719116210938e-05, -1.6223639249801636e-05, -1.5519559383392334e-05, -1.4815479516983032e-05, -1.411139965057373e-05, -1.3407319784164429e-05, -1.2703239917755127e-05, -1.1999160051345825e-05, -1.1295080184936523e-05, -1.0591000318527222e-05, -9.88692045211792e-06, -9.182840585708618e-06, -8.478760719299316e-06, -7.774680852890015e-06, -7.070600986480713e-06, -6.366521120071411e-06, -5.662441253662109e-06, -4.958361387252808e-06, -4.254281520843506e-06, -3.550201654434204e-06, -2.8461217880249023e-06, -2.1420419216156006e-06, -1.4379620552062988e-06, -7.338821887969971e-07, -2.9802322387695312e-08, 6.742775440216064e-07, 1.3783574104309082e-06, 2.08243727684021e-06, 2.7865171432495117e-06, 3.4905970096588135e-06, 4.194676876068115e-06, 4.898756742477417e-06, 5.602836608886719e-06, 6.3069164752960205e-06, 7.010996341705322e-06, 7.715076208114624e-06, 8.419156074523926e-06, 9.123235940933228e-06, 9.82731580734253e-06, 1.0531395673751831e-05, 1.1235475540161133e-05, 1.1939555406570435e-05, 1.2643635272979736e-05, 1.3347715139389038e-05, 1.405179500579834e-05, 1.4755874872207642e-05, 1.5459954738616943e-05, 1.6164034605026245e-05, 1.6868114471435547e-05, 1.757219433784485e-05, 1.827627420425415e-05, 1.8980354070663452e-05, 1.9684433937072754e-05, 2.0388513803482056e-05, 2.1092593669891357e-05, 2.179667353630066e-05, 2.250075340270996e-05, 2.3204833269119263e-05, 2.3908913135528564e-05, 2.4612993001937866e-05, 2.5317072868347168e-05, 2.602115273475647e-05, 2.672523260116577e-05, 2.7429312467575073e-05, 2.8133392333984375e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 11.0, 9.0, 16.0, 20.0, 25.0, 38.0, 60.0, 87.0, 142.0, 265.0, 496.0, 1200.0, 3025.0, 10391.0, 60795.0, 639901.0, 291050.0, 30433.0, 6539.0, 2131.0, 917.0, 419.0, 226.0, 125.0, 87.0, 40.0, 34.0, 24.0, 19.0, 8.0, 4.0, 5.0, 6.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11566162109375, -0.1116495132446289, -0.10763740539550781, -0.10362529754638672, -0.09961318969726562, -0.09560108184814453, -0.09158897399902344, -0.08757686614990234, -0.08356475830078125, -0.07955265045166016, -0.07554054260253906, -0.07152843475341797, -0.06751632690429688, -0.06350421905517578, -0.05949211120605469, -0.055480003356933594, -0.0514678955078125, -0.047455787658691406, -0.04344367980957031, -0.03943157196044922, -0.035419464111328125, -0.03140735626220703, -0.027395248413085938, -0.023383140563964844, -0.01937103271484375, -0.015358924865722656, -0.011346817016601562, -0.007334709167480469, -0.003322601318359375, 0.0006895065307617188, 0.0047016143798828125, 0.008713722229003906, 0.012725830078125, 0.016737937927246094, 0.020750045776367188, 0.02476215362548828, 0.028774261474609375, 0.03278636932373047, 0.03679847717285156, 0.040810585021972656, 0.04482269287109375, 0.048834800720214844, 0.05284690856933594, 0.05685901641845703, 0.060871124267578125, 0.06488323211669922, 0.06889533996582031, 0.0729074478149414, 0.0769195556640625, 0.0809316635131836, 0.08494377136230469, 0.08895587921142578, 0.09296798706054688, 0.09698009490966797, 0.10099220275878906, 0.10500431060791016, 0.10901641845703125, 0.11302852630615234, 0.11704063415527344, 0.12105274200439453, 0.12506484985351562, 0.12907695770263672, 0.1330890655517578, 0.1371011734008789, 0.14111328125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 5.0, 0.0, 9.0, 16.0, 10.0, 13.0, 10.0, 16.0, 17.0, 30.0, 27.0, 26.0, 37.0, 57.0, 48.0, 49.0, 57.0, 64.0, 68.0, 69.0, 58.0, 37.0, 43.0, 49.0, 27.0, 25.0, 30.0, 25.0, 12.0, 16.0, 13.0, 6.0, 8.0, 7.0, 4.0, 2.0, 2.0, 3.0, 6.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0908203125, -0.0880727767944336, -0.08532524108886719, -0.08257770538330078, -0.07983016967773438, -0.07708263397216797, -0.07433509826660156, -0.07158756256103516, -0.06884002685546875, -0.06609249114990234, -0.06334495544433594, -0.06059741973876953, -0.057849884033203125, -0.05510234832763672, -0.05235481262207031, -0.049607276916503906, -0.0468597412109375, -0.044112205505371094, -0.04136466979980469, -0.03861713409423828, -0.035869598388671875, -0.03312206268310547, -0.030374526977539062, -0.027626991271972656, -0.02487945556640625, -0.022131919860839844, -0.019384384155273438, -0.01663684844970703, -0.013889312744140625, -0.011141777038574219, -0.008394241333007812, -0.005646705627441406, -0.002899169921875, -0.00015163421630859375, 0.0025959014892578125, 0.005343437194824219, 0.008090972900390625, 0.010838508605957031, 0.013586044311523438, 0.016333580017089844, 0.01908111572265625, 0.021828651428222656, 0.024576187133789062, 0.02732372283935547, 0.030071258544921875, 0.03281879425048828, 0.03556632995605469, 0.038313865661621094, 0.0410614013671875, 0.043808937072753906, 0.04655647277832031, 0.04930400848388672, 0.052051544189453125, 0.05479907989501953, 0.05754661560058594, 0.060294151306152344, 0.06304168701171875, 0.06578922271728516, 0.06853675842285156, 0.07128429412841797, 0.07403182983398438, 0.07677936553955078, 0.07952690124511719, 0.0822744369506836, 0.08502197265625]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 9.0, 18.0, 75.0, 223.0, 397.0, 195.0, 68.0, 11.0, 3.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.003175735473633, -1.872571349143982, -1.741966962814331, -1.6113626956939697, -1.4807581901550293, -1.350153923034668, -1.219549536705017, -1.0889451503753662, -0.9583407640457153, -0.8277363777160645, -0.6971319913864136, -0.5665276646614075, -0.4359232783317566, -0.3053188920021057, -0.1747145652770996, -0.04411017894744873, 0.08649420738220215, 0.21709857881069183, 0.3477029502391815, 0.47830730676651, 0.6089116930961609, 0.7395160794258118, 0.8701204061508179, 1.0007247924804688, 1.1313291788101196, 1.2619335651397705, 1.3925379514694214, 1.5231423377990723, 1.6537466049194336, 1.784351110458374, 1.9149553775787354, 2.045559883117676, 2.176164150238037, 2.3067684173583984, 2.437372922897339, 2.5679771900177, 2.6985816955566406, 2.829185962677002, 2.9597902297973633, 3.0903947353363037, 3.220999240875244, 3.3516035079956055, 3.482208013534546, 3.6128122806549072, 3.7434167861938477, 3.874021053314209, 4.00462532043457, 4.13523006439209, 4.265833854675293, 4.396438121795654, 4.527042388916016, 4.657647132873535, 4.7882513999938965, 4.918855667114258, 5.049459934234619, 5.1800642013549805, 5.3106689453125, 5.441273212432861, 5.571877479553223, 5.702482223510742, 5.8330864906311035, 5.963690757751465, 6.094295024871826, 6.2248992919921875, 6.355504035949707]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 4.0, 0.0, 1.0, 3.0, 1.0, 0.0, 5.0, 9.0, 9.0, 5.0, 8.0, 11.0, 16.0, 11.0, 19.0, 19.0, 15.0, 27.0, 40.0, 38.0, 49.0, 50.0, 55.0, 63.0, 61.0, 61.0, 59.0, 58.0, 50.0, 31.0, 31.0, 35.0, 31.0, 17.0, 15.0, 16.0, 15.0, 17.0, 12.0, 9.0, 8.0, 7.0, 5.0, 7.0, 4.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0825799703598022, -1.045342206954956, -1.0081044435501099, -0.9708666205406189, -0.9336287975311279, -0.8963910341262817, -0.8591532707214355, -0.8219155073165894, -0.7846776843070984, -0.7474399209022522, -0.7102020978927612, -0.672964334487915, -0.6357265710830688, -0.5984887480735779, -0.5612509846687317, -0.5240131616592407, -0.48677539825439453, -0.44953760504722595, -0.4122998118400574, -0.3750620484352112, -0.3378242552280426, -0.300586462020874, -0.26334869861602783, -0.22611090540885925, -0.18887311220169067, -0.1516353189945221, -0.11439754068851471, -0.07715975493192673, -0.039921969175338745, -0.002684175968170166, 0.03455360233783722, 0.0717913806438446, 0.10902929306030273, 0.1462670862674713, 0.1835048645734787, 0.22074264287948608, 0.25798043608665466, 0.29521822929382324, 0.33245599269866943, 0.369693785905838, 0.4069315791130066, 0.44416937232017517, 0.48140716552734375, 0.5186449289321899, 0.5558826923370361, 0.5931205153465271, 0.6303582787513733, 0.6675961017608643, 0.7048338651657104, 0.7420716285705566, 0.7793094515800476, 0.8165472149848938, 0.8537850379943848, 0.891022801399231, 0.9282605648040771, 0.9654983282089233, 1.0027360916137695, 1.0399738550186157, 1.077211618423462, 1.1144495010375977, 1.1516872644424438, 1.18892502784729, 1.2261627912521362, 1.2634005546569824, 1.3006384372711182]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 5.0, 2.0, 7.0, 10.0, 12.0, 20.0, 28.0, 34.0, 50.0, 93.0, 128.0, 289.0, 645.0, 2277.0, 11144.0, 111732.0, 3311213.0, 716548.0, 32495.0, 5265.0, 1362.0, 438.0, 182.0, 113.0, 57.0, 45.0, 27.0, 19.0, 9.0, 15.0, 5.0, 4.0, 2.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18701171875, -0.18050765991210938, -0.17400360107421875, -0.16749954223632812, -0.1609954833984375, -0.15449142456054688, -0.14798736572265625, -0.14148330688476562, -0.134979248046875, -0.12847518920898438, -0.12197113037109375, -0.11546707153320312, -0.1089630126953125, -0.10245895385742188, -0.09595489501953125, -0.08945083618164062, -0.08294677734375, -0.07644271850585938, -0.06993865966796875, -0.06343460083007812, -0.0569305419921875, -0.050426483154296875, -0.04392242431640625, -0.037418365478515625, -0.030914306640625, -0.024410247802734375, -0.01790618896484375, -0.011402130126953125, -0.0048980712890625, 0.001605987548828125, 0.00811004638671875, 0.014614105224609375, 0.0211181640625, 0.027622222900390625, 0.03412628173828125, 0.040630340576171875, 0.0471343994140625, 0.053638458251953125, 0.06014251708984375, 0.06664657592773438, 0.073150634765625, 0.07965469360351562, 0.08615875244140625, 0.09266281127929688, 0.0991668701171875, 0.10567092895507812, 0.11217498779296875, 0.11867904663085938, 0.12518310546875, 0.13168716430664062, 0.13819122314453125, 0.14469528198242188, 0.1511993408203125, 0.15770339965820312, 0.16420745849609375, 0.17071151733398438, 0.177215576171875, 0.18371963500976562, 0.19022369384765625, 0.19672775268554688, 0.2032318115234375, 0.20973587036132812, 0.21623992919921875, 0.22274398803710938, 0.229248046875]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 10.0, 10.0, 16.0, 26.0, 36.0, 41.0, 63.0, 85.0, 90.0, 93.0, 100.0, 93.0, 78.0, 70.0, 55.0, 46.0, 31.0, 27.0, 16.0, 8.0, 3.0, 3.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.178466796875, -0.1743450164794922, -0.17022323608398438, -0.16610145568847656, -0.16197967529296875, -0.15785789489746094, -0.15373611450195312, -0.1496143341064453, -0.1454925537109375, -0.1413707733154297, -0.13724899291992188, -0.13312721252441406, -0.12900543212890625, -0.12488365173339844, -0.12076187133789062, -0.11664009094238281, -0.112518310546875, -0.10839653015136719, -0.10427474975585938, -0.10015296936035156, -0.09603118896484375, -0.09190940856933594, -0.08778762817382812, -0.08366584777832031, -0.0795440673828125, -0.07542228698730469, -0.07130050659179688, -0.06717872619628906, -0.06305694580078125, -0.05893516540527344, -0.054813385009765625, -0.05069160461425781, -0.04656982421875, -0.04244804382324219, -0.038326263427734375, -0.03420448303222656, -0.03008270263671875, -0.025960922241210938, -0.021839141845703125, -0.017717361450195312, -0.0135955810546875, -0.009473800659179688, -0.005352020263671875, -0.0012302398681640625, 0.00289154052734375, 0.0070133209228515625, 0.011135101318359375, 0.015256881713867188, 0.019378662109375, 0.023500442504882812, 0.027622222900390625, 0.03174400329589844, 0.03586578369140625, 0.03998756408691406, 0.044109344482421875, 0.04823112487792969, 0.0523529052734375, 0.05647468566894531, 0.060596466064453125, 0.06471824645996094, 0.06884002685546875, 0.07296180725097656, 0.07708358764648438, 0.08120536804199219, 0.0853271484375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 5.0, 5.0, 4.0, 9.0, 14.0, 22.0, 27.0, 41.0, 58.0, 76.0, 127.0, 225.0, 457.0, 995.0, 3089.0, 12892.0, 80314.0, 1879993.0, 2110179.0, 85965.0, 13918.0, 3486.0, 1227.0, 467.0, 266.0, 131.0, 87.0, 58.0, 36.0, 32.0, 21.0, 17.0, 8.0, 5.0, 8.0, 2.0, 6.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2041015625, -0.19730186462402344, -0.19050216674804688, -0.1837024688720703, -0.17690277099609375, -0.1701030731201172, -0.16330337524414062, -0.15650367736816406, -0.1497039794921875, -0.14290428161621094, -0.13610458374023438, -0.1293048858642578, -0.12250518798828125, -0.11570549011230469, -0.10890579223632812, -0.10210609436035156, -0.095306396484375, -0.08850669860839844, -0.08170700073242188, -0.07490730285644531, -0.06810760498046875, -0.06130790710449219, -0.054508209228515625, -0.04770851135253906, -0.0409088134765625, -0.03410911560058594, -0.027309417724609375, -0.020509719848632812, -0.01371002197265625, -0.0069103240966796875, -0.000110626220703125, 0.0066890716552734375, 0.01348876953125, 0.020288467407226562, 0.027088165283203125, 0.03388786315917969, 0.04068756103515625, 0.04748725891113281, 0.054286956787109375, 0.06108665466308594, 0.0678863525390625, 0.07468605041503906, 0.08148574829101562, 0.08828544616699219, 0.09508514404296875, 0.10188484191894531, 0.10868453979492188, 0.11548423767089844, 0.122283935546875, 0.12908363342285156, 0.13588333129882812, 0.1426830291748047, 0.14948272705078125, 0.1562824249267578, 0.16308212280273438, 0.16988182067871094, 0.1766815185546875, 0.18348121643066406, 0.19028091430664062, 0.1970806121826172, 0.20388031005859375, 0.2106800079345703, 0.21747970581054688, 0.22427940368652344, 0.2310791015625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 7.0, 2.0, 5.0, 9.0, 13.0, 26.0, 22.0, 30.0, 47.0, 74.0, 113.0, 152.0, 253.0, 458.0, 725.0, 790.0, 536.0, 263.0, 155.0, 110.0, 68.0, 58.0, 37.0, 27.0, 23.0, 18.0, 11.0, 12.0, 7.0, 4.0, 7.0, 4.0, 3.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1812744140625, -0.17527008056640625, -0.1692657470703125, -0.16326141357421875, -0.157257080078125, -0.15125274658203125, -0.1452484130859375, -0.13924407958984375, -0.13323974609375, -0.12723541259765625, -0.1212310791015625, -0.11522674560546875, -0.109222412109375, -0.10321807861328125, -0.0972137451171875, -0.09120941162109375, -0.085205078125, -0.07920074462890625, -0.0731964111328125, -0.06719207763671875, -0.061187744140625, -0.05518341064453125, -0.0491790771484375, -0.04317474365234375, -0.03717041015625, -0.03116607666015625, -0.0251617431640625, -0.01915740966796875, -0.013153076171875, -0.00714874267578125, -0.0011444091796875, 0.00485992431640625, 0.0108642578125, 0.01686859130859375, 0.0228729248046875, 0.02887725830078125, 0.034881591796875, 0.04088592529296875, 0.0468902587890625, 0.05289459228515625, 0.05889892578125, 0.06490325927734375, 0.0709075927734375, 0.07691192626953125, 0.082916259765625, 0.08892059326171875, 0.0949249267578125, 0.10092926025390625, 0.10693359375, 0.11293792724609375, 0.1189422607421875, 0.12494659423828125, 0.130950927734375, 0.13695526123046875, 0.1429595947265625, 0.14896392822265625, 0.15496826171875, 0.16097259521484375, 0.1669769287109375, 0.17298126220703125, 0.178985595703125, 0.18498992919921875, 0.1909942626953125, 0.19699859619140625, 0.2030029296875]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 4.0, 7.0, 7.0, 21.0, 45.0, 112.0, 223.0, 267.0, 171.0, 85.0, 31.0, 10.0, 5.0, 6.0, 5.0, 2.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.6735081672668457, -3.5817699432373047, -3.4900317192077637, -3.3982934951782227, -3.3065550327301025, -3.2148168087005615, -3.1230785846710205, -3.0313403606414795, -2.9396018981933594, -2.8478636741638184, -2.7561254501342773, -2.6643872261047363, -2.572648763656616, -2.480910539627075, -2.389172315597534, -2.297434091567993, -2.205695867538452, -2.113957643508911, -2.02221941947937, -1.9304810762405396, -1.838742733001709, -1.747004508972168, -1.655266284942627, -1.563528060913086, -1.4717897176742554, -1.3800514936447144, -1.2883131504058838, -1.1965749263763428, -1.1048367023468018, -1.0130983591079712, -0.9213601350784302, -0.8296218514442444, -0.7378835678100586, -0.6461452841758728, -0.554407000541687, -0.462668776512146, -0.3709304928779602, -0.2791922092437744, -0.1874539852142334, -0.09571570158004761, -0.003977417945861816, 0.08776085078716278, 0.17949911952018738, 0.2712373733520508, 0.3629756569862366, 0.45471394062042236, 0.5464521646499634, 0.6381904482841492, 0.729928731918335, 0.8216670155525208, 0.9134052991867065, 1.0051435232162476, 1.0968818664550781, 1.1886200904846191, 1.2803583145141602, 1.3720965385437012, 1.4638348817825317, 1.5555731058120728, 1.6473114490509033, 1.7390496730804443, 1.8307878971099854, 1.922526240348816, 2.0142645835876465, 2.1060028076171875, 2.1977410316467285]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 5.0, 1.0, 1.0, 4.0, 3.0, 4.0, 1.0, 2.0, 1.0, 2.0, 5.0, 3.0, 13.0, 13.0, 18.0, 11.0, 24.0, 23.0, 19.0, 39.0, 26.0, 43.0, 39.0, 46.0, 29.0, 53.0, 52.0, 49.0, 42.0, 58.0, 42.0, 42.0, 35.0, 36.0, 44.0, 28.0, 25.0, 21.0, 26.0, 18.0, 16.0, 10.0, 7.0, 9.0, 2.0, 8.0, 5.0, 4.0, 1.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.8484213948249817, -0.8197226524353027, -0.7910239696502686, -0.7623252272605896, -0.7336265444755554, -0.7049278020858765, -0.6762291193008423, -0.6475303769111633, -0.6188316345214844, -0.5901328921318054, -0.5614342093467712, -0.5327354669570923, -0.5040367841720581, -0.47533804178237915, -0.4466393291950226, -0.417940616607666, -0.38924193382263184, -0.36054322123527527, -0.3318445086479187, -0.30314576625823975, -0.27444708347320557, -0.2457483559846878, -0.21704962849617004, -0.18835091590881348, -0.1596522033214569, -0.13095349073410034, -0.10225477069616318, -0.07355605065822601, -0.044857338070869446, -0.01615862548351288, 0.012540102005004883, 0.04123881459236145, 0.06993758678436279, 0.09863629937171936, 0.12733501195907593, 0.1560337394475937, 0.18473245203495026, 0.21343116462230682, 0.24212989211082458, 0.27082860469818115, 0.2995273172855377, 0.3282260298728943, 0.35692474246025085, 0.3856234550476074, 0.4143221974372864, 0.44302088022232056, 0.4717196226119995, 0.5004183053970337, 0.5291170477867126, 0.5578157901763916, 0.5865144729614258, 0.6152132153511047, 0.6439118981361389, 0.6726106405258179, 0.701309323310852, 0.730008065700531, 0.75870680809021, 0.7874055504798889, 0.8161042332649231, 0.844802975654602, 0.8735016584396362, 0.9022004008293152, 0.9308991432189941, 0.9595978260040283, 0.9882965087890625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 6.0, 5.0, 4.0, 6.0, 8.0, 9.0, 12.0, 22.0, 33.0, 58.0, 76.0, 116.0, 212.0, 410.0, 929.0, 2261.0, 6013.0, 18683.0, 62331.0, 205171.0, 396028.0, 243500.0, 77659.0, 22903.0, 7299.0, 2645.0, 1061.0, 473.0, 274.0, 137.0, 66.0, 47.0, 24.0, 23.0, 16.0, 11.0, 12.0, 8.0, 5.0, 2.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1844482421875, -0.17911529541015625, -0.1737823486328125, -0.16844940185546875, -0.163116455078125, -0.15778350830078125, -0.1524505615234375, -0.14711761474609375, -0.14178466796875, -0.13645172119140625, -0.1311187744140625, -0.12578582763671875, -0.120452880859375, -0.11511993408203125, -0.1097869873046875, -0.10445404052734375, -0.09912109375, -0.09378814697265625, -0.0884552001953125, -0.08312225341796875, -0.077789306640625, -0.07245635986328125, -0.0671234130859375, -0.06179046630859375, -0.05645751953125, -0.05112457275390625, -0.0457916259765625, -0.04045867919921875, -0.035125732421875, -0.02979278564453125, -0.0244598388671875, -0.01912689208984375, -0.0137939453125, -0.00846099853515625, -0.0031280517578125, 0.00220489501953125, 0.007537841796875, 0.01287078857421875, 0.0182037353515625, 0.02353668212890625, 0.02886962890625, 0.03420257568359375, 0.0395355224609375, 0.04486846923828125, 0.050201416015625, 0.05553436279296875, 0.0608673095703125, 0.06620025634765625, 0.071533203125, 0.07686614990234375, 0.0821990966796875, 0.08753204345703125, 0.092864990234375, 0.09819793701171875, 0.1035308837890625, 0.10886383056640625, 0.11419677734375, 0.11952972412109375, 0.1248626708984375, 0.13019561767578125, 0.135528564453125, 0.14086151123046875, 0.1461944580078125, 0.15152740478515625, 0.1568603515625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 3.0, 7.0, 11.0, 14.0, 33.0, 33.0, 52.0, 51.0, 79.0, 88.0, 88.0, 103.0, 83.0, 96.0, 77.0, 60.0, 46.0, 31.0, 22.0, 14.0, 8.0, 4.0, 3.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1824951171875, -0.1782827377319336, -0.1740703582763672, -0.16985797882080078, -0.16564559936523438, -0.16143321990966797, -0.15722084045410156, -0.15300846099853516, -0.14879608154296875, -0.14458370208740234, -0.14037132263183594, -0.13615894317626953, -0.13194656372070312, -0.12773418426513672, -0.12352180480957031, -0.1193094253540039, -0.1150970458984375, -0.1108846664428711, -0.10667228698730469, -0.10245990753173828, -0.09824752807617188, -0.09403514862060547, -0.08982276916503906, -0.08561038970947266, -0.08139801025390625, -0.07718563079833984, -0.07297325134277344, -0.06876087188720703, -0.06454849243164062, -0.06033611297607422, -0.05612373352050781, -0.051911354064941406, -0.047698974609375, -0.043486595153808594, -0.03927421569824219, -0.03506183624267578, -0.030849456787109375, -0.02663707733154297, -0.022424697875976562, -0.018212318420410156, -0.01399993896484375, -0.009787559509277344, -0.0055751800537109375, -0.0013628005981445312, 0.002849578857421875, 0.007061958312988281, 0.011274337768554688, 0.015486717224121094, 0.0196990966796875, 0.023911476135253906, 0.028123855590820312, 0.03233623504638672, 0.036548614501953125, 0.04076099395751953, 0.04497337341308594, 0.049185752868652344, 0.05339813232421875, 0.057610511779785156, 0.06182289123535156, 0.06603527069091797, 0.07024765014648438, 0.07446002960205078, 0.07867240905761719, 0.0828847885131836, 0.08709716796875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 5.0, 7.0, 9.0, 9.0, 5.0, 14.0, 25.0, 21.0, 39.0, 57.0, 82.0, 113.0, 149.0, 233.0, 336.0, 447.0, 754.0, 1324.0, 2633.0, 7025.0, 25397.0, 132903.0, 620750.0, 203268.0, 36321.0, 9171.0, 3274.0, 1566.0, 905.0, 513.0, 349.0, 266.0, 145.0, 132.0, 93.0, 59.0, 41.0, 29.0, 30.0, 18.0, 12.0, 11.0, 4.0, 8.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.2491455078125, -0.24126625061035156, -0.23338699340820312, -0.2255077362060547, -0.21762847900390625, -0.2097492218017578, -0.20186996459960938, -0.19399070739746094, -0.1861114501953125, -0.17823219299316406, -0.17035293579101562, -0.1624736785888672, -0.15459442138671875, -0.1467151641845703, -0.13883590698242188, -0.13095664978027344, -0.123077392578125, -0.11519813537597656, -0.10731887817382812, -0.09943962097167969, -0.09156036376953125, -0.08368110656738281, -0.07580184936523438, -0.06792259216308594, -0.0600433349609375, -0.05216407775878906, -0.044284820556640625, -0.03640556335449219, -0.02852630615234375, -0.020647048950195312, -0.012767791748046875, -0.0048885345458984375, 0.00299072265625, 0.010869979858398438, 0.018749237060546875, 0.026628494262695312, 0.03450775146484375, 0.04238700866699219, 0.050266265869140625, 0.05814552307128906, 0.0660247802734375, 0.07390403747558594, 0.08178329467773438, 0.08966255187988281, 0.09754180908203125, 0.10542106628417969, 0.11330032348632812, 0.12117958068847656, 0.129058837890625, 0.13693809509277344, 0.14481735229492188, 0.1526966094970703, 0.16057586669921875, 0.1684551239013672, 0.17633438110351562, 0.18421363830566406, 0.1920928955078125, 0.19997215270996094, 0.20785140991210938, 0.2157306671142578, 0.22360992431640625, 0.2314891815185547, 0.23936843872070312, 0.24724769592285156, 0.255126953125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 2.0, 6.0, 3.0, 2.0, 7.0, 6.0, 8.0, 14.0, 13.0, 20.0, 28.0, 26.0, 36.0, 31.0, 40.0, 52.0, 40.0, 53.0, 46.0, 48.0, 49.0, 51.0, 42.0, 46.0, 32.0, 38.0, 51.0, 32.0, 32.0, 25.0, 19.0, 13.0, 22.0, 14.0, 12.0, 10.0, 5.0, 9.0, 5.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.349365234375, -0.33860015869140625, -0.3278350830078125, -0.31707000732421875, -0.306304931640625, -0.29553985595703125, -0.2847747802734375, -0.27400970458984375, -0.26324462890625, -0.25247955322265625, -0.2417144775390625, -0.23094940185546875, -0.220184326171875, -0.20941925048828125, -0.1986541748046875, -0.18788909912109375, -0.1771240234375, -0.16635894775390625, -0.1555938720703125, -0.14482879638671875, -0.134063720703125, -0.12329864501953125, -0.1125335693359375, -0.10176849365234375, -0.09100341796875, -0.08023834228515625, -0.0694732666015625, -0.05870819091796875, -0.047943115234375, -0.03717803955078125, -0.0264129638671875, -0.01564788818359375, -0.0048828125, 0.00588226318359375, 0.0166473388671875, 0.02741241455078125, 0.038177490234375, 0.04894256591796875, 0.0597076416015625, 0.07047271728515625, 0.08123779296875, 0.09200286865234375, 0.1027679443359375, 0.11353302001953125, 0.124298095703125, 0.13506317138671875, 0.1458282470703125, 0.15659332275390625, 0.1673583984375, 0.17812347412109375, 0.1888885498046875, 0.19965362548828125, 0.210418701171875, 0.22118377685546875, 0.2319488525390625, 0.24271392822265625, 0.25347900390625, 0.26424407958984375, 0.2750091552734375, 0.28577423095703125, 0.296539306640625, 0.30730438232421875, 0.3180694580078125, 0.32883453369140625, 0.339599609375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 3.0, 2.0, 5.0, 12.0, 22.0, 31.0, 59.0, 126.0, 282.0, 682.0, 2138.0, 8045.0, 50390.0, 823736.0, 143505.0, 14351.0, 3385.0, 1074.0, 384.0, 162.0, 71.0, 30.0, 22.0, 16.0, 15.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.20751953125, -0.2017040252685547, -0.19588851928710938, -0.19007301330566406, -0.18425750732421875, -0.17844200134277344, -0.17262649536132812, -0.1668109893798828, -0.1609954833984375, -0.1551799774169922, -0.14936447143554688, -0.14354896545410156, -0.13773345947265625, -0.13191795349121094, -0.12610244750976562, -0.12028694152832031, -0.114471435546875, -0.10865592956542969, -0.10284042358398438, -0.09702491760253906, -0.09120941162109375, -0.08539390563964844, -0.07957839965820312, -0.07376289367675781, -0.0679473876953125, -0.06213188171386719, -0.056316375732421875, -0.05050086975097656, -0.04468536376953125, -0.03886985778808594, -0.033054351806640625, -0.027238845825195312, -0.02142333984375, -0.015607833862304688, -0.009792327880859375, -0.0039768218994140625, 0.00183868408203125, 0.0076541900634765625, 0.013469696044921875, 0.019285202026367188, 0.0251007080078125, 0.030916213989257812, 0.036731719970703125, 0.04254722595214844, 0.04836273193359375, 0.05417823791503906, 0.059993743896484375, 0.06580924987792969, 0.071624755859375, 0.07744026184082031, 0.08325576782226562, 0.08907127380371094, 0.09488677978515625, 0.10070228576660156, 0.10651779174804688, 0.11233329772949219, 0.1181488037109375, 0.12396430969238281, 0.12977981567382812, 0.13559532165527344, 0.14141082763671875, 0.14722633361816406, 0.15304183959960938, 0.1588573455810547, 0.1646728515625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 5.0, 0.0, 3.0, 2.0, 5.0, 3.0, 3.0, 4.0, 6.0, 14.0, 15.0, 15.0, 28.0, 37.0, 63.0, 72.0, 132.0, 148.0, 117.0, 116.0, 72.0, 41.0, 25.0, 21.0, 14.0, 12.0, 10.0, 6.0, 5.0, 4.0, 3.0, 5.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.916025161743164e-05, -3.7962570786476135e-05, -3.676488995552063e-05, -3.5567209124565125e-05, -3.436952829360962e-05, -3.3171847462654114e-05, -3.197416663169861e-05, -3.07764858007431e-05, -2.9578804969787598e-05, -2.8381124138832092e-05, -2.7183443307876587e-05, -2.598576247692108e-05, -2.4788081645965576e-05, -2.359040081501007e-05, -2.2392719984054565e-05, -2.119503915309906e-05, -1.9997358322143555e-05, -1.879967749118805e-05, -1.7601996660232544e-05, -1.640431582927704e-05, -1.5206634998321533e-05, -1.4008954167366028e-05, -1.2811273336410522e-05, -1.1613592505455017e-05, -1.0415911674499512e-05, -9.218230843544006e-06, -8.020550012588501e-06, -6.822869181632996e-06, -5.62518835067749e-06, -4.427507519721985e-06, -3.2298266887664795e-06, -2.032145857810974e-06, -8.344650268554688e-07, 3.632158041000366e-07, 1.560896635055542e-06, 2.7585774660110474e-06, 3.956258296966553e-06, 5.153939127922058e-06, 6.3516199588775635e-06, 7.549300789833069e-06, 8.746981620788574e-06, 9.94466245174408e-06, 1.1142343282699585e-05, 1.234002411365509e-05, 1.3537704944610596e-05, 1.4735385775566101e-05, 1.5933066606521606e-05, 1.7130747437477112e-05, 1.8328428268432617e-05, 1.9526109099388123e-05, 2.0723789930343628e-05, 2.1921470761299133e-05, 2.311915159225464e-05, 2.4316832423210144e-05, 2.551451325416565e-05, 2.6712194085121155e-05, 2.790987491607666e-05, 2.9107555747032166e-05, 3.030523657798767e-05, 3.1502917408943176e-05, 3.270059823989868e-05, 3.389827907085419e-05, 3.509595990180969e-05, 3.62936407327652e-05, 3.74913215637207e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 2.0, 6.0, 3.0, 8.0, 9.0, 12.0, 16.0, 17.0, 29.0, 26.0, 57.0, 73.0, 105.0, 168.0, 272.0, 550.0, 1105.0, 2382.0, 6281.0, 19984.0, 103834.0, 707261.0, 165803.0, 26775.0, 7990.0, 2965.0, 1251.0, 641.0, 342.0, 193.0, 125.0, 81.0, 58.0, 34.0, 30.0, 19.0, 15.0, 6.0, 11.0, 5.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.104736328125, -0.10131454467773438, -0.09789276123046875, -0.09447097778320312, -0.0910491943359375, -0.08762741088867188, -0.08420562744140625, -0.08078384399414062, -0.077362060546875, -0.07394027709960938, -0.07051849365234375, -0.06709671020507812, -0.0636749267578125, -0.060253143310546875, -0.05683135986328125, -0.053409576416015625, -0.04998779296875, -0.046566009521484375, -0.04314422607421875, -0.039722442626953125, -0.0363006591796875, -0.032878875732421875, -0.02945709228515625, -0.026035308837890625, -0.022613525390625, -0.019191741943359375, -0.01576995849609375, -0.012348175048828125, -0.0089263916015625, -0.005504608154296875, -0.00208282470703125, 0.001338958740234375, 0.0047607421875, 0.008182525634765625, 0.01160430908203125, 0.015026092529296875, 0.0184478759765625, 0.021869659423828125, 0.02529144287109375, 0.028713226318359375, 0.032135009765625, 0.035556793212890625, 0.03897857666015625, 0.042400360107421875, 0.0458221435546875, 0.049243927001953125, 0.05266571044921875, 0.056087493896484375, 0.05950927734375, 0.06293106079101562, 0.06635284423828125, 0.06977462768554688, 0.0731964111328125, 0.07661819458007812, 0.08003997802734375, 0.08346176147460938, 0.086883544921875, 0.09030532836914062, 0.09372711181640625, 0.09714889526367188, 0.1005706787109375, 0.10399246215820312, 0.10741424560546875, 0.11083602905273438, 0.1142578125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 3.0, 3.0, 1.0, 3.0, 6.0, 8.0, 5.0, 12.0, 19.0, 25.0, 34.0, 42.0, 40.0, 66.0, 79.0, 87.0, 85.0, 88.0, 97.0, 67.0, 59.0, 42.0, 40.0, 27.0, 12.0, 8.0, 10.0, 11.0, 10.0, 3.0, 3.0, 1.0, 7.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1619873046875, -0.15790462493896484, -0.1538219451904297, -0.14973926544189453, -0.14565658569335938, -0.14157390594482422, -0.13749122619628906, -0.1334085464477539, -0.12932586669921875, -0.1252431869506836, -0.12116050720214844, -0.11707782745361328, -0.11299514770507812, -0.10891246795654297, -0.10482978820800781, -0.10074710845947266, -0.0966644287109375, -0.09258174896240234, -0.08849906921386719, -0.08441638946533203, -0.08033370971679688, -0.07625102996826172, -0.07216835021972656, -0.0680856704711914, -0.06400299072265625, -0.059920310974121094, -0.05583763122558594, -0.05175495147705078, -0.047672271728515625, -0.04358959197998047, -0.03950691223144531, -0.035424232482910156, -0.031341552734375, -0.027258872985839844, -0.023176193237304688, -0.01909351348876953, -0.015010833740234375, -0.010928153991699219, -0.0068454742431640625, -0.0027627944946289062, 0.00131988525390625, 0.005402565002441406, 0.009485244750976562, 0.013567924499511719, 0.017650604248046875, 0.02173328399658203, 0.025815963745117188, 0.029898643493652344, 0.0339813232421875, 0.038064002990722656, 0.04214668273925781, 0.04622936248779297, 0.050312042236328125, 0.05439472198486328, 0.05847740173339844, 0.0625600814819336, 0.06664276123046875, 0.0707254409790039, 0.07480812072753906, 0.07889080047607422, 0.08297348022460938, 0.08705615997314453, 0.09113883972167969, 0.09522151947021484, 0.09930419921875]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 7.0, 8.0, 31.0, 79.0, 140.0, 279.0, 242.0, 123.0, 53.0, 20.0, 8.0, 4.0, 1.0, 5.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.524156093597412, -3.416891098022461, -3.3096261024475098, -3.2023611068725586, -3.0950958728790283, -2.987830877304077, -2.880565881729126, -2.773300886154175, -2.6660358905792236, -2.5587708950042725, -2.4515058994293213, -2.344240665435791, -2.23697566986084, -2.1297106742858887, -2.0224456787109375, -1.9151806831359863, -1.8079155683517456, -1.7006505727767944, -1.5933854579925537, -1.4861204624176025, -1.3788554668426514, -1.2715904712677002, -1.1643253564834595, -1.0570603609085083, -0.9497953057289124, -0.8425302505493164, -0.7352652549743652, -0.6280001997947693, -0.5207351446151733, -0.41347014904022217, -0.3062050938606262, -0.19894009828567505, -0.0916750431060791, 0.015589989721775055, 0.12285502254962921, 0.23012006282806396, 0.3373850882053375, 0.4446501135826111, 0.551915168762207, 0.6591801643371582, 0.7664452195167542, 0.8737102746963501, 0.9809752702713013, 1.088240385055542, 1.1955053806304932, 1.3027703762054443, 1.4100353717803955, 1.5173003673553467, 1.6245654821395874, 1.7318304777145386, 1.8390955924987793, 1.9463605880737305, 2.0536255836486816, 2.160890579223633, 2.268155574798584, 2.375420570373535, 2.4826858043670654, 2.5899507999420166, 2.6972157955169678, 2.804481029510498, 2.911746025085449, 3.0190110206604004, 3.1262760162353516, 3.2335410118103027, 3.340806007385254]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 4.0, 1.0, 2.0, 6.0, 4.0, 11.0, 12.0, 9.0, 15.0, 20.0, 17.0, 25.0, 18.0, 32.0, 27.0, 32.0, 33.0, 48.0, 44.0, 51.0, 62.0, 60.0, 74.0, 46.0, 52.0, 29.0, 33.0, 31.0, 30.0, 30.0, 30.0, 25.0, 17.0, 12.0, 12.0, 8.0, 7.0, 8.0, 6.0, 3.0, 2.0, 5.0, 1.0, 1.0, 4.0, 0.0, 5.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.4257782697677612, -1.3842524290084839, -1.3427265882492065, -1.3012006282806396, -1.2596747875213623, -1.218148946762085, -1.1766231060028076, -1.1350972652435303, -1.093571424484253, -1.0520455837249756, -1.0105197429656982, -0.9689938426017761, -0.927467942237854, -0.8859421014785767, -0.8444162607192993, -0.802890419960022, -0.7613644599914551, -0.7198386192321777, -0.6783127188682556, -0.6367868781089783, -0.5952609777450562, -0.5537351369857788, -0.5122092962265015, -0.47068342566490173, -0.429157555103302, -0.38763168454170227, -0.34610581398010254, -0.3045799732208252, -0.26305410265922546, -0.22152823209762573, -0.1800023764371872, -0.13847652077674866, -0.09695076942443848, -0.05542490631341934, -0.013899043202400208, 0.027626819908618927, 0.06915268301963806, 0.11067855358123779, 0.15220440924167633, 0.19373026490211487, 0.2352561354637146, 0.27678200602531433, 0.31830787658691406, 0.3598337173461914, 0.40135958790779114, 0.44288545846939087, 0.4844112992286682, 0.5259371995925903, 0.5674630403518677, 0.608988881111145, 0.6505147814750671, 0.6920406222343445, 0.7335665225982666, 0.775092363357544, 0.8166182041168213, 0.8581440448760986, 0.8996699452400208, 0.9411957859992981, 0.9827216863632202, 1.0242475271224976, 1.065773367881775, 1.1072993278503418, 1.1488251686096191, 1.1903510093688965, 1.2318768501281738]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 7.0, 2.0, 5.0, 8.0, 7.0, 6.0, 11.0, 17.0, 23.0, 31.0, 55.0, 95.0, 151.0, 233.0, 506.0, 1085.0, 2520.0, 6350.0, 18789.0, 73624.0, 465869.0, 2568991.0, 898217.0, 116079.0, 26588.0, 8753.0, 3433.0, 1366.0, 630.0, 326.0, 183.0, 117.0, 75.0, 46.0, 23.0, 18.0, 11.0, 9.0, 14.0, 3.0, 6.0, 1.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1177978515625, -0.11429691314697266, -0.11079597473144531, -0.10729503631591797, -0.10379409790039062, -0.10029315948486328, -0.09679222106933594, -0.0932912826538086, -0.08979034423828125, -0.0862894058227539, -0.08278846740722656, -0.07928752899169922, -0.07578659057617188, -0.07228565216064453, -0.06878471374511719, -0.06528377532958984, -0.0617828369140625, -0.058281898498535156, -0.05478096008300781, -0.05128002166748047, -0.047779083251953125, -0.04427814483642578, -0.04077720642089844, -0.037276268005371094, -0.03377532958984375, -0.030274391174316406, -0.026773452758789062, -0.02327251434326172, -0.019771575927734375, -0.01627063751220703, -0.012769699096679688, -0.009268760681152344, -0.005767822265625, -0.0022668838500976562, 0.0012340545654296875, 0.004734992980957031, 0.008235931396484375, 0.011736869812011719, 0.015237808227539062, 0.018738746643066406, 0.02223968505859375, 0.025740623474121094, 0.029241561889648438, 0.03274250030517578, 0.036243438720703125, 0.03974437713623047, 0.04324531555175781, 0.046746253967285156, 0.0502471923828125, 0.053748130798339844, 0.05724906921386719, 0.06075000762939453, 0.06425094604492188, 0.06775188446044922, 0.07125282287597656, 0.0747537612915039, 0.07825469970703125, 0.0817556381225586, 0.08525657653808594, 0.08875751495361328, 0.09225845336914062, 0.09575939178466797, 0.09926033020019531, 0.10276126861572266, 0.10626220703125]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 8.0, 3.0, 13.0, 27.0, 29.0, 51.0, 52.0, 70.0, 91.0, 96.0, 115.0, 106.0, 89.0, 81.0, 63.0, 38.0, 28.0, 17.0, 11.0, 7.0, 7.0, 8.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17578125, -0.1709728240966797, -0.16616439819335938, -0.16135597229003906, -0.15654754638671875, -0.15173912048339844, -0.14693069458007812, -0.1421222686767578, -0.1373138427734375, -0.1325054168701172, -0.12769699096679688, -0.12288856506347656, -0.11808013916015625, -0.11327171325683594, -0.10846328735351562, -0.10365486145019531, -0.098846435546875, -0.09403800964355469, -0.08922958374023438, -0.08442115783691406, -0.07961273193359375, -0.07480430603027344, -0.06999588012695312, -0.06518745422363281, -0.0603790283203125, -0.05557060241699219, -0.050762176513671875, -0.04595375061035156, -0.04114532470703125, -0.03633689880371094, -0.031528472900390625, -0.026720046997070312, -0.02191162109375, -0.017103195190429688, -0.012294769287109375, -0.0074863433837890625, -0.00267791748046875, 0.0021305084228515625, 0.006938934326171875, 0.011747360229492188, 0.0165557861328125, 0.021364212036132812, 0.026172637939453125, 0.030981063842773438, 0.03578948974609375, 0.04059791564941406, 0.045406341552734375, 0.05021476745605469, 0.055023193359375, 0.05983161926269531, 0.06464004516601562, 0.06944847106933594, 0.07425689697265625, 0.07906532287597656, 0.08387374877929688, 0.08868217468261719, 0.0934906005859375, 0.09829902648925781, 0.10310745239257812, 0.10791587829589844, 0.11272430419921875, 0.11753273010253906, 0.12234115600585938, 0.1271495819091797, 0.1319580078125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 9.0, 7.0, 14.0, 17.0, 27.0, 34.0, 36.0, 54.0, 76.0, 104.0, 164.0, 365.0, 954.0, 7315.0, 350305.0, 3805114.0, 26791.0, 1605.0, 491.0, 254.0, 161.0, 106.0, 81.0, 47.0, 41.0, 34.0, 17.0, 19.0, 9.0, 9.0, 7.0, 2.0, 5.0, 3.0, 5.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.474853515625, -0.45964813232421875, -0.4444427490234375, -0.42923736572265625, -0.414031982421875, -0.39882659912109375, -0.3836212158203125, -0.36841583251953125, -0.35321044921875, -0.33800506591796875, -0.3227996826171875, -0.30759429931640625, -0.292388916015625, -0.27718353271484375, -0.2619781494140625, -0.24677276611328125, -0.2315673828125, -0.21636199951171875, -0.2011566162109375, -0.18595123291015625, -0.170745849609375, -0.15554046630859375, -0.1403350830078125, -0.12512969970703125, -0.10992431640625, -0.09471893310546875, -0.0795135498046875, -0.06430816650390625, -0.049102783203125, -0.03389739990234375, -0.0186920166015625, -0.00348663330078125, 0.01171875, 0.02692413330078125, 0.0421295166015625, 0.05733489990234375, 0.072540283203125, 0.08774566650390625, 0.1029510498046875, 0.11815643310546875, 0.13336181640625, 0.14856719970703125, 0.1637725830078125, 0.17897796630859375, 0.194183349609375, 0.20938873291015625, 0.2245941162109375, 0.23979949951171875, 0.2550048828125, 0.27021026611328125, 0.2854156494140625, 0.30062103271484375, 0.315826416015625, 0.33103179931640625, 0.3462371826171875, 0.36144256591796875, 0.37664794921875, 0.39185333251953125, 0.4070587158203125, 0.42226409912109375, 0.437469482421875, 0.45267486572265625, 0.4678802490234375, 0.48308563232421875, 0.498291015625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 0.0, 5.0, 6.0, 12.0, 5.0, 10.0, 12.0, 14.0, 18.0, 38.0, 35.0, 45.0, 58.0, 101.0, 145.0, 237.0, 390.0, 598.0, 774.0, 595.0, 375.0, 220.0, 129.0, 80.0, 42.0, 34.0, 25.0, 16.0, 19.0, 16.0, 7.0, 6.0, 4.0, 5.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1947021484375, -0.18830490112304688, -0.18190765380859375, -0.17551040649414062, -0.1691131591796875, -0.16271591186523438, -0.15631866455078125, -0.14992141723632812, -0.143524169921875, -0.13712692260742188, -0.13072967529296875, -0.12433242797851562, -0.1179351806640625, -0.11153793334960938, -0.10514068603515625, -0.09874343872070312, -0.09234619140625, -0.08594894409179688, -0.07955169677734375, -0.07315444946289062, -0.0667572021484375, -0.060359954833984375, -0.05396270751953125, -0.047565460205078125, -0.041168212890625, -0.034770965576171875, -0.02837371826171875, -0.021976470947265625, -0.0155792236328125, -0.009181976318359375, -0.00278472900390625, 0.003612518310546875, 0.010009765625, 0.016407012939453125, 0.02280426025390625, 0.029201507568359375, 0.0355987548828125, 0.041996002197265625, 0.04839324951171875, 0.054790496826171875, 0.061187744140625, 0.06758499145507812, 0.07398223876953125, 0.08037948608398438, 0.0867767333984375, 0.09317398071289062, 0.09957122802734375, 0.10596847534179688, 0.11236572265625, 0.11876296997070312, 0.12516021728515625, 0.13155746459960938, 0.1379547119140625, 0.14435195922851562, 0.15074920654296875, 0.15714645385742188, 0.163543701171875, 0.16994094848632812, 0.17633819580078125, 0.18273544311523438, 0.1891326904296875, 0.19552993774414062, 0.20192718505859375, 0.20832443237304688, 0.2147216796875]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 5.0, 12.0, 29.0, 78.0, 182.0, 297.0, 225.0, 100.0, 39.0, 13.0, 11.0, 4.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.924928188323975, -4.800938129425049, -4.676948070526123, -4.552957534790039, -4.428967475891113, -4.3049774169921875, -4.180987358093262, -4.056997299194336, -3.93300724029541, -3.8090171813964844, -3.6850268840789795, -3.5610368251800537, -3.437046766281128, -3.313056468963623, -3.1890664100646973, -3.0650763511657715, -2.9410860538482666, -2.817095994949341, -2.693105697631836, -2.56911563873291, -2.4451255798339844, -2.3211355209350586, -2.1971452236175537, -2.073155164718628, -1.9491649866104126, -1.8251748085021973, -1.7011847496032715, -1.5771945714950562, -1.4532043933868408, -1.329214334487915, -1.2052241563796997, -1.0812339782714844, -0.9572439193725586, -0.833253800868988, -0.7092636823654175, -0.5852735042572021, -0.4612833857536316, -0.33729326725006104, -0.2133030891418457, -0.08931297063827515, 0.03467714786529541, 0.15866728127002716, 0.2826574146747589, 0.40664756298065186, 0.5306376814842224, 0.654627799987793, 0.7786179780960083, 0.9026080965995789, 1.0265982151031494, 1.1505883932113647, 1.2745784521102905, 1.3985686302185059, 1.5225586891174316, 1.646548867225647, 1.7705390453338623, 1.894529104232788, 2.018519401550293, 2.1425094604492188, 2.2664997577667236, 2.3904898166656494, 2.514479875564575, 2.63847017288208, 2.762460231781006, 2.8864502906799316, 3.0104403495788574]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 6.0, 3.0, 6.0, 10.0, 13.0, 17.0, 20.0, 15.0, 26.0, 33.0, 40.0, 46.0, 38.0, 51.0, 46.0, 61.0, 55.0, 66.0, 47.0, 46.0, 68.0, 47.0, 34.0, 32.0, 31.0, 29.0, 18.0, 19.0, 19.0, 16.0, 11.0, 6.0, 7.0, 3.0, 6.0, 4.0, 4.0, 4.0, 4.0, 1.0, 4.0, 0.0, 1.0], "bins": [-1.344069004058838, -1.3080029487609863, -1.2719368934631348, -1.2358708381652832, -1.1998047828674316, -1.16373872756958, -1.1276726722717285, -1.0916064977645874, -1.0555404424667358, -1.0194743871688843, -0.9834083318710327, -0.9473422765731812, -0.9112761616706848, -0.8752101063728333, -0.8391440510749817, -0.8030779361724854, -0.7670119404792786, -0.730945885181427, -0.6948798298835754, -0.6588137149810791, -0.6227476596832275, -0.586681604385376, -0.5506155490875244, -0.5145494937896729, -0.4784834086894989, -0.44241735339164734, -0.4063512682914734, -0.3702852129936218, -0.33421915769577026, -0.2981530725955963, -0.26208701729774475, -0.2260209321975708, -0.18995487689971924, -0.15388880670070648, -0.11782274395227432, -0.08175668120384216, -0.04569061100482941, -0.00962454080581665, 0.026441514492034912, 0.06250759959220886, 0.09857365489006042, 0.13463972508907318, 0.17070579528808594, 0.2067718505859375, 0.24283792078495026, 0.278903990983963, 0.3149700462818146, 0.3510361313819885, 0.3871021866798401, 0.42316824197769165, 0.4592343270778656, 0.49530038237571716, 0.5313664674758911, 0.5674325227737427, 0.6034985780715942, 0.6395646333694458, 0.6756306886672974, 0.7116967439651489, 0.7477627992630005, 0.783828854560852, 0.8198949694633484, 0.8559610247612, 0.8920270800590515, 0.9280931949615479, 0.9641592502593994]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 2.0, 2.0, 5.0, 10.0, 9.0, 13.0, 23.0, 43.0, 79.0, 127.0, 193.0, 329.0, 561.0, 991.0, 1914.0, 3767.0, 7739.0, 17134.0, 38960.0, 91942.0, 208037.0, 314517.0, 202353.0, 89167.0, 38343.0, 16714.0, 7673.0, 3658.0, 1883.0, 998.0, 567.0, 325.0, 176.0, 111.0, 67.0, 41.0, 26.0, 24.0, 11.0, 7.0, 3.0, 7.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.1583251953125, -0.1535968780517578, -0.14886856079101562, -0.14414024353027344, -0.13941192626953125, -0.13468360900878906, -0.12995529174804688, -0.1252269744873047, -0.1204986572265625, -0.11577033996582031, -0.11104202270507812, -0.10631370544433594, -0.10158538818359375, -0.09685707092285156, -0.09212875366210938, -0.08740043640136719, -0.082672119140625, -0.07794380187988281, -0.07321548461914062, -0.06848716735839844, -0.06375885009765625, -0.05903053283691406, -0.054302215576171875, -0.04957389831542969, -0.0448455810546875, -0.04011726379394531, -0.035388946533203125, -0.030660629272460938, -0.02593231201171875, -0.021203994750976562, -0.016475677490234375, -0.011747360229492188, -0.00701904296875, -0.0022907257080078125, 0.002437591552734375, 0.0071659088134765625, 0.01189422607421875, 0.016622543334960938, 0.021350860595703125, 0.026079177856445312, 0.0308074951171875, 0.03553581237792969, 0.040264129638671875, 0.04499244689941406, 0.04972076416015625, 0.05444908142089844, 0.059177398681640625, 0.06390571594238281, 0.068634033203125, 0.07336235046386719, 0.07809066772460938, 0.08281898498535156, 0.08754730224609375, 0.09227561950683594, 0.09700393676757812, 0.10173225402832031, 0.1064605712890625, 0.11118888854980469, 0.11591720581054688, 0.12064552307128906, 0.12537384033203125, 0.13010215759277344, 0.13483047485351562, 0.1395587921142578, 0.144287109375]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 7.0, 8.0, 11.0, 12.0, 29.0, 35.0, 35.0, 45.0, 64.0, 58.0, 61.0, 73.0, 81.0, 85.0, 92.0, 64.0, 63.0, 44.0, 44.0, 26.0, 23.0, 19.0, 11.0, 10.0, 2.0, 2.0, 6.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.1756591796875, -0.17171287536621094, -0.16776657104492188, -0.1638202667236328, -0.15987396240234375, -0.1559276580810547, -0.15198135375976562, -0.14803504943847656, -0.1440887451171875, -0.14014244079589844, -0.13619613647460938, -0.1322498321533203, -0.12830352783203125, -0.12435722351074219, -0.12041091918945312, -0.11646461486816406, -0.112518310546875, -0.10857200622558594, -0.10462570190429688, -0.10067939758300781, -0.09673309326171875, -0.09278678894042969, -0.08884048461914062, -0.08489418029785156, -0.0809478759765625, -0.07700157165527344, -0.07305526733398438, -0.06910896301269531, -0.06516265869140625, -0.06121635437011719, -0.057270050048828125, -0.05332374572753906, -0.04937744140625, -0.04543113708496094, -0.041484832763671875, -0.03753852844238281, -0.03359222412109375, -0.029645919799804688, -0.025699615478515625, -0.021753311157226562, -0.0178070068359375, -0.013860702514648438, -0.009914398193359375, -0.0059680938720703125, -0.00202178955078125, 0.0019245147705078125, 0.005870819091796875, 0.009817123413085938, 0.013763427734375, 0.017709732055664062, 0.021656036376953125, 0.025602340698242188, 0.02954864501953125, 0.03349494934082031, 0.037441253662109375, 0.04138755798339844, 0.0453338623046875, 0.04928016662597656, 0.053226470947265625, 0.05717277526855469, 0.06111907958984375, 0.06506538391113281, 0.06901168823242188, 0.07295799255371094, 0.076904296875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 5.0, 7.0, 11.0, 10.0, 15.0, 21.0, 32.0, 35.0, 62.0, 75.0, 81.0, 142.0, 228.0, 301.0, 480.0, 665.0, 1173.0, 2067.0, 4199.0, 10803.0, 35712.0, 150266.0, 594309.0, 182443.0, 42591.0, 12481.0, 4761.0, 2227.0, 1153.0, 702.0, 461.0, 306.0, 187.0, 153.0, 107.0, 90.0, 44.0, 30.0, 26.0, 25.0, 21.0, 15.0, 7.0, 13.0, 4.0, 9.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.2568359375, -0.24843215942382812, -0.24002838134765625, -0.23162460327148438, -0.2232208251953125, -0.21481704711914062, -0.20641326904296875, -0.19800949096679688, -0.189605712890625, -0.18120193481445312, -0.17279815673828125, -0.16439437866210938, -0.1559906005859375, -0.14758682250976562, -0.13918304443359375, -0.13077926635742188, -0.12237548828125, -0.11397171020507812, -0.10556793212890625, -0.09716415405273438, -0.0887603759765625, -0.08035659790039062, -0.07195281982421875, -0.06354904174804688, -0.055145263671875, -0.046741485595703125, -0.03833770751953125, -0.029933929443359375, -0.0215301513671875, -0.013126373291015625, -0.00472259521484375, 0.003681182861328125, 0.0120849609375, 0.020488739013671875, 0.02889251708984375, 0.037296295166015625, 0.0457000732421875, 0.054103851318359375, 0.06250762939453125, 0.07091140747070312, 0.079315185546875, 0.08771896362304688, 0.09612274169921875, 0.10452651977539062, 0.1129302978515625, 0.12133407592773438, 0.12973785400390625, 0.13814163208007812, 0.14654541015625, 0.15494918823242188, 0.16335296630859375, 0.17175674438476562, 0.1801605224609375, 0.18856430053710938, 0.19696807861328125, 0.20537185668945312, 0.213775634765625, 0.22217941284179688, 0.23058319091796875, 0.23898696899414062, 0.2473907470703125, 0.2557945251464844, 0.26419830322265625, 0.2726020812988281, 0.281005859375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 4.0, 5.0, 7.0, 11.0, 11.0, 14.0, 17.0, 18.0, 23.0, 25.0, 28.0, 26.0, 53.0, 44.0, 37.0, 55.0, 55.0, 55.0, 60.0, 51.0, 52.0, 47.0, 33.0, 40.0, 40.0, 33.0, 33.0, 26.0, 14.0, 17.0, 15.0, 13.0, 14.0, 5.0, 5.0, 4.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.321533203125, -0.3105316162109375, -0.299530029296875, -0.2885284423828125, -0.27752685546875, -0.2665252685546875, -0.255523681640625, -0.2445220947265625, -0.2335205078125, -0.2225189208984375, -0.211517333984375, -0.2005157470703125, -0.18951416015625, -0.1785125732421875, -0.167510986328125, -0.1565093994140625, -0.1455078125, -0.1345062255859375, -0.123504638671875, -0.1125030517578125, -0.10150146484375, -0.0904998779296875, -0.079498291015625, -0.0684967041015625, -0.0574951171875, -0.0464935302734375, -0.035491943359375, -0.0244903564453125, -0.01348876953125, -0.0024871826171875, 0.008514404296875, 0.0195159912109375, 0.030517578125, 0.0415191650390625, 0.052520751953125, 0.0635223388671875, 0.07452392578125, 0.0855255126953125, 0.096527099609375, 0.1075286865234375, 0.1185302734375, 0.1295318603515625, 0.140533447265625, 0.1515350341796875, 0.16253662109375, 0.1735382080078125, 0.184539794921875, 0.1955413818359375, 0.20654296875, 0.2175445556640625, 0.228546142578125, 0.2395477294921875, 0.25054931640625, 0.2615509033203125, 0.272552490234375, 0.2835540771484375, 0.2945556640625, 0.3055572509765625, 0.316558837890625, 0.3275604248046875, 0.33856201171875, 0.3495635986328125, 0.360565185546875, 0.3715667724609375, 0.382568359375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 1.0, 3.0, 4.0, 9.0, 24.0, 32.0, 36.0, 85.0, 130.0, 204.0, 368.0, 725.0, 1331.0, 2749.0, 6198.0, 17723.0, 88036.0, 731863.0, 158743.0, 25562.0, 7872.0, 3311.0, 1660.0, 871.0, 424.0, 243.0, 156.0, 68.0, 39.0, 34.0, 17.0, 11.0, 7.0, 8.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.19482421875, -0.18919944763183594, -0.18357467651367188, -0.1779499053955078, -0.17232513427734375, -0.1667003631591797, -0.16107559204101562, -0.15545082092285156, -0.1498260498046875, -0.14420127868652344, -0.13857650756835938, -0.1329517364501953, -0.12732696533203125, -0.12170219421386719, -0.11607742309570312, -0.11045265197753906, -0.104827880859375, -0.09920310974121094, -0.09357833862304688, -0.08795356750488281, -0.08232879638671875, -0.07670402526855469, -0.07107925415039062, -0.06545448303222656, -0.0598297119140625, -0.05420494079589844, -0.048580169677734375, -0.04295539855957031, -0.03733062744140625, -0.03170585632324219, -0.026081085205078125, -0.020456314086914062, -0.01483154296875, -0.009206771850585938, -0.003582000732421875, 0.0020427703857421875, 0.00766754150390625, 0.013292312622070312, 0.018917083740234375, 0.024541854858398438, 0.0301666259765625, 0.03579139709472656, 0.041416168212890625, 0.04704093933105469, 0.05266571044921875, 0.05829048156738281, 0.06391525268554688, 0.06954002380371094, 0.075164794921875, 0.08078956604003906, 0.08641433715820312, 0.09203910827636719, 0.09766387939453125, 0.10328865051269531, 0.10891342163085938, 0.11453819274902344, 0.1201629638671875, 0.12578773498535156, 0.13141250610351562, 0.1370372772216797, 0.14266204833984375, 0.1482868194580078, 0.15391159057617188, 0.15953636169433594, 0.1651611328125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 4.0, 4.0, 1.0, 7.0, 6.0, 6.0, 10.0, 12.0, 27.0, 34.0, 41.0, 97.0, 151.0, 196.0, 145.0, 102.0, 58.0, 34.0, 20.0, 14.0, 11.0, 7.0, 5.0, 2.0, 1.0, 3.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.338689804077148e-05, -8.103623986244202e-05, -7.868558168411255e-05, -7.633492350578308e-05, -7.398426532745361e-05, -7.163360714912415e-05, -6.928294897079468e-05, -6.693229079246521e-05, -6.458163261413574e-05, -6.223097443580627e-05, -5.988031625747681e-05, -5.752965807914734e-05, -5.517899990081787e-05, -5.28283417224884e-05, -5.0477683544158936e-05, -4.812702536582947e-05, -4.57763671875e-05, -4.342570900917053e-05, -4.1075050830841064e-05, -3.87243926525116e-05, -3.637373447418213e-05, -3.402307629585266e-05, -3.167241811752319e-05, -2.9321759939193726e-05, -2.6971101760864258e-05, -2.462044358253479e-05, -2.2269785404205322e-05, -1.9919127225875854e-05, -1.7568469047546387e-05, -1.5217810869216919e-05, -1.2867152690887451e-05, -1.0516494512557983e-05, -8.165836334228516e-06, -5.815178155899048e-06, -3.46451997756958e-06, -1.1138617992401123e-06, 1.2367963790893555e-06, 3.5874545574188232e-06, 5.938112735748291e-06, 8.288770914077759e-06, 1.0639429092407227e-05, 1.2990087270736694e-05, 1.5340745449066162e-05, 1.769140362739563e-05, 2.0042061805725098e-05, 2.2392719984054565e-05, 2.4743378162384033e-05, 2.70940363407135e-05, 2.944469451904297e-05, 3.1795352697372437e-05, 3.4146010875701904e-05, 3.649666905403137e-05, 3.884732723236084e-05, 4.119798541069031e-05, 4.3548643589019775e-05, 4.589930176734924e-05, 4.824995994567871e-05, 5.060061812400818e-05, 5.2951276302337646e-05, 5.5301934480667114e-05, 5.765259265899658e-05, 6.000325083732605e-05, 6.235390901565552e-05, 6.470456719398499e-05, 6.705522537231445e-05]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 6.0, 13.0, 10.0, 17.0, 22.0, 33.0, 38.0, 73.0, 117.0, 200.0, 366.0, 672.0, 1435.0, 3573.0, 9848.0, 37850.0, 315027.0, 608519.0, 50922.0, 11980.0, 4258.0, 1753.0, 851.0, 404.0, 223.0, 119.0, 68.0, 54.0, 31.0, 22.0, 13.0, 9.0, 5.0, 6.0, 7.0, 3.0, 4.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1597900390625, -0.154296875, -0.1488037109375, -0.143310546875, -0.1378173828125, -0.13232421875, -0.1268310546875, -0.121337890625, -0.1158447265625, -0.1103515625, -0.1048583984375, -0.099365234375, -0.0938720703125, -0.08837890625, -0.0828857421875, -0.077392578125, -0.0718994140625, -0.06640625, -0.0609130859375, -0.055419921875, -0.0499267578125, -0.04443359375, -0.0389404296875, -0.033447265625, -0.0279541015625, -0.0224609375, -0.0169677734375, -0.011474609375, -0.0059814453125, -0.00048828125, 0.0050048828125, 0.010498046875, 0.0159912109375, 0.021484375, 0.0269775390625, 0.032470703125, 0.0379638671875, 0.04345703125, 0.0489501953125, 0.054443359375, 0.0599365234375, 0.0654296875, 0.0709228515625, 0.076416015625, 0.0819091796875, 0.08740234375, 0.0928955078125, 0.098388671875, 0.1038818359375, 0.109375, 0.1148681640625, 0.120361328125, 0.1258544921875, 0.13134765625, 0.1368408203125, 0.142333984375, 0.1478271484375, 0.1533203125, 0.1588134765625, 0.164306640625, 0.1697998046875, 0.17529296875, 0.1807861328125, 0.186279296875, 0.1917724609375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 5.0, 1.0, 7.0, 5.0, 4.0, 3.0, 5.0, 11.0, 15.0, 16.0, 29.0, 24.0, 42.0, 57.0, 71.0, 74.0, 87.0, 89.0, 76.0, 73.0, 53.0, 51.0, 44.0, 38.0, 21.0, 30.0, 12.0, 14.0, 12.0, 9.0, 7.0, 7.0, 7.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1263427734375, -0.12218666076660156, -0.11803054809570312, -0.11387443542480469, -0.10971832275390625, -0.10556221008300781, -0.10140609741210938, -0.09724998474121094, -0.0930938720703125, -0.08893775939941406, -0.08478164672851562, -0.08062553405761719, -0.07646942138671875, -0.07231330871582031, -0.06815719604492188, -0.06400108337402344, -0.059844970703125, -0.05568885803222656, -0.051532745361328125, -0.04737663269042969, -0.04322052001953125, -0.03906440734863281, -0.034908294677734375, -0.030752182006835938, -0.0265960693359375, -0.022439956665039062, -0.018283843994140625, -0.014127731323242188, -0.00997161865234375, -0.0058155059814453125, -0.001659393310546875, 0.0024967193603515625, 0.00665283203125, 0.010808944702148438, 0.014965057373046875, 0.019121170043945312, 0.02327728271484375, 0.027433395385742188, 0.031589508056640625, 0.03574562072753906, 0.0399017333984375, 0.04405784606933594, 0.048213958740234375, 0.05237007141113281, 0.05652618408203125, 0.06068229675292969, 0.06483840942382812, 0.06899452209472656, 0.073150634765625, 0.07730674743652344, 0.08146286010742188, 0.08561897277832031, 0.08977508544921875, 0.09393119812011719, 0.09808731079101562, 0.10224342346191406, 0.1063995361328125, 0.11055564880371094, 0.11471176147460938, 0.11886787414550781, 0.12302398681640625, 0.1271800994873047, 0.13133621215820312, 0.13549232482910156, 0.1396484375]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 7.0, 4.0, 14.0, 10.0, 32.0, 85.0, 152.0, 295.0, 218.0, 115.0, 37.0, 17.0, 14.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4472243785858154, -2.309879779815674, -2.1725351810455322, -2.0351905822753906, -1.8978461027145386, -1.760501503944397, -1.623157024383545, -1.4858124256134033, -1.3484678268432617, -1.2111232280731201, -1.0737786293029785, -0.9364341497421265, -0.7990895509719849, -0.6617449522018433, -0.5244004130363464, -0.3870558738708496, -0.249711275100708, -0.1123667061328888, 0.02497786283493042, 0.16232243180274963, 0.29966700077056885, 0.43701159954071045, 0.5743561387062073, 0.7117006778717041, 0.8490452766418457, 0.9863898754119873, 1.123734474182129, 1.261078953742981, 1.3984235525131226, 1.5357681512832642, 1.6731126308441162, 1.8104572296142578, 1.9478015899658203, 2.085146188735962, 2.2224907875061035, 2.359835386276245, 2.4971799850463867, 2.634524345397949, 2.771868944168091, 2.9092135429382324, 3.046558141708374, 3.1839027404785156, 3.3212473392486572, 3.458591938018799, 3.5959362983703613, 3.733281135559082, 3.8706254959106445, 4.007969856262207, 4.145314693450928, 4.28265905380249, 4.420003890991211, 4.557348251342773, 4.694693088531494, 4.832037448883057, 4.969382286071777, 5.10672664642334, 5.244071006774902, 5.381415367126465, 5.5187602043151855, 5.656104564666748, 5.793449401855469, 5.930793762207031, 6.068138599395752, 6.2054829597473145, 6.342827796936035]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 7.0, 8.0, 5.0, 4.0, 16.0, 11.0, 24.0, 20.0, 22.0, 15.0, 37.0, 27.0, 29.0, 36.0, 43.0, 68.0, 70.0, 83.0, 88.0, 65.0, 34.0, 45.0, 42.0, 23.0, 19.0, 28.0, 25.0, 24.0, 19.0, 8.0, 11.0, 10.0, 6.0, 3.0, 5.0, 9.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.6975972652435303, -1.6501396894454956, -1.602682113647461, -1.5552245378494263, -1.5077669620513916, -1.4603092670440674, -1.4128518104553223, -1.365394115447998, -1.3179365396499634, -1.2704789638519287, -1.223021388053894, -1.1755638122558594, -1.1281062364578247, -1.08064866065979, -1.0331909656524658, -0.9857333898544312, -0.9382758736610413, -0.8908182978630066, -0.8433607220649719, -0.7959030866622925, -0.7484455108642578, -0.7009879350662231, -0.6535303592681885, -0.6060727834701538, -0.5586152076721191, -0.5111576318740845, -0.4637000262737274, -0.41624245047569275, -0.3687848448753357, -0.321327269077301, -0.27386969327926636, -0.2264120876789093, -0.17895448207855225, -0.13149689137935638, -0.08403930813074112, -0.036581724882125854, 0.010875865817070007, 0.05833345651626587, 0.10579103231430054, 0.1532486379146576, 0.20070621371269226, 0.24816380441188812, 0.295621395111084, 0.34307897090911865, 0.3905365467071533, 0.4379941523075104, 0.48545172810554504, 0.5329093337059021, 0.5803669095039368, 0.6278244853019714, 0.6752820611000061, 0.7227396965026855, 0.7701972723007202, 0.8176548480987549, 0.8651124238967896, 0.9125699996948242, 0.9600275754928589, 1.0074851512908936, 1.0549427270889282, 1.102400302886963, 1.1498578786849976, 1.1973154544830322, 1.2447731494903564, 1.2922307252883911, 1.3396883010864258]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 2.0, 4.0, 1.0, 2.0, 3.0, 6.0, 10.0, 10.0, 13.0, 22.0, 20.0, 24.0, 40.0, 49.0, 85.0, 133.0, 193.0, 340.0, 582.0, 1351.0, 3430.0, 10560.0, 48214.0, 505625.0, 3137786.0, 424914.0, 44130.0, 10590.0, 3353.0, 1274.0, 591.0, 329.0, 176.0, 131.0, 87.0, 63.0, 42.0, 26.0, 14.0, 21.0, 14.0, 6.0, 8.0, 5.0, 2.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1571044921875, -0.15158653259277344, -0.14606857299804688, -0.1405506134033203, -0.13503265380859375, -0.1295146942138672, -0.12399673461914062, -0.11847877502441406, -0.1129608154296875, -0.10744285583496094, -0.10192489624023438, -0.09640693664550781, -0.09088897705078125, -0.08537101745605469, -0.07985305786132812, -0.07433509826660156, -0.068817138671875, -0.06329917907714844, -0.057781219482421875, -0.05226325988769531, -0.04674530029296875, -0.04122734069824219, -0.035709381103515625, -0.030191421508789062, -0.0246734619140625, -0.019155502319335938, -0.013637542724609375, -0.008119583129882812, -0.00260162353515625, 0.0029163360595703125, 0.008434295654296875, 0.013952255249023438, 0.01947021484375, 0.024988174438476562, 0.030506134033203125, 0.03602409362792969, 0.04154205322265625, 0.04706001281738281, 0.052577972412109375, 0.05809593200683594, 0.0636138916015625, 0.06913185119628906, 0.07464981079101562, 0.08016777038574219, 0.08568572998046875, 0.09120368957519531, 0.09672164916992188, 0.10223960876464844, 0.107757568359375, 0.11327552795410156, 0.11879348754882812, 0.12431144714355469, 0.12982940673828125, 0.1353473663330078, 0.14086532592773438, 0.14638328552246094, 0.1519012451171875, 0.15741920471191406, 0.16293716430664062, 0.1684551239013672, 0.17397308349609375, 0.1794910430908203, 0.18500900268554688, 0.19052696228027344, 0.196044921875]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 7.0, 4.0, 16.0, 20.0, 29.0, 43.0, 48.0, 57.0, 69.0, 76.0, 90.0, 78.0, 88.0, 68.0, 81.0, 55.0, 40.0, 35.0, 27.0, 24.0, 20.0, 13.0, 8.0, 4.0, 5.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1732177734375, -0.16915035247802734, -0.1650829315185547, -0.16101551055908203, -0.15694808959960938, -0.15288066864013672, -0.14881324768066406, -0.1447458267211914, -0.14067840576171875, -0.1366109848022461, -0.13254356384277344, -0.12847614288330078, -0.12440872192382812, -0.12034130096435547, -0.11627388000488281, -0.11220645904541016, -0.1081390380859375, -0.10407161712646484, -0.10000419616699219, -0.09593677520751953, -0.09186935424804688, -0.08780193328857422, -0.08373451232910156, -0.0796670913696289, -0.07559967041015625, -0.0715322494506836, -0.06746482849121094, -0.06339740753173828, -0.059329986572265625, -0.05526256561279297, -0.05119514465332031, -0.047127723693847656, -0.043060302734375, -0.038992881774902344, -0.03492546081542969, -0.03085803985595703, -0.026790618896484375, -0.02272319793701172, -0.018655776977539062, -0.014588356018066406, -0.01052093505859375, -0.006453514099121094, -0.0023860931396484375, 0.0016813278198242188, 0.005748748779296875, 0.009816169738769531, 0.013883590698242188, 0.017951011657714844, 0.0220184326171875, 0.026085853576660156, 0.030153274536132812, 0.03422069549560547, 0.038288116455078125, 0.04235553741455078, 0.04642295837402344, 0.050490379333496094, 0.05455780029296875, 0.058625221252441406, 0.06269264221191406, 0.06676006317138672, 0.07082748413085938, 0.07489490509033203, 0.07896232604980469, 0.08302974700927734, 0.08709716796875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 7.0, 15.0, 6.0, 12.0, 20.0, 24.0, 26.0, 38.0, 63.0, 77.0, 82.0, 151.0, 214.0, 376.0, 763.0, 2743.0, 74205.0, 4063586.0, 47533.0, 2512.0, 741.0, 392.0, 225.0, 124.0, 96.0, 80.0, 42.0, 33.0, 25.0, 20.0, 21.0, 9.0, 5.0, 9.0, 5.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.69677734375, -0.6765518188476562, -0.6563262939453125, -0.6361007690429688, -0.615875244140625, -0.5956497192382812, -0.5754241943359375, -0.5551986694335938, -0.53497314453125, -0.5147476196289062, -0.4945220947265625, -0.47429656982421875, -0.454071044921875, -0.43384552001953125, -0.4136199951171875, -0.39339447021484375, -0.3731689453125, -0.35294342041015625, -0.3327178955078125, -0.31249237060546875, -0.292266845703125, -0.27204132080078125, -0.2518157958984375, -0.23159027099609375, -0.21136474609375, -0.19113922119140625, -0.1709136962890625, -0.15068817138671875, -0.130462646484375, -0.11023712158203125, -0.0900115966796875, -0.06978607177734375, -0.049560546875, -0.02933502197265625, -0.0091094970703125, 0.01111602783203125, 0.031341552734375, 0.05156707763671875, 0.0717926025390625, 0.09201812744140625, 0.11224365234375, 0.13246917724609375, 0.1526947021484375, 0.17292022705078125, 0.193145751953125, 0.21337127685546875, 0.2335968017578125, 0.25382232666015625, 0.2740478515625, 0.29427337646484375, 0.3144989013671875, 0.33472442626953125, 0.354949951171875, 0.37517547607421875, 0.3954010009765625, 0.41562652587890625, 0.43585205078125, 0.45607757568359375, 0.4763031005859375, 0.49652862548828125, 0.516754150390625, 0.5369796752929688, 0.5572052001953125, 0.5774307250976562, 0.59765625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 4.0, 7.0, 7.0, 14.0, 19.0, 34.0, 42.0, 87.0, 152.0, 274.0, 522.0, 903.0, 898.0, 504.0, 256.0, 145.0, 64.0, 44.0, 30.0, 25.0, 12.0, 12.0, 6.0, 5.0, 2.0, 6.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.389404296875, -0.3801155090332031, -0.37082672119140625, -0.3615379333496094, -0.3522491455078125, -0.3429603576660156, -0.33367156982421875, -0.3243827819824219, -0.315093994140625, -0.3058052062988281, -0.29651641845703125, -0.2872276306152344, -0.2779388427734375, -0.2686500549316406, -0.25936126708984375, -0.2500724792480469, -0.24078369140625, -0.23149490356445312, -0.22220611572265625, -0.21291732788085938, -0.2036285400390625, -0.19433975219726562, -0.18505096435546875, -0.17576217651367188, -0.166473388671875, -0.15718460083007812, -0.14789581298828125, -0.13860702514648438, -0.1293182373046875, -0.12002944946289062, -0.11074066162109375, -0.10145187377929688, -0.0921630859375, -0.08287429809570312, -0.07358551025390625, -0.06429672241210938, -0.0550079345703125, -0.045719146728515625, -0.03643035888671875, -0.027141571044921875, -0.017852783203125, -0.008563995361328125, 0.00072479248046875, 0.010013580322265625, 0.0193023681640625, 0.028591156005859375, 0.03787994384765625, 0.047168731689453125, 0.05645751953125, 0.06574630737304688, 0.07503509521484375, 0.08432388305664062, 0.0936126708984375, 0.10290145874023438, 0.11219024658203125, 0.12147903442382812, 0.130767822265625, 0.14005661010742188, 0.14934539794921875, 0.15863418579101562, 0.1679229736328125, 0.17721176147460938, 0.18650054931640625, 0.19578933715820312, 0.205078125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 1.0, 8.0, 10.0, 21.0, 54.0, 120.0, 206.0, 244.0, 155.0, 91.0, 36.0, 18.0, 14.0, 9.0, 5.0, 3.0, 6.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.344862461090088, -4.228235721588135, -4.11160945892334, -3.9949827194213867, -3.8783559799194336, -3.7617294788360596, -3.6451029777526855, -3.5284762382507324, -3.4118494987487793, -3.2952229976654053, -3.178596258163452, -3.061969757080078, -2.945343017578125, -2.828716516494751, -2.712090015411377, -2.595463275909424, -2.47883677482605, -2.362210273742676, -2.2455835342407227, -2.1289570331573486, -2.0123302936553955, -1.8957037925720215, -1.779077172279358, -1.6624505519866943, -1.5458239316940308, -1.4291973114013672, -1.3125706911087036, -1.19594407081604, -1.079317569732666, -0.9626908898353577, -0.8460643291473389, -0.7294377088546753, -0.6128108501434326, -0.49618422985076904, -0.37955763936042786, -0.26293104887008667, -0.1463044285774231, -0.02967780828475952, 0.08694875240325928, 0.20357537269592285, 0.3202019929885864, 0.43682861328125, 0.5534552335739136, 0.6700817942619324, 0.786708414554596, 0.9033350348472595, 1.0199615955352783, 1.136588215827942, 1.2532148361206055, 1.369841456413269, 1.4864680767059326, 1.6030945777893066, 1.7197213172912598, 1.8363478183746338, 1.9529744386672974, 2.069601058959961, 2.186227798461914, 2.302854299545288, 2.419481039047241, 2.5361075401306152, 2.6527342796325684, 2.7693607807159424, 2.8859872817993164, 3.0026140213012695, 3.1192405223846436]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 4.0, 7.0, 2.0, 2.0, 9.0, 14.0, 12.0, 12.0, 8.0, 12.0, 15.0, 27.0, 22.0, 27.0, 38.0, 51.0, 46.0, 48.0, 47.0, 36.0, 51.0, 32.0, 49.0, 47.0, 41.0, 35.0, 41.0, 32.0, 37.0, 33.0, 25.0, 29.0, 18.0, 9.0, 18.0, 14.0, 16.0, 7.0, 12.0, 10.0, 7.0, 5.0, 6.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8209830522537231, -0.7906261682510376, -0.760269284248352, -0.7299124002456665, -0.6995554566383362, -0.6691985726356506, -0.6388416886329651, -0.6084848046302795, -0.578127920627594, -0.5477710366249084, -0.5174141526222229, -0.48705723881721497, -0.4567003548145294, -0.4263434410095215, -0.39598655700683594, -0.3656296730041504, -0.33527275919914246, -0.3049158751964569, -0.274558961391449, -0.24420207738876343, -0.21384519338607788, -0.18348829448223114, -0.1531313955783844, -0.12277451157569885, -0.09241761267185211, -0.06206072121858597, -0.031703826040029526, -0.0013469308614730835, 0.02900996059179306, 0.059366852045059204, 0.08972375094890594, 0.12008063495159149, 0.15043753385543823, 0.18079443275928497, 0.21115131676197052, 0.24150821566581726, 0.2718650996685028, 0.30222201347351074, 0.3325788974761963, 0.36293578147888184, 0.3932926654815674, 0.42364954948425293, 0.45400646328926086, 0.4843633472919464, 0.5147202610969543, 0.5450771450996399, 0.5754340291023254, 0.605790913105011, 0.6361478567123413, 0.6665047407150269, 0.6968616247177124, 0.727218508720398, 0.7575754523277283, 0.7879323363304138, 0.8182892203330994, 0.8486461043357849, 0.8790029883384705, 0.909359872341156, 0.9397167563438416, 0.9700736999511719, 1.0004305839538574, 1.030787467956543, 1.0611443519592285, 1.091501235961914, 1.1218581199645996]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 11.0, 9.0, 15.0, 16.0, 30.0, 41.0, 59.0, 87.0, 144.0, 237.0, 365.0, 626.0, 1090.0, 1961.0, 3845.0, 8193.0, 17820.0, 41988.0, 102357.0, 224001.0, 304088.0, 193282.0, 84432.0, 34394.0, 14931.0, 6936.0, 3397.0, 1749.0, 1010.0, 531.0, 327.0, 180.0, 141.0, 90.0, 52.0, 36.0, 22.0, 16.0, 19.0, 15.0, 4.0, 10.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1444091796875, -0.139495849609375, -0.13458251953125, -0.129669189453125, -0.124755859375, -0.119842529296875, -0.11492919921875, -0.110015869140625, -0.1051025390625, -0.100189208984375, -0.09527587890625, -0.090362548828125, -0.08544921875, -0.080535888671875, -0.07562255859375, -0.070709228515625, -0.0657958984375, -0.060882568359375, -0.05596923828125, -0.051055908203125, -0.046142578125, -0.041229248046875, -0.03631591796875, -0.031402587890625, -0.0264892578125, -0.021575927734375, -0.01666259765625, -0.011749267578125, -0.0068359375, -0.001922607421875, 0.00299072265625, 0.007904052734375, 0.0128173828125, 0.017730712890625, 0.02264404296875, 0.027557373046875, 0.032470703125, 0.037384033203125, 0.04229736328125, 0.047210693359375, 0.0521240234375, 0.057037353515625, 0.06195068359375, 0.066864013671875, 0.07177734375, 0.076690673828125, 0.08160400390625, 0.086517333984375, 0.0914306640625, 0.096343994140625, 0.10125732421875, 0.106170654296875, 0.111083984375, 0.115997314453125, 0.12091064453125, 0.125823974609375, 0.1307373046875, 0.135650634765625, 0.14056396484375, 0.145477294921875, 0.150390625, 0.155303955078125, 0.16021728515625, 0.165130615234375, 0.1700439453125]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 12.0, 7.0, 6.0, 11.0, 36.0, 30.0, 29.0, 42.0, 51.0, 73.0, 67.0, 73.0, 60.0, 62.0, 66.0, 78.0, 59.0, 51.0, 48.0, 39.0, 25.0, 22.0, 23.0, 11.0, 14.0, 6.0, 5.0, 6.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16796875, -0.1639881134033203, -0.16000747680664062, -0.15602684020996094, -0.15204620361328125, -0.14806556701660156, -0.14408493041992188, -0.1401042938232422, -0.1361236572265625, -0.1321430206298828, -0.12816238403320312, -0.12418174743652344, -0.12020111083984375, -0.11622047424316406, -0.11223983764648438, -0.10825920104980469, -0.104278564453125, -0.10029792785644531, -0.09631729125976562, -0.09233665466308594, -0.08835601806640625, -0.08437538146972656, -0.08039474487304688, -0.07641410827636719, -0.0724334716796875, -0.06845283508300781, -0.06447219848632812, -0.06049156188964844, -0.05651092529296875, -0.05253028869628906, -0.048549652099609375, -0.04456901550292969, -0.04058837890625, -0.03660774230957031, -0.032627105712890625, -0.028646469116210938, -0.02466583251953125, -0.020685195922851562, -0.016704559326171875, -0.012723922729492188, -0.0087432861328125, -0.0047626495361328125, -0.000782012939453125, 0.0031986236572265625, 0.00717926025390625, 0.011159896850585938, 0.015140533447265625, 0.019121170043945312, 0.023101806640625, 0.027082443237304688, 0.031063079833984375, 0.03504371643066406, 0.03902435302734375, 0.04300498962402344, 0.046985626220703125, 0.05096626281738281, 0.0549468994140625, 0.05892753601074219, 0.06290817260742188, 0.06688880920410156, 0.07086944580078125, 0.07485008239746094, 0.07883071899414062, 0.08281135559082031, 0.0867919921875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 4.0, 2.0, 3.0, 3.0, 8.0, 9.0, 22.0, 35.0, 49.0, 83.0, 160.0, 329.0, 728.0, 1656.0, 5048.0, 24248.0, 248295.0, 693257.0, 61087.0, 9033.0, 2536.0, 984.0, 482.0, 220.0, 114.0, 67.0, 29.0, 26.0, 13.0, 12.0, 5.0, 5.0, 0.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.468994140625, -0.4539680480957031, -0.43894195556640625, -0.4239158630371094, -0.4088897705078125, -0.3938636779785156, -0.37883758544921875, -0.3638114929199219, -0.348785400390625, -0.3337593078613281, -0.31873321533203125, -0.3037071228027344, -0.2886810302734375, -0.2736549377441406, -0.25862884521484375, -0.24360275268554688, -0.22857666015625, -0.21355056762695312, -0.19852447509765625, -0.18349838256835938, -0.1684722900390625, -0.15344619750976562, -0.13842010498046875, -0.12339401245117188, -0.108367919921875, -0.09334182739257812, -0.07831573486328125, -0.06328964233398438, -0.0482635498046875, -0.033237457275390625, -0.01821136474609375, -0.003185272216796875, 0.0118408203125, 0.026866912841796875, 0.04189300537109375, 0.056919097900390625, 0.0719451904296875, 0.08697128295898438, 0.10199737548828125, 0.11702346801757812, 0.132049560546875, 0.14707565307617188, 0.16210174560546875, 0.17712783813476562, 0.1921539306640625, 0.20718002319335938, 0.22220611572265625, 0.23723220825195312, 0.25225830078125, 0.2672843933105469, 0.28231048583984375, 0.2973365783691406, 0.3123626708984375, 0.3273887634277344, 0.34241485595703125, 0.3574409484863281, 0.372467041015625, 0.3874931335449219, 0.40251922607421875, 0.4175453186035156, 0.4325714111328125, 0.4475975036621094, 0.46262359619140625, 0.4776496887207031, 0.49267578125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 5.0, 2.0, 6.0, 16.0, 6.0, 10.0, 16.0, 15.0, 19.0, 34.0, 28.0, 43.0, 42.0, 52.0, 53.0, 63.0, 66.0, 62.0, 65.0, 47.0, 43.0, 50.0, 34.0, 40.0, 39.0, 30.0, 25.0, 30.0, 20.0, 8.0, 10.0, 8.0, 4.0, 6.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.44189453125, -0.42951202392578125, -0.4171295166015625, -0.40474700927734375, -0.392364501953125, -0.37998199462890625, -0.3675994873046875, -0.35521697998046875, -0.34283447265625, -0.33045196533203125, -0.3180694580078125, -0.30568695068359375, -0.293304443359375, -0.28092193603515625, -0.2685394287109375, -0.25615692138671875, -0.2437744140625, -0.23139190673828125, -0.2190093994140625, -0.20662689208984375, -0.194244384765625, -0.18186187744140625, -0.1694793701171875, -0.15709686279296875, -0.14471435546875, -0.13233184814453125, -0.1199493408203125, -0.10756683349609375, -0.095184326171875, -0.08280181884765625, -0.0704193115234375, -0.05803680419921875, -0.045654296875, -0.03327178955078125, -0.0208892822265625, -0.00850677490234375, 0.003875732421875, 0.01625823974609375, 0.0286407470703125, 0.04102325439453125, 0.05340576171875, 0.06578826904296875, 0.0781707763671875, 0.09055328369140625, 0.102935791015625, 0.11531829833984375, 0.1277008056640625, 0.14008331298828125, 0.1524658203125, 0.16484832763671875, 0.1772308349609375, 0.18961334228515625, 0.201995849609375, 0.21437835693359375, 0.2267608642578125, 0.23914337158203125, 0.25152587890625, 0.26390838623046875, 0.2762908935546875, 0.28867340087890625, 0.301055908203125, 0.31343841552734375, 0.3258209228515625, 0.33820343017578125, 0.3505859375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 7.0, 3.0, 7.0, 4.0, 12.0, 12.0, 21.0, 21.0, 25.0, 35.0, 65.0, 68.0, 92.0, 149.0, 195.0, 311.0, 431.0, 709.0, 1088.0, 1799.0, 3080.0, 6012.0, 13623.0, 40269.0, 189140.0, 642558.0, 101035.0, 26136.0, 10176.0, 4666.0, 2520.0, 1573.0, 898.0, 571.0, 362.0, 241.0, 182.0, 132.0, 91.0, 80.0, 42.0, 32.0, 29.0, 16.0, 17.0, 8.0, 11.0, 4.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1441650390625, -0.13907432556152344, -0.13398361206054688, -0.1288928985595703, -0.12380218505859375, -0.11871147155761719, -0.11362075805664062, -0.10853004455566406, -0.1034393310546875, -0.09834861755371094, -0.09325790405273438, -0.08816719055175781, -0.08307647705078125, -0.07798576354980469, -0.07289505004882812, -0.06780433654785156, -0.062713623046875, -0.05762290954589844, -0.052532196044921875, -0.04744148254394531, -0.04235076904296875, -0.03726005554199219, -0.032169342041015625, -0.027078628540039062, -0.0219879150390625, -0.016897201538085938, -0.011806488037109375, -0.0067157745361328125, -0.00162506103515625, 0.0034656524658203125, 0.008556365966796875, 0.013647079467773438, 0.01873779296875, 0.023828506469726562, 0.028919219970703125, 0.03400993347167969, 0.03910064697265625, 0.04419136047363281, 0.049282073974609375, 0.05437278747558594, 0.0594635009765625, 0.06455421447753906, 0.06964492797851562, 0.07473564147949219, 0.07982635498046875, 0.08491706848144531, 0.09000778198242188, 0.09509849548339844, 0.100189208984375, 0.10527992248535156, 0.11037063598632812, 0.11546134948730469, 0.12055206298828125, 0.1256427764892578, 0.13073348999023438, 0.13582420349121094, 0.1409149169921875, 0.14600563049316406, 0.15109634399414062, 0.1561870574951172, 0.16127777099609375, 0.1663684844970703, 0.17145919799804688, 0.17654991149902344, 0.181640625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 5.0, 8.0, 9.0, 18.0, 44.0, 146.0, 335.0, 265.0, 91.0, 36.0, 15.0, 13.0, 9.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00021409988403320312, -0.00020827725529670715, -0.00020245462656021118, -0.0001966319978237152, -0.00019080936908721924, -0.00018498674035072327, -0.0001791641116142273, -0.00017334148287773132, -0.00016751885414123535, -0.00016169622540473938, -0.0001558735966682434, -0.00015005096793174744, -0.00014422833919525146, -0.0001384057104587555, -0.00013258308172225952, -0.00012676045298576355, -0.00012093782424926758, -0.0001151151955127716, -0.00010929256677627563, -0.00010346993803977966, -9.764730930328369e-05, -9.182468056678772e-05, -8.600205183029175e-05, -8.017942309379578e-05, -7.43567943572998e-05, -6.853416562080383e-05, -6.271153688430786e-05, -5.688890814781189e-05, -5.106627941131592e-05, -4.5243650674819946e-05, -3.9421021938323975e-05, -3.3598393201828e-05, -2.777576446533203e-05, -2.195313572883606e-05, -1.6130506992340088e-05, -1.0307878255844116e-05, -4.4852495193481445e-06, 1.3373792171478271e-06, 7.160007953643799e-06, 1.298263669013977e-05, 1.8805265426635742e-05, 2.4627894163131714e-05, 3.0450522899627686e-05, 3.627315163612366e-05, 4.209578037261963e-05, 4.79184091091156e-05, 5.374103784561157e-05, 5.9563666582107544e-05, 6.538629531860352e-05, 7.120892405509949e-05, 7.703155279159546e-05, 8.285418152809143e-05, 8.86768102645874e-05, 9.449943900108337e-05, 0.00010032206773757935, 0.00010614469647407532, 0.00011196732521057129, 0.00011778995394706726, 0.00012361258268356323, 0.0001294352114200592, 0.00013525784015655518, 0.00014108046889305115, 0.00014690309762954712, 0.0001527257263660431, 0.00015854835510253906]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 6.0, 9.0, 8.0, 11.0, 6.0, 15.0, 22.0, 26.0, 39.0, 59.0, 122.0, 164.0, 256.0, 464.0, 834.0, 1634.0, 3416.0, 8229.0, 25583.0, 127602.0, 716812.0, 123192.0, 24842.0, 8060.0, 3349.0, 1664.0, 896.0, 469.0, 277.0, 170.0, 101.0, 53.0, 52.0, 35.0, 31.0, 12.0, 8.0, 8.0, 8.0, 5.0, 1.0, 1.0, 0.0, 7.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.20703125, -0.2008495330810547, -0.19466781616210938, -0.18848609924316406, -0.18230438232421875, -0.17612266540527344, -0.16994094848632812, -0.1637592315673828, -0.1575775146484375, -0.1513957977294922, -0.14521408081054688, -0.13903236389160156, -0.13285064697265625, -0.12666893005371094, -0.12048721313476562, -0.11430549621582031, -0.108123779296875, -0.10194206237792969, -0.09576034545898438, -0.08957862854003906, -0.08339691162109375, -0.07721519470214844, -0.07103347778320312, -0.06485176086425781, -0.0586700439453125, -0.05248832702636719, -0.046306610107421875, -0.04012489318847656, -0.03394317626953125, -0.027761459350585938, -0.021579742431640625, -0.015398025512695312, -0.00921630859375, -0.0030345916748046875, 0.003147125244140625, 0.009328842163085938, 0.01551055908203125, 0.021692276000976562, 0.027873992919921875, 0.03405570983886719, 0.0402374267578125, 0.04641914367675781, 0.052600860595703125, 0.05878257751464844, 0.06496429443359375, 0.07114601135253906, 0.07732772827148438, 0.08350944519042969, 0.089691162109375, 0.09587287902832031, 0.10205459594726562, 0.10823631286621094, 0.11441802978515625, 0.12059974670410156, 0.12678146362304688, 0.1329631805419922, 0.1391448974609375, 0.1453266143798828, 0.15150833129882812, 0.15769004821777344, 0.16387176513671875, 0.17005348205566406, 0.17623519897460938, 0.1824169158935547, 0.1885986328125]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 10.0, 11.0, 14.0, 27.0, 24.0, 38.0, 59.0, 81.0, 118.0, 137.0, 134.0, 113.0, 70.0, 47.0, 25.0, 16.0, 19.0, 8.0, 7.0, 8.0, 5.0, 7.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.215576171875, -0.20904159545898438, -0.20250701904296875, -0.19597244262695312, -0.1894378662109375, -0.18290328979492188, -0.17636871337890625, -0.16983413696289062, -0.163299560546875, -0.15676498413085938, -0.15023040771484375, -0.14369583129882812, -0.1371612548828125, -0.13062667846679688, -0.12409210205078125, -0.11755752563476562, -0.11102294921875, -0.10448837280273438, -0.09795379638671875, -0.09141921997070312, -0.0848846435546875, -0.07835006713867188, -0.07181549072265625, -0.06528091430664062, -0.058746337890625, -0.052211761474609375, -0.04567718505859375, -0.039142608642578125, -0.0326080322265625, -0.026073455810546875, -0.01953887939453125, -0.013004302978515625, -0.0064697265625, 6.4849853515625e-05, 0.00659942626953125, 0.013134002685546875, 0.0196685791015625, 0.026203155517578125, 0.03273773193359375, 0.039272308349609375, 0.045806884765625, 0.052341461181640625, 0.05887603759765625, 0.06541061401367188, 0.0719451904296875, 0.07847976684570312, 0.08501434326171875, 0.09154891967773438, 0.09808349609375, 0.10461807250976562, 0.11115264892578125, 0.11768722534179688, 0.1242218017578125, 0.13075637817382812, 0.13729095458984375, 0.14382553100585938, 0.150360107421875, 0.15689468383789062, 0.16342926025390625, 0.16996383666992188, 0.1764984130859375, 0.18303298950195312, 0.18956756591796875, 0.19610214233398438, 0.20263671875]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 14.0, 28.0, 61.0, 137.0, 348.0, 206.0, 105.0, 46.0, 22.0, 15.0, 9.0, 2.0, 5.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.609805107116699, -4.442532539367676, -4.275259494781494, -4.107986927032471, -3.940713882446289, -3.7734413146972656, -3.606168508529663, -3.4388957023620605, -3.271622896194458, -3.1043500900268555, -2.937077283859253, -2.7698044776916504, -2.602531909942627, -2.4352588653564453, -2.267986297607422, -2.1007134914398193, -1.9334406852722168, -1.7661678791046143, -1.5988950729370117, -1.4316223859786987, -1.2643495798110962, -1.0970767736434937, -0.9298040866851807, -0.7625312805175781, -0.5952584743499756, -0.42798569798469543, -0.2607129216194153, -0.09344017505645752, 0.07383263111114502, 0.24110543727874756, 0.40837812423706055, 0.5756509304046631, 0.7429237365722656, 0.9101965427398682, 1.0774693489074707, 1.2447420358657837, 1.4120148420333862, 1.5792876482009888, 1.7465603351593018, 1.9138331413269043, 2.081105947494507, 2.2483787536621094, 2.415651559829712, 2.5829243659973145, 2.750196933746338, 2.9174699783325195, 3.084742546081543, 3.2520153522491455, 3.419288158416748, 3.5865609645843506, 3.753833770751953, 3.9211063385009766, 4.088379383087158, 4.255651950836182, 4.422924995422363, 4.590197563171387, 4.75747013092041, 4.924742698669434, 5.092015743255615, 5.259288311004639, 5.42656135559082, 5.593833923339844, 5.761106491088867, 5.928379535675049, 6.0956525802612305]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 6.0, 3.0, 5.0, 7.0, 4.0, 6.0, 5.0, 10.0, 4.0, 10.0, 8.0, 17.0, 18.0, 17.0, 26.0, 17.0, 16.0, 26.0, 20.0, 30.0, 38.0, 32.0, 32.0, 58.0, 76.0, 88.0, 55.0, 43.0, 31.0, 43.0, 24.0, 31.0, 25.0, 18.0, 25.0, 15.0, 17.0, 17.0, 12.0, 13.0, 13.0, 9.0, 9.0, 11.0, 6.0, 1.0, 7.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.130967617034912, -1.0895479917526245, -1.048128366470337, -1.0067087411880493, -0.9652891159057617, -0.9238694906234741, -0.8824498653411865, -0.8410302400588989, -0.7996106147766113, -0.7581909894943237, -0.7167713642120361, -0.6753517389297485, -0.6339321136474609, -0.5925124883651733, -0.5510928630828857, -0.5096732378005981, -0.4682536721229553, -0.4268340468406677, -0.3854144215583801, -0.34399479627609253, -0.30257517099380493, -0.26115554571151733, -0.21973595023155212, -0.17831632494926453, -0.13689669966697693, -0.09547707438468933, -0.05405745655298233, -0.01263783872127533, 0.028781786561012268, 0.07020141184329987, 0.11162102222442627, 0.15304064750671387, 0.19446027278900146, 0.23587989807128906, 0.27729952335357666, 0.31871914863586426, 0.36013877391815186, 0.40155839920043945, 0.44297799468040466, 0.48439761996269226, 0.5258172750473022, 0.5672369003295898, 0.6086565256118774, 0.650076150894165, 0.6914957761764526, 0.7329154014587402, 0.7743350267410278, 0.8157546520233154, 0.8571742177009583, 0.8985938429832458, 0.9400134682655334, 0.981433093547821, 1.0228526592254639, 1.0642722845077515, 1.105691909790039, 1.1471115350723267, 1.1885311603546143, 1.2299507856369019, 1.2713704109191895, 1.312790036201477, 1.3542096614837646, 1.3956292867660522, 1.4370489120483398, 1.4784685373306274, 1.519888162612915]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 7.0, 6.0, 9.0, 15.0, 23.0, 43.0, 48.0, 80.0, 155.0, 278.0, 391.0, 682.0, 1215.0, 2346.0, 4767.0, 11178.0, 33087.0, 152355.0, 1406190.0, 2244647.0, 262469.0, 47018.0, 14912.0, 6017.0, 2787.0, 1483.0, 877.0, 482.0, 277.0, 151.0, 87.0, 62.0, 45.0, 34.0, 25.0, 17.0, 6.0, 7.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.173828125, -0.16841888427734375, -0.1630096435546875, -0.15760040283203125, -0.152191162109375, -0.14678192138671875, -0.1413726806640625, -0.13596343994140625, -0.13055419921875, -0.12514495849609375, -0.1197357177734375, -0.11432647705078125, -0.108917236328125, -0.10350799560546875, -0.0980987548828125, -0.09268951416015625, -0.0872802734375, -0.08187103271484375, -0.0764617919921875, -0.07105255126953125, -0.065643310546875, -0.06023406982421875, -0.0548248291015625, -0.04941558837890625, -0.04400634765625, -0.03859710693359375, -0.0331878662109375, -0.02777862548828125, -0.022369384765625, -0.01696014404296875, -0.0115509033203125, -0.00614166259765625, -0.000732421875, 0.00467681884765625, 0.0100860595703125, 0.01549530029296875, 0.020904541015625, 0.02631378173828125, 0.0317230224609375, 0.03713226318359375, 0.04254150390625, 0.04795074462890625, 0.0533599853515625, 0.05876922607421875, 0.064178466796875, 0.06958770751953125, 0.0749969482421875, 0.08040618896484375, 0.0858154296875, 0.09122467041015625, 0.0966339111328125, 0.10204315185546875, 0.107452392578125, 0.11286163330078125, 0.1182708740234375, 0.12368011474609375, 0.12908935546875, 0.13449859619140625, 0.1399078369140625, 0.14531707763671875, 0.150726318359375, 0.15613555908203125, 0.1615447998046875, 0.16695404052734375, 0.17236328125]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 7.0, 11.0, 7.0, 14.0, 24.0, 11.0, 27.0, 40.0, 42.0, 54.0, 53.0, 72.0, 71.0, 74.0, 57.0, 84.0, 60.0, 67.0, 50.0, 29.0, 27.0, 25.0, 28.0, 22.0, 13.0, 14.0, 10.0, 7.0, 5.0, 4.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.15625, -0.15244579315185547, -0.14864158630371094, -0.1448373794555664, -0.14103317260742188, -0.13722896575927734, -0.1334247589111328, -0.12962055206298828, -0.12581634521484375, -0.12201213836669922, -0.11820793151855469, -0.11440372467041016, -0.11059951782226562, -0.1067953109741211, -0.10299110412597656, -0.09918689727783203, -0.0953826904296875, -0.09157848358154297, -0.08777427673339844, -0.0839700698852539, -0.08016586303710938, -0.07636165618896484, -0.07255744934082031, -0.06875324249267578, -0.06494903564453125, -0.06114482879638672, -0.05734062194824219, -0.053536415100097656, -0.049732208251953125, -0.045928001403808594, -0.04212379455566406, -0.03831958770751953, -0.034515380859375, -0.03071117401123047, -0.026906967163085938, -0.023102760314941406, -0.019298553466796875, -0.015494346618652344, -0.011690139770507812, -0.007885932922363281, -0.00408172607421875, -0.00027751922607421875, 0.0035266876220703125, 0.007330894470214844, 0.011135101318359375, 0.014939308166503906, 0.018743515014648438, 0.02254772186279297, 0.0263519287109375, 0.03015613555908203, 0.03396034240722656, 0.037764549255371094, 0.041568756103515625, 0.045372962951660156, 0.04917716979980469, 0.05298137664794922, 0.05678558349609375, 0.06058979034423828, 0.06439399719238281, 0.06819820404052734, 0.07200241088867188, 0.0758066177368164, 0.07961082458496094, 0.08341503143310547, 0.08721923828125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 1.0, 8.0, 17.0, 46.0, 119.0, 318.0, 1397.0, 121456.0, 4066349.0, 3699.0, 531.0, 201.0, 80.0, 36.0, 19.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.833984375, -1.7833099365234375, -1.732635498046875, -1.6819610595703125, -1.63128662109375, -1.5806121826171875, -1.529937744140625, -1.4792633056640625, -1.4285888671875, -1.3779144287109375, -1.327239990234375, -1.2765655517578125, -1.22589111328125, -1.1752166748046875, -1.124542236328125, -1.0738677978515625, -1.023193359375, -0.9725189208984375, -0.921844482421875, -0.8711700439453125, -0.82049560546875, -0.7698211669921875, -0.719146728515625, -0.6684722900390625, -0.6177978515625, -0.5671234130859375, -0.516448974609375, -0.4657745361328125, -0.41510009765625, -0.3644256591796875, -0.313751220703125, -0.2630767822265625, -0.21240234375, -0.1617279052734375, -0.111053466796875, -0.0603790283203125, -0.00970458984375, 0.0409698486328125, 0.091644287109375, 0.1423187255859375, 0.1929931640625, 0.2436676025390625, 0.294342041015625, 0.3450164794921875, 0.39569091796875, 0.4463653564453125, 0.497039794921875, 0.5477142333984375, 0.598388671875, 0.6490631103515625, 0.699737548828125, 0.7504119873046875, 0.80108642578125, 0.8517608642578125, 0.902435302734375, 0.9531097412109375, 1.0037841796875, 1.0544586181640625, 1.105133056640625, 1.1558074951171875, 1.20648193359375, 1.2571563720703125, 1.307830810546875, 1.3585052490234375, 1.4091796875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 6.0, 6.0, 26.0, 66.0, 155.0, 506.0, 1868.0, 1039.0, 265.0, 103.0, 23.0, 14.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.607421875, -0.5806884765625, -0.553955078125, -0.5272216796875, -0.50048828125, -0.4737548828125, -0.447021484375, -0.4202880859375, -0.3935546875, -0.3668212890625, -0.340087890625, -0.3133544921875, -0.28662109375, -0.2598876953125, -0.233154296875, -0.2064208984375, -0.1796875, -0.1529541015625, -0.126220703125, -0.0994873046875, -0.07275390625, -0.0460205078125, -0.019287109375, 0.0074462890625, 0.0341796875, 0.0609130859375, 0.087646484375, 0.1143798828125, 0.14111328125, 0.1678466796875, 0.194580078125, 0.2213134765625, 0.248046875, 0.2747802734375, 0.301513671875, 0.3282470703125, 0.35498046875, 0.3817138671875, 0.408447265625, 0.4351806640625, 0.4619140625, 0.4886474609375, 0.515380859375, 0.5421142578125, 0.56884765625, 0.5955810546875, 0.622314453125, 0.6490478515625, 0.67578125, 0.7025146484375, 0.729248046875, 0.7559814453125, 0.78271484375, 0.8094482421875, 0.836181640625, 0.8629150390625, 0.8896484375, 0.9163818359375, 0.943115234375, 0.9698486328125, 0.99658203125, 1.0233154296875, 1.050048828125, 1.0767822265625, 1.103515625]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 8.0, 12.0, 29.0, 77.0, 141.0, 218.0, 214.0, 134.0, 92.0, 39.0, 21.0, 6.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9099971055984497, -1.7824445962905884, -1.6548919677734375, -1.5273394584655762, -1.3997869491577148, -1.272234320640564, -1.1446818113327026, -1.0171291828155518, -0.8895766735076904, -0.7620241045951843, -0.6344715356826782, -0.5069190263748169, -0.3793664574623108, -0.2518138885498047, -0.12426137924194336, 0.003291189670562744, 0.13084375858306885, 0.25839632749557495, 0.38594886660575867, 0.5135014057159424, 0.6410539746284485, 0.7686065435409546, 0.8961590528488159, 1.0237116813659668, 1.1512641906738281, 1.2788166999816895, 1.4063693284988403, 1.5339218378067017, 1.6614744663238525, 1.7890269756317139, 1.9165794849395752, 2.0441319942474365, 2.171684741973877, 2.2992372512817383, 2.4267897605895996, 2.554342269897461, 2.6818950176239014, 2.8094475269317627, 2.937000036239624, 3.0645525455474854, 3.192105293273926, 3.319657802581787, 3.4472103118896484, 3.5747628211975098, 3.70231556892395, 3.8298680782318115, 3.957420587539673, 4.084973335266113, 4.212525367736816, 4.340077877044678, 4.467630386352539, 4.5951828956604, 4.722735404968262, 4.850288391113281, 4.977840423583984, 5.105393409729004, 5.232945919036865, 5.360498428344727, 5.488050937652588, 5.615603446960449, 5.7431559562683105, 5.870708465576172, 5.998261451721191, 6.125813961029053, 6.253366470336914]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 5.0, 6.0, 7.0, 7.0, 6.0, 6.0, 13.0, 13.0, 9.0, 23.0, 26.0, 29.0, 48.0, 34.0, 42.0, 39.0, 35.0, 44.0, 47.0, 35.0, 41.0, 49.0, 48.0, 44.0, 27.0, 33.0, 47.0, 34.0, 32.0, 26.0, 26.0, 20.0, 17.0, 13.0, 16.0, 8.0, 14.0, 6.0, 8.0, 4.0, 2.0, 1.0, 2.0, 0.0, 4.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-1.7115514278411865, -1.661831021308899, -1.6121106147766113, -1.5623900890350342, -1.5126696825027466, -1.462949275970459, -1.4132288694381714, -1.3635084629058838, -1.3137880563735962, -1.2640676498413086, -1.214347243309021, -1.1646268367767334, -1.1149063110351562, -1.0651859045028687, -1.015465497970581, -0.9657450914382935, -0.9160246253013611, -0.8663042187690735, -0.8165837526321411, -0.7668633460998535, -0.7171429395675659, -0.6674225330352783, -0.617702066898346, -0.5679816603660583, -0.518261194229126, -0.468540757894516, -0.4188203513622284, -0.3690999150276184, -0.3193795084953308, -0.2696590721607208, -0.21993863582611084, -0.17021822929382324, -0.12049782276153564, -0.07077740132808685, -0.021056972444057465, 0.028663456439971924, 0.07838387787342072, 0.1281042993068695, 0.1778247356414795, 0.2275451421737671, 0.2772655785083771, 0.32698601484298706, 0.37670642137527466, 0.42642685770988464, 0.47614729404449463, 0.5258677005767822, 0.5755881071090698, 0.6253085136413574, 0.6750289797782898, 0.7247493863105774, 0.7744698524475098, 0.8241902589797974, 0.873910665512085, 0.9236310720443726, 0.9733515381813049, 1.0230720043182373, 1.072792410850525, 1.1225128173828125, 1.1722332239151, 1.2219536304473877, 1.2716741561889648, 1.3213945627212524, 1.37111496925354, 1.4208353757858276, 1.4705557823181152]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 1.0, 8.0, 5.0, 5.0, 13.0, 25.0, 20.0, 33.0, 48.0, 82.0, 104.0, 174.0, 304.0, 500.0, 786.0, 1310.0, 2275.0, 4084.0, 7506.0, 14047.0, 26849.0, 52715.0, 106349.0, 203697.0, 261962.0, 178759.0, 91561.0, 45316.0, 22893.0, 11974.0, 6388.0, 3633.0, 2049.0, 1154.0, 746.0, 427.0, 283.0, 171.0, 98.0, 69.0, 48.0, 20.0, 23.0, 15.0, 17.0, 6.0, 1.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0], "bins": [-0.137939453125, -0.1336803436279297, -0.12942123413085938, -0.12516212463378906, -0.12090301513671875, -0.11664390563964844, -0.11238479614257812, -0.10812568664550781, -0.1038665771484375, -0.09960746765136719, -0.09534835815429688, -0.09108924865722656, -0.08683013916015625, -0.08257102966308594, -0.07831192016601562, -0.07405281066894531, -0.069793701171875, -0.06553459167480469, -0.061275482177734375, -0.05701637268066406, -0.05275726318359375, -0.04849815368652344, -0.044239044189453125, -0.03997993469238281, -0.0357208251953125, -0.03146171569824219, -0.027202606201171875, -0.022943496704101562, -0.01868438720703125, -0.014425277709960938, -0.010166168212890625, -0.0059070587158203125, -0.00164794921875, 0.0026111602783203125, 0.006870269775390625, 0.011129379272460938, 0.01538848876953125, 0.019647598266601562, 0.023906707763671875, 0.028165817260742188, 0.0324249267578125, 0.03668403625488281, 0.040943145751953125, 0.04520225524902344, 0.04946136474609375, 0.05372047424316406, 0.057979583740234375, 0.06223869323730469, 0.066497802734375, 0.07075691223144531, 0.07501602172851562, 0.07927513122558594, 0.08353424072265625, 0.08779335021972656, 0.09205245971679688, 0.09631156921386719, 0.1005706787109375, 0.10482978820800781, 0.10908889770507812, 0.11334800720214844, 0.11760711669921875, 0.12186622619628906, 0.12612533569335938, 0.1303844451904297, 0.1346435546875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 5.0, 2.0, 5.0, 5.0, 8.0, 7.0, 17.0, 15.0, 18.0, 26.0, 35.0, 21.0, 36.0, 45.0, 51.0, 46.0, 56.0, 57.0, 46.0, 49.0, 52.0, 49.0, 57.0, 44.0, 33.0, 46.0, 31.0, 34.0, 26.0, 22.0, 10.0, 13.0, 14.0, 8.0, 5.0, 3.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 4.0], "bins": [-0.15673828125, -0.15281200408935547, -0.14888572692871094, -0.1449594497680664, -0.14103317260742188, -0.13710689544677734, -0.1331806182861328, -0.12925434112548828, -0.12532806396484375, -0.12140178680419922, -0.11747550964355469, -0.11354923248291016, -0.10962295532226562, -0.1056966781616211, -0.10177040100097656, -0.09784412384033203, -0.0939178466796875, -0.08999156951904297, -0.08606529235839844, -0.0821390151977539, -0.07821273803710938, -0.07428646087646484, -0.07036018371582031, -0.06643390655517578, -0.06250762939453125, -0.05858135223388672, -0.05465507507324219, -0.050728797912597656, -0.046802520751953125, -0.042876243591308594, -0.03894996643066406, -0.03502368927001953, -0.031097412109375, -0.02717113494873047, -0.023244857788085938, -0.019318580627441406, -0.015392303466796875, -0.011466026306152344, -0.0075397491455078125, -0.0036134719848632812, 0.00031280517578125, 0.004239082336425781, 0.008165359497070312, 0.012091636657714844, 0.016017913818359375, 0.019944190979003906, 0.023870468139648438, 0.02779674530029297, 0.0317230224609375, 0.03564929962158203, 0.03957557678222656, 0.043501853942871094, 0.047428131103515625, 0.051354408264160156, 0.05528068542480469, 0.05920696258544922, 0.06313323974609375, 0.06705951690673828, 0.07098579406738281, 0.07491207122802734, 0.07883834838867188, 0.0827646255493164, 0.08669090270996094, 0.09061717987060547, 0.09454345703125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 6.0, 5.0, 9.0, 8.0, 10.0, 15.0, 24.0, 36.0, 40.0, 57.0, 84.0, 128.0, 158.0, 240.0, 417.0, 790.0, 1540.0, 3717.0, 11406.0, 48511.0, 269841.0, 606985.0, 78389.0, 16882.0, 4872.0, 1980.0, 923.0, 500.0, 325.0, 199.0, 145.0, 98.0, 54.0, 50.0, 41.0, 14.0, 19.0, 11.0, 7.0, 9.0, 6.0, 4.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.34326171875, -0.3318748474121094, -0.32048797607421875, -0.3091011047363281, -0.2977142333984375, -0.2863273620605469, -0.27494049072265625, -0.2635536193847656, -0.252166748046875, -0.24077987670898438, -0.22939300537109375, -0.21800613403320312, -0.2066192626953125, -0.19523239135742188, -0.18384552001953125, -0.17245864868164062, -0.16107177734375, -0.14968490600585938, -0.13829803466796875, -0.12691116333007812, -0.1155242919921875, -0.10413742065429688, -0.09275054931640625, -0.08136367797851562, -0.069976806640625, -0.058589935302734375, -0.04720306396484375, -0.035816192626953125, -0.0244293212890625, -0.013042449951171875, -0.00165557861328125, 0.009731292724609375, 0.0211181640625, 0.032505035400390625, 0.04389190673828125, 0.055278778076171875, 0.0666656494140625, 0.07805252075195312, 0.08943939208984375, 0.10082626342773438, 0.112213134765625, 0.12360000610351562, 0.13498687744140625, 0.14637374877929688, 0.1577606201171875, 0.16914749145507812, 0.18053436279296875, 0.19192123413085938, 0.20330810546875, 0.21469497680664062, 0.22608184814453125, 0.23746871948242188, 0.2488555908203125, 0.2602424621582031, 0.27162933349609375, 0.2830162048339844, 0.294403076171875, 0.3057899475097656, 0.31717681884765625, 0.3285636901855469, 0.3399505615234375, 0.3513374328613281, 0.36272430419921875, 0.3741111755371094, 0.385498046875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 7.0, 2.0, 6.0, 5.0, 5.0, 4.0, 9.0, 11.0, 8.0, 18.0, 18.0, 19.0, 22.0, 41.0, 38.0, 35.0, 53.0, 60.0, 64.0, 51.0, 54.0, 61.0, 54.0, 46.0, 48.0, 38.0, 43.0, 29.0, 27.0, 32.0, 25.0, 13.0, 12.0, 11.0, 15.0, 11.0, 3.0, 4.0, 7.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.49951171875, -0.48314666748046875, -0.4667816162109375, -0.45041656494140625, -0.434051513671875, -0.41768646240234375, -0.4013214111328125, -0.38495635986328125, -0.36859130859375, -0.35222625732421875, -0.3358612060546875, -0.31949615478515625, -0.303131103515625, -0.28676605224609375, -0.2704010009765625, -0.25403594970703125, -0.2376708984375, -0.22130584716796875, -0.2049407958984375, -0.18857574462890625, -0.172210693359375, -0.15584564208984375, -0.1394805908203125, -0.12311553955078125, -0.10675048828125, -0.09038543701171875, -0.0740203857421875, -0.05765533447265625, -0.041290283203125, -0.02492523193359375, -0.0085601806640625, 0.00780487060546875, 0.024169921875, 0.04053497314453125, 0.0569000244140625, 0.07326507568359375, 0.089630126953125, 0.10599517822265625, 0.1223602294921875, 0.13872528076171875, 0.15509033203125, 0.17145538330078125, 0.1878204345703125, 0.20418548583984375, 0.220550537109375, 0.23691558837890625, 0.2532806396484375, 0.26964569091796875, 0.2860107421875, 0.30237579345703125, 0.3187408447265625, 0.33510589599609375, 0.351470947265625, 0.36783599853515625, 0.3842010498046875, 0.40056610107421875, 0.41693115234375, 0.43329620361328125, 0.4496612548828125, 0.46602630615234375, 0.482391357421875, 0.49875640869140625, 0.5151214599609375, 0.5314865112304688, 0.5478515625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 7.0, 8.0, 16.0, 17.0, 33.0, 23.0, 47.0, 90.0, 116.0, 204.0, 311.0, 587.0, 1079.0, 2151.0, 4661.0, 11312.0, 31264.0, 105071.0, 641538.0, 176075.0, 46035.0, 15749.0, 6304.0, 2700.0, 1371.0, 756.0, 387.0, 236.0, 144.0, 92.0, 61.0, 32.0, 29.0, 13.0, 12.0, 5.0, 8.0, 3.0, 2.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09942626953125, -0.09555339813232422, -0.09168052673339844, -0.08780765533447266, -0.08393478393554688, -0.0800619125366211, -0.07618904113769531, -0.07231616973876953, -0.06844329833984375, -0.06457042694091797, -0.06069755554199219, -0.056824684143066406, -0.052951812744140625, -0.049078941345214844, -0.04520606994628906, -0.04133319854736328, -0.0374603271484375, -0.03358745574951172, -0.029714584350585938, -0.025841712951660156, -0.021968841552734375, -0.018095970153808594, -0.014223098754882812, -0.010350227355957031, -0.00647735595703125, -0.0026044845581054688, 0.0012683868408203125, 0.005141258239746094, 0.009014129638671875, 0.012887001037597656, 0.016759872436523438, 0.02063274383544922, 0.024505615234375, 0.02837848663330078, 0.03225135803222656, 0.036124229431152344, 0.039997100830078125, 0.043869972229003906, 0.04774284362792969, 0.05161571502685547, 0.05548858642578125, 0.05936145782470703, 0.06323432922363281, 0.0671072006225586, 0.07098007202148438, 0.07485294342041016, 0.07872581481933594, 0.08259868621826172, 0.0864715576171875, 0.09034442901611328, 0.09421730041503906, 0.09809017181396484, 0.10196304321289062, 0.1058359146118164, 0.10970878601074219, 0.11358165740966797, 0.11745452880859375, 0.12132740020751953, 0.1252002716064453, 0.1290731430053711, 0.13294601440429688, 0.13681888580322266, 0.14069175720214844, 0.14456462860107422, 0.1484375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 3.0, 5.0, 7.0, 6.0, 12.0, 11.0, 18.0, 32.0, 43.0, 54.0, 92.0, 133.0, 179.0, 136.0, 89.0, 49.0, 37.0, 29.0, 23.0, 4.0, 10.0, 8.0, 9.0, 1.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.45789909362793e-05, -8.189119398593903e-05, -7.920339703559875e-05, -7.651560008525848e-05, -7.382780313491821e-05, -7.114000618457794e-05, -6.845220923423767e-05, -6.57644122838974e-05, -6.307661533355713e-05, -6.038881838321686e-05, -5.770102143287659e-05, -5.5013224482536316e-05, -5.2325427532196045e-05, -4.9637630581855774e-05, -4.69498336315155e-05, -4.426203668117523e-05, -4.157423973083496e-05, -3.888644278049469e-05, -3.619864583015442e-05, -3.351084887981415e-05, -3.082305192947388e-05, -2.8135254979133606e-05, -2.5447458028793335e-05, -2.2759661078453064e-05, -2.0071864128112793e-05, -1.7384067177772522e-05, -1.4696270227432251e-05, -1.200847327709198e-05, -9.320676326751709e-06, -6.632879376411438e-06, -3.945082426071167e-06, -1.257285475730896e-06, 1.430511474609375e-06, 4.118308424949646e-06, 6.806105375289917e-06, 9.493902325630188e-06, 1.2181699275970459e-05, 1.486949622631073e-05, 1.7557293176651e-05, 2.0245090126991272e-05, 2.2932887077331543e-05, 2.5620684027671814e-05, 2.8308480978012085e-05, 3.0996277928352356e-05, 3.368407487869263e-05, 3.63718718290329e-05, 3.905966877937317e-05, 4.174746572971344e-05, 4.443526268005371e-05, 4.712305963039398e-05, 4.981085658073425e-05, 5.2498653531074524e-05, 5.5186450481414795e-05, 5.7874247431755066e-05, 6.056204438209534e-05, 6.324984133243561e-05, 6.593763828277588e-05, 6.862543523311615e-05, 7.131323218345642e-05, 7.400102913379669e-05, 7.668882608413696e-05, 7.937662303447723e-05, 8.20644199848175e-05, 8.475221693515778e-05, 8.744001388549805e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 6.0, 9.0, 12.0, 13.0, 17.0, 23.0, 39.0, 52.0, 97.0, 137.0, 235.0, 445.0, 921.0, 2081.0, 5406.0, 16958.0, 71063.0, 640680.0, 247664.0, 44051.0, 11648.0, 3825.0, 1518.0, 737.0, 392.0, 170.0, 122.0, 69.0, 52.0, 34.0, 18.0, 22.0, 10.0, 13.0, 4.0, 1.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.146484375, -0.14173507690429688, -0.13698577880859375, -0.13223648071289062, -0.1274871826171875, -0.12273788452148438, -0.11798858642578125, -0.11323928833007812, -0.108489990234375, -0.10374069213867188, -0.09899139404296875, -0.09424209594726562, -0.0894927978515625, -0.08474349975585938, -0.07999420166015625, -0.07524490356445312, -0.07049560546875, -0.06574630737304688, -0.06099700927734375, -0.056247711181640625, -0.0514984130859375, -0.046749114990234375, -0.04199981689453125, -0.037250518798828125, -0.032501220703125, -0.027751922607421875, -0.02300262451171875, -0.018253326416015625, -0.0135040283203125, -0.008754730224609375, -0.00400543212890625, 0.000743865966796875, 0.0054931640625, 0.010242462158203125, 0.01499176025390625, 0.019741058349609375, 0.0244903564453125, 0.029239654541015625, 0.03398895263671875, 0.038738250732421875, 0.043487548828125, 0.048236846923828125, 0.05298614501953125, 0.057735443115234375, 0.0624847412109375, 0.06723403930664062, 0.07198333740234375, 0.07673263549804688, 0.08148193359375, 0.08623123168945312, 0.09098052978515625, 0.09572982788085938, 0.1004791259765625, 0.10522842407226562, 0.10997772216796875, 0.11472702026367188, 0.119476318359375, 0.12422561645507812, 0.12897491455078125, 0.13372421264648438, 0.1384735107421875, 0.14322280883789062, 0.14797210693359375, 0.15272140502929688, 0.157470703125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 6.0, 7.0, 8.0, 9.0, 9.0, 19.0, 24.0, 17.0, 26.0, 58.0, 59.0, 80.0, 79.0, 110.0, 104.0, 95.0, 62.0, 56.0, 52.0, 22.0, 23.0, 12.0, 11.0, 12.0, 9.0, 6.0, 3.0, 4.0, 3.0, 0.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1226806640625, -0.11839675903320312, -0.11411285400390625, -0.10982894897460938, -0.1055450439453125, -0.10126113891601562, -0.09697723388671875, -0.09269332885742188, -0.088409423828125, -0.08412551879882812, -0.07984161376953125, -0.07555770874023438, -0.0712738037109375, -0.06698989868164062, -0.06270599365234375, -0.058422088623046875, -0.05413818359375, -0.049854278564453125, -0.04557037353515625, -0.041286468505859375, -0.0370025634765625, -0.032718658447265625, -0.02843475341796875, -0.024150848388671875, -0.019866943359375, -0.015583038330078125, -0.01129913330078125, -0.007015228271484375, -0.0027313232421875, 0.001552581787109375, 0.00583648681640625, 0.010120391845703125, 0.014404296875, 0.018688201904296875, 0.02297210693359375, 0.027256011962890625, 0.0315399169921875, 0.035823822021484375, 0.04010772705078125, 0.044391632080078125, 0.048675537109375, 0.052959442138671875, 0.05724334716796875, 0.061527252197265625, 0.0658111572265625, 0.07009506225585938, 0.07437896728515625, 0.07866287231445312, 0.08294677734375, 0.08723068237304688, 0.09151458740234375, 0.09579849243164062, 0.1000823974609375, 0.10436630249023438, 0.10865020751953125, 0.11293411254882812, 0.117218017578125, 0.12150192260742188, 0.12578582763671875, 0.13006973266601562, 0.1343536376953125, 0.13863754272460938, 0.14292144775390625, 0.14720535278320312, 0.1514892578125]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 8.0, 2.0, 6.0, 21.0, 20.0, 44.0, 62.0, 83.0, 125.0, 300.0, 125.0, 80.0, 48.0, 32.0, 21.0, 10.0, 11.0, 6.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.261214256286621, -4.1652326583862305, -4.06925106048584, -3.973268985748291, -3.8772873878479004, -3.7813057899475098, -3.68532395362854, -3.5893421173095703, -3.4933605194091797, -3.397378921508789, -3.3013970851898193, -3.2054152488708496, -3.109433650970459, -3.0134520530700684, -2.9174702167510986, -2.821488380432129, -2.7255067825317383, -2.6295251846313477, -2.533543348312378, -2.437561511993408, -2.3415799140930176, -2.245598316192627, -2.1496164798736572, -2.0536346435546875, -1.9576530456542969, -1.8616713285446167, -1.7656896114349365, -1.6697078943252563, -1.5737261772155762, -1.477744460105896, -1.3817627429962158, -1.2857810258865356, -1.1897990703582764, -1.0938173532485962, -0.997835636138916, -0.9018539190292358, -0.8058722019195557, -0.7098904848098755, -0.6139087677001953, -0.5179270505905151, -0.42194533348083496, -0.3259636163711548, -0.2299818992614746, -0.13400018215179443, -0.03801846504211426, 0.05796325206756592, 0.1539449691772461, 0.24992668628692627, 0.34590840339660645, 0.4418901205062866, 0.5378718376159668, 0.633853554725647, 0.7298352718353271, 0.8258169889450073, 0.9217987060546875, 1.0177804231643677, 1.1137621402740479, 1.209743857383728, 1.3057255744934082, 1.4017072916030884, 1.4976890087127686, 1.5936707258224487, 1.689652442932129, 1.785634160041809, 1.8816158771514893]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 0.0, 5.0, 4.0, 6.0, 6.0, 10.0, 11.0, 17.0, 17.0, 22.0, 24.0, 22.0, 24.0, 30.0, 25.0, 32.0, 39.0, 58.0, 95.0, 96.0, 105.0, 46.0, 43.0, 30.0, 25.0, 26.0, 27.0, 13.0, 19.0, 18.0, 19.0, 11.0, 18.0, 11.0, 9.0, 8.0, 6.0, 7.0, 4.0, 3.0, 4.0, 8.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.2842304706573486, -2.2182564735412598, -2.152282476425171, -2.086308479309082, -2.0203347206115723, -1.9543606042861938, -1.8883867263793945, -1.8224127292633057, -1.7564387321472168, -1.690464735031128, -1.624490737915039, -1.5585168600082397, -1.4925428628921509, -1.426568865776062, -1.3605949878692627, -1.2946209907531738, -1.228646993637085, -1.162672996520996, -1.0966989994049072, -1.030725121498108, -0.964751124382019, -0.8987771272659302, -0.8328031897544861, -0.766829252243042, -0.7008552551269531, -0.6348812580108643, -0.5689073204994202, -0.5029333829879761, -0.4369593858718872, -0.3709854185581207, -0.30501145124435425, -0.23903748393058777, -0.1730632781982422, -0.10708931088447571, -0.04111534357070923, 0.02485862374305725, 0.09083259105682373, 0.1568065583705902, 0.2227805256843567, 0.28875449299812317, 0.35472846031188965, 0.42070242762565613, 0.4866763949394226, 0.5526503324508667, 0.6186243295669556, 0.6845983266830444, 0.7505722641944885, 0.8165462017059326, 0.8825201988220215, 0.9484941959381104, 1.0144681930541992, 1.0804420709609985, 1.1464160680770874, 1.2123900651931763, 1.2783639430999756, 1.3443379402160645, 1.4103119373321533, 1.4762859344482422, 1.542259931564331, 1.6082338094711304, 1.6742078065872192, 1.740181803703308, 1.8061556816101074, 1.8721296787261963, 1.9381036758422852]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 1.0, 11.0, 3.0, 11.0, 11.0, 18.0, 29.0, 41.0, 75.0, 89.0, 145.0, 202.0, 306.0, 554.0, 824.0, 1520.0, 2628.0, 5030.0, 10984.0, 28683.0, 96673.0, 448660.0, 1837911.0, 1370636.0, 282888.0, 65565.0, 21990.0, 8956.0, 4292.0, 2291.0, 1294.0, 720.0, 406.0, 269.0, 167.0, 126.0, 90.0, 76.0, 32.0, 23.0, 17.0, 13.0, 5.0, 12.0, 4.0, 3.0, 5.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.156982421875, -0.1524791717529297, -0.14797592163085938, -0.14347267150878906, -0.13896942138671875, -0.13446617126464844, -0.12996292114257812, -0.1254596710205078, -0.1209564208984375, -0.11645317077636719, -0.11194992065429688, -0.10744667053222656, -0.10294342041015625, -0.09844017028808594, -0.09393692016601562, -0.08943367004394531, -0.084930419921875, -0.08042716979980469, -0.07592391967773438, -0.07142066955566406, -0.06691741943359375, -0.06241416931152344, -0.057910919189453125, -0.05340766906738281, -0.0489044189453125, -0.04440116882324219, -0.039897918701171875, -0.03539466857910156, -0.03089141845703125, -0.026388168334960938, -0.021884918212890625, -0.017381668090820312, -0.01287841796875, -0.008375167846679688, -0.003871917724609375, 0.0006313323974609375, 0.00513458251953125, 0.009637832641601562, 0.014141082763671875, 0.018644332885742188, 0.0231475830078125, 0.027650833129882812, 0.032154083251953125, 0.03665733337402344, 0.04116058349609375, 0.04566383361816406, 0.050167083740234375, 0.05467033386230469, 0.059173583984375, 0.06367683410644531, 0.06818008422851562, 0.07268333435058594, 0.07718658447265625, 0.08168983459472656, 0.08619308471679688, 0.09069633483886719, 0.0951995849609375, 0.09970283508300781, 0.10420608520507812, 0.10870933532714844, 0.11321258544921875, 0.11771583557128906, 0.12221908569335938, 0.1267223358154297, 0.1312255859375]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 4.0, 1.0, 3.0, 4.0, 12.0, 14.0, 14.0, 23.0, 17.0, 24.0, 34.0, 30.0, 55.0, 46.0, 60.0, 47.0, 62.0, 55.0, 52.0, 56.0, 55.0, 54.0, 45.0, 36.0, 37.0, 39.0, 27.0, 23.0, 19.0, 18.0, 16.0, 8.0, 8.0, 3.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1536865234375, -0.14941692352294922, -0.14514732360839844, -0.14087772369384766, -0.13660812377929688, -0.1323385238647461, -0.1280689239501953, -0.12379932403564453, -0.11952972412109375, -0.11526012420654297, -0.11099052429199219, -0.1067209243774414, -0.10245132446289062, -0.09818172454833984, -0.09391212463378906, -0.08964252471923828, -0.0853729248046875, -0.08110332489013672, -0.07683372497558594, -0.07256412506103516, -0.06829452514648438, -0.0640249252319336, -0.05975532531738281, -0.05548572540283203, -0.05121612548828125, -0.04694652557373047, -0.04267692565917969, -0.038407325744628906, -0.034137725830078125, -0.029868125915527344, -0.025598526000976562, -0.02132892608642578, -0.017059326171875, -0.012789726257324219, -0.008520126342773438, -0.004250526428222656, 1.9073486328125e-05, 0.004288673400878906, 0.008558273315429688, 0.012827873229980469, 0.01709747314453125, 0.02136707305908203, 0.025636672973632812, 0.029906272888183594, 0.034175872802734375, 0.038445472717285156, 0.04271507263183594, 0.04698467254638672, 0.0512542724609375, 0.05552387237548828, 0.05979347229003906, 0.06406307220458984, 0.06833267211914062, 0.0726022720336914, 0.07687187194824219, 0.08114147186279297, 0.08541107177734375, 0.08968067169189453, 0.09395027160644531, 0.0982198715209961, 0.10248947143554688, 0.10675907135009766, 0.11102867126464844, 0.11529827117919922, 0.11956787109375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 8.0, 12.0, 13.0, 18.0, 33.0, 49.0, 58.0, 124.0, 164.0, 320.0, 574.0, 1457.0, 4696.0, 33498.0, 2135051.0, 1977460.0, 33213.0, 4718.0, 1453.0, 591.0, 300.0, 184.0, 104.0, 65.0, 34.0, 34.0, 13.0, 9.0, 10.0, 4.0, 7.0, 3.0, 0.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.41845703125, -0.4010162353515625, -0.383575439453125, -0.3661346435546875, -0.34869384765625, -0.3312530517578125, -0.313812255859375, -0.2963714599609375, -0.2789306640625, -0.2614898681640625, -0.244049072265625, -0.2266082763671875, -0.20916748046875, -0.1917266845703125, -0.174285888671875, -0.1568450927734375, -0.139404296875, -0.1219635009765625, -0.104522705078125, -0.0870819091796875, -0.06964111328125, -0.0522003173828125, -0.034759521484375, -0.0173187255859375, 0.0001220703125, 0.0175628662109375, 0.035003662109375, 0.0524444580078125, 0.06988525390625, 0.0873260498046875, 0.104766845703125, 0.1222076416015625, 0.1396484375, 0.1570892333984375, 0.174530029296875, 0.1919708251953125, 0.20941162109375, 0.2268524169921875, 0.244293212890625, 0.2617340087890625, 0.2791748046875, 0.2966156005859375, 0.314056396484375, 0.3314971923828125, 0.34893798828125, 0.3663787841796875, 0.383819580078125, 0.4012603759765625, 0.418701171875, 0.4361419677734375, 0.453582763671875, 0.4710235595703125, 0.48846435546875, 0.5059051513671875, 0.523345947265625, 0.5407867431640625, 0.5582275390625, 0.5756683349609375, 0.593109130859375, 0.6105499267578125, 0.62799072265625, 0.6454315185546875, 0.662872314453125, 0.6803131103515625, 0.69775390625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 6.0, 14.0, 12.0, 19.0, 23.0, 51.0, 59.0, 103.0, 187.0, 281.0, 496.0, 789.0, 795.0, 484.0, 300.0, 166.0, 83.0, 66.0, 46.0, 22.0, 23.0, 18.0, 6.0, 7.0, 5.0, 5.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.43408203125, -0.421661376953125, -0.40924072265625, -0.396820068359375, -0.3843994140625, -0.371978759765625, -0.35955810546875, -0.347137451171875, -0.334716796875, -0.322296142578125, -0.30987548828125, -0.297454833984375, -0.2850341796875, -0.272613525390625, -0.26019287109375, -0.247772216796875, -0.2353515625, -0.222930908203125, -0.21051025390625, -0.198089599609375, -0.1856689453125, -0.173248291015625, -0.16082763671875, -0.148406982421875, -0.135986328125, -0.123565673828125, -0.11114501953125, -0.098724365234375, -0.0863037109375, -0.073883056640625, -0.06146240234375, -0.049041748046875, -0.03662109375, -0.024200439453125, -0.01177978515625, 0.000640869140625, 0.0130615234375, 0.025482177734375, 0.03790283203125, 0.050323486328125, 0.062744140625, 0.075164794921875, 0.08758544921875, 0.100006103515625, 0.1124267578125, 0.124847412109375, 0.13726806640625, 0.149688720703125, 0.162109375, 0.174530029296875, 0.18695068359375, 0.199371337890625, 0.2117919921875, 0.224212646484375, 0.23663330078125, 0.249053955078125, 0.261474609375, 0.273895263671875, 0.28631591796875, 0.298736572265625, 0.3111572265625, 0.323577880859375, 0.33599853515625, 0.348419189453125, 0.36083984375]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 10.0, 9.0, 12.0, 29.0, 77.0, 166.0, 241.0, 201.0, 141.0, 59.0, 34.0, 12.0, 6.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.509602069854736, -4.3633623123168945, -4.2171220779418945, -4.070882320404053, -3.924642562866211, -3.778402805328369, -3.6321628093719482, -3.4859228134155273, -3.3396830558776855, -3.1934432983398438, -3.047203302383423, -2.900963306427002, -2.75472354888916, -2.6084837913513184, -2.4622437953948975, -2.3160037994384766, -2.1697640419006348, -2.023524284362793, -1.877284288406372, -1.7310444116592407, -1.5848045349121094, -1.438564658164978, -1.2923247814178467, -1.1460849046707153, -0.999845027923584, -0.8536051511764526, -0.7073652744293213, -0.5611253976821899, -0.4148855209350586, -0.26864564418792725, -0.1224057674407959, 0.02383410930633545, 0.1700735092163086, 0.31631338596343994, 0.4625532627105713, 0.6087931394577026, 0.755033016204834, 0.9012728929519653, 1.0475127696990967, 1.193752646446228, 1.3399925231933594, 1.4862323999404907, 1.632472276687622, 1.7787121534347534, 1.9249520301818848, 2.0711917877197266, 2.2174317836761475, 2.3636717796325684, 2.50991153717041, 2.656151294708252, 2.802391290664673, 2.9486312866210938, 3.0948710441589355, 3.2411108016967773, 3.3873507976531982, 3.533590793609619, 3.679830551147461, 3.8260703086853027, 3.9723103046417236, 4.1185503005981445, 4.264790058135986, 4.411029815673828, 4.557270050048828, 4.70350980758667, 4.849749565124512]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 4.0, 4.0, 8.0, 7.0, 4.0, 6.0, 10.0, 18.0, 19.0, 17.0, 15.0, 23.0, 27.0, 23.0, 31.0, 27.0, 37.0, 43.0, 48.0, 45.0, 75.0, 51.0, 69.0, 41.0, 32.0, 38.0, 42.0, 31.0, 27.0, 27.0, 19.0, 23.0, 19.0, 17.0, 14.0, 10.0, 9.0, 14.0, 5.0, 5.0, 7.0, 5.0, 7.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-1.5919300317764282, -1.5455338954925537, -1.4991376399993896, -1.4527413845062256, -1.406345248222351, -1.3599491119384766, -1.3135528564453125, -1.2671566009521484, -1.220760464668274, -1.1743643283843994, -1.1279680728912354, -1.0815718173980713, -1.0351756811141968, -0.9887794852256775, -0.9423832893371582, -0.8959870934486389, -0.8495908975601196, -0.8031947016716003, -0.756798505783081, -0.7104023098945618, -0.6640061140060425, -0.6176099181175232, -0.5712137222290039, -0.5248175263404846, -0.47842133045196533, -0.43202513456344604, -0.38562893867492676, -0.33923274278640747, -0.2928365468978882, -0.2464403510093689, -0.2000441551208496, -0.15364795923233032, -0.10725176334381104, -0.06085556745529175, -0.014459371566772461, 0.031936824321746826, 0.07833302021026611, 0.1247292160987854, 0.1711254119873047, 0.21752160787582397, 0.26391780376434326, 0.31031399965286255, 0.35671019554138184, 0.4031063914299011, 0.4495025873184204, 0.4958987832069397, 0.542294979095459, 0.5886911749839783, 0.6350873708724976, 0.6814835667610168, 0.7278797626495361, 0.7742759585380554, 0.8206721544265747, 0.867068350315094, 0.9134645462036133, 0.9598607420921326, 1.0062569379806519, 1.0526530742645264, 1.0990493297576904, 1.1454455852508545, 1.191841721534729, 1.2382378578186035, 1.2846341133117676, 1.3310303688049316, 1.3774265050888062]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 3.0, 6.0, 13.0, 12.0, 15.0, 31.0, 37.0, 69.0, 83.0, 161.0, 248.0, 391.0, 629.0, 973.0, 1810.0, 3019.0, 5063.0, 9126.0, 17733.0, 34733.0, 71345.0, 150547.0, 272668.0, 239963.0, 120962.0, 57365.0, 28286.0, 14618.0, 7828.0, 4404.0, 2478.0, 1541.0, 936.0, 535.0, 359.0, 217.0, 115.0, 86.0, 54.0, 31.0, 19.0, 17.0, 8.0, 10.0, 6.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.182861328125, -0.17776107788085938, -0.17266082763671875, -0.16756057739257812, -0.1624603271484375, -0.15736007690429688, -0.15225982666015625, -0.14715957641601562, -0.142059326171875, -0.13695907592773438, -0.13185882568359375, -0.12675857543945312, -0.1216583251953125, -0.11655807495117188, -0.11145782470703125, -0.10635757446289062, -0.10125732421875, -0.09615707397460938, -0.09105682373046875, -0.08595657348632812, -0.0808563232421875, -0.07575607299804688, -0.07065582275390625, -0.06555557250976562, -0.060455322265625, -0.055355072021484375, -0.05025482177734375, -0.045154571533203125, -0.0400543212890625, -0.034954071044921875, -0.02985382080078125, -0.024753570556640625, -0.0196533203125, -0.014553070068359375, -0.00945281982421875, -0.004352569580078125, 0.0007476806640625, 0.005847930908203125, 0.01094818115234375, 0.016048431396484375, 0.021148681640625, 0.026248931884765625, 0.03134918212890625, 0.036449432373046875, 0.0415496826171875, 0.046649932861328125, 0.05175018310546875, 0.056850433349609375, 0.06195068359375, 0.06705093383789062, 0.07215118408203125, 0.07725143432617188, 0.0823516845703125, 0.08745193481445312, 0.09255218505859375, 0.09765243530273438, 0.102752685546875, 0.10785293579101562, 0.11295318603515625, 0.11805343627929688, 0.1231536865234375, 0.12825393676757812, 0.13335418701171875, 0.13845443725585938, 0.1435546875]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 2.0, 4.0, 5.0, 9.0, 8.0, 15.0, 18.0, 27.0, 18.0, 18.0, 24.0, 34.0, 34.0, 43.0, 49.0, 46.0, 53.0, 53.0, 54.0, 61.0, 57.0, 43.0, 48.0, 41.0, 35.0, 39.0, 30.0, 26.0, 21.0, 15.0, 11.0, 23.0, 14.0, 6.0, 8.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.166015625, -0.16160011291503906, -0.15718460083007812, -0.1527690887451172, -0.14835357666015625, -0.1439380645751953, -0.13952255249023438, -0.13510704040527344, -0.1306915283203125, -0.12627601623535156, -0.12186050415039062, -0.11744499206542969, -0.11302947998046875, -0.10861396789550781, -0.10419845581054688, -0.09978294372558594, -0.095367431640625, -0.09095191955566406, -0.08653640747070312, -0.08212089538574219, -0.07770538330078125, -0.07328987121582031, -0.06887435913085938, -0.06445884704589844, -0.0600433349609375, -0.05562782287597656, -0.051212310791015625, -0.04679679870605469, -0.04238128662109375, -0.03796577453613281, -0.033550262451171875, -0.029134750366210938, -0.02471923828125, -0.020303726196289062, -0.015888214111328125, -0.011472702026367188, -0.00705718994140625, -0.0026416778564453125, 0.001773834228515625, 0.0061893463134765625, 0.0106048583984375, 0.015020370483398438, 0.019435882568359375, 0.023851394653320312, 0.02826690673828125, 0.03268241882324219, 0.037097930908203125, 0.04151344299316406, 0.045928955078125, 0.05034446716308594, 0.054759979248046875, 0.05917549133300781, 0.06359100341796875, 0.06800651550292969, 0.07242202758789062, 0.07683753967285156, 0.0812530517578125, 0.08566856384277344, 0.09008407592773438, 0.09449958801269531, 0.09891510009765625, 0.10333061218261719, 0.10774612426757812, 0.11216163635253906, 0.1165771484375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 9.0, 6.0, 10.0, 8.0, 11.0, 23.0, 23.0, 27.0, 34.0, 46.0, 68.0, 95.0, 122.0, 183.0, 259.0, 346.0, 625.0, 1065.0, 2029.0, 5347.0, 19912.0, 130526.0, 752660.0, 108036.0, 17560.0, 4700.0, 1960.0, 977.0, 615.0, 407.0, 253.0, 171.0, 115.0, 83.0, 53.0, 51.0, 35.0, 25.0, 13.0, 14.0, 10.0, 15.0, 10.0, 7.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 0.0, 2.0], "bins": [-0.39453125, -0.3815765380859375, -0.368621826171875, -0.3556671142578125, -0.34271240234375, -0.3297576904296875, -0.316802978515625, -0.3038482666015625, -0.2908935546875, -0.2779388427734375, -0.264984130859375, -0.2520294189453125, -0.23907470703125, -0.2261199951171875, -0.213165283203125, -0.2002105712890625, -0.187255859375, -0.1743011474609375, -0.161346435546875, -0.1483917236328125, -0.13543701171875, -0.1224822998046875, -0.109527587890625, -0.0965728759765625, -0.0836181640625, -0.0706634521484375, -0.057708740234375, -0.0447540283203125, -0.03179931640625, -0.0188446044921875, -0.005889892578125, 0.0070648193359375, 0.02001953125, 0.0329742431640625, 0.045928955078125, 0.0588836669921875, 0.07183837890625, 0.0847930908203125, 0.097747802734375, 0.1107025146484375, 0.1236572265625, 0.1366119384765625, 0.149566650390625, 0.1625213623046875, 0.17547607421875, 0.1884307861328125, 0.201385498046875, 0.2143402099609375, 0.227294921875, 0.2402496337890625, 0.253204345703125, 0.2661590576171875, 0.27911376953125, 0.2920684814453125, 0.305023193359375, 0.3179779052734375, 0.3309326171875, 0.3438873291015625, 0.356842041015625, 0.3697967529296875, 0.38275146484375, 0.3957061767578125, 0.408660888671875, 0.4216156005859375, 0.4345703125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 0.0, 2.0, 4.0, 4.0, 8.0, 7.0, 11.0, 10.0, 12.0, 27.0, 19.0, 25.0, 31.0, 26.0, 35.0, 39.0, 47.0, 50.0, 50.0, 51.0, 63.0, 51.0, 52.0, 52.0, 56.0, 53.0, 43.0, 28.0, 30.0, 24.0, 20.0, 13.0, 16.0, 15.0, 6.0, 6.0, 8.0, 3.0, 3.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.546875, -0.5299606323242188, -0.5130462646484375, -0.49613189697265625, -0.479217529296875, -0.46230316162109375, -0.4453887939453125, -0.42847442626953125, -0.41156005859375, -0.39464569091796875, -0.3777313232421875, -0.36081695556640625, -0.343902587890625, -0.32698822021484375, -0.3100738525390625, -0.29315948486328125, -0.2762451171875, -0.25933074951171875, -0.2424163818359375, -0.22550201416015625, -0.208587646484375, -0.19167327880859375, -0.1747589111328125, -0.15784454345703125, -0.14093017578125, -0.12401580810546875, -0.1071014404296875, -0.09018707275390625, -0.073272705078125, -0.05635833740234375, -0.0394439697265625, -0.02252960205078125, -0.005615234375, 0.01129913330078125, 0.0282135009765625, 0.04512786865234375, 0.062042236328125, 0.07895660400390625, 0.0958709716796875, 0.11278533935546875, 0.12969970703125, 0.14661407470703125, 0.1635284423828125, 0.18044281005859375, 0.197357177734375, 0.21427154541015625, 0.2311859130859375, 0.24810028076171875, 0.2650146484375, 0.28192901611328125, 0.2988433837890625, 0.31575775146484375, 0.332672119140625, 0.34958648681640625, 0.3665008544921875, 0.38341522216796875, 0.40032958984375, 0.41724395751953125, 0.4341583251953125, 0.45107269287109375, 0.467987060546875, 0.48490142822265625, 0.5018157958984375, 0.5187301635742188, 0.53564453125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 5.0, 9.0, 13.0, 24.0, 49.0, 58.0, 128.0, 295.0, 684.0, 1946.0, 8636.0, 63590.0, 840574.0, 115296.0, 12947.0, 2804.0, 834.0, 322.0, 156.0, 67.0, 40.0, 31.0, 12.0, 5.0, 5.0, 6.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.205810546875, -0.19950103759765625, -0.1931915283203125, -0.18688201904296875, -0.180572509765625, -0.17426300048828125, -0.1679534912109375, -0.16164398193359375, -0.15533447265625, -0.14902496337890625, -0.1427154541015625, -0.13640594482421875, -0.130096435546875, -0.12378692626953125, -0.1174774169921875, -0.11116790771484375, -0.1048583984375, -0.09854888916015625, -0.0922393798828125, -0.08592987060546875, -0.079620361328125, -0.07331085205078125, -0.0670013427734375, -0.06069183349609375, -0.05438232421875, -0.04807281494140625, -0.0417633056640625, -0.03545379638671875, -0.029144287109375, -0.02283477783203125, -0.0165252685546875, -0.01021575927734375, -0.00390625, 0.00240325927734375, 0.0087127685546875, 0.01502227783203125, 0.021331787109375, 0.02764129638671875, 0.0339508056640625, 0.04026031494140625, 0.04656982421875, 0.05287933349609375, 0.0591888427734375, 0.06549835205078125, 0.071807861328125, 0.07811737060546875, 0.0844268798828125, 0.09073638916015625, 0.0970458984375, 0.10335540771484375, 0.1096649169921875, 0.11597442626953125, 0.122283935546875, 0.12859344482421875, 0.1349029541015625, 0.14121246337890625, 0.14752197265625, 0.15383148193359375, 0.1601409912109375, 0.16645050048828125, 0.172760009765625, 0.17906951904296875, 0.1853790283203125, 0.19168853759765625, 0.197998046875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 5.0, 7.0, 4.0, 6.0, 15.0, 23.0, 26.0, 29.0, 49.0, 72.0, 105.0, 181.0, 171.0, 112.0, 48.0, 39.0, 37.0, 19.0, 18.0, 12.0, 8.0, 6.0, 6.0, 1.0, 3.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.715557098388672e-05, -9.451154619455338e-05, -9.186752140522003e-05, -8.922349661588669e-05, -8.657947182655334e-05, -8.393544703722e-05, -8.129142224788666e-05, -7.864739745855331e-05, -7.600337266921997e-05, -7.335934787988663e-05, -7.071532309055328e-05, -6.807129830121994e-05, -6.54272735118866e-05, -6.278324872255325e-05, -6.013922393321991e-05, -5.7495199143886566e-05, -5.485117435455322e-05, -5.220714956521988e-05, -4.9563124775886536e-05, -4.691909998655319e-05, -4.427507519721985e-05, -4.1631050407886505e-05, -3.898702561855316e-05, -3.634300082921982e-05, -3.3698976039886475e-05, -3.105495125055313e-05, -2.8410926461219788e-05, -2.5766901671886444e-05, -2.31228768825531e-05, -2.0478852093219757e-05, -1.7834827303886414e-05, -1.519080251455307e-05, -1.2546777725219727e-05, -9.902752935886383e-06, -7.2587281465530396e-06, -4.614703357219696e-06, -1.9706785678863525e-06, 6.73346221446991e-07, 3.3173710107803345e-06, 5.961395800113678e-06, 8.605420589447021e-06, 1.1249445378780365e-05, 1.3893470168113708e-05, 1.6537494957447052e-05, 1.9181519746780396e-05, 2.182554453611374e-05, 2.4469569325447083e-05, 2.7113594114780426e-05, 2.975761890411377e-05, 3.240164369344711e-05, 3.5045668482780457e-05, 3.76896932721138e-05, 4.0333718061447144e-05, 4.297774285078049e-05, 4.562176764011383e-05, 4.8265792429447174e-05, 5.090981721878052e-05, 5.355384200811386e-05, 5.6197866797447205e-05, 5.884189158678055e-05, 6.148591637611389e-05, 6.412994116544724e-05, 6.677396595478058e-05, 6.941799074411392e-05, 7.206201553344727e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 0.0, 3.0, 8.0, 15.0, 21.0, 32.0, 58.0, 84.0, 135.0, 242.0, 396.0, 956.0, 2534.0, 10019.0, 70101.0, 796434.0, 144595.0, 16867.0, 3540.0, 1222.0, 579.0, 319.0, 157.0, 91.0, 63.0, 35.0, 23.0, 11.0, 6.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.158935546875, -0.15357589721679688, -0.14821624755859375, -0.14285659790039062, -0.1374969482421875, -0.13213729858398438, -0.12677764892578125, -0.12141799926757812, -0.116058349609375, -0.11069869995117188, -0.10533905029296875, -0.09997940063476562, -0.0946197509765625, -0.08926010131835938, -0.08390045166015625, -0.07854080200195312, -0.07318115234375, -0.06782150268554688, -0.06246185302734375, -0.057102203369140625, -0.0517425537109375, -0.046382904052734375, -0.04102325439453125, -0.035663604736328125, -0.030303955078125, -0.024944305419921875, -0.01958465576171875, -0.014225006103515625, -0.0088653564453125, -0.003505706787109375, 0.00185394287109375, 0.007213592529296875, 0.0125732421875, 0.017932891845703125, 0.02329254150390625, 0.028652191162109375, 0.0340118408203125, 0.039371490478515625, 0.04473114013671875, 0.050090789794921875, 0.055450439453125, 0.060810089111328125, 0.06616973876953125, 0.07152938842773438, 0.0768890380859375, 0.08224868774414062, 0.08760833740234375, 0.09296798706054688, 0.09832763671875, 0.10368728637695312, 0.10904693603515625, 0.11440658569335938, 0.1197662353515625, 0.12512588500976562, 0.13048553466796875, 0.13584518432617188, 0.141204833984375, 0.14656448364257812, 0.15192413330078125, 0.15728378295898438, 0.1626434326171875, 0.16800308227539062, 0.17336273193359375, 0.17872238159179688, 0.18408203125]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 4.0, 5.0, 7.0, 8.0, 6.0, 10.0, 11.0, 15.0, 13.0, 20.0, 26.0, 35.0, 45.0, 52.0, 74.0, 80.0, 87.0, 120.0, 93.0, 78.0, 39.0, 40.0, 33.0, 11.0, 23.0, 14.0, 12.0, 18.0, 4.0, 6.0, 8.0, 7.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1094970703125, -0.10543632507324219, -0.10137557983398438, -0.09731483459472656, -0.09325408935546875, -0.08919334411621094, -0.08513259887695312, -0.08107185363769531, -0.0770111083984375, -0.07295036315917969, -0.06888961791992188, -0.06482887268066406, -0.06076812744140625, -0.05670738220214844, -0.052646636962890625, -0.04858589172363281, -0.044525146484375, -0.04046440124511719, -0.036403656005859375, -0.03234291076660156, -0.02828216552734375, -0.024221420288085938, -0.020160675048828125, -0.016099929809570312, -0.0120391845703125, -0.007978439331054688, -0.003917694091796875, 0.0001430511474609375, 0.00420379638671875, 0.008264541625976562, 0.012325286865234375, 0.016386032104492188, 0.02044677734375, 0.024507522583007812, 0.028568267822265625, 0.03262901306152344, 0.03668975830078125, 0.04075050354003906, 0.044811248779296875, 0.04887199401855469, 0.0529327392578125, 0.05699348449707031, 0.061054229736328125, 0.06511497497558594, 0.06917572021484375, 0.07323646545410156, 0.07729721069335938, 0.08135795593261719, 0.085418701171875, 0.08947944641113281, 0.09354019165039062, 0.09760093688964844, 0.10166168212890625, 0.10572242736816406, 0.10978317260742188, 0.11384391784667969, 0.1179046630859375, 0.12196540832519531, 0.12602615356445312, 0.13008689880371094, 0.13414764404296875, 0.13820838928222656, 0.14226913452148438, 0.1463298797607422, 0.150390625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 1.0, 0.0, 2.0, 3.0, 2.0, 16.0, 33.0, 69.0, 163.0, 465.0, 148.0, 68.0, 22.0, 6.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.906357765197754, -7.7283406257629395, -7.550323486328125, -7.372306823730469, -7.194289684295654, -7.01627254486084, -6.838255882263184, -6.660238742828369, -6.482221603393555, -6.30420446395874, -6.126187324523926, -5.9481706619262695, -5.770153522491455, -5.592136383056641, -5.414119720458984, -5.23610258102417, -5.0580854415893555, -4.880068302154541, -4.702051162719727, -4.52403450012207, -4.346017360687256, -4.168000221252441, -3.989983320236206, -3.8119664192199707, -3.6339492797851562, -3.455932140350342, -3.2779152393341064, -3.099898338317871, -2.9218811988830566, -2.743864059448242, -2.565847158432007, -2.3878302574157715, -2.209812879562378, -2.0317959785461426, -1.8537788391113281, -1.6757618188858032, -1.4977447986602783, -1.3197277784347534, -1.1417107582092285, -0.9636937379837036, -0.7856767177581787, -0.6076596975326538, -0.4296426773071289, -0.251625657081604, -0.0736086368560791, 0.1044083833694458, 0.2824254035949707, 0.4604424238204956, 0.6384594440460205, 0.8164764642715454, 0.9944934844970703, 1.1725105047225952, 1.3505275249481201, 1.528544545173645, 1.70656156539917, 1.8845785856246948, 2.0625956058502197, 2.240612506866455, 2.4186296463012695, 2.596646785736084, 2.7746636867523193, 2.9526805877685547, 3.130697727203369, 3.3087148666381836, 3.486731767654419]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 4.0, 3.0, 4.0, 4.0, 2.0, 6.0, 6.0, 8.0, 5.0, 8.0, 11.0, 9.0, 19.0, 11.0, 22.0, 27.0, 19.0, 38.0, 28.0, 38.0, 27.0, 34.0, 78.0, 161.0, 119.0, 46.0, 33.0, 31.0, 30.0, 23.0, 26.0, 25.0, 20.0, 15.0, 11.0, 13.0, 8.0, 4.0, 9.0, 7.0, 3.0, 7.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.371966600418091, -2.29927659034729, -2.22658634185791, -2.1538963317871094, -2.0812060832977295, -2.0085160732269287, -1.9358258247375488, -1.863135814666748, -1.7904455661773682, -1.7177554368972778, -1.6450653076171875, -1.5723751783370972, -1.4996850490570068, -1.4269949197769165, -1.3543047904968262, -1.2816147804260254, -1.208924651145935, -1.1362345218658447, -1.0635443925857544, -0.9908542633056641, -0.9181641340255737, -0.8454740047454834, -0.7727839350700378, -0.7000938057899475, -0.6274036765098572, -0.5547135472297668, -0.4820234179496765, -0.40933331847190857, -0.33664318919181824, -0.2639530599117279, -0.19126296043395996, -0.11857283115386963, -0.0458827018737793, 0.026807419955730438, 0.09949754178524017, 0.1721876561641693, 0.24487778544425964, 0.31756791472435, 0.3902580142021179, 0.46294814348220825, 0.5356382727622986, 0.6083284020423889, 0.6810185313224792, 0.7537086009979248, 0.8263987302780151, 0.8990888595581055, 0.9717789888381958, 1.0444691181182861, 1.1171592473983765, 1.1898493766784668, 1.2625395059585571, 1.3352296352386475, 1.4079197645187378, 1.4806098937988281, 1.553299903869629, 1.6259901523590088, 1.6986801624298096, 1.7713702917099, 1.8440604209899902, 1.9167505502700806, 1.989440679550171, 2.0621306896209717, 2.1348209381103516, 2.2075109481811523, 2.2802011966705322]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 7.0, 8.0, 7.0, 17.0, 26.0, 42.0, 77.0, 118.0, 137.0, 278.0, 415.0, 650.0, 1172.0, 2028.0, 4121.0, 8952.0, 22393.0, 67032.0, 261119.0, 1053153.0, 1837309.0, 689170.0, 166388.0, 48054.0, 17030.0, 7098.0, 3307.0, 1724.0, 952.0, 615.0, 353.0, 198.0, 120.0, 77.0, 59.0, 28.0, 29.0, 11.0, 10.0, 5.0, 1.0, 4.0, 1.0], "bins": [-0.246337890625, -0.24037933349609375, -0.2344207763671875, -0.22846221923828125, -0.222503662109375, -0.21654510498046875, -0.2105865478515625, -0.20462799072265625, -0.19866943359375, -0.19271087646484375, -0.1867523193359375, -0.18079376220703125, -0.174835205078125, -0.16887664794921875, -0.1629180908203125, -0.15695953369140625, -0.1510009765625, -0.14504241943359375, -0.1390838623046875, -0.13312530517578125, -0.127166748046875, -0.12120819091796875, -0.1152496337890625, -0.10929107666015625, -0.10333251953125, -0.09737396240234375, -0.0914154052734375, -0.08545684814453125, -0.079498291015625, -0.07353973388671875, -0.0675811767578125, -0.06162261962890625, -0.0556640625, -0.04970550537109375, -0.0437469482421875, -0.03778839111328125, -0.031829833984375, -0.02587127685546875, -0.0199127197265625, -0.01395416259765625, -0.00799560546875, -0.00203704833984375, 0.0039215087890625, 0.00988006591796875, 0.015838623046875, 0.02179718017578125, 0.0277557373046875, 0.03371429443359375, 0.0396728515625, 0.04563140869140625, 0.0515899658203125, 0.05754852294921875, 0.063507080078125, 0.06946563720703125, 0.0754241943359375, 0.08138275146484375, 0.08734130859375, 0.09329986572265625, 0.0992584228515625, 0.10521697998046875, 0.111175537109375, 0.11713409423828125, 0.1230926513671875, 0.12905120849609375, 0.135009765625]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 5.0, 2.0, 6.0, 11.0, 10.0, 16.0, 13.0, 19.0, 15.0, 32.0, 32.0, 41.0, 47.0, 57.0, 67.0, 47.0, 65.0, 52.0, 52.0, 45.0, 50.0, 47.0, 45.0, 31.0, 35.0, 35.0, 31.0, 24.0, 19.0, 18.0, 5.0, 14.0, 11.0, 1.0, 5.0, 4.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.174560546875, -0.1703643798828125, -0.166168212890625, -0.1619720458984375, -0.15777587890625, -0.1535797119140625, -0.149383544921875, -0.1451873779296875, -0.1409912109375, -0.1367950439453125, -0.132598876953125, -0.1284027099609375, -0.12420654296875, -0.1200103759765625, -0.115814208984375, -0.1116180419921875, -0.107421875, -0.1032257080078125, -0.099029541015625, -0.0948333740234375, -0.09063720703125, -0.0864410400390625, -0.082244873046875, -0.0780487060546875, -0.0738525390625, -0.0696563720703125, -0.065460205078125, -0.0612640380859375, -0.05706787109375, -0.0528717041015625, -0.048675537109375, -0.0444793701171875, -0.040283203125, -0.0360870361328125, -0.031890869140625, -0.0276947021484375, -0.02349853515625, -0.0193023681640625, -0.015106201171875, -0.0109100341796875, -0.0067138671875, -0.0025177001953125, 0.001678466796875, 0.0058746337890625, 0.01007080078125, 0.0142669677734375, 0.018463134765625, 0.0226593017578125, 0.02685546875, 0.0310516357421875, 0.035247802734375, 0.0394439697265625, 0.04364013671875, 0.0478363037109375, 0.052032470703125, 0.0562286376953125, 0.0604248046875, 0.0646209716796875, 0.068817138671875, 0.0730133056640625, 0.07720947265625, 0.0814056396484375, 0.085601806640625, 0.0897979736328125, 0.093994140625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 6.0, 12.0, 15.0, 23.0, 41.0, 58.0, 114.0, 180.0, 420.0, 1030.0, 4698.0, 2995929.0, 1186016.0, 3980.0, 901.0, 411.0, 182.0, 109.0, 63.0, 41.0, 20.0, 11.0, 9.0, 7.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.71484375, -1.6556396484375, -1.596435546875, -1.5372314453125, -1.47802734375, -1.4188232421875, -1.359619140625, -1.3004150390625, -1.2412109375, -1.1820068359375, -1.122802734375, -1.0635986328125, -1.00439453125, -0.9451904296875, -0.885986328125, -0.8267822265625, -0.767578125, -0.7083740234375, -0.649169921875, -0.5899658203125, -0.53076171875, -0.4715576171875, -0.412353515625, -0.3531494140625, -0.2939453125, -0.2347412109375, -0.175537109375, -0.1163330078125, -0.05712890625, 0.0020751953125, 0.061279296875, 0.1204833984375, 0.1796875, 0.2388916015625, 0.298095703125, 0.3572998046875, 0.41650390625, 0.4757080078125, 0.534912109375, 0.5941162109375, 0.6533203125, 0.7125244140625, 0.771728515625, 0.8309326171875, 0.89013671875, 0.9493408203125, 1.008544921875, 1.0677490234375, 1.126953125, 1.1861572265625, 1.245361328125, 1.3045654296875, 1.36376953125, 1.4229736328125, 1.482177734375, 1.5413818359375, 1.6005859375, 1.6597900390625, 1.718994140625, 1.7781982421875, 1.83740234375, 1.8966064453125, 1.955810546875, 2.0150146484375, 2.07421875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 8.0, 19.0, 28.0, 72.0, 176.0, 488.0, 1405.0, 1173.0, 442.0, 169.0, 68.0, 19.0, 7.0, 8.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.53125, -1.48736572265625, -1.4434814453125, -1.39959716796875, -1.355712890625, -1.31182861328125, -1.2679443359375, -1.22406005859375, -1.18017578125, -1.13629150390625, -1.0924072265625, -1.04852294921875, -1.004638671875, -0.96075439453125, -0.9168701171875, -0.87298583984375, -0.8291015625, -0.78521728515625, -0.7413330078125, -0.69744873046875, -0.653564453125, -0.60968017578125, -0.5657958984375, -0.52191162109375, -0.47802734375, -0.43414306640625, -0.3902587890625, -0.34637451171875, -0.302490234375, -0.25860595703125, -0.2147216796875, -0.17083740234375, -0.126953125, -0.08306884765625, -0.0391845703125, 0.00469970703125, 0.048583984375, 0.09246826171875, 0.1363525390625, 0.18023681640625, 0.22412109375, 0.26800537109375, 0.3118896484375, 0.35577392578125, 0.399658203125, 0.44354248046875, 0.4874267578125, 0.53131103515625, 0.5751953125, 0.61907958984375, 0.6629638671875, 0.70684814453125, 0.750732421875, 0.79461669921875, 0.8385009765625, 0.88238525390625, 0.92626953125, 0.97015380859375, 1.0140380859375, 1.05792236328125, 1.101806640625, 1.14569091796875, 1.1895751953125, 1.23345947265625, 1.27734375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 6.0, 7.0, 3.0, 4.0, 5.0, 8.0, 28.0, 52.0, 84.0, 155.0, 215.0, 197.0, 105.0, 57.0, 31.0, 21.0, 12.0, 5.0, 0.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.203498840332031, -7.959491729736328, -7.715485095977783, -7.47147798538208, -7.227471351623535, -6.983464241027832, -6.739457130432129, -6.495450496673584, -6.251443386077881, -6.007436275482178, -5.763429641723633, -5.51942253112793, -5.275415897369385, -5.031408786773682, -4.787402153015137, -4.543395042419434, -4.2993879318237305, -4.055380821228027, -3.8113741874694824, -3.5673670768737793, -3.3233602046966553, -3.0793533325195312, -2.8353464603424072, -2.591339588165283, -2.3473329544067383, -2.1033260822296143, -1.8593190908432007, -1.6153122186660767, -1.371305227279663, -1.127298355102539, -0.883291482925415, -0.6392844915390015, -0.3952775001525879, -0.15127058327198029, 0.09273633360862732, 0.33674323558807373, 0.5807501673698425, 0.8247570991516113, 1.0687639713287354, 1.312770962715149, 1.556777834892273, 1.800784707069397, 2.0447916984558105, 2.2887985706329346, 2.5328054428100586, 2.7768125534057617, 3.0208191871643066, 3.2648262977600098, 3.508833169937134, 3.752840042114258, 3.996846914291382, 4.240853786468506, 4.484860897064209, 4.728867530822754, 4.972874641418457, 5.21688175201416, 5.460888385772705, 5.704895496368408, 5.948902130126953, 6.192909240722656, 6.436915874481201, 6.680922985076904, 6.924929618835449, 7.168936729431152, 7.4129438400268555]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 3.0, 5.0, 6.0, 5.0, 9.0, 14.0, 16.0, 17.0, 32.0, 24.0, 31.0, 34.0, 46.0, 57.0, 61.0, 62.0, 55.0, 74.0, 62.0, 69.0, 43.0, 54.0, 36.0, 33.0, 28.0, 20.0, 27.0, 21.0, 13.0, 17.0, 7.0, 6.0, 1.0, 5.0, 2.0, 5.0, 3.0, 5.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.793348789215088, -2.6837520599365234, -2.574155569076538, -2.4645590782165527, -2.3549623489379883, -2.245365619659424, -2.1357691287994385, -2.026172637939453, -1.9165759086608887, -1.8069792985916138, -1.6973826885223389, -1.587786078453064, -1.478189468383789, -1.3685928583145142, -1.2589962482452393, -1.1493996381759644, -1.0398030281066895, -0.9302064180374146, -0.8206098079681396, -0.7110131978988647, -0.6014165878295898, -0.49181997776031494, -0.38222336769104004, -0.27262675762176514, -0.16303014755249023, -0.05343353748321533, 0.05616307258605957, 0.16575968265533447, 0.2753562927246094, 0.3849529027938843, 0.4945495128631592, 0.6041461229324341, 0.713742733001709, 0.8233393430709839, 0.9329359531402588, 1.0425325632095337, 1.1521291732788086, 1.2617257833480835, 1.3713223934173584, 1.4809190034866333, 1.5905156135559082, 1.700112223625183, 1.809708833694458, 1.919305443763733, 2.028902053833008, 2.1384987831115723, 2.2480952739715576, 2.357691764831543, 2.4672884941101074, 2.576885223388672, 2.6864817142486572, 2.7960782051086426, 2.905674934387207, 3.0152716636657715, 3.124868154525757, 3.234464645385742, 3.3440613746643066, 3.453658103942871, 3.5632545948028564, 3.672851085662842, 3.7824478149414062, 3.8920445442199707, 4.001641273498535, 4.111237525939941, 4.220834255218506]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 4.0, 4.0, 4.0, 4.0, 10.0, 10.0, 22.0, 28.0, 36.0, 64.0, 110.0, 198.0, 378.0, 791.0, 1857.0, 4885.0, 15358.0, 61019.0, 367122.0, 494357.0, 74346.0, 18266.0, 5708.0, 2170.0, 906.0, 401.0, 208.0, 86.0, 63.0, 58.0, 32.0, 8.0, 14.0, 7.0, 5.0, 5.0, 9.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.394287109375, -0.38271331787109375, -0.3711395263671875, -0.35956573486328125, -0.347991943359375, -0.33641815185546875, -0.3248443603515625, -0.31327056884765625, -0.30169677734375, -0.29012298583984375, -0.2785491943359375, -0.26697540283203125, -0.255401611328125, -0.24382781982421875, -0.2322540283203125, -0.22068023681640625, -0.2091064453125, -0.19753265380859375, -0.1859588623046875, -0.17438507080078125, -0.162811279296875, -0.15123748779296875, -0.1396636962890625, -0.12808990478515625, -0.11651611328125, -0.10494232177734375, -0.0933685302734375, -0.08179473876953125, -0.070220947265625, -0.05864715576171875, -0.0470733642578125, -0.03549957275390625, -0.02392578125, -0.01235198974609375, -0.0007781982421875, 0.01079559326171875, 0.022369384765625, 0.03394317626953125, 0.0455169677734375, 0.05709075927734375, 0.06866455078125, 0.08023834228515625, 0.0918121337890625, 0.10338592529296875, 0.114959716796875, 0.12653350830078125, 0.1381072998046875, 0.14968109130859375, 0.1612548828125, 0.17282867431640625, 0.1844024658203125, 0.19597625732421875, 0.207550048828125, 0.21912384033203125, 0.2306976318359375, 0.24227142333984375, 0.25384521484375, 0.26541900634765625, 0.2769927978515625, 0.28856658935546875, 0.300140380859375, 0.31171417236328125, 0.3232879638671875, 0.33486175537109375, 0.346435546875]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 3.0, 6.0, 1.0, 10.0, 10.0, 8.0, 16.0, 20.0, 13.0, 37.0, 32.0, 32.0, 51.0, 71.0, 64.0, 62.0, 63.0, 73.0, 79.0, 54.0, 44.0, 40.0, 45.0, 44.0, 22.0, 25.0, 23.0, 19.0, 15.0, 6.0, 10.0, 3.0, 7.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1895751953125, -0.182830810546875, -0.17608642578125, -0.169342041015625, -0.16259765625, -0.155853271484375, -0.14910888671875, -0.142364501953125, -0.1356201171875, -0.128875732421875, -0.12213134765625, -0.115386962890625, -0.108642578125, -0.101898193359375, -0.09515380859375, -0.088409423828125, -0.0816650390625, -0.074920654296875, -0.06817626953125, -0.061431884765625, -0.0546875, -0.047943115234375, -0.04119873046875, -0.034454345703125, -0.0277099609375, -0.020965576171875, -0.01422119140625, -0.007476806640625, -0.000732421875, 0.006011962890625, 0.01275634765625, 0.019500732421875, 0.0262451171875, 0.032989501953125, 0.03973388671875, 0.046478271484375, 0.05322265625, 0.059967041015625, 0.06671142578125, 0.073455810546875, 0.0802001953125, 0.086944580078125, 0.09368896484375, 0.100433349609375, 0.107177734375, 0.113922119140625, 0.12066650390625, 0.127410888671875, 0.1341552734375, 0.140899658203125, 0.14764404296875, 0.154388427734375, 0.1611328125, 0.167877197265625, 0.17462158203125, 0.181365966796875, 0.1881103515625, 0.194854736328125, 0.20159912109375, 0.208343505859375, 0.215087890625, 0.221832275390625, 0.22857666015625, 0.235321044921875, 0.2420654296875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 5.0, 4.0, 8.0, 8.0, 7.0, 19.0, 19.0, 36.0, 37.0, 44.0, 56.0, 89.0, 152.0, 199.0, 288.0, 527.0, 872.0, 1903.0, 5289.0, 20267.0, 121266.0, 824974.0, 54504.0, 11308.0, 3372.0, 1381.0, 713.0, 373.0, 234.0, 162.0, 124.0, 83.0, 55.0, 54.0, 31.0, 20.0, 19.0, 10.0, 10.0, 14.0, 9.0, 0.0, 4.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.406494140625, -0.3949775695800781, -0.38346099853515625, -0.3719444274902344, -0.3604278564453125, -0.3489112854003906, -0.33739471435546875, -0.3258781433105469, -0.314361572265625, -0.3028450012207031, -0.29132843017578125, -0.2798118591308594, -0.2682952880859375, -0.2567787170410156, -0.24526214599609375, -0.23374557495117188, -0.22222900390625, -0.21071243286132812, -0.19919586181640625, -0.18767929077148438, -0.1761627197265625, -0.16464614868164062, -0.15312957763671875, -0.14161300659179688, -0.130096435546875, -0.11857986450195312, -0.10706329345703125, -0.09554672241210938, -0.0840301513671875, -0.07251358032226562, -0.06099700927734375, -0.049480438232421875, -0.0379638671875, -0.026447296142578125, -0.01493072509765625, -0.003414154052734375, 0.0081024169921875, 0.019618988037109375, 0.03113555908203125, 0.042652130126953125, 0.054168701171875, 0.06568527221679688, 0.07720184326171875, 0.08871841430664062, 0.1002349853515625, 0.11175155639648438, 0.12326812744140625, 0.13478469848632812, 0.14630126953125, 0.15781784057617188, 0.16933441162109375, 0.18085098266601562, 0.1923675537109375, 0.20388412475585938, 0.21540069580078125, 0.22691726684570312, 0.238433837890625, 0.24995040893554688, 0.26146697998046875, 0.2729835510253906, 0.2845001220703125, 0.2960166931152344, 0.30753326416015625, 0.3190498352050781, 0.33056640625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 0.0, 3.0, 2.0, 2.0, 7.0, 1.0, 8.0, 11.0, 6.0, 8.0, 9.0, 14.0, 13.0, 23.0, 18.0, 14.0, 20.0, 26.0, 28.0, 53.0, 41.0, 54.0, 70.0, 73.0, 87.0, 61.0, 56.0, 52.0, 30.0, 29.0, 29.0, 25.0, 26.0, 21.0, 11.0, 7.0, 16.0, 9.0, 7.0, 8.0, 8.0, 5.0, 7.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.66650390625, -0.6468734741210938, -0.6272430419921875, -0.6076126098632812, -0.587982177734375, -0.5683517456054688, -0.5487213134765625, -0.5290908813476562, -0.50946044921875, -0.48983001708984375, -0.4701995849609375, -0.45056915283203125, -0.430938720703125, -0.41130828857421875, -0.3916778564453125, -0.37204742431640625, -0.3524169921875, -0.33278656005859375, -0.3131561279296875, -0.29352569580078125, -0.273895263671875, -0.25426483154296875, -0.2346343994140625, -0.21500396728515625, -0.19537353515625, -0.17574310302734375, -0.1561126708984375, -0.13648223876953125, -0.116851806640625, -0.09722137451171875, -0.0775909423828125, -0.05796051025390625, -0.038330078125, -0.01869964599609375, 0.0009307861328125, 0.02056121826171875, 0.040191650390625, 0.05982208251953125, 0.0794525146484375, 0.09908294677734375, 0.11871337890625, 0.13834381103515625, 0.1579742431640625, 0.17760467529296875, 0.197235107421875, 0.21686553955078125, 0.2364959716796875, 0.25612640380859375, 0.2757568359375, 0.29538726806640625, 0.3150177001953125, 0.33464813232421875, 0.354278564453125, 0.37390899658203125, 0.3935394287109375, 0.41316986083984375, 0.43280029296875, 0.45243072509765625, 0.4720611572265625, 0.49169158935546875, 0.511322021484375, 0.5309524536132812, 0.5505828857421875, 0.5702133178710938, 0.58984375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 4.0, 3.0, 5.0, 6.0, 11.0, 5.0, 16.0, 19.0, 19.0, 29.0, 37.0, 56.0, 61.0, 97.0, 131.0, 224.0, 362.0, 648.0, 1238.0, 2653.0, 6214.0, 17469.0, 64501.0, 823005.0, 95667.0, 21855.0, 7707.0, 3172.0, 1468.0, 719.0, 401.0, 206.0, 134.0, 109.0, 70.0, 56.0, 45.0, 32.0, 20.0, 17.0, 14.0, 12.0, 12.0, 6.0, 10.0, 7.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.07757568359375, -0.07512092590332031, -0.07266616821289062, -0.07021141052246094, -0.06775665283203125, -0.06530189514160156, -0.06284713745117188, -0.06039237976074219, -0.0579376220703125, -0.05548286437988281, -0.053028106689453125, -0.05057334899902344, -0.04811859130859375, -0.04566383361816406, -0.043209075927734375, -0.04075431823730469, -0.038299560546875, -0.03584480285644531, -0.033390045166015625, -0.030935287475585938, -0.02848052978515625, -0.026025772094726562, -0.023571014404296875, -0.021116256713867188, -0.0186614990234375, -0.016206741333007812, -0.013751983642578125, -0.011297225952148438, -0.00884246826171875, -0.0063877105712890625, -0.003932952880859375, -0.0014781951904296875, 0.0009765625, 0.0034313201904296875, 0.005886077880859375, 0.008340835571289062, 0.01079559326171875, 0.013250350952148438, 0.015705108642578125, 0.018159866333007812, 0.0206146240234375, 0.023069381713867188, 0.025524139404296875, 0.027978897094726562, 0.03043365478515625, 0.03288841247558594, 0.035343170166015625, 0.03779792785644531, 0.040252685546875, 0.04270744323730469, 0.045162200927734375, 0.04761695861816406, 0.05007171630859375, 0.05252647399902344, 0.054981231689453125, 0.05743598937988281, 0.0598907470703125, 0.06234550476074219, 0.06480026245117188, 0.06725502014160156, 0.06970977783203125, 0.07216453552246094, 0.07461929321289062, 0.07707405090332031, 0.07952880859375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 6.0, 3.0, 1.0, 4.0, 5.0, 2.0, 8.0, 10.0, 6.0, 15.0, 10.0, 15.0, 18.0, 18.0, 23.0, 40.0, 50.0, 76.0, 106.0, 133.0, 104.0, 106.0, 62.0, 47.0, 33.0, 30.0, 21.0, 12.0, 8.0, 3.0, 5.0, 3.0, 4.0, 3.0, 4.0, 4.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.9637088775634766e-05, -3.838539123535156e-05, -3.713369369506836e-05, -3.5881996154785156e-05, -3.463029861450195e-05, -3.337860107421875e-05, -3.212690353393555e-05, -3.0875205993652344e-05, -2.962350845336914e-05, -2.8371810913085938e-05, -2.7120113372802734e-05, -2.586841583251953e-05, -2.4616718292236328e-05, -2.3365020751953125e-05, -2.2113323211669922e-05, -2.086162567138672e-05, -1.9609928131103516e-05, -1.8358230590820312e-05, -1.710653305053711e-05, -1.5854835510253906e-05, -1.4603137969970703e-05, -1.33514404296875e-05, -1.2099742889404297e-05, -1.0848045349121094e-05, -9.59634780883789e-06, -8.344650268554688e-06, -7.092952728271484e-06, -5.841255187988281e-06, -4.589557647705078e-06, -3.337860107421875e-06, -2.086162567138672e-06, -8.344650268554688e-07, 4.172325134277344e-07, 1.6689300537109375e-06, 2.9206275939941406e-06, 4.172325134277344e-06, 5.424022674560547e-06, 6.67572021484375e-06, 7.927417755126953e-06, 9.179115295410156e-06, 1.043081283569336e-05, 1.1682510375976562e-05, 1.2934207916259766e-05, 1.4185905456542969e-05, 1.5437602996826172e-05, 1.6689300537109375e-05, 1.7940998077392578e-05, 1.919269561767578e-05, 2.0444393157958984e-05, 2.1696090698242188e-05, 2.294778823852539e-05, 2.4199485778808594e-05, 2.5451183319091797e-05, 2.6702880859375e-05, 2.7954578399658203e-05, 2.9206275939941406e-05, 3.045797348022461e-05, 3.170967102050781e-05, 3.2961368560791016e-05, 3.421306610107422e-05, 3.546476364135742e-05, 3.6716461181640625e-05, 3.796815872192383e-05, 3.921985626220703e-05, 4.0471553802490234e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 11.0, 7.0, 10.0, 13.0, 24.0, 36.0, 47.0, 108.0, 188.0, 251.0, 476.0, 854.0, 1624.0, 3538.0, 8094.0, 21775.0, 89824.0, 811933.0, 76145.0, 19599.0, 7306.0, 3191.0, 1617.0, 802.0, 432.0, 257.0, 154.0, 96.0, 46.0, 29.0, 25.0, 15.0, 7.0, 11.0, 6.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.087158203125, -0.08476734161376953, -0.08237648010253906, -0.0799856185913086, -0.07759475708007812, -0.07520389556884766, -0.07281303405761719, -0.07042217254638672, -0.06803131103515625, -0.06564044952392578, -0.06324958801269531, -0.060858726501464844, -0.058467864990234375, -0.056077003479003906, -0.05368614196777344, -0.05129528045654297, -0.0489044189453125, -0.04651355743408203, -0.04412269592285156, -0.041731834411621094, -0.039340972900390625, -0.036950111389160156, -0.03455924987792969, -0.03216838836669922, -0.02977752685546875, -0.02738666534423828, -0.024995803833007812, -0.022604942321777344, -0.020214080810546875, -0.017823219299316406, -0.015432357788085938, -0.013041496276855469, -0.010650634765625, -0.008259773254394531, -0.0058689117431640625, -0.0034780502319335938, -0.001087188720703125, 0.0013036727905273438, 0.0036945343017578125, 0.006085395812988281, 0.00847625732421875, 0.010867118835449219, 0.013257980346679688, 0.015648841857910156, 0.018039703369140625, 0.020430564880371094, 0.022821426391601562, 0.02521228790283203, 0.0276031494140625, 0.02999401092529297, 0.03238487243652344, 0.034775733947753906, 0.037166595458984375, 0.039557456970214844, 0.04194831848144531, 0.04433917999267578, 0.04673004150390625, 0.04912090301513672, 0.05151176452636719, 0.053902626037597656, 0.056293487548828125, 0.058684349060058594, 0.06107521057128906, 0.06346607208251953, 0.06585693359375]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 3.0, 1.0, 3.0, 2.0, 2.0, 4.0, 3.0, 4.0, 8.0, 5.0, 6.0, 16.0, 7.0, 15.0, 11.0, 19.0, 41.0, 60.0, 59.0, 86.0, 103.0, 135.0, 99.0, 75.0, 60.0, 36.0, 31.0, 30.0, 14.0, 19.0, 12.0, 9.0, 1.0, 9.0, 1.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0948486328125, -0.0922384262084961, -0.08962821960449219, -0.08701801300048828, -0.08440780639648438, -0.08179759979248047, -0.07918739318847656, -0.07657718658447266, -0.07396697998046875, -0.07135677337646484, -0.06874656677246094, -0.06613636016845703, -0.06352615356445312, -0.06091594696044922, -0.05830574035644531, -0.055695533752441406, -0.0530853271484375, -0.050475120544433594, -0.04786491394042969, -0.04525470733642578, -0.042644500732421875, -0.04003429412841797, -0.03742408752441406, -0.034813880920410156, -0.03220367431640625, -0.029593467712402344, -0.026983261108398438, -0.02437305450439453, -0.021762847900390625, -0.01915264129638672, -0.016542434692382812, -0.013932228088378906, -0.011322021484375, -0.008711814880371094, -0.0061016082763671875, -0.0034914016723632812, -0.000881195068359375, 0.0017290115356445312, 0.0043392181396484375, 0.006949424743652344, 0.00955963134765625, 0.012169837951660156, 0.014780044555664062, 0.01739025115966797, 0.020000457763671875, 0.02261066436767578, 0.025220870971679688, 0.027831077575683594, 0.0304412841796875, 0.033051490783691406, 0.03566169738769531, 0.03827190399169922, 0.040882110595703125, 0.04349231719970703, 0.04610252380371094, 0.048712730407714844, 0.05132293701171875, 0.053933143615722656, 0.05654335021972656, 0.05915355682373047, 0.061763763427734375, 0.06437397003173828, 0.06698417663574219, 0.0695943832397461, 0.07220458984375]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 9.0, 8.0, 17.0, 37.0, 91.0, 175.0, 483.0, 88.0, 44.0, 28.0, 7.0, 8.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.784217834472656, -5.656238079071045, -5.528258800506592, -5.4002790451049805, -5.272299766540527, -5.144320011138916, -5.016340732574463, -4.888360977172852, -4.760381698608398, -4.632401943206787, -4.504422664642334, -4.376442909240723, -4.2484636306762695, -4.120483875274658, -3.992504596710205, -3.8645248413085938, -3.7365453243255615, -3.6085658073425293, -3.480586290359497, -3.352606773376465, -3.2246272563934326, -3.0966477394104004, -2.968667984008789, -2.840688705444336, -2.7127089500427246, -2.5847294330596924, -2.45674991607666, -2.328770399093628, -2.2007908821105957, -2.0728113651275635, -1.9448317289352417, -1.8168522119522095, -1.6888728141784668, -1.5608932971954346, -1.4329137802124023, -1.3049342632293701, -1.176954746246338, -1.0489752292633057, -0.9209955930709839, -0.7930160760879517, -0.6650365591049194, -0.5370570421218872, -0.4090774953365326, -0.281097948551178, -0.15311843156814575, -0.025138914585113525, 0.10284066200256348, 0.2308201789855957, 0.35879969596862793, 0.48677921295166016, 0.6147587299346924, 0.7427383065223694, 0.8707178235054016, 0.9986973404884338, 1.1266769170761108, 1.254656434059143, 1.3826359510421753, 1.5106154680252075, 1.6385949850082397, 1.7665746212005615, 1.8945541381835938, 2.022533655166626, 2.150513172149658, 2.2784926891326904, 2.4064722061157227]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 2.0, 7.0, 4.0, 7.0, 13.0, 10.0, 12.0, 17.0, 24.0, 21.0, 35.0, 28.0, 38.0, 39.0, 262.0, 227.0, 41.0, 32.0, 28.0, 33.0, 23.0, 18.0, 19.0, 17.0, 4.0, 7.0, 10.0, 12.0, 6.0, 3.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-2.729764938354492, -2.6596639156341553, -2.5895628929138184, -2.5194616317749023, -2.4493606090545654, -2.3792595863342285, -2.3091583251953125, -2.2390573024749756, -2.1689562797546387, -2.0988552570343018, -2.028754234313965, -1.9586529731750488, -1.888551950454712, -1.818450927734375, -1.7483497858047485, -1.678248643875122, -1.6081476211547852, -1.5380465984344482, -1.4679454565048218, -1.3978443145751953, -1.3277432918548584, -1.2576422691345215, -1.187541127204895, -1.1174399852752686, -1.0473389625549316, -0.97723788022995, -0.9071367979049683, -0.8370357155799866, -0.7669346332550049, -0.6968335509300232, -0.6267324686050415, -0.5566313862800598, -0.486530065536499, -0.41642898321151733, -0.34632790088653564, -0.27622681856155396, -0.20612573623657227, -0.13602465391159058, -0.06592357158660889, 0.004177510738372803, 0.07427859306335449, 0.14437967538833618, 0.21448075771331787, 0.28458184003829956, 0.35468292236328125, 0.42478400468826294, 0.49488508701324463, 0.5649861693382263, 0.635087251663208, 0.7051883339881897, 0.7752894163131714, 0.8453904986381531, 0.9154915809631348, 0.9855926632881165, 1.0556937456130981, 1.1257948875427246, 1.1958959102630615, 1.2659969329833984, 1.336098074913025, 1.4061992168426514, 1.4763002395629883, 1.5464012622833252, 1.6165024042129517, 1.6866035461425781, 1.756704568862915]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 13.0, 30.0, 40.0, 67.0, 88.0, 320.0, 228.0, 67.0, 59.0, 39.0, 21.0, 17.0, 8.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.5859375, -0.5712623596191406, -0.5565872192382812, -0.5419120788574219, -0.5272369384765625, -0.5125617980957031, -0.49788665771484375, -0.4832115173339844, -0.468536376953125, -0.4538612365722656, -0.43918609619140625, -0.4245109558105469, -0.4098358154296875, -0.3951606750488281, -0.38048553466796875, -0.3658103942871094, -0.35113525390625, -0.3364601135253906, -0.32178497314453125, -0.3071098327636719, -0.2924346923828125, -0.2777595520019531, -0.26308441162109375, -0.24840927124023438, -0.233734130859375, -0.21905899047851562, -0.20438385009765625, -0.18970870971679688, -0.1750335693359375, -0.16035842895507812, -0.14568328857421875, -0.13100814819335938, -0.1163330078125, -0.10165786743164062, -0.08698272705078125, -0.07230758666992188, -0.0576324462890625, -0.042957305908203125, -0.02828216552734375, -0.013607025146484375, 0.001068115234375, 0.015743255615234375, 0.03041839599609375, 0.045093536376953125, 0.0597686767578125, 0.07444381713867188, 0.08911895751953125, 0.10379409790039062, 0.11846923828125, 0.13314437866210938, 0.14781951904296875, 0.16249465942382812, 0.1771697998046875, 0.19184494018554688, 0.20652008056640625, 0.22119522094726562, 0.235870361328125, 0.2505455017089844, 0.26522064208984375, 0.2798957824707031, 0.2945709228515625, 0.3092460632324219, 0.32392120361328125, 0.3385963439941406, 0.353271484375]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 2.0, 2.0, 4.0, 2.0, 7.0, 15.0, 12.0, 10.0, 14.0, 17.0, 29.0, 29.0, 27.0, 33.0, 50.0, 59.0, 127.0, 239.0, 486.0, 1082.0, 3718.0, 30261.0, 8336026.0, 12301.0, 2386.0, 755.0, 320.0, 192.0, 103.0, 59.0, 53.0, 48.0, 21.0, 17.0, 17.0, 15.0, 13.0, 10.0, 8.0, 4.0, 6.0, 2.0, 2.0, 3.0, 1.0, 0.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-2.1945393085479736, -2.1287035942077637, -2.0628676414489746, -1.9970319271087646, -1.9311962127685547, -1.8653603792190552, -1.7995245456695557, -1.7336888313293457, -1.6678531169891357, -1.6020172834396362, -1.5361815690994263, -1.4703457355499268, -1.4045100212097168, -1.3386741876602173, -1.2728383541107178, -1.2070026397705078, -1.1411668062210083, -1.0753309726715088, -1.0094952583312988, -0.9436594247817993, -0.8778237104415894, -0.8119878768920898, -0.7461521029472351, -0.6803163290023804, -0.6144805550575256, -0.5486447811126709, -0.48280900716781616, -0.41697320342063904, -0.3511374294757843, -0.28530165553092957, -0.21946585178375244, -0.1536300778388977, -0.08779430389404297, -0.021958522498607635, 0.0438772588968277, 0.10971304774284363, 0.17554882168769836, 0.2413845956325531, 0.3072203993797302, 0.37305617332458496, 0.4388919472694397, 0.5047277212142944, 0.5705634951591492, 0.6363992691040039, 0.7022351026535034, 0.7680708169937134, 0.8339066505432129, 0.8997424244880676, 0.9655781984329224, 1.0314140319824219, 1.0972497463226318, 1.1630855798721313, 1.2289212942123413, 1.2947571277618408, 1.3605928421020508, 1.4264286756515503, 1.4922645092010498, 1.5581003427505493, 1.6239360570907593, 1.6897718906402588, 1.7556076049804688, 1.8214434385299683, 1.8872792720794678, 1.9531149864196777, 2.0189507007598877]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 4.0, 2.0, 2.0, 4.0, 1.0, 7.0, 3.0, 0.0, 6.0, 3.0, 5.0, 3.0, 3.0, 1.0, 5.0, 5.0, 5.0, 3.0, 4.0, 1.0, 0.0, 2.0, 2.0, 5.0, 4.0, 2.0, 3.0, 3.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3166910409927368, -1.2601501941680908, -1.2036092281341553, -1.1470683813095093, -1.0905274152755737, -1.0339865684509277, -0.977445662021637, -0.9209047555923462, -0.8643638491630554, -0.8078229427337646, -0.7512820363044739, -0.6947411298751831, -0.6382002830505371, -0.5816593170166016, -0.5251184701919556, -0.4685775637626648, -0.412036657333374, -0.35549575090408325, -0.2989548444747925, -0.2424139678478241, -0.18587306141853333, -0.12933215498924255, -0.07279127836227417, -0.0162503719329834, 0.04029053449630737, 0.09683143347501755, 0.15337233245372772, 0.2099132239818573, 0.26645413041114807, 0.32299503684043884, 0.3795359134674072, 0.436076819896698, 0.4926178455352783, 0.5491587519645691, 0.6056996583938599, 0.6622405052185059, 0.7187814712524414, 0.7753223180770874, 0.8318632245063782, 0.888404130935669, 0.9449450373649597, 1.0014859437942505, 1.0580267906188965, 1.114567756652832, 1.171108603477478, 1.2276495695114136, 1.2841904163360596, 1.3407313823699951, 1.3972722291946411, 1.453813076019287, 1.5103540420532227, 1.5668948888778687, 1.6234358549118042, 1.6799767017364502, 1.7365176677703857, 1.7930585145950317, 1.8495993614196777, 1.9061402082443237, 1.9626811742782593, 2.0192220211029053, 2.075762987136841, 2.1323039531707764, 2.188844680786133, 2.2453856468200684, 2.301926612854004]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 7.0, 5.0, 11.0, 16.0, 14.0, 28.0, 50.0, 78.0, 103.0, 219.0, 395.0, 924.0, 2298.0, 8731.0, 58946.0, 339265.0, 95322.0, 12497.0, 3074.0, 1147.0, 507.0, 261.0, 142.0, 80.0, 54.0, 31.0, 29.0, 14.0, 10.0, 2.0, 2.0, 7.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.451171875, -3.34197998046875, -3.2327880859375, -3.12359619140625, -3.014404296875, -2.90521240234375, -2.7960205078125, -2.68682861328125, -2.57763671875, -2.46844482421875, -2.3592529296875, -2.25006103515625, -2.140869140625, -2.03167724609375, -1.9224853515625, -1.81329345703125, -1.7041015625, -1.59490966796875, -1.4857177734375, -1.37652587890625, -1.267333984375, -1.15814208984375, -1.0489501953125, -0.93975830078125, -0.83056640625, -0.72137451171875, -0.6121826171875, -0.50299072265625, -0.393798828125, -0.28460693359375, -0.1754150390625, -0.06622314453125, 0.04296875, 0.15216064453125, 0.2613525390625, 0.37054443359375, 0.479736328125, 0.58892822265625, 0.6981201171875, 0.80731201171875, 0.91650390625, 1.02569580078125, 1.1348876953125, 1.24407958984375, 1.353271484375, 1.46246337890625, 1.5716552734375, 1.68084716796875, 1.7900390625, 1.89923095703125, 2.0084228515625, 2.11761474609375, 2.226806640625, 2.33599853515625, 2.4451904296875, 2.55438232421875, 2.66357421875, 2.77276611328125, 2.8819580078125, 2.99114990234375, 3.100341796875, 3.20953369140625, 3.3187255859375, 3.42791748046875, 3.537109375]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 5.0, 10.0, 4.0, 21.0, 24.0, 33.0, 34.0, 54.0, 61.0, 80.0, 70.0, 73.0, 88.0, 84.0, 76.0, 56.0, 55.0, 40.0, 36.0, 23.0, 17.0, 16.0, 15.0, 10.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.150390625, -0.14297866821289062, -0.13556671142578125, -0.12815475463867188, -0.1207427978515625, -0.11333084106445312, -0.10591888427734375, -0.09850692749023438, -0.091094970703125, -0.08368301391601562, -0.07627105712890625, -0.06885910034179688, -0.0614471435546875, -0.054035186767578125, -0.04662322998046875, -0.039211273193359375, -0.03179931640625, -0.024387359619140625, -0.01697540283203125, -0.009563446044921875, -0.0021514892578125, 0.005260467529296875, 0.01267242431640625, 0.020084381103515625, 0.027496337890625, 0.034908294677734375, 0.04232025146484375, 0.049732208251953125, 0.0571441650390625, 0.06455612182617188, 0.07196807861328125, 0.07938003540039062, 0.0867919921875, 0.09420394897460938, 0.10161590576171875, 0.10902786254882812, 0.1164398193359375, 0.12385177612304688, 0.13126373291015625, 0.13867568969726562, 0.146087646484375, 0.15349960327148438, 0.16091156005859375, 0.16832351684570312, 0.1757354736328125, 0.18314743041992188, 0.19055938720703125, 0.19797134399414062, 0.20538330078125, 0.21279525756835938, 0.22020721435546875, 0.22761917114257812, 0.2350311279296875, 0.24244308471679688, 0.24985504150390625, 0.2572669982910156, 0.264678955078125, 0.2720909118652344, 0.27950286865234375, 0.2869148254394531, 0.2943267822265625, 0.3017387390136719, 0.30915069580078125, 0.3165626525878906, 0.323974609375]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 2.0, 7.0, 7.0, 10.0, 13.0, 27.0, 71.0, 105.0, 116.0, 63.0, 24.0, 18.0, 4.0, 6.0, 6.0, 4.0, 0.0, 3.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.656930923461914, -4.553699493408203, -4.450467586517334, -4.347235679626465, -4.244004249572754, -4.140772819519043, -4.037540912628174, -3.934309244155884, -3.8310775756835938, -3.7278459072113037, -3.6246142387390137, -3.5213825702667236, -3.4181509017944336, -3.3149192333221436, -3.2116875648498535, -3.1084558963775635, -3.0052242279052734, -2.9019925594329834, -2.7987608909606934, -2.6955292224884033, -2.5922975540161133, -2.4890658855438232, -2.385834217071533, -2.282602548599243, -2.179370880126953, -2.076139211654663, -1.972907543182373, -1.869675874710083, -1.766444206237793, -1.663212537765503, -1.559980869293213, -1.4567492008209229, -1.3535172939300537, -1.2502856254577637, -1.1470539569854736, -1.0438222885131836, -0.9405906200408936, -0.8373589515686035, -0.7341272830963135, -0.6308956146240234, -0.5276639461517334, -0.42443227767944336, -0.3212006092071533, -0.21796894073486328, -0.11473727226257324, -0.011505603790283203, 0.09172606468200684, 0.19495773315429688, 0.2981894016265869, 0.40142107009887695, 0.504652738571167, 0.607884407043457, 0.7111160755157471, 0.8143477439880371, 0.9175794124603271, 1.0208110809326172, 1.1240427494049072, 1.2272744178771973, 1.3305060863494873, 1.4337377548217773, 1.5369694232940674, 1.6402010917663574, 1.7434327602386475, 1.8466644287109375, 1.9498960971832275]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 7.0, 3.0, 5.0, 6.0, 6.0, 7.0, 19.0, 42.0, 61.0, 103.0, 79.0, 59.0, 37.0, 16.0, 6.0, 4.0, 9.0, 3.0, 4.0, 1.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4236809015274048, -1.383976697921753, -1.3442723751068115, -1.3045681715011597, -1.2648639678955078, -1.2251596450805664, -1.1854554414749146, -1.1457512378692627, -1.1060469150543213, -1.0663427114486694, -1.026638388633728, -0.9869341850280762, -0.9472299218177795, -0.9075256586074829, -0.867821455001831, -0.8281171917915344, -0.7884129285812378, -0.7487086653709412, -0.7090044021606445, -0.6693001985549927, -0.629595935344696, -0.5898916721343994, -0.5501874685287476, -0.5104832053184509, -0.4707789421081543, -0.43107467889785767, -0.3913704454898834, -0.3516662120819092, -0.31196194887161255, -0.2722576856613159, -0.23255345225334167, -0.19284921884536743, -0.15314483642578125, -0.11344058811664581, -0.07373633980751038, -0.03403209149837494, 0.005672156810760498, 0.045376405119895935, 0.08508065342903137, 0.12478488683700562, 0.16448915004730225, 0.20419339835643768, 0.24389764666557312, 0.28360188007354736, 0.323306143283844, 0.3630104064941406, 0.40271463990211487, 0.4424188733100891, 0.48212313652038574, 0.5218273997306824, 0.561531662940979, 0.6012358665466309, 0.6409401297569275, 0.6806443929672241, 0.720348596572876, 0.7600528597831726, 0.7997571229934692, 0.8394613862037659, 0.8791656494140625, 0.9188698530197144, 0.958574116230011, 0.9982783794403076, 1.0379825830459595, 1.0776867866516113, 1.1173911094665527]}, "eval/loss": 4.7075324058532715, "eval/wer": 1.9290162633875447, "eval/runtime": 947.3, "eval/samples_per_second": 2.789, "eval/steps_per_second": 0.349} \ No newline at end of file +{"train/loss": 4.4733, "train/learning_rate": 6.137071651090343e-05, "train/epoch": 0.56, "train/global_step": 1000, "_runtime": 4976, "_timestamp": 1646159872, "_step": 1001, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 0.0, 21.0, 589.0, 401.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.412925720214844, -30.11447525024414, -19.816022872924805, -9.517570495605469, 0.7808799743652344, 11.079330444335938, 21.377784729003906, 31.676231384277344, 41.97468566894531, 52.273136138916016, 62.57158660888672, 72.87004089355469, 83.16848754882812, 93.4669418334961, 103.76539611816406, 114.0638427734375, 124.36229705810547, 134.66075134277344, 144.95919799804688, 155.25765991210938, 165.5561065673828, 175.85455322265625, 186.15301513671875, 196.45144653320312, 206.74990844726562, 217.04835510253906, 227.34681701660156, 237.645263671875, 247.94371032714844, 258.2421569824219, 268.5406188964844, 278.83905029296875, 289.1375427246094, 299.4360046386719, 309.73443603515625, 320.03289794921875, 330.33135986328125, 340.6297912597656, 350.9282531738281, 361.2266845703125, 371.525146484375, 381.8236083984375, 392.1220397949219, 402.4205017089844, 412.7189636230469, 423.01739501953125, 433.31585693359375, 443.61431884765625, 453.91278076171875, 464.21124267578125, 474.5096740722656, 484.8081359863281, 495.1065979003906, 505.405029296875, 515.7034912109375, 526.001953125, 536.3003540039062, 546.5988159179688, 556.8972778320312, 567.1956787109375, 577.494140625, 587.7926025390625, 598.091064453125, 608.3895263671875, 618.68798828125]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 3.0, 2.0, 2.0, 7.0, 6.0, 10.0, 10.0, 17.0, 18.0, 21.0, 14.0, 21.0, 25.0, 42.0, 31.0, 27.0, 25.0, 36.0, 28.0, 46.0, 48.0, 33.0, 34.0, 40.0, 36.0, 45.0, 52.0, 37.0, 34.0, 33.0, 30.0, 25.0, 26.0, 15.0, 23.0, 25.0, 11.0, 15.0, 13.0, 8.0, 6.0, 9.0, 4.0, 3.0, 1.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.45861053466797, -62.272972106933594, -60.08733367919922, -57.901695251464844, -55.71605682373047, -53.530418395996094, -51.34477615356445, -49.15913772583008, -46.9734992980957, -44.78786087036133, -42.60222244262695, -40.41658401489258, -38.23094177246094, -36.04530334472656, -33.85966491699219, -31.674026489257812, -29.488388061523438, -27.302749633789062, -25.117111206054688, -22.93147087097168, -20.745832443237305, -18.56019401550293, -16.374553680419922, -14.188915252685547, -12.003276824951172, -9.817638397216797, -7.6319990158081055, -5.446360111236572, -3.260721206665039, -1.075082778930664, 1.1105566024780273, 3.2961959838867188, 5.4818267822265625, 7.667465686798096, 9.853104591369629, 12.03874397277832, 14.224382400512695, 16.41002082824707, 18.595661163330078, 20.781299591064453, 22.966938018798828, 25.152576446533203, 27.338214874267578, 29.523855209350586, 31.70949363708496, 33.89513397216797, 36.080772399902344, 38.26641082763672, 40.452049255371094, 42.63768768310547, 44.823326110839844, 47.00896453857422, 49.194602966308594, 51.38024139404297, 53.56588363647461, 55.751522064208984, 57.93716049194336, 60.122798919677734, 62.30843734741211, 64.49407958984375, 66.67971801757812, 68.8653564453125, 71.05099487304688, 73.23663330078125, 75.42227172851562]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 5.0, 7.0, 6.0, 8.0, 14.0, 15.0, 20.0, 22.0, 30.0, 32.0, 36.0, 43.0, 47.0, 28.0, 41.0, 58.0, 62.0, 49.0, 37.0, 53.0, 40.0, 49.0, 44.0, 42.0, 33.0, 40.0, 24.0, 29.0, 16.0, 16.0, 16.0, 9.0, 6.0, 7.0, 8.0, 1.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.734375, -2.645294189453125, -2.55621337890625, -2.467132568359375, -2.3780517578125, -2.288970947265625, -2.19989013671875, -2.110809326171875, -2.021728515625, -1.932647705078125, -1.84356689453125, -1.754486083984375, -1.6654052734375, -1.576324462890625, -1.48724365234375, -1.398162841796875, -1.30908203125, -1.220001220703125, -1.13092041015625, -1.041839599609375, -0.9527587890625, -0.863677978515625, -0.77459716796875, -0.685516357421875, -0.596435546875, -0.507354736328125, -0.41827392578125, -0.329193115234375, -0.2401123046875, -0.151031494140625, -0.06195068359375, 0.027130126953125, 0.1162109375, 0.205291748046875, 0.29437255859375, 0.383453369140625, 0.4725341796875, 0.561614990234375, 0.65069580078125, 0.739776611328125, 0.828857421875, 0.917938232421875, 1.00701904296875, 1.096099853515625, 1.1851806640625, 1.274261474609375, 1.36334228515625, 1.452423095703125, 1.54150390625, 1.630584716796875, 1.71966552734375, 1.808746337890625, 1.8978271484375, 1.986907958984375, 2.07598876953125, 2.165069580078125, 2.254150390625, 2.343231201171875, 2.43231201171875, 2.521392822265625, 2.6104736328125, 2.699554443359375, 2.78863525390625, 2.877716064453125, 2.966796875]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 7.0, 2.0, 15.0, 14.0, 25.0, 30.0, 33.0, 63.0, 108.0, 149.0, 214.0, 343.0, 527.0, 912.0, 1704.0, 3699.0, 10559.0, 57512.0, 2071163.0, 1972051.0, 57030.0, 10622.0, 3488.0, 1655.0, 838.0, 516.0, 336.0, 217.0, 146.0, 103.0, 66.0, 33.0, 31.0, 26.0, 12.0, 16.0, 6.0, 4.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-19.015625, -18.402099609375, -17.78857421875, -17.175048828125, -16.5615234375, -15.947998046875, -15.33447265625, -14.720947265625, -14.107421875, -13.493896484375, -12.88037109375, -12.266845703125, -11.6533203125, -11.039794921875, -10.42626953125, -9.812744140625, -9.19921875, -8.585693359375, -7.97216796875, -7.358642578125, -6.7451171875, -6.131591796875, -5.51806640625, -4.904541015625, -4.291015625, -3.677490234375, -3.06396484375, -2.450439453125, -1.8369140625, -1.223388671875, -0.60986328125, 0.003662109375, 0.6171875, 1.230712890625, 1.84423828125, 2.457763671875, 3.0712890625, 3.684814453125, 4.29833984375, 4.911865234375, 5.525390625, 6.138916015625, 6.75244140625, 7.365966796875, 7.9794921875, 8.593017578125, 9.20654296875, 9.820068359375, 10.43359375, 11.047119140625, 11.66064453125, 12.274169921875, 12.8876953125, 13.501220703125, 14.11474609375, 14.728271484375, 15.341796875, 15.955322265625, 16.56884765625, 17.182373046875, 17.7958984375, 18.409423828125, 19.02294921875, 19.636474609375, 20.25]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 5.0, 7.0, 3.0, 15.0, 13.0, 9.0, 27.0, 46.0, 69.0, 93.0, 129.0, 201.0, 321.0, 534.0, 665.0, 597.0, 443.0, 278.0, 183.0, 139.0, 99.0, 59.0, 45.0, 30.0, 19.0, 19.0, 9.0, 8.0, 3.0, 7.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-15.9140625, -15.513671875, -15.11328125, -14.712890625, -14.3125, -13.912109375, -13.51171875, -13.111328125, -12.7109375, -12.310546875, -11.91015625, -11.509765625, -11.109375, -10.708984375, -10.30859375, -9.908203125, -9.5078125, -9.107421875, -8.70703125, -8.306640625, -7.90625, -7.505859375, -7.10546875, -6.705078125, -6.3046875, -5.904296875, -5.50390625, -5.103515625, -4.703125, -4.302734375, -3.90234375, -3.501953125, -3.1015625, -2.701171875, -2.30078125, -1.900390625, -1.5, -1.099609375, -0.69921875, -0.298828125, 0.1015625, 0.501953125, 0.90234375, 1.302734375, 1.703125, 2.103515625, 2.50390625, 2.904296875, 3.3046875, 3.705078125, 4.10546875, 4.505859375, 4.90625, 5.306640625, 5.70703125, 6.107421875, 6.5078125, 6.908203125, 7.30859375, 7.708984375, 8.109375, 8.509765625, 8.91015625, 9.310546875, 9.7109375]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 8.0, 3.0, 15.0, 20.0, 19.0, 36.0, 57.0, 86.0, 142.0, 324.0, 496.0, 1173.0, 4704.0, 142913.0, 3959251.0, 78856.0, 3770.0, 1132.0, 550.0, 276.0, 164.0, 95.0, 67.0, 57.0, 25.0, 11.0, 7.0, 7.0, 3.0, 6.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-47.875, -46.443359375, -45.01171875, -43.580078125, -42.1484375, -40.716796875, -39.28515625, -37.853515625, -36.421875, -34.990234375, -33.55859375, -32.126953125, -30.6953125, -29.263671875, -27.83203125, -26.400390625, -24.96875, -23.537109375, -22.10546875, -20.673828125, -19.2421875, -17.810546875, -16.37890625, -14.947265625, -13.515625, -12.083984375, -10.65234375, -9.220703125, -7.7890625, -6.357421875, -4.92578125, -3.494140625, -2.0625, -0.630859375, 0.80078125, 2.232421875, 3.6640625, 5.095703125, 6.52734375, 7.958984375, 9.390625, 10.822265625, 12.25390625, 13.685546875, 15.1171875, 16.548828125, 17.98046875, 19.412109375, 20.84375, 22.275390625, 23.70703125, 25.138671875, 26.5703125, 28.001953125, 29.43359375, 30.865234375, 32.296875, 33.728515625, 35.16015625, 36.591796875, 38.0234375, 39.455078125, 40.88671875, 42.318359375, 43.75]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 8.0, 70.0, 387.0, 424.0, 111.0, 13.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-214.093505859375, -209.44091796875, -204.788330078125, -200.1357421875, -195.483154296875, -190.83056640625, -186.177978515625, -181.525390625, -176.872802734375, -172.22021484375, -167.567626953125, -162.9150390625, -158.262451171875, -153.60986328125, -148.957275390625, -144.3046875, -139.652099609375, -134.99951171875, -130.346923828125, -125.6943359375, -121.041748046875, -116.38916015625, -111.736572265625, -107.083984375, -102.431396484375, -97.77880859375, -93.126220703125, -88.4736328125, -83.821044921875, -79.16845703125, -74.515869140625, -69.86328125, -65.210693359375, -60.55810546875, -55.905517578125, -51.2529296875, -46.600341796875, -41.94775390625, -37.295166015625, -32.642578125, -27.989990234375, -23.33740234375, -18.684814453125, -14.0322265625, -9.379638671875, -4.72705078125, -0.074462890625, 4.578125, 9.230712890625, 13.88330078125, 18.535888671875, 23.1884765625, 27.841064453125, 32.49365234375, 37.146240234375, 41.798828125, 46.451416015625, 51.10400390625, 55.756591796875, 60.4091796875, 65.061767578125, 69.71435546875, 74.366943359375, 79.01953125, 83.672119140625]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 2.0, 2.0, 7.0, 6.0, 12.0, 15.0, 18.0, 16.0, 16.0, 16.0, 20.0, 27.0, 37.0, 37.0, 44.0, 43.0, 50.0, 40.0, 50.0, 67.0, 44.0, 48.0, 48.0, 40.0, 34.0, 39.0, 35.0, 40.0, 21.0, 26.0, 27.0, 19.0, 10.0, 8.0, 11.0, 11.0, 5.0, 2.0, 5.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-51.13330078125, -49.707176208496094, -48.28105163574219, -46.85493087768555, -45.42880630493164, -44.002681732177734, -42.576560974121094, -41.15043640136719, -39.72431182861328, -38.298187255859375, -36.87206268310547, -35.44594192504883, -34.01981735229492, -32.593692779541016, -31.167570114135742, -29.74144744873047, -28.315322875976562, -26.889198303222656, -25.463075637817383, -24.03695297241211, -22.610828399658203, -21.184703826904297, -19.758581161499023, -18.33245849609375, -16.906333923339844, -15.480210304260254, -14.054086685180664, -12.627963066101074, -11.201839447021484, -9.775715827941895, -8.349592208862305, -6.923468589782715, -5.497344970703125, -4.071221351623535, -2.6450977325439453, -1.2189741134643555, 0.20714950561523438, 1.6332731246948242, 3.059396743774414, 4.485520362854004, 5.911643981933594, 7.337767601013184, 8.763891220092773, 10.190014839172363, 11.616138458251953, 13.042262077331543, 14.468385696411133, 15.894509315490723, 17.320632934570312, 18.74675750732422, 20.172880172729492, 21.599002838134766, 23.025127410888672, 24.451251983642578, 25.87737464904785, 27.303497314453125, 28.72962188720703, 30.155746459960938, 31.58186912536621, 33.007991790771484, 34.43411636352539, 35.8602409362793, 37.28636169433594, 38.712486267089844, 40.13861083984375]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 9.0, 5.0, 7.0, 8.0, 10.0, 13.0, 17.0, 13.0, 30.0, 30.0, 27.0, 27.0, 33.0, 32.0, 31.0, 38.0, 29.0, 35.0, 44.0, 34.0, 57.0, 35.0, 31.0, 44.0, 31.0, 44.0, 38.0, 34.0, 30.0, 26.0, 26.0, 31.0, 26.0, 17.0, 9.0, 11.0, 10.0, 4.0, 8.0, 1.0, 2.0, 6.0, 7.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.626953125, -2.5477294921875, -2.468505859375, -2.3892822265625, -2.31005859375, -2.2308349609375, -2.151611328125, -2.0723876953125, -1.9931640625, -1.9139404296875, -1.834716796875, -1.7554931640625, -1.67626953125, -1.5970458984375, -1.517822265625, -1.4385986328125, -1.359375, -1.2801513671875, -1.200927734375, -1.1217041015625, -1.04248046875, -0.9632568359375, -0.884033203125, -0.8048095703125, -0.7255859375, -0.6463623046875, -0.567138671875, -0.4879150390625, -0.40869140625, -0.3294677734375, -0.250244140625, -0.1710205078125, -0.091796875, -0.0125732421875, 0.066650390625, 0.1458740234375, 0.22509765625, 0.3043212890625, 0.383544921875, 0.4627685546875, 0.5419921875, 0.6212158203125, 0.700439453125, 0.7796630859375, 0.85888671875, 0.9381103515625, 1.017333984375, 1.0965576171875, 1.17578125, 1.2550048828125, 1.334228515625, 1.4134521484375, 1.49267578125, 1.5718994140625, 1.651123046875, 1.7303466796875, 1.8095703125, 1.8887939453125, 1.968017578125, 2.0472412109375, 2.12646484375, 2.2056884765625, 2.284912109375, 2.3641357421875, 2.443359375]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 8.0, 6.0, 7.0, 12.0, 21.0, 34.0, 37.0, 59.0, 68.0, 84.0, 141.0, 202.0, 295.0, 421.0, 617.0, 977.0, 1374.0, 2157.0, 3153.0, 4884.0, 7619.0, 12182.0, 19371.0, 31397.0, 53306.0, 93433.0, 173153.0, 248511.0, 168673.0, 91351.0, 51309.0, 30818.0, 19053.0, 12050.0, 7515.0, 4920.0, 3070.0, 2099.0, 1376.0, 912.0, 645.0, 412.0, 275.0, 184.0, 131.0, 89.0, 54.0, 37.0, 27.0, 16.0, 8.0, 6.0, 2.0, 1.0, 1.0, 3.0], "bins": [-0.2435302734375, -0.2366657257080078, -0.22980117797851562, -0.22293663024902344, -0.21607208251953125, -0.20920753479003906, -0.20234298706054688, -0.1954784393310547, -0.1886138916015625, -0.1817493438720703, -0.17488479614257812, -0.16802024841308594, -0.16115570068359375, -0.15429115295410156, -0.14742660522460938, -0.1405620574951172, -0.133697509765625, -0.1268329620361328, -0.11996841430664062, -0.11310386657714844, -0.10623931884765625, -0.09937477111816406, -0.09251022338867188, -0.08564567565917969, -0.0787811279296875, -0.07191658020019531, -0.06505203247070312, -0.05818748474121094, -0.05132293701171875, -0.04445838928222656, -0.037593841552734375, -0.030729293823242188, -0.02386474609375, -0.017000198364257812, -0.010135650634765625, -0.0032711029052734375, 0.00359344482421875, 0.010457992553710938, 0.017322540283203125, 0.024187088012695312, 0.0310516357421875, 0.03791618347167969, 0.044780731201171875, 0.05164527893066406, 0.05850982666015625, 0.06537437438964844, 0.07223892211914062, 0.07910346984863281, 0.085968017578125, 0.09283256530761719, 0.09969711303710938, 0.10656166076660156, 0.11342620849609375, 0.12029075622558594, 0.12715530395507812, 0.1340198516845703, 0.1408843994140625, 0.1477489471435547, 0.15461349487304688, 0.16147804260253906, 0.16834259033203125, 0.17520713806152344, 0.18207168579101562, 0.1889362335205078, 0.19580078125]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 4.0, 1.0, 7.0, 13.0, 16.0, 16.0, 16.0, 14.0, 23.0, 27.0, 28.0, 27.0, 38.0, 38.0, 42.0, 38.0, 37.0, 41.0, 1075.0, 51.0, 58.0, 43.0, 38.0, 43.0, 42.0, 39.0, 37.0, 26.0, 19.0, 21.0, 25.0, 9.0, 21.0, 12.0, 7.0, 8.0, 8.0, 9.0, 7.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.580078125, -1.5247344970703125, -1.469390869140625, -1.4140472412109375, -1.35870361328125, -1.3033599853515625, -1.248016357421875, -1.1926727294921875, -1.1373291015625, -1.0819854736328125, -1.026641845703125, -0.9712982177734375, -0.91595458984375, -0.8606109619140625, -0.805267333984375, -0.7499237060546875, -0.694580078125, -0.6392364501953125, -0.583892822265625, -0.5285491943359375, -0.47320556640625, -0.4178619384765625, -0.362518310546875, -0.3071746826171875, -0.2518310546875, -0.1964874267578125, -0.141143798828125, -0.0858001708984375, -0.03045654296875, 0.0248870849609375, 0.080230712890625, 0.1355743408203125, 0.19091796875, 0.2462615966796875, 0.301605224609375, 0.3569488525390625, 0.41229248046875, 0.4676361083984375, 0.522979736328125, 0.5783233642578125, 0.6336669921875, 0.6890106201171875, 0.744354248046875, 0.7996978759765625, 0.85504150390625, 0.9103851318359375, 0.965728759765625, 1.0210723876953125, 1.076416015625, 1.1317596435546875, 1.187103271484375, 1.2424468994140625, 1.29779052734375, 1.3531341552734375, 1.408477783203125, 1.4638214111328125, 1.5191650390625, 1.5745086669921875, 1.629852294921875, 1.6851959228515625, 1.74053955078125, 1.7958831787109375, 1.851226806640625, 1.9065704345703125, 1.9619140625]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 5.0, 9.0, 9.0, 12.0, 22.0, 29.0, 37.0, 69.0, 102.0, 143.0, 212.0, 306.0, 597.0, 990.0, 1732.0, 3043.0, 5531.0, 10165.0, 18992.0, 35138.0, 66913.0, 127600.0, 221204.0, 1282206.0, 150548.0, 80078.0, 42225.0, 22149.0, 12068.0, 6563.0, 3484.0, 2058.0, 1121.0, 670.0, 397.0, 243.0, 169.0, 93.0, 67.0, 49.0, 24.0, 22.0, 9.0, 11.0, 4.0, 4.0, 9.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.1783447265625, -0.17312049865722656, -0.16789627075195312, -0.1626720428466797, -0.15744781494140625, -0.1522235870361328, -0.14699935913085938, -0.14177513122558594, -0.1365509033203125, -0.13132667541503906, -0.12610244750976562, -0.12087821960449219, -0.11565399169921875, -0.11042976379394531, -0.10520553588867188, -0.09998130798339844, -0.094757080078125, -0.08953285217285156, -0.08430862426757812, -0.07908439636230469, -0.07386016845703125, -0.06863594055175781, -0.06341171264648438, -0.05818748474121094, -0.0529632568359375, -0.04773902893066406, -0.042514801025390625, -0.03729057312011719, -0.03206634521484375, -0.026842117309570312, -0.021617889404296875, -0.016393661499023438, -0.01116943359375, -0.0059452056884765625, -0.000720977783203125, 0.0045032501220703125, 0.00972747802734375, 0.014951705932617188, 0.020175933837890625, 0.025400161743164062, 0.0306243896484375, 0.03584861755371094, 0.041072845458984375, 0.04629707336425781, 0.05152130126953125, 0.05674552917480469, 0.061969757080078125, 0.06719398498535156, 0.072418212890625, 0.07764244079589844, 0.08286666870117188, 0.08809089660644531, 0.09331512451171875, 0.09853935241699219, 0.10376358032226562, 0.10898780822753906, 0.1142120361328125, 0.11943626403808594, 0.12466049194335938, 0.1298847198486328, 0.13510894775390625, 0.1403331756591797, 0.14555740356445312, 0.15078163146972656, 0.156005859375]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 5.0, 2.0, 6.0, 6.0, 11.0, 9.0, 15.0, 24.0, 26.0, 45.0, 61.0, 85.0, 90.0, 120.0, 122.0, 91.0, 79.0, 61.0, 28.0, 29.0, 21.0, 15.0, 10.0, 5.0, 12.0, 6.0, 3.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0009531974792480469, -0.0009189173579216003, -0.0008846372365951538, -0.0008503571152687073, -0.0008160769939422607, -0.0007817968726158142, -0.0007475167512893677, -0.0007132366299629211, -0.0006789565086364746, -0.0006446763873100281, -0.0006103962659835815, -0.000576116144657135, -0.0005418360233306885, -0.0005075559020042419, -0.0004732757806777954, -0.0004389956593513489, -0.00040471553802490234, -0.0003704354166984558, -0.0003361552953720093, -0.00030187517404556274, -0.0002675950527191162, -0.00023331493139266968, -0.00019903481006622314, -0.0001647546887397766, -0.00013047456741333008, -9.619444608688354e-05, -6.191432476043701e-05, -2.763420343399048e-05, 6.645917892456055e-06, 4.092603921890259e-05, 7.520616054534912e-05, 0.00010948628187179565, 0.0001437664031982422, 0.00017804652452468872, 0.00021232664585113525, 0.0002466067671775818, 0.0002808868885040283, 0.00031516700983047485, 0.0003494471311569214, 0.0003837272524833679, 0.00041800737380981445, 0.000452287495136261, 0.0004865676164627075, 0.000520847737789154, 0.0005551278591156006, 0.0005894079804420471, 0.0006236881017684937, 0.0006579682230949402, 0.0006922483444213867, 0.0007265284657478333, 0.0007608085870742798, 0.0007950887084007263, 0.0008293688297271729, 0.0008636489510536194, 0.0008979290723800659, 0.0009322091937065125, 0.000966489315032959, 0.0010007694363594055, 0.001035049557685852, 0.0010693296790122986, 0.0011036098003387451, 0.0011378899216651917, 0.0011721700429916382, 0.0012064501643180847, 0.0012407302856445312]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 4.0, 2.0, 2.0, 2.0, 6.0, 8.0, 19.0, 27.0, 31.0, 42.0, 78.0, 108.0, 188.0, 276.0, 665.0, 4940.0, 1015576.0, 24641.0, 965.0, 366.0, 189.0, 128.0, 94.0, 55.0, 36.0, 24.0, 16.0, 11.0, 13.0, 3.0, 3.0, 5.0, 3.0, 2.0, 1.0, 2.0, 2.0, 6.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.0216522216796875, -0.020869731903076172, -0.020087242126464844, -0.019304752349853516, -0.018522262573242188, -0.01773977279663086, -0.01695728302001953, -0.016174793243408203, -0.015392303466796875, -0.014609813690185547, -0.013827323913574219, -0.01304483413696289, -0.012262344360351562, -0.011479854583740234, -0.010697364807128906, -0.009914875030517578, -0.00913238525390625, -0.008349895477294922, -0.007567405700683594, -0.006784915924072266, -0.0060024261474609375, -0.005219936370849609, -0.004437446594238281, -0.003654956817626953, -0.002872467041015625, -0.002089977264404297, -0.0013074874877929688, -0.0005249977111816406, 0.0002574920654296875, 0.0010399818420410156, 0.0018224716186523438, 0.002604961395263672, 0.003387451171875, 0.004169940948486328, 0.004952430725097656, 0.005734920501708984, 0.0065174102783203125, 0.007299900054931641, 0.008082389831542969, 0.008864879608154297, 0.009647369384765625, 0.010429859161376953, 0.011212348937988281, 0.01199483871459961, 0.012777328491210938, 0.013559818267822266, 0.014342308044433594, 0.015124797821044922, 0.01590728759765625, 0.016689777374267578, 0.017472267150878906, 0.018254756927490234, 0.019037246704101562, 0.01981973648071289, 0.02060222625732422, 0.021384716033935547, 0.022167205810546875, 0.022949695587158203, 0.02373218536376953, 0.02451467514038086, 0.025297164916992188, 0.026079654693603516, 0.026862144470214844, 0.027644634246826172, 0.0284271240234375]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.0, 930.0, 35.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.013438841328024864, -0.013080080971121788, -0.012721321545541286, -0.01236256118863821, -0.012003800831735134, -0.011645041406154633, -0.011286281049251556, -0.01092752069234848, -0.010568760335445404, -0.010209999978542328, -0.009851240552961826, -0.00949248019605875, -0.009133719839155674, -0.008774960413575172, -0.008416200056672096, -0.00805743969976902, -0.0076986802741885185, -0.00733992038294673, -0.0069811600260436535, -0.006622400134801865, -0.0062636397778987885, -0.005904879886657, -0.005546119995415211, -0.0051873596385121346, -0.004828599747270346, -0.004469839856028557, -0.004111079499125481, -0.003752319607883692, -0.0033935594838112593, -0.0030347993597388268, -0.002676039468497038, -0.0023172793444246054, -0.0019585182890295982, -0.0015997581649571657, -0.001240998157300055, -0.0008822381496429443, -0.0005234780255705118, -0.0001647179014980793, 0.00019404198974370956, 0.0005528021138161421, 0.0009115622378885746, 0.0012703223619610071, 0.0016290823696181178, 0.0019878423772752285, 0.002346602501347661, 0.0027053626254200935, 0.0030641225166618824, 0.003422882640734315, 0.0037816427648067474, 0.004140402656048536, 0.0044991630129516125, 0.004857922904193401, 0.0052166832610964775, 0.005575443152338266, 0.005934203043580055, 0.006292963400483131, 0.00665172329172492, 0.007010483182966709, 0.007369243539869785, 0.007728003431111574, 0.008086763322353363, 0.00844552367925644, 0.008804284036159515, 0.009163043461740017, 0.009521803818643093]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 6.0, 1.0, 4.0, 6.0, 14.0, 10.0, 11.0, 14.0, 12.0, 17.0, 21.0, 42.0, 34.0, 41.0, 36.0, 42.0, 33.0, 48.0, 48.0, 51.0, 39.0, 44.0, 33.0, 41.0, 45.0, 40.0, 29.0, 32.0, 37.0, 27.0, 28.0, 25.0, 15.0, 18.0, 10.0, 9.0, 11.0, 6.0, 6.0, 8.0, 6.0, 2.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0005055665969848633, -0.0004913890734314919, -0.0004772115498781204, -0.000463034026324749, -0.00044885650277137756, -0.00043467897921800613, -0.0004205014556646347, -0.0004063239321112633, -0.00039214640855789185, -0.0003779688850045204, -0.000363791361451149, -0.00034961383789777756, -0.00033543631434440613, -0.0003212587907910347, -0.00030708126723766327, -0.00029290374368429184, -0.0002787262201309204, -0.000264548696577549, -0.00025037117302417755, -0.00023619364947080612, -0.0002220161259174347, -0.00020783860236406326, -0.00019366107881069183, -0.0001794835552573204, -0.00016530603170394897, -0.00015112850815057755, -0.00013695098459720612, -0.00012277346104383469, -0.00010859593749046326, -9.441841393709183e-05, -8.02408903837204e-05, -6.606336683034897e-05, -5.188584327697754e-05, -3.770831972360611e-05, -2.353079617023468e-05, -9.35327261686325e-06, 4.824250936508179e-06, 1.9001774489879608e-05, 3.317929804325104e-05, 4.735682159662247e-05, 6.15343451499939e-05, 7.571186870336533e-05, 8.988939225673676e-05, 0.00010406691581010818, 0.00011824443936347961, 0.00013242196291685104, 0.00014659948647022247, 0.0001607770100235939, 0.00017495453357696533, 0.00018913205713033676, 0.0002033095806837082, 0.00021748710423707962, 0.00023166462779045105, 0.0002458421513438225, 0.0002600196748971939, 0.00027419719845056534, 0.00028837472200393677, 0.0003025522455573082, 0.0003167297691106796, 0.00033090729266405106, 0.0003450848162174225, 0.0003592623397707939, 0.00037343986332416534, 0.0003876173868775368, 0.0004017949104309082]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 9.0, 5.0, 7.0, 8.0, 10.0, 13.0, 17.0, 13.0, 30.0, 30.0, 27.0, 27.0, 33.0, 32.0, 31.0, 38.0, 29.0, 35.0, 44.0, 34.0, 57.0, 35.0, 31.0, 44.0, 31.0, 44.0, 38.0, 34.0, 30.0, 26.0, 26.0, 31.0, 26.0, 17.0, 9.0, 11.0, 10.0, 4.0, 8.0, 1.0, 2.0, 6.0, 7.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.626953125, -2.5477294921875, -2.468505859375, -2.3892822265625, -2.31005859375, -2.2308349609375, -2.151611328125, -2.0723876953125, -1.9931640625, -1.9139404296875, -1.834716796875, -1.7554931640625, -1.67626953125, -1.5970458984375, -1.517822265625, -1.4385986328125, -1.359375, -1.2801513671875, -1.200927734375, -1.1217041015625, -1.04248046875, -0.9632568359375, -0.884033203125, -0.8048095703125, -0.7255859375, -0.6463623046875, -0.567138671875, -0.4879150390625, -0.40869140625, -0.3294677734375, -0.250244140625, -0.1710205078125, -0.091796875, -0.0125732421875, 0.066650390625, 0.1458740234375, 0.22509765625, 0.3043212890625, 0.383544921875, 0.4627685546875, 0.5419921875, 0.6212158203125, 0.700439453125, 0.7796630859375, 0.85888671875, 0.9381103515625, 1.017333984375, 1.0965576171875, 1.17578125, 1.2550048828125, 1.334228515625, 1.4134521484375, 1.49267578125, 1.5718994140625, 1.651123046875, 1.7303466796875, 1.8095703125, 1.8887939453125, 1.968017578125, 2.0472412109375, 2.12646484375, 2.2056884765625, 2.284912109375, 2.3641357421875, 2.443359375]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 3.0, 3.0, 11.0, 18.0, 17.0, 35.0, 55.0, 86.0, 118.0, 155.0, 220.0, 324.0, 544.0, 846.0, 1287.0, 1863.0, 2831.0, 4734.0, 7999.0, 14792.0, 33846.0, 129959.0, 551673.0, 208686.0, 45980.0, 18071.0, 9431.0, 5503.0, 3290.0, 2075.0, 1386.0, 881.0, 585.0, 423.0, 278.0, 177.0, 132.0, 82.0, 53.0, 41.0, 21.0, 17.0, 10.0, 5.0, 1.0, 7.0, 2.0, 2.0, 6.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.703125, -9.4146728515625, -9.126220703125, -8.8377685546875, -8.54931640625, -8.2608642578125, -7.972412109375, -7.6839599609375, -7.3955078125, -7.1070556640625, -6.818603515625, -6.5301513671875, -6.24169921875, -5.9532470703125, -5.664794921875, -5.3763427734375, -5.087890625, -4.7994384765625, -4.510986328125, -4.2225341796875, -3.93408203125, -3.6456298828125, -3.357177734375, -3.0687255859375, -2.7802734375, -2.4918212890625, -2.203369140625, -1.9149169921875, -1.62646484375, -1.3380126953125, -1.049560546875, -0.7611083984375, -0.47265625, -0.1842041015625, 0.104248046875, 0.3927001953125, 0.68115234375, 0.9696044921875, 1.258056640625, 1.5465087890625, 1.8349609375, 2.1234130859375, 2.411865234375, 2.7003173828125, 2.98876953125, 3.2772216796875, 3.565673828125, 3.8541259765625, 4.142578125, 4.4310302734375, 4.719482421875, 5.0079345703125, 5.29638671875, 5.5848388671875, 5.873291015625, 6.1617431640625, 6.4501953125, 6.7386474609375, 7.027099609375, 7.3155517578125, 7.60400390625, 7.8924560546875, 8.180908203125, 8.4693603515625, 8.7578125]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 1.0, 4.0, 2.0, 2.0, 5.0, 12.0, 9.0, 10.0, 10.0, 21.0, 16.0, 23.0, 19.0, 20.0, 26.0, 33.0, 34.0, 41.0, 36.0, 43.0, 65.0, 94.0, 241.0, 1518.0, 247.0, 89.0, 62.0, 36.0, 27.0, 37.0, 34.0, 28.0, 35.0, 19.0, 25.0, 24.0, 19.0, 17.0, 9.0, 9.0, 5.0, 11.0, 12.0, 7.0, 7.0, 4.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.9140625, -7.6629638671875, -7.411865234375, -7.1607666015625, -6.90966796875, -6.6585693359375, -6.407470703125, -6.1563720703125, -5.9052734375, -5.6541748046875, -5.403076171875, -5.1519775390625, -4.90087890625, -4.6497802734375, -4.398681640625, -4.1475830078125, -3.896484375, -3.6453857421875, -3.394287109375, -3.1431884765625, -2.89208984375, -2.6409912109375, -2.389892578125, -2.1387939453125, -1.8876953125, -1.6365966796875, -1.385498046875, -1.1343994140625, -0.88330078125, -0.6322021484375, -0.381103515625, -0.1300048828125, 0.12109375, 0.3721923828125, 0.623291015625, 0.8743896484375, 1.12548828125, 1.3765869140625, 1.627685546875, 1.8787841796875, 2.1298828125, 2.3809814453125, 2.632080078125, 2.8831787109375, 3.13427734375, 3.3853759765625, 3.636474609375, 3.8875732421875, 4.138671875, 4.3897705078125, 4.640869140625, 4.8919677734375, 5.14306640625, 5.3941650390625, 5.645263671875, 5.8963623046875, 6.1474609375, 6.3985595703125, 6.649658203125, 6.9007568359375, 7.15185546875, 7.4029541015625, 7.654052734375, 7.9051513671875, 8.15625]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 7.0, 6.0, 7.0, 12.0, 6.0, 7.0, 14.0, 8.0, 25.0, 20.0, 19.0, 18.0, 29.0, 28.0, 43.0, 42.0, 66.0, 100.0, 252.0, 763.0, 22058.0, 3107744.0, 13064.0, 696.0, 221.0, 103.0, 65.0, 49.0, 34.0, 34.0, 23.0, 19.0, 16.0, 29.0, 19.0, 10.0, 8.0, 7.0, 8.0, 10.0, 7.0, 0.0, 2.0, 5.0, 2.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-37.8125, -36.6474609375, -35.482421875, -34.3173828125, -33.15234375, -31.9873046875, -30.822265625, -29.6572265625, -28.4921875, -27.3271484375, -26.162109375, -24.9970703125, -23.83203125, -22.6669921875, -21.501953125, -20.3369140625, -19.171875, -18.0068359375, -16.841796875, -15.6767578125, -14.51171875, -13.3466796875, -12.181640625, -11.0166015625, -9.8515625, -8.6865234375, -7.521484375, -6.3564453125, -5.19140625, -4.0263671875, -2.861328125, -1.6962890625, -0.53125, 0.6337890625, 1.798828125, 2.9638671875, 4.12890625, 5.2939453125, 6.458984375, 7.6240234375, 8.7890625, 9.9541015625, 11.119140625, 12.2841796875, 13.44921875, 14.6142578125, 15.779296875, 16.9443359375, 18.109375, 19.2744140625, 20.439453125, 21.6044921875, 22.76953125, 23.9345703125, 25.099609375, 26.2646484375, 27.4296875, 28.5947265625, 29.759765625, 30.9248046875, 32.08984375, 33.2548828125, 34.419921875, 35.5849609375, 36.75]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [2.0, 8.0, 149.0, 778.0, 77.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.42736530303955, -7.372426986694336, -4.317488670349121, -1.2625503540039062, 1.7923879623413086, 4.847326278686523, 7.902264595031738, 10.957201957702637, 14.012141227722168, 17.067079544067383, 20.12201690673828, 23.176956176757812, 26.231895446777344, 29.286832809448242, 32.34177017211914, 35.39670944213867, 38.4516487121582, 41.506587982177734, 44.5615234375, 47.61646270751953, 50.67140197753906, 53.726341247558594, 56.781280517578125, 59.83621597290039, 62.89115524291992, 65.94609069824219, 69.00102996826172, 72.05596923828125, 75.11090850830078, 78.16584777832031, 81.22078704833984, 84.27572631835938, 87.33065795898438, 90.3855972290039, 93.44053649902344, 96.49547576904297, 99.5504150390625, 102.6053466796875, 105.66028594970703, 108.71522521972656, 111.7701644897461, 114.82510375976562, 117.88004302978516, 120.93498229980469, 123.98991394042969, 127.04485321044922, 130.09979248046875, 133.15472412109375, 136.2096710205078, 139.2646026611328, 142.31954956054688, 145.37448120117188, 148.42942810058594, 151.48435974121094, 154.539306640625, 157.59423828125, 160.649169921875, 163.7041015625, 166.75904846191406, 169.81398010253906, 172.86892700195312, 175.92385864257812, 178.9788055419922, 182.0337371826172, 185.08868408203125]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 4.0, 4.0, 4.0, 13.0, 11.0, 23.0, 20.0, 13.0, 22.0, 37.0, 22.0, 37.0, 38.0, 33.0, 54.0, 36.0, 47.0, 35.0, 61.0, 46.0, 47.0, 43.0, 44.0, 36.0, 30.0, 51.0, 35.0, 30.0, 19.0, 20.0, 16.0, 24.0, 14.0, 7.0, 9.0, 3.0, 5.0, 5.0, 4.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.749897003173828, -28.776386260986328, -27.802875518798828, -26.829364776611328, -25.855854034423828, -24.882343292236328, -23.908832550048828, -22.935319900512695, -21.961809158325195, -20.988298416137695, -20.014787673950195, -19.041276931762695, -18.067766189575195, -17.094253540039062, -16.120742797851562, -15.147232055664062, -14.173722267150879, -13.200211524963379, -12.226700782775879, -11.253189086914062, -10.279678344726562, -9.306167602539062, -8.332656860351562, -7.359145641326904, -6.385634899139404, -5.412124156951904, -4.438612937927246, -3.465102195739746, -2.491591215133667, -1.518080234527588, -0.5445694923400879, 0.4289417266845703, 1.4024524688720703, 2.3759634494781494, 3.3494744300842285, 4.3229851722717285, 5.296496391296387, 6.270007133483887, 7.243517875671387, 8.217029571533203, 9.190540313720703, 10.164051055908203, 11.137561798095703, 12.111072540283203, 13.08458423614502, 14.05809497833252, 15.03160572052002, 16.005117416381836, 16.978626251220703, 17.952136993408203, 18.925647735595703, 19.899158477783203, 20.872669219970703, 21.846179962158203, 22.819690704345703, 23.793203353881836, 24.766714096069336, 25.740224838256836, 26.713735580444336, 27.687246322631836, 28.660757064819336, 29.63426971435547, 30.60778045654297, 31.58129119873047, 32.55480194091797]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 3.0, 3.0, 3.0, 4.0, 5.0, 11.0, 10.0, 15.0, 16.0, 16.0, 20.0, 22.0, 27.0, 30.0, 22.0, 38.0, 36.0, 33.0, 40.0, 28.0, 37.0, 47.0, 46.0, 41.0, 30.0, 42.0, 38.0, 43.0, 42.0, 31.0, 37.0, 24.0, 37.0, 22.0, 23.0, 17.0, 11.0, 13.0, 8.0, 10.0, 4.0, 6.0, 4.0, 5.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.94921875, -2.864105224609375, -2.77899169921875, -2.693878173828125, -2.6087646484375, -2.523651123046875, -2.43853759765625, -2.353424072265625, -2.268310546875, -2.183197021484375, -2.09808349609375, -2.012969970703125, -1.9278564453125, -1.842742919921875, -1.75762939453125, -1.672515869140625, -1.58740234375, -1.502288818359375, -1.41717529296875, -1.332061767578125, -1.2469482421875, -1.161834716796875, -1.07672119140625, -0.991607666015625, -0.906494140625, -0.821380615234375, -0.73626708984375, -0.651153564453125, -0.5660400390625, -0.480926513671875, -0.39581298828125, -0.310699462890625, -0.2255859375, -0.140472412109375, -0.05535888671875, 0.029754638671875, 0.1148681640625, 0.199981689453125, 0.28509521484375, 0.370208740234375, 0.455322265625, 0.540435791015625, 0.62554931640625, 0.710662841796875, 0.7957763671875, 0.880889892578125, 0.96600341796875, 1.051116943359375, 1.13623046875, 1.221343994140625, 1.30645751953125, 1.391571044921875, 1.4766845703125, 1.561798095703125, 1.64691162109375, 1.732025146484375, 1.817138671875, 1.902252197265625, 1.98736572265625, 2.072479248046875, 2.1575927734375, 2.242706298828125, 2.32781982421875, 2.412933349609375, 2.498046875]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 4.0, 4.0, 8.0, 12.0, 5.0, 13.0, 15.0, 22.0, 32.0, 30.0, 47.0, 59.0, 59.0, 97.0, 123.0, 176.0, 224.0, 328.0, 593.0, 1219.0, 2859.0, 10175.0, 56046.0, 727446.0, 3146634.0, 211939.0, 26219.0, 5724.0, 1849.0, 817.0, 419.0, 272.0, 214.0, 134.0, 102.0, 99.0, 62.0, 43.0, 37.0, 29.0, 19.0, 13.0, 21.0, 10.0, 10.0, 10.0, 7.0, 4.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-14.203125, -13.7633056640625, -13.323486328125, -12.8836669921875, -12.44384765625, -12.0040283203125, -11.564208984375, -11.1243896484375, -10.6845703125, -10.2447509765625, -9.804931640625, -9.3651123046875, -8.92529296875, -8.4854736328125, -8.045654296875, -7.6058349609375, -7.166015625, -6.7261962890625, -6.286376953125, -5.8465576171875, -5.40673828125, -4.9669189453125, -4.527099609375, -4.0872802734375, -3.6474609375, -3.2076416015625, -2.767822265625, -2.3280029296875, -1.88818359375, -1.4483642578125, -1.008544921875, -0.5687255859375, -0.12890625, 0.3109130859375, 0.750732421875, 1.1905517578125, 1.63037109375, 2.0701904296875, 2.510009765625, 2.9498291015625, 3.3896484375, 3.8294677734375, 4.269287109375, 4.7091064453125, 5.14892578125, 5.5887451171875, 6.028564453125, 6.4683837890625, 6.908203125, 7.3480224609375, 7.787841796875, 8.2276611328125, 8.66748046875, 9.1072998046875, 9.547119140625, 9.9869384765625, 10.4267578125, 10.8665771484375, 11.306396484375, 11.7462158203125, 12.18603515625, 12.6258544921875, 13.065673828125, 13.5054931640625, 13.9453125]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 7.0, 10.0, 16.0, 26.0, 36.0, 92.0, 126.0, 208.0, 310.0, 537.0, 826.0, 750.0, 470.0, 267.0, 164.0, 97.0, 56.0, 36.0, 22.0, 7.0, 7.0, 5.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.3984375, -14.8988037109375, -14.399169921875, -13.8995361328125, -13.39990234375, -12.9002685546875, -12.400634765625, -11.9010009765625, -11.4013671875, -10.9017333984375, -10.402099609375, -9.9024658203125, -9.40283203125, -8.9031982421875, -8.403564453125, -7.9039306640625, -7.404296875, -6.9046630859375, -6.405029296875, -5.9053955078125, -5.40576171875, -4.9061279296875, -4.406494140625, -3.9068603515625, -3.4072265625, -2.9075927734375, -2.407958984375, -1.9083251953125, -1.40869140625, -0.9090576171875, -0.409423828125, 0.0902099609375, 0.58984375, 1.0894775390625, 1.589111328125, 2.0887451171875, 2.58837890625, 3.0880126953125, 3.587646484375, 4.0872802734375, 4.5869140625, 5.0865478515625, 5.586181640625, 6.0858154296875, 6.58544921875, 7.0850830078125, 7.584716796875, 8.0843505859375, 8.583984375, 9.0836181640625, 9.583251953125, 10.0828857421875, 10.58251953125, 11.0821533203125, 11.581787109375, 12.0814208984375, 12.5810546875, 13.0806884765625, 13.580322265625, 14.0799560546875, 14.57958984375, 15.0792236328125, 15.578857421875, 16.0784912109375, 16.578125]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 3.0, 1.0, 5.0, 7.0, 9.0, 10.0, 14.0, 21.0, 23.0, 23.0, 61.0, 98.0, 138.0, 246.0, 548.0, 1421.0, 6185.0, 62280.0, 1514179.0, 2503928.0, 93618.0, 8277.0, 1783.0, 654.0, 307.0, 149.0, 116.0, 52.0, 31.0, 28.0, 17.0, 22.0, 4.0, 8.0, 6.0, 3.0, 6.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-30.640625, -29.791259765625, -28.94189453125, -28.092529296875, -27.2431640625, -26.393798828125, -25.54443359375, -24.695068359375, -23.845703125, -22.996337890625, -22.14697265625, -21.297607421875, -20.4482421875, -19.598876953125, -18.74951171875, -17.900146484375, -17.05078125, -16.201416015625, -15.35205078125, -14.502685546875, -13.6533203125, -12.803955078125, -11.95458984375, -11.105224609375, -10.255859375, -9.406494140625, -8.55712890625, -7.707763671875, -6.8583984375, -6.009033203125, -5.15966796875, -4.310302734375, -3.4609375, -2.611572265625, -1.76220703125, -0.912841796875, -0.0634765625, 0.785888671875, 1.63525390625, 2.484619140625, 3.333984375, 4.183349609375, 5.03271484375, 5.882080078125, 6.7314453125, 7.580810546875, 8.43017578125, 9.279541015625, 10.12890625, 10.978271484375, 11.82763671875, 12.677001953125, 13.5263671875, 14.375732421875, 15.22509765625, 16.074462890625, 16.923828125, 17.773193359375, 18.62255859375, 19.471923828125, 20.3212890625, 21.170654296875, 22.02001953125, 22.869384765625, 23.71875]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [3.0, 5.0, 165.0, 658.0, 178.0, 7.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.931596755981445, -19.29599380493164, -11.660390853881836, -4.024787902832031, 3.6108150482177734, 11.246419906616211, 18.882020950317383, 26.517621994018555, 34.153228759765625, 41.78883361816406, 49.424434661865234, 57.060035705566406, 64.69564056396484, 72.33124542236328, 79.96684265136719, 87.60244750976562, 95.23805236816406, 102.8736572265625, 110.50926208496094, 118.14485931396484, 125.78046417236328, 133.41607666015625, 141.05166625976562, 148.68727111816406, 156.3228759765625, 163.95848083496094, 171.59408569335938, 179.2296905517578, 186.86529541015625, 194.50088500976562, 202.13648986816406, 209.7720947265625, 217.40768432617188, 225.0432891845703, 232.67889404296875, 240.3144989013672, 247.95010375976562, 255.585693359375, 263.2213134765625, 270.8569030761719, 278.49249267578125, 286.1280822753906, 293.7637023925781, 301.3992919921875, 309.034912109375, 316.6705017089844, 324.3061218261719, 331.94171142578125, 339.57733154296875, 347.2129211425781, 354.8485412597656, 362.484130859375, 370.1197509765625, 377.7553405761719, 385.3909606933594, 393.02655029296875, 400.66217041015625, 408.2977600097656, 415.9333801269531, 423.5689697265625, 431.20458984375, 438.8401794433594, 446.4757995605469, 454.11138916015625, 461.7469787597656]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 4.0, 10.0, 7.0, 6.0, 12.0, 17.0, 7.0, 15.0, 17.0, 14.0, 19.0, 24.0, 23.0, 33.0, 27.0, 19.0, 36.0, 29.0, 33.0, 39.0, 38.0, 37.0, 37.0, 39.0, 34.0, 36.0, 28.0, 30.0, 32.0, 28.0, 36.0, 32.0, 29.0, 24.0, 23.0, 20.0, 15.0, 11.0, 9.0, 18.0, 10.0, 10.0, 7.0, 6.0, 5.0, 7.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-28.371917724609375, -27.49315643310547, -26.614395141601562, -25.735633850097656, -24.85687255859375, -23.978111267089844, -23.099349975585938, -22.22058868408203, -21.341827392578125, -20.46306610107422, -19.584304809570312, -18.705543518066406, -17.8267822265625, -16.948020935058594, -16.069259643554688, -15.190499305725098, -14.311738967895508, -13.432977676391602, -12.554216384887695, -11.675455093383789, -10.796693801879883, -9.917932510375977, -9.039172172546387, -8.16041088104248, -7.281649589538574, -6.402888298034668, -5.524127006530762, -4.645366191864014, -3.7666049003601074, -2.887843608856201, -2.009082794189453, -1.1303215026855469, -0.2515602111816406, 0.6272009611129761, 1.5059621334075928, 2.38472318649292, 3.263484477996826, 4.142245769500732, 5.0210065841674805, 5.899767875671387, 6.778529167175293, 7.657290458679199, 8.536051750183105, 9.414812088012695, 10.293573379516602, 11.172334671020508, 12.051095962524414, 12.92985725402832, 13.808618545532227, 14.687379837036133, 15.566141128540039, 16.444902420043945, 17.32366371154785, 18.202425003051758, 19.08118438720703, 19.959945678710938, 20.838706970214844, 21.71746826171875, 22.596229553222656, 23.474990844726562, 24.35375213623047, 25.232513427734375, 26.11127471923828, 26.990036010742188, 27.868797302246094]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 3.0, 5.0, 6.0, 4.0, 5.0, 14.0, 8.0, 25.0, 9.0, 22.0, 17.0, 26.0, 26.0, 29.0, 24.0, 17.0, 28.0, 34.0, 23.0, 34.0, 43.0, 30.0, 35.0, 53.0, 39.0, 44.0, 31.0, 29.0, 35.0, 35.0, 24.0, 32.0, 25.0, 32.0, 30.0, 17.0, 15.0, 17.0, 13.0, 9.0, 7.0, 11.0, 13.0, 5.0, 6.0, 3.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0], "bins": [-2.544921875, -2.468170166015625, -2.39141845703125, -2.314666748046875, -2.2379150390625, -2.161163330078125, -2.08441162109375, -2.007659912109375, -1.930908203125, -1.854156494140625, -1.77740478515625, -1.700653076171875, -1.6239013671875, -1.547149658203125, -1.47039794921875, -1.393646240234375, -1.31689453125, -1.240142822265625, -1.16339111328125, -1.086639404296875, -1.0098876953125, -0.933135986328125, -0.85638427734375, -0.779632568359375, -0.702880859375, -0.626129150390625, -0.54937744140625, -0.472625732421875, -0.3958740234375, -0.319122314453125, -0.24237060546875, -0.165618896484375, -0.0888671875, -0.012115478515625, 0.06463623046875, 0.141387939453125, 0.2181396484375, 0.294891357421875, 0.37164306640625, 0.448394775390625, 0.525146484375, 0.601898193359375, 0.67864990234375, 0.755401611328125, 0.8321533203125, 0.908905029296875, 0.98565673828125, 1.062408447265625, 1.13916015625, 1.215911865234375, 1.29266357421875, 1.369415283203125, 1.4461669921875, 1.522918701171875, 1.59967041015625, 1.676422119140625, 1.753173828125, 1.829925537109375, 1.90667724609375, 1.983428955078125, 2.0601806640625, 2.136932373046875, 2.21368408203125, 2.290435791015625, 2.3671875]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 6.0, 7.0, 7.0, 15.0, 12.0, 12.0, 19.0, 34.0, 31.0, 58.0, 95.0, 131.0, 178.0, 236.0, 341.0, 541.0, 777.0, 1171.0, 1693.0, 2504.0, 3587.0, 5513.0, 8014.0, 12266.0, 18679.0, 29485.0, 47676.0, 82687.0, 149147.0, 232548.0, 184865.0, 105210.0, 59111.0, 35677.0, 22323.0, 14493.0, 9364.0, 6274.0, 4378.0, 2974.0, 2036.0, 1404.0, 984.0, 626.0, 449.0, 285.0, 217.0, 139.0, 105.0, 63.0, 44.0, 35.0, 19.0, 10.0, 7.0, 2.0, 4.0], "bins": [-0.283935546875, -0.2761993408203125, -0.268463134765625, -0.2607269287109375, -0.25299072265625, -0.2452545166015625, -0.237518310546875, -0.2297821044921875, -0.2220458984375, -0.2143096923828125, -0.206573486328125, -0.1988372802734375, -0.19110107421875, -0.1833648681640625, -0.175628662109375, -0.1678924560546875, -0.16015625, -0.1524200439453125, -0.144683837890625, -0.1369476318359375, -0.12921142578125, -0.1214752197265625, -0.113739013671875, -0.1060028076171875, -0.0982666015625, -0.0905303955078125, -0.082794189453125, -0.0750579833984375, -0.06732177734375, -0.0595855712890625, -0.051849365234375, -0.0441131591796875, -0.036376953125, -0.0286407470703125, -0.020904541015625, -0.0131683349609375, -0.00543212890625, 0.0023040771484375, 0.010040283203125, 0.0177764892578125, 0.0255126953125, 0.0332489013671875, 0.040985107421875, 0.0487213134765625, 0.05645751953125, 0.0641937255859375, 0.071929931640625, 0.0796661376953125, 0.08740234375, 0.0951385498046875, 0.102874755859375, 0.1106109619140625, 0.11834716796875, 0.1260833740234375, 0.133819580078125, 0.1415557861328125, 0.1492919921875, 0.1570281982421875, 0.164764404296875, 0.1725006103515625, 0.18023681640625, 0.1879730224609375, 0.195709228515625, 0.2034454345703125, 0.211181640625]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 9.0, 8.0, 4.0, 5.0, 10.0, 7.0, 11.0, 14.0, 19.0, 21.0, 24.0, 21.0, 20.0, 37.0, 30.0, 37.0, 38.0, 43.0, 44.0, 43.0, 44.0, 1069.0, 48.0, 44.0, 39.0, 38.0, 39.0, 37.0, 33.0, 20.0, 25.0, 19.0, 15.0, 15.0, 17.0, 9.0, 9.0, 19.0, 7.0, 10.0, 8.0, 5.0, 4.0, 5.0, 1.0, 0.0, 3.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.658203125, -1.6021881103515625, -1.546173095703125, -1.4901580810546875, -1.43414306640625, -1.3781280517578125, -1.322113037109375, -1.2660980224609375, -1.2100830078125, -1.1540679931640625, -1.098052978515625, -1.0420379638671875, -0.98602294921875, -0.9300079345703125, -0.873992919921875, -0.8179779052734375, -0.761962890625, -0.7059478759765625, -0.649932861328125, -0.5939178466796875, -0.53790283203125, -0.4818878173828125, -0.425872802734375, -0.3698577880859375, -0.3138427734375, -0.2578277587890625, -0.201812744140625, -0.1457977294921875, -0.08978271484375, -0.0337677001953125, 0.022247314453125, 0.0782623291015625, 0.13427734375, 0.1902923583984375, 0.246307373046875, 0.3023223876953125, 0.35833740234375, 0.4143524169921875, 0.470367431640625, 0.5263824462890625, 0.5823974609375, 0.6384124755859375, 0.694427490234375, 0.7504425048828125, 0.80645751953125, 0.8624725341796875, 0.918487548828125, 0.9745025634765625, 1.030517578125, 1.0865325927734375, 1.142547607421875, 1.1985626220703125, 1.25457763671875, 1.3105926513671875, 1.366607666015625, 1.4226226806640625, 1.4786376953125, 1.5346527099609375, 1.590667724609375, 1.6466827392578125, 1.70269775390625, 1.7587127685546875, 1.814727783203125, 1.8707427978515625, 1.9267578125]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 6.0, 6.0, 8.0, 13.0, 15.0, 15.0, 35.0, 48.0, 64.0, 113.0, 158.0, 241.0, 405.0, 654.0, 1189.0, 2062.0, 3570.0, 6590.0, 12187.0, 23175.0, 44367.0, 88721.0, 173621.0, 1307868.0, 206966.0, 109967.0, 54435.0, 27844.0, 14699.0, 7868.0, 4406.0, 2356.0, 1342.0, 807.0, 468.0, 300.0, 182.0, 123.0, 55.0, 67.0, 42.0, 23.0, 19.0, 14.0, 6.0, 3.0, 6.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0], "bins": [-0.2137451171875, -0.20757675170898438, -0.20140838623046875, -0.19524002075195312, -0.1890716552734375, -0.18290328979492188, -0.17673492431640625, -0.17056655883789062, -0.164398193359375, -0.15822982788085938, -0.15206146240234375, -0.14589309692382812, -0.1397247314453125, -0.13355636596679688, -0.12738800048828125, -0.12121963500976562, -0.11505126953125, -0.10888290405273438, -0.10271453857421875, -0.09654617309570312, -0.0903778076171875, -0.08420944213867188, -0.07804107666015625, -0.07187271118164062, -0.065704345703125, -0.059535980224609375, -0.05336761474609375, -0.047199249267578125, -0.0410308837890625, -0.034862518310546875, -0.02869415283203125, -0.022525787353515625, -0.016357421875, -0.010189056396484375, -0.00402069091796875, 0.002147674560546875, 0.0083160400390625, 0.014484405517578125, 0.02065277099609375, 0.026821136474609375, 0.032989501953125, 0.039157867431640625, 0.04532623291015625, 0.051494598388671875, 0.0576629638671875, 0.06383132934570312, 0.06999969482421875, 0.07616806030273438, 0.08233642578125, 0.08850479125976562, 0.09467315673828125, 0.10084152221679688, 0.1070098876953125, 0.11317825317382812, 0.11934661865234375, 0.12551498413085938, 0.131683349609375, 0.13785171508789062, 0.14402008056640625, 0.15018844604492188, 0.1563568115234375, 0.16252517700195312, 0.16869354248046875, 0.17486190795898438, 0.1810302734375]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 5.0, 4.0, 8.0, 3.0, 8.0, 9.0, 20.0, 13.0, 40.0, 38.0, 86.0, 105.0, 173.0, 183.0, 105.0, 66.0, 41.0, 25.0, 19.0, 9.0, 11.0, 5.0, 5.0, 4.0, 2.0, 4.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0035610198974609375, -0.003452986478805542, -0.0033449530601501465, -0.003236919641494751, -0.0031288862228393555, -0.00302085280418396, -0.0029128193855285645, -0.002804785966873169, -0.0026967525482177734, -0.002588719129562378, -0.0024806857109069824, -0.002372652292251587, -0.0022646188735961914, -0.002156585454940796, -0.0020485520362854004, -0.0019405186176300049, -0.0018324851989746094, -0.0017244517803192139, -0.0016164183616638184, -0.0015083849430084229, -0.0014003515243530273, -0.0012923181056976318, -0.0011842846870422363, -0.0010762512683868408, -0.0009682178497314453, -0.0008601844310760498, -0.0007521510124206543, -0.0006441175937652588, -0.0005360841751098633, -0.0004280507564544678, -0.00032001733779907227, -0.00021198391914367676, -0.00010395050048828125, 4.082918167114258e-06, 0.00011211633682250977, 0.00022014975547790527, 0.0003281831741333008, 0.0004362165927886963, 0.0005442500114440918, 0.0006522834300994873, 0.0007603168487548828, 0.0008683502674102783, 0.0009763836860656738, 0.0010844171047210693, 0.0011924505233764648, 0.0013004839420318604, 0.0014085173606872559, 0.0015165507793426514, 0.0016245841979980469, 0.0017326176166534424, 0.0018406510353088379, 0.0019486844539642334, 0.002056717872619629, 0.0021647512912750244, 0.00227278470993042, 0.0023808181285858154, 0.002488851547241211, 0.0025968849658966064, 0.002704918384552002, 0.0028129518032073975, 0.002920985221862793, 0.0030290186405181885, 0.003137052059173584, 0.0032450854778289795, 0.003353118896484375]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 2.0, 1.0, 4.0, 3.0, 4.0, 5.0, 6.0, 6.0, 12.0, 4.0, 10.0, 10.0, 9.0, 21.0, 32.0, 34.0, 48.0, 45.0, 80.0, 111.0, 206.0, 490.0, 4564.0, 993054.0, 47787.0, 1221.0, 286.0, 155.0, 86.0, 54.0, 49.0, 23.0, 32.0, 12.0, 16.0, 15.0, 13.0, 13.0, 6.0, 5.0, 3.0, 5.0, 0.0, 7.0, 0.0, 0.0, 0.0, 4.0, 9.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.061370849609375, -0.05949735641479492, -0.057623863220214844, -0.055750370025634766, -0.05387687683105469, -0.05200338363647461, -0.05012989044189453, -0.04825639724731445, -0.046382904052734375, -0.0445094108581543, -0.04263591766357422, -0.04076242446899414, -0.03888893127441406, -0.037015438079833984, -0.035141944885253906, -0.03326845169067383, -0.03139495849609375, -0.029521465301513672, -0.027647972106933594, -0.025774478912353516, -0.023900985717773438, -0.02202749252319336, -0.02015399932861328, -0.018280506134033203, -0.016407012939453125, -0.014533519744873047, -0.012660026550292969, -0.01078653335571289, -0.008913040161132812, -0.007039546966552734, -0.005166053771972656, -0.003292560577392578, -0.0014190673828125, 0.0004544258117675781, 0.0023279190063476562, 0.004201412200927734, 0.0060749053955078125, 0.00794839859008789, 0.009821891784667969, 0.011695384979248047, 0.013568878173828125, 0.015442371368408203, 0.01731586456298828, 0.01918935775756836, 0.021062850952148438, 0.022936344146728516, 0.024809837341308594, 0.026683330535888672, 0.02855682373046875, 0.030430316925048828, 0.032303810119628906, 0.034177303314208984, 0.03605079650878906, 0.03792428970336914, 0.03979778289794922, 0.0416712760925293, 0.043544769287109375, 0.04541826248168945, 0.04729175567626953, 0.04916524887084961, 0.05103874206542969, 0.052912235260009766, 0.054785728454589844, 0.05665922164916992, 0.05853271484375]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 8.0, 238.0, 729.0, 39.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00460351537913084, -0.0038577113300561905, -0.0031119072809815407, -0.0023661034647375345, -0.0016202994156628847, -0.0008744953665882349, -0.00012869155034422874, 0.0006171124987304211, 0.0013629165478050709, 0.0021087205968797207, 0.0028545246459543705, 0.0036003284621983767, 0.004346132278442383, 0.005091936327517033, 0.0058377403765916824, 0.006583544425666332, 0.007329348474740982, 0.008075152523815632, 0.008820956572890282, 0.009566760621964931, 0.010312564671039581, 0.011058368720114231, 0.011804172769188881, 0.012549975886940956, 0.01329578086733818, 0.01404158491641283, 0.01478738896548748, 0.01553319301456213, 0.01627899706363678, 0.017024800181388855, 0.01777060516178608, 0.018516408279538155, 0.01926221139729023, 0.020008014515042305, 0.02075381949543953, 0.021499622613191605, 0.02224542759358883, 0.022991230711340904, 0.02373703569173813, 0.024482838809490204, 0.02522864378988743, 0.025974446907639503, 0.026720251888036728, 0.027466055005788803, 0.028211859986186028, 0.028957663103938103, 0.029703468084335327, 0.030449271202087402, 0.031195074319839478, 0.03194087743759155, 0.03268668055534363, 0.033432487398386, 0.03417829051613808, 0.03492409363389015, 0.03566989675164223, 0.0364157035946846, 0.037161506712436676, 0.03790730983018875, 0.038653112947940826, 0.0393989197909832, 0.040144722908735275, 0.04089052602648735, 0.041636329144239426, 0.0423821359872818, 0.043127939105033875]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 2.0, 4.0, 6.0, 7.0, 5.0, 13.0, 30.0, 21.0, 24.0, 39.0, 42.0, 48.0, 65.0, 89.0, 64.0, 69.0, 72.0, 55.0, 67.0, 45.0, 51.0, 47.0, 27.0, 35.0, 25.0, 16.0, 23.0, 4.0, 8.0, 3.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0032212138175964355, -0.003138430416584015, -0.0030556470155715942, -0.0029728636145591736, -0.002890080213546753, -0.0028072968125343323, -0.0027245134115219116, -0.002641730010509491, -0.0025589466094970703, -0.0024761632084846497, -0.002393379807472229, -0.0023105964064598083, -0.0022278130054473877, -0.002145029604434967, -0.0020622462034225464, -0.0019794628024101257, -0.001896679401397705, -0.0018138960003852844, -0.0017311125993728638, -0.0016483291983604431, -0.0015655457973480225, -0.0014827623963356018, -0.0013999789953231812, -0.0013171955943107605, -0.0012344121932983398, -0.0011516287922859192, -0.0010688453912734985, -0.0009860619902610779, -0.0009032785892486572, -0.0008204951882362366, -0.0007377117872238159, -0.0006549283862113953, -0.0005721449851989746, -0.000489361584186554, -0.0004065781831741333, -0.00032379478216171265, -0.000241011381149292, -0.00015822798013687134, -7.544457912445068e-05, 7.338821887969971e-06, 9.012222290039062e-05, 0.00017290562391281128, 0.00025568902492523193, 0.0003384724259376526, 0.00042125582695007324, 0.0005040392279624939, 0.0005868226289749146, 0.0006696060299873352, 0.0007523894309997559, 0.0008351728320121765, 0.0009179562330245972, 0.0010007396340370178, 0.0010835230350494385, 0.0011663064360618591, 0.0012490898370742798, 0.0013318732380867004, 0.001414656639099121, 0.0014974400401115417, 0.0015802234411239624, 0.001663006842136383, 0.0017457902431488037, 0.0018285736441612244, 0.001911357045173645, 0.0019941404461860657, 0.0020769238471984863]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 3.0, 5.0, 6.0, 4.0, 5.0, 14.0, 8.0, 25.0, 9.0, 22.0, 17.0, 26.0, 26.0, 29.0, 24.0, 17.0, 28.0, 34.0, 23.0, 34.0, 43.0, 31.0, 34.0, 53.0, 39.0, 44.0, 31.0, 29.0, 35.0, 35.0, 24.0, 32.0, 25.0, 32.0, 30.0, 17.0, 15.0, 17.0, 13.0, 9.0, 7.0, 11.0, 13.0, 5.0, 6.0, 3.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0], "bins": [-2.544921875, -2.468170166015625, -2.39141845703125, -2.314666748046875, -2.2379150390625, -2.161163330078125, -2.08441162109375, -2.007659912109375, -1.930908203125, -1.854156494140625, -1.77740478515625, -1.700653076171875, -1.6239013671875, -1.547149658203125, -1.47039794921875, -1.393646240234375, -1.31689453125, -1.240142822265625, -1.16339111328125, -1.086639404296875, -1.0098876953125, -0.933135986328125, -0.85638427734375, -0.779632568359375, -0.702880859375, -0.626129150390625, -0.54937744140625, -0.472625732421875, -0.3958740234375, -0.319122314453125, -0.24237060546875, -0.165618896484375, -0.0888671875, -0.012115478515625, 0.06463623046875, 0.141387939453125, 0.2181396484375, 0.294891357421875, 0.37164306640625, 0.448394775390625, 0.525146484375, 0.601898193359375, 0.67864990234375, 0.755401611328125, 0.8321533203125, 0.908905029296875, 0.98565673828125, 1.062408447265625, 1.13916015625, 1.215911865234375, 1.29266357421875, 1.369415283203125, 1.4461669921875, 1.522918701171875, 1.59967041015625, 1.676422119140625, 1.753173828125, 1.829925537109375, 1.90667724609375, 1.983428955078125, 2.0601806640625, 2.136932373046875, 2.21368408203125, 2.290435791015625, 2.3671875]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 7.0, 8.0, 8.0, 14.0, 11.0, 24.0, 23.0, 34.0, 44.0, 53.0, 70.0, 97.0, 126.0, 188.0, 289.0, 392.0, 569.0, 871.0, 1348.0, 2303.0, 4001.0, 7566.0, 15604.0, 34153.0, 82093.0, 221681.0, 402205.0, 158733.0, 61968.0, 26465.0, 12362.0, 6199.0, 3430.0, 1942.0, 1189.0, 775.0, 487.0, 328.0, 248.0, 184.0, 110.0, 71.0, 89.0, 56.0, 31.0, 28.0, 34.0, 13.0, 12.0, 6.0, 6.0, 3.0, 6.0, 3.0, 0.0, 4.0], "bins": [-2.890625, -2.80645751953125, -2.7222900390625, -2.63812255859375, -2.553955078125, -2.46978759765625, -2.3856201171875, -2.30145263671875, -2.21728515625, -2.13311767578125, -2.0489501953125, -1.96478271484375, -1.880615234375, -1.79644775390625, -1.7122802734375, -1.62811279296875, -1.5439453125, -1.45977783203125, -1.3756103515625, -1.29144287109375, -1.207275390625, -1.12310791015625, -1.0389404296875, -0.95477294921875, -0.87060546875, -0.78643798828125, -0.7022705078125, -0.61810302734375, -0.533935546875, -0.44976806640625, -0.3656005859375, -0.28143310546875, -0.197265625, -0.11309814453125, -0.0289306640625, 0.05523681640625, 0.139404296875, 0.22357177734375, 0.3077392578125, 0.39190673828125, 0.47607421875, 0.56024169921875, 0.6444091796875, 0.72857666015625, 0.812744140625, 0.89691162109375, 0.9810791015625, 1.06524658203125, 1.1494140625, 1.23358154296875, 1.3177490234375, 1.40191650390625, 1.486083984375, 1.57025146484375, 1.6544189453125, 1.73858642578125, 1.82275390625, 1.90692138671875, 1.9910888671875, 2.07525634765625, 2.159423828125, 2.24359130859375, 2.3277587890625, 2.41192626953125, 2.49609375]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 2.0, 5.0, 5.0, 2.0, 14.0, 6.0, 6.0, 8.0, 9.0, 20.0, 12.0, 17.0, 14.0, 19.0, 26.0, 29.0, 44.0, 34.0, 41.0, 42.0, 67.0, 64.0, 95.0, 245.0, 1635.0, 148.0, 64.0, 55.0, 38.0, 34.0, 33.0, 29.0, 28.0, 28.0, 23.0, 19.0, 16.0, 13.0, 12.0, 9.0, 13.0, 8.0, 3.0, 6.0, 6.0, 7.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.5234375, -9.2283935546875, -8.933349609375, -8.6383056640625, -8.34326171875, -8.0482177734375, -7.753173828125, -7.4581298828125, -7.1630859375, -6.8680419921875, -6.572998046875, -6.2779541015625, -5.98291015625, -5.6878662109375, -5.392822265625, -5.0977783203125, -4.802734375, -4.5076904296875, -4.212646484375, -3.9176025390625, -3.62255859375, -3.3275146484375, -3.032470703125, -2.7374267578125, -2.4423828125, -2.1473388671875, -1.852294921875, -1.5572509765625, -1.26220703125, -0.9671630859375, -0.672119140625, -0.3770751953125, -0.08203125, 0.2130126953125, 0.508056640625, 0.8031005859375, 1.09814453125, 1.3931884765625, 1.688232421875, 1.9832763671875, 2.2783203125, 2.5733642578125, 2.868408203125, 3.1634521484375, 3.45849609375, 3.7535400390625, 4.048583984375, 4.3436279296875, 4.638671875, 4.9337158203125, 5.228759765625, 5.5238037109375, 5.81884765625, 6.1138916015625, 6.408935546875, 6.7039794921875, 6.9990234375, 7.2940673828125, 7.589111328125, 7.8841552734375, 8.17919921875, 8.4742431640625, 8.769287109375, 9.0643310546875, 9.359375]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 7.0, 4.0, 5.0, 5.0, 10.0, 10.0, 14.0, 9.0, 18.0, 10.0, 23.0, 32.0, 30.0, 48.0, 66.0, 79.0, 115.0, 292.0, 647.0, 2205.0, 42478.0, 3049931.0, 45684.0, 2436.0, 670.0, 285.0, 163.0, 94.0, 65.0, 54.0, 38.0, 37.0, 21.0, 16.0, 20.0, 17.0, 13.0, 10.0, 7.0, 6.0, 11.0, 7.0, 4.0, 3.0, 2.0, 6.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0], "bins": [-21.46875, -20.808349609375, -20.14794921875, -19.487548828125, -18.8271484375, -18.166748046875, -17.50634765625, -16.845947265625, -16.185546875, -15.525146484375, -14.86474609375, -14.204345703125, -13.5439453125, -12.883544921875, -12.22314453125, -11.562744140625, -10.90234375, -10.241943359375, -9.58154296875, -8.921142578125, -8.2607421875, -7.600341796875, -6.93994140625, -6.279541015625, -5.619140625, -4.958740234375, -4.29833984375, -3.637939453125, -2.9775390625, -2.317138671875, -1.65673828125, -0.996337890625, -0.3359375, 0.324462890625, 0.98486328125, 1.645263671875, 2.3056640625, 2.966064453125, 3.62646484375, 4.286865234375, 4.947265625, 5.607666015625, 6.26806640625, 6.928466796875, 7.5888671875, 8.249267578125, 8.90966796875, 9.570068359375, 10.23046875, 10.890869140625, 11.55126953125, 12.211669921875, 12.8720703125, 13.532470703125, 14.19287109375, 14.853271484375, 15.513671875, 16.174072265625, 16.83447265625, 17.494873046875, 18.1552734375, 18.815673828125, 19.47607421875, 20.136474609375, 20.796875]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 7.0, 14.0, 42.0, 160.0, 326.0, 298.0, 125.0, 31.0, 8.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.325531005859375, -28.375564575195312, -27.42559814453125, -26.475629806518555, -25.525663375854492, -24.57569694519043, -23.625728607177734, -22.675762176513672, -21.72579574584961, -20.775829315185547, -19.825862884521484, -18.87589454650879, -17.925928115844727, -16.975961685180664, -16.02599334716797, -15.076026916503906, -14.126060485839844, -13.176094055175781, -12.226126670837402, -11.276159286499023, -10.326192855834961, -9.376226425170898, -8.42625904083252, -7.476292133331299, -6.526325225830078, -5.576358318328857, -4.626391410827637, -3.676424503326416, -2.7264575958251953, -1.7764906883239746, -0.8265237808227539, 0.1234431266784668, 1.0734100341796875, 2.023376941680908, 2.973343849182129, 3.9233107566833496, 4.87327766418457, 5.823244571685791, 6.773211479187012, 7.723178386688232, 8.673145294189453, 9.623111724853516, 10.573079109191895, 11.523046493530273, 12.473012924194336, 13.422979354858398, 14.372946739196777, 15.322914123535156, 16.27288055419922, 17.22284698486328, 18.172813415527344, 19.12278175354004, 20.0727481842041, 21.022714614868164, 21.97268295288086, 22.922649383544922, 23.872615814208984, 24.822582244873047, 25.77254867553711, 26.722517013549805, 27.672483444213867, 28.62244987487793, 29.572418212890625, 30.522384643554688, 31.47235107421875]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 3.0, 3.0, 2.0, 6.0, 2.0, 3.0, 2.0, 7.0, 7.0, 10.0, 9.0, 9.0, 12.0, 12.0, 17.0, 12.0, 22.0, 21.0, 29.0, 17.0, 36.0, 20.0, 31.0, 35.0, 35.0, 29.0, 24.0, 43.0, 43.0, 39.0, 30.0, 41.0, 31.0, 36.0, 32.0, 39.0, 32.0, 30.0, 23.0, 25.0, 24.0, 18.0, 17.0, 8.0, 11.0, 12.0, 9.0, 11.0, 10.0, 8.0, 5.0, 4.0, 5.0, 5.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-26.812501907348633, -25.97269058227539, -25.13287925720215, -24.293067932128906, -23.453258514404297, -22.613447189331055, -21.773635864257812, -20.93382453918457, -20.094013214111328, -19.254201889038086, -18.414390563964844, -17.574581146240234, -16.734769821166992, -15.89495849609375, -15.055147171020508, -14.215335845947266, -13.375526428222656, -12.535715103149414, -11.695904731750488, -10.856093406677246, -10.01628303527832, -9.176471710205078, -8.336660385131836, -7.496849536895752, -6.657038688659668, -5.817227840423584, -4.9774169921875, -4.137605667114258, -3.297794818878174, -2.45798397064209, -1.6181726455688477, -0.7783617973327637, 0.0614471435546875, 0.901258111000061, 1.7410690784454346, 2.5808801651000977, 3.4206910133361816, 4.260501861572266, 5.100313186645508, 5.940124034881592, 6.779934883117676, 7.61974573135376, 8.459556579589844, 9.299367904663086, 10.139179229736328, 10.978989601135254, 11.818800926208496, 12.658611297607422, 13.498422622680664, 14.338233947753906, 15.178044319152832, 16.01785659790039, 16.857666015625, 17.697477340698242, 18.537288665771484, 19.377099990844727, 20.21691131591797, 21.05672264099121, 21.896533966064453, 22.736343383789062, 23.576154708862305, 24.415966033935547, 25.25577735900879, 26.09558868408203, 26.93539810180664]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 3.0, 7.0, 9.0, 3.0, 13.0, 14.0, 16.0, 17.0, 20.0, 17.0, 27.0, 32.0, 29.0, 23.0, 23.0, 30.0, 23.0, 40.0, 44.0, 28.0, 26.0, 50.0, 41.0, 47.0, 36.0, 33.0, 33.0, 29.0, 30.0, 35.0, 30.0, 25.0, 23.0, 19.0, 25.0, 13.0, 15.0, 15.0, 9.0, 14.0, 7.0, 4.0, 9.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.53515625, -2.455078125, -2.375, -2.294921875, -2.21484375, -2.134765625, -2.0546875, -1.974609375, -1.89453125, -1.814453125, -1.734375, -1.654296875, -1.57421875, -1.494140625, -1.4140625, -1.333984375, -1.25390625, -1.173828125, -1.09375, -1.013671875, -0.93359375, -0.853515625, -0.7734375, -0.693359375, -0.61328125, -0.533203125, -0.453125, -0.373046875, -0.29296875, -0.212890625, -0.1328125, -0.052734375, 0.02734375, 0.107421875, 0.1875, 0.267578125, 0.34765625, 0.427734375, 0.5078125, 0.587890625, 0.66796875, 0.748046875, 0.828125, 0.908203125, 0.98828125, 1.068359375, 1.1484375, 1.228515625, 1.30859375, 1.388671875, 1.46875, 1.548828125, 1.62890625, 1.708984375, 1.7890625, 1.869140625, 1.94921875, 2.029296875, 2.109375, 2.189453125, 2.26953125, 2.349609375, 2.4296875, 2.509765625, 2.58984375]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 7.0, 6.0, 1.0, 11.0, 14.0, 16.0, 19.0, 21.0, 23.0, 39.0, 44.0, 43.0, 73.0, 70.0, 110.0, 134.0, 221.0, 430.0, 1088.0, 3812.0, 17741.0, 114773.0, 1596012.0, 2267064.0, 161560.0, 23669.0, 4698.0, 1237.0, 501.0, 235.0, 150.0, 84.0, 71.0, 53.0, 39.0, 51.0, 27.0, 24.0, 31.0, 21.0, 13.0, 9.0, 13.0, 7.0, 7.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-11.3046875, -10.9522705078125, -10.599853515625, -10.2474365234375, -9.89501953125, -9.5426025390625, -9.190185546875, -8.8377685546875, -8.4853515625, -8.1329345703125, -7.780517578125, -7.4281005859375, -7.07568359375, -6.7232666015625, -6.370849609375, -6.0184326171875, -5.666015625, -5.3135986328125, -4.961181640625, -4.6087646484375, -4.25634765625, -3.9039306640625, -3.551513671875, -3.1990966796875, -2.8466796875, -2.4942626953125, -2.141845703125, -1.7894287109375, -1.43701171875, -1.0845947265625, -0.732177734375, -0.3797607421875, -0.02734375, 0.3250732421875, 0.677490234375, 1.0299072265625, 1.38232421875, 1.7347412109375, 2.087158203125, 2.4395751953125, 2.7919921875, 3.1444091796875, 3.496826171875, 3.8492431640625, 4.20166015625, 4.5540771484375, 4.906494140625, 5.2589111328125, 5.611328125, 5.9637451171875, 6.316162109375, 6.6685791015625, 7.02099609375, 7.3734130859375, 7.725830078125, 8.0782470703125, 8.4306640625, 8.7830810546875, 9.135498046875, 9.4879150390625, 9.84033203125, 10.1927490234375, 10.545166015625, 10.8975830078125, 11.25]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 11.0, 7.0, 20.0, 23.0, 33.0, 47.0, 53.0, 56.0, 92.0, 126.0, 171.0, 262.0, 336.0, 390.0, 492.0, 455.0, 395.0, 300.0, 228.0, 150.0, 123.0, 78.0, 63.0, 43.0, 38.0, 18.0, 20.0, 11.0, 9.0, 9.0, 3.0, 1.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.1875, -8.8978271484375, -8.608154296875, -8.3184814453125, -8.02880859375, -7.7391357421875, -7.449462890625, -7.1597900390625, -6.8701171875, -6.5804443359375, -6.290771484375, -6.0010986328125, -5.71142578125, -5.4217529296875, -5.132080078125, -4.8424072265625, -4.552734375, -4.2630615234375, -3.973388671875, -3.6837158203125, -3.39404296875, -3.1043701171875, -2.814697265625, -2.5250244140625, -2.2353515625, -1.9456787109375, -1.656005859375, -1.3663330078125, -1.07666015625, -0.7869873046875, -0.497314453125, -0.2076416015625, 0.08203125, 0.3717041015625, 0.661376953125, 0.9510498046875, 1.24072265625, 1.5303955078125, 1.820068359375, 2.1097412109375, 2.3994140625, 2.6890869140625, 2.978759765625, 3.2684326171875, 3.55810546875, 3.8477783203125, 4.137451171875, 4.4271240234375, 4.716796875, 5.0064697265625, 5.296142578125, 5.5858154296875, 5.87548828125, 6.1651611328125, 6.454833984375, 6.7445068359375, 7.0341796875, 7.3238525390625, 7.613525390625, 7.9031982421875, 8.19287109375, 8.4825439453125, 8.772216796875, 9.0618896484375, 9.3515625]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 6.0, 6.0, 15.0, 34.0, 47.0, 75.0, 161.0, 364.0, 826.0, 2984.0, 19067.0, 217629.0, 3157117.0, 739443.0, 48135.0, 6110.0, 1324.0, 483.0, 197.0, 119.0, 64.0, 21.0, 19.0, 11.0, 9.0, 4.0, 4.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-27.171875, -26.410888671875, -25.64990234375, -24.888916015625, -24.1279296875, -23.366943359375, -22.60595703125, -21.844970703125, -21.083984375, -20.322998046875, -19.56201171875, -18.801025390625, -18.0400390625, -17.279052734375, -16.51806640625, -15.757080078125, -14.99609375, -14.235107421875, -13.47412109375, -12.713134765625, -11.9521484375, -11.191162109375, -10.43017578125, -9.669189453125, -8.908203125, -8.147216796875, -7.38623046875, -6.625244140625, -5.8642578125, -5.103271484375, -4.34228515625, -3.581298828125, -2.8203125, -2.059326171875, -1.29833984375, -0.537353515625, 0.2236328125, 0.984619140625, 1.74560546875, 2.506591796875, 3.267578125, 4.028564453125, 4.78955078125, 5.550537109375, 6.3115234375, 7.072509765625, 7.83349609375, 8.594482421875, 9.35546875, 10.116455078125, 10.87744140625, 11.638427734375, 12.3994140625, 13.160400390625, 13.92138671875, 14.682373046875, 15.443359375, 16.204345703125, 16.96533203125, 17.726318359375, 18.4873046875, 19.248291015625, 20.00927734375, 20.770263671875, 21.53125]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 12.0, 20.0, 24.0, 32.0, 49.0, 76.0, 97.0, 116.0, 102.0, 129.0, 112.0, 69.0, 65.0, 41.0, 23.0, 19.0, 9.0, 9.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.9039192199707, -33.48814392089844, -32.07236862182617, -30.65659523010254, -29.240821838378906, -27.82504653930664, -26.409271240234375, -24.99349594116211, -23.577722549438477, -22.16194725036621, -20.746173858642578, -19.330398559570312, -17.914623260498047, -16.498849868774414, -15.083074569702148, -13.6673002243042, -12.25152587890625, -10.8357515335083, -9.419977188110352, -8.004201889038086, -6.588427543640137, -5.1726531982421875, -3.756877899169922, -2.3411035537719727, -0.9253292083740234, 0.4904453754425049, 1.9062199592590332, 3.3219947814941406, 4.73776912689209, 6.153543472290039, 7.569318771362305, 8.985093116760254, 10.400867462158203, 11.816641807556152, 13.232416152954102, 14.648191452026367, 16.06396484375, 17.479740142822266, 18.89551544189453, 20.311290740966797, 21.72706413269043, 23.142839431762695, 24.558612823486328, 25.974388122558594, 27.39016342163086, 28.805936813354492, 30.221712112426758, 31.63748550415039, 33.053260803222656, 34.46903610229492, 35.88481140136719, 37.30058288574219, 38.71635818481445, 40.13213348388672, 41.547908782958984, 42.96368408203125, 44.37945556640625, 45.795230865478516, 47.21100616455078, 48.62677764892578, 50.04255294799805, 51.45832824707031, 52.87410354614258, 54.289878845214844, 55.70565414428711]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 3.0, 4.0, 4.0, 3.0, 3.0, 4.0, 5.0, 6.0, 7.0, 8.0, 6.0, 10.0, 13.0, 13.0, 15.0, 12.0, 19.0, 22.0, 23.0, 35.0, 27.0, 28.0, 36.0, 44.0, 39.0, 34.0, 30.0, 34.0, 28.0, 34.0, 35.0, 37.0, 37.0, 39.0, 28.0, 34.0, 28.0, 24.0, 28.0, 24.0, 22.0, 16.0, 14.0, 18.0, 13.0, 11.0, 7.0, 12.0, 6.0, 3.0, 10.0, 5.0, 1.0, 6.0, 7.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-23.523147583007812, -22.727962493896484, -21.932777404785156, -21.137592315673828, -20.3424072265625, -19.547222137451172, -18.752037048339844, -17.956851959228516, -17.161666870117188, -16.36648178100586, -15.571296691894531, -14.776111602783203, -13.980926513671875, -13.185741424560547, -12.390556335449219, -11.59537124633789, -10.800186157226562, -10.005001068115234, -9.209815979003906, -8.414630889892578, -7.61944580078125, -6.824260711669922, -6.029075622558594, -5.233890533447266, -4.4387054443359375, -3.6435203552246094, -2.8483352661132812, -2.053150177001953, -1.257965087890625, -0.4627799987792969, 0.33240509033203125, 1.1275901794433594, 1.9227752685546875, 2.7179603576660156, 3.5131454467773438, 4.308330535888672, 5.103515625, 5.898700714111328, 6.693885803222656, 7.489070892333984, 8.284255981445312, 9.07944107055664, 9.874626159667969, 10.669811248779297, 11.464996337890625, 12.260181427001953, 13.055366516113281, 13.85055160522461, 14.645736694335938, 15.440921783447266, 16.236106872558594, 17.031291961669922, 17.82647705078125, 18.621662139892578, 19.416847229003906, 20.212032318115234, 21.007217407226562, 21.80240249633789, 22.59758758544922, 23.392772674560547, 24.187957763671875, 24.983142852783203, 25.77832794189453, 26.57351303100586, 27.368698120117188]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 7.0, 8.0, 4.0, 11.0, 17.0, 16.0, 16.0, 13.0, 18.0, 34.0, 34.0, 37.0, 28.0, 36.0, 28.0, 40.0, 36.0, 34.0, 50.0, 41.0, 51.0, 35.0, 47.0, 35.0, 37.0, 35.0, 37.0, 36.0, 25.0, 22.0, 18.0, 27.0, 10.0, 17.0, 17.0, 9.0, 11.0, 3.0, 5.0, 4.0, 7.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.185546875, -3.0927734375, -3.0, -2.9072265625, -2.814453125, -2.7216796875, -2.62890625, -2.5361328125, -2.443359375, -2.3505859375, -2.2578125, -2.1650390625, -2.072265625, -1.9794921875, -1.88671875, -1.7939453125, -1.701171875, -1.6083984375, -1.515625, -1.4228515625, -1.330078125, -1.2373046875, -1.14453125, -1.0517578125, -0.958984375, -0.8662109375, -0.7734375, -0.6806640625, -0.587890625, -0.4951171875, -0.40234375, -0.3095703125, -0.216796875, -0.1240234375, -0.03125, 0.0615234375, 0.154296875, 0.2470703125, 0.33984375, 0.4326171875, 0.525390625, 0.6181640625, 0.7109375, 0.8037109375, 0.896484375, 0.9892578125, 1.08203125, 1.1748046875, 1.267578125, 1.3603515625, 1.453125, 1.5458984375, 1.638671875, 1.7314453125, 1.82421875, 1.9169921875, 2.009765625, 2.1025390625, 2.1953125, 2.2880859375, 2.380859375, 2.4736328125, 2.56640625, 2.6591796875, 2.751953125]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 1.0, 7.0, 8.0, 5.0, 21.0, 12.0, 33.0, 39.0, 74.0, 99.0, 160.0, 235.0, 318.0, 476.0, 731.0, 1125.0, 1610.0, 2437.0, 3719.0, 5775.0, 9187.0, 14336.0, 23691.0, 40066.0, 71727.0, 133963.0, 236481.0, 220295.0, 121435.0, 64523.0, 36699.0, 21718.0, 13606.0, 8275.0, 5324.0, 3483.0, 2307.0, 1546.0, 1009.0, 673.0, 415.0, 314.0, 201.0, 133.0, 91.0, 69.0, 42.0, 28.0, 18.0, 11.0, 6.0, 2.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.292724609375, -0.28325653076171875, -0.2737884521484375, -0.26432037353515625, -0.254852294921875, -0.24538421630859375, -0.2359161376953125, -0.22644805908203125, -0.21697998046875, -0.20751190185546875, -0.1980438232421875, -0.18857574462890625, -0.179107666015625, -0.16963958740234375, -0.1601715087890625, -0.15070343017578125, -0.1412353515625, -0.13176727294921875, -0.1222991943359375, -0.11283111572265625, -0.103363037109375, -0.09389495849609375, -0.0844268798828125, -0.07495880126953125, -0.06549072265625, -0.05602264404296875, -0.0465545654296875, -0.03708648681640625, -0.027618408203125, -0.01815032958984375, -0.0086822509765625, 0.00078582763671875, 0.01025390625, 0.01972198486328125, 0.0291900634765625, 0.03865814208984375, 0.048126220703125, 0.05759429931640625, 0.0670623779296875, 0.07653045654296875, 0.08599853515625, 0.09546661376953125, 0.1049346923828125, 0.11440277099609375, 0.123870849609375, 0.13333892822265625, 0.1428070068359375, 0.15227508544921875, 0.1617431640625, 0.17121124267578125, 0.1806793212890625, 0.19014739990234375, 0.199615478515625, 0.20908355712890625, 0.2185516357421875, 0.22801971435546875, 0.23748779296875, 0.24695587158203125, 0.2564239501953125, 0.26589202880859375, 0.275360107421875, 0.28482818603515625, 0.2942962646484375, 0.30376434326171875, 0.313232421875]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 5.0, 6.0, 5.0, 6.0, 12.0, 5.0, 9.0, 12.0, 23.0, 21.0, 23.0, 17.0, 32.0, 24.0, 32.0, 38.0, 39.0, 34.0, 44.0, 51.0, 45.0, 1071.0, 54.0, 38.0, 38.0, 45.0, 37.0, 28.0, 28.0, 28.0, 32.0, 22.0, 22.0, 14.0, 20.0, 14.0, 13.0, 5.0, 12.0, 7.0, 5.0, 2.0, 4.0, 3.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0], "bins": [-2.158203125, -2.0977630615234375, -2.037322998046875, -1.9768829345703125, -1.91644287109375, -1.8560028076171875, -1.795562744140625, -1.7351226806640625, -1.6746826171875, -1.6142425537109375, -1.553802490234375, -1.4933624267578125, -1.43292236328125, -1.3724822998046875, -1.312042236328125, -1.2516021728515625, -1.191162109375, -1.1307220458984375, -1.070281982421875, -1.0098419189453125, -0.94940185546875, -0.8889617919921875, -0.828521728515625, -0.7680816650390625, -0.7076416015625, -0.6472015380859375, -0.586761474609375, -0.5263214111328125, -0.46588134765625, -0.4054412841796875, -0.345001220703125, -0.2845611572265625, -0.22412109375, -0.1636810302734375, -0.103240966796875, -0.0428009033203125, 0.01763916015625, 0.0780792236328125, 0.138519287109375, 0.1989593505859375, 0.2593994140625, 0.3198394775390625, 0.380279541015625, 0.4407196044921875, 0.50115966796875, 0.5615997314453125, 0.622039794921875, 0.6824798583984375, 0.742919921875, 0.8033599853515625, 0.863800048828125, 0.9242401123046875, 0.98468017578125, 1.0451202392578125, 1.105560302734375, 1.1660003662109375, 1.2264404296875, 1.2868804931640625, 1.347320556640625, 1.4077606201171875, 1.46820068359375, 1.5286407470703125, 1.589080810546875, 1.6495208740234375, 1.7099609375]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 6.0, 11.0, 14.0, 25.0, 30.0, 41.0, 59.0, 99.0, 143.0, 221.0, 338.0, 524.0, 813.0, 1286.0, 2233.0, 3718.0, 6403.0, 11141.0, 19659.0, 36044.0, 67169.0, 126416.0, 235171.0, 1262165.0, 147987.0, 79118.0, 42227.0, 22762.0, 13100.0, 7227.0, 4427.0, 2487.0, 1516.0, 887.0, 564.0, 354.0, 233.0, 159.0, 107.0, 64.0, 44.0, 38.0, 25.0, 18.0, 18.0, 14.0, 12.0, 7.0, 4.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.19873046875, -0.19254493713378906, -0.18635940551757812, -0.1801738739013672, -0.17398834228515625, -0.1678028106689453, -0.16161727905273438, -0.15543174743652344, -0.1492462158203125, -0.14306068420410156, -0.13687515258789062, -0.1306896209716797, -0.12450408935546875, -0.11831855773925781, -0.11213302612304688, -0.10594749450683594, -0.099761962890625, -0.09357643127441406, -0.08739089965820312, -0.08120536804199219, -0.07501983642578125, -0.06883430480957031, -0.06264877319335938, -0.05646324157714844, -0.0502777099609375, -0.04409217834472656, -0.037906646728515625, -0.03172111511230469, -0.02553558349609375, -0.019350051879882812, -0.013164520263671875, -0.0069789886474609375, -0.00079345703125, 0.0053920745849609375, 0.011577606201171875, 0.017763137817382812, 0.02394866943359375, 0.030134201049804688, 0.036319732666015625, 0.04250526428222656, 0.0486907958984375, 0.05487632751464844, 0.061061859130859375, 0.06724739074707031, 0.07343292236328125, 0.07961845397949219, 0.08580398559570312, 0.09198951721191406, 0.098175048828125, 0.10436058044433594, 0.11054611206054688, 0.11673164367675781, 0.12291717529296875, 0.1291027069091797, 0.13528823852539062, 0.14147377014160156, 0.1476593017578125, 0.15384483337402344, 0.16003036499023438, 0.1662158966064453, 0.17240142822265625, 0.1785869598388672, 0.18477249145507812, 0.19095802307128906, 0.1971435546875]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 7.0, 5.0, 4.0, 4.0, 7.0, 3.0, 8.0, 9.0, 9.0, 8.0, 9.0, 21.0, 19.0, 16.0, 19.0, 19.0, 25.0, 39.0, 41.0, 67.0, 99.0, 105.0, 96.0, 76.0, 50.0, 34.0, 34.0, 18.0, 27.0, 16.0, 16.0, 11.0, 9.0, 6.0, 10.0, 8.0, 4.0, 3.0, 5.0, 2.0, 11.0, 2.0, 2.0, 2.0, 5.0, 3.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.0022487640380859375, -0.002175241708755493, -0.002101719379425049, -0.0020281970500946045, -0.00195467472076416, -0.0018811523914337158, -0.0018076300621032715, -0.0017341077327728271, -0.0016605854034423828, -0.0015870630741119385, -0.0015135407447814941, -0.0014400184154510498, -0.0013664960861206055, -0.0012929737567901611, -0.0012194514274597168, -0.0011459290981292725, -0.0010724067687988281, -0.0009988844394683838, -0.0009253621101379395, -0.0008518397808074951, -0.0007783174514770508, -0.0007047951221466064, -0.0006312727928161621, -0.0005577504634857178, -0.00048422813415527344, -0.0004107058048248291, -0.00033718347549438477, -0.00026366114616394043, -0.0001901388168334961, -0.00011661648750305176, -4.309415817260742e-05, 3.0428171157836914e-05, 0.00010395050048828125, 0.00017747282981872559, 0.0002509951591491699, 0.00032451748847961426, 0.0003980398178100586, 0.00047156214714050293, 0.0005450844764709473, 0.0006186068058013916, 0.0006921291351318359, 0.0007656514644622803, 0.0008391737937927246, 0.0009126961231231689, 0.0009862184524536133, 0.0010597407817840576, 0.001133263111114502, 0.0012067854404449463, 0.0012803077697753906, 0.001353830099105835, 0.0014273524284362793, 0.0015008747577667236, 0.001574397087097168, 0.0016479194164276123, 0.0017214417457580566, 0.001794964075088501, 0.0018684864044189453, 0.0019420087337493896, 0.002015531063079834, 0.0020890533924102783, 0.0021625757217407227, 0.002236098051071167, 0.0023096203804016113, 0.0023831427097320557, 0.0024566650390625]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 5.0, 3.0, 3.0, 5.0, 3.0, 8.0, 10.0, 10.0, 10.0, 12.0, 18.0, 24.0, 17.0, 33.0, 23.0, 24.0, 29.0, 44.0, 49.0, 57.0, 80.0, 91.0, 93.0, 161.0, 292.0, 718.0, 3818.0, 48131.0, 918087.0, 69776.0, 5046.0, 760.0, 296.0, 170.0, 124.0, 108.0, 80.0, 59.0, 44.0, 44.0, 26.0, 21.0, 18.0, 16.0, 15.0, 17.0, 8.0, 15.0, 14.0, 16.0, 6.0, 6.0, 6.0, 7.0, 6.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0], "bins": [-0.036895751953125, -0.03568840026855469, -0.034481048583984375, -0.03327369689941406, -0.03206634521484375, -0.030858993530273438, -0.029651641845703125, -0.028444290161132812, -0.0272369384765625, -0.026029586791992188, -0.024822235107421875, -0.023614883422851562, -0.02240753173828125, -0.021200180053710938, -0.019992828369140625, -0.018785476684570312, -0.017578125, -0.016370773315429688, -0.015163421630859375, -0.013956069946289062, -0.01274871826171875, -0.011541366577148438, -0.010334014892578125, -0.009126663208007812, -0.0079193115234375, -0.0067119598388671875, -0.005504608154296875, -0.0042972564697265625, -0.00308990478515625, -0.0018825531005859375, -0.000675201416015625, 0.0005321502685546875, 0.001739501953125, 0.0029468536376953125, 0.004154205322265625, 0.0053615570068359375, 0.00656890869140625, 0.0077762603759765625, 0.008983612060546875, 0.010190963745117188, 0.0113983154296875, 0.012605667114257812, 0.013813018798828125, 0.015020370483398438, 0.01622772216796875, 0.017435073852539062, 0.018642425537109375, 0.019849777221679688, 0.02105712890625, 0.022264480590820312, 0.023471832275390625, 0.024679183959960938, 0.02588653564453125, 0.027093887329101562, 0.028301239013671875, 0.029508590698242188, 0.0307159423828125, 0.03192329406738281, 0.033130645751953125, 0.03433799743652344, 0.03554534912109375, 0.03675270080566406, 0.037960052490234375, 0.03916740417480469, 0.040374755859375]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 9.0, 112.0, 753.0, 121.0, 17.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004986761137843132, -0.004076060838997364, -0.0031653600744903088, -0.002254659542813897, -0.0013439590111374855, -0.00043325871229171753, 0.00047744205221533775, 0.001388142816722393, 0.002298843115568161, 0.0032095436472445726, 0.004120244178920984, 0.0050309449434280396, 0.0059416452422738075, 0.0068523455411195755, 0.007763046305626631, 0.008673747070133686, 0.009584447368979454, 0.010495147667825222, 0.01140584796667099, 0.012316549196839333, 0.0132272494956851, 0.014137949794530869, 0.015048651024699211, 0.015959352254867554, 0.016870051622390747, 0.01778075285255909, 0.018691452220082283, 0.019602153450250626, 0.02051285281777382, 0.02142355404794216, 0.022334255278110504, 0.023244954645633698, 0.02415565401315689, 0.025066355243325233, 0.025977054610848427, 0.02688775584101677, 0.027798455208539963, 0.028709156438708305, 0.029619857668876648, 0.03053055703639984, 0.031441256403923035, 0.03235195577144623, 0.03326265886425972, 0.03417335823178291, 0.03508405759930611, 0.0359947606921196, 0.03690546005964279, 0.037816159427165985, 0.03872686251997948, 0.03963756188750267, 0.04054826498031616, 0.041458964347839355, 0.04236966371536255, 0.04328036308288574, 0.044191066175699234, 0.04510176554322243, 0.04601246863603592, 0.04692316800355911, 0.047833871096372604, 0.0487445704638958, 0.04965526983141899, 0.05056597292423248, 0.051476672291755676, 0.05238737165927887, 0.05329807102680206]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 4.0, 13.0, 12.0, 22.0, 22.0, 28.0, 36.0, 48.0, 50.0, 48.0, 67.0, 55.0, 69.0, 66.0, 59.0, 77.0, 57.0, 52.0, 43.0, 60.0, 35.0, 19.0, 20.0, 12.0, 14.0, 5.0, 10.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.005595088005065918, -0.005462699569761753, -0.005330311134457588, -0.005197922699153423, -0.005065534263849258, -0.0049331458285450935, -0.004800757393240929, -0.004668368957936764, -0.004535980522632599, -0.004403592087328434, -0.004271203652024269, -0.004138815216720104, -0.004006426781415939, -0.0038740383461117744, -0.0037416499108076096, -0.0036092614755034447, -0.00347687304019928, -0.003344484604895115, -0.00321209616959095, -0.003079707734286785, -0.0029473192989826202, -0.0028149308636784554, -0.0026825424283742905, -0.0025501539930701256, -0.0024177655577659607, -0.002285377122461796, -0.002152988687157631, -0.002020600251853466, -0.0018882118165493011, -0.0017558233812451363, -0.0016234349459409714, -0.0014910465106368065, -0.0013586580753326416, -0.0012262696400284767, -0.0010938812047243118, -0.0009614927694201469, -0.0008291043341159821, -0.0006967158988118172, -0.0005643274635076523, -0.0004319390282034874, -0.0002995505928993225, -0.00016716215759515762, -3.477372229099274e-05, 9.761471301317215e-05, 0.00023000314831733704, 0.0003623915836215019, 0.0004947800189256668, 0.0006271684542298317, 0.0007595568895339966, 0.0008919453248381615, 0.0010243337601423264, 0.0011567221954464912, 0.0012891106307506561, 0.001421499066054821, 0.001553887501358986, 0.0016862759366631508, 0.0018186643719673157, 0.0019510528072714806, 0.0020834412425756454, 0.0022158296778798103, 0.0023482181131839752, 0.00248060654848814, 0.002612994983792305, 0.00274538341909647, 0.0028777718544006348]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 7.0, 8.0, 4.0, 11.0, 17.0, 16.0, 16.0, 13.0, 18.0, 34.0, 34.0, 37.0, 28.0, 36.0, 28.0, 40.0, 36.0, 34.0, 50.0, 41.0, 51.0, 35.0, 47.0, 35.0, 37.0, 35.0, 37.0, 36.0, 25.0, 22.0, 18.0, 27.0, 10.0, 17.0, 17.0, 9.0, 11.0, 3.0, 5.0, 4.0, 7.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.185546875, -3.0927734375, -3.0, -2.9072265625, -2.814453125, -2.7216796875, -2.62890625, -2.5361328125, -2.443359375, -2.3505859375, -2.2578125, -2.1650390625, -2.072265625, -1.9794921875, -1.88671875, -1.7939453125, -1.701171875, -1.6083984375, -1.515625, -1.4228515625, -1.330078125, -1.2373046875, -1.14453125, -1.0517578125, -0.958984375, -0.8662109375, -0.7734375, -0.6806640625, -0.587890625, -0.4951171875, -0.40234375, -0.3095703125, -0.216796875, -0.1240234375, -0.03125, 0.0615234375, 0.154296875, 0.2470703125, 0.33984375, 0.4326171875, 0.525390625, 0.6181640625, 0.7109375, 0.8037109375, 0.896484375, 0.9892578125, 1.08203125, 1.1748046875, 1.267578125, 1.3603515625, 1.453125, 1.5458984375, 1.638671875, 1.7314453125, 1.82421875, 1.9169921875, 2.009765625, 2.1025390625, 2.1953125, 2.2880859375, 2.380859375, 2.4736328125, 2.56640625, 2.6591796875, 2.751953125]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 5.0, 7.0, 11.0, 14.0, 24.0, 31.0, 36.0, 60.0, 107.0, 166.0, 226.0, 402.0, 591.0, 990.0, 1864.0, 3210.0, 6592.0, 14302.0, 36480.0, 140476.0, 611666.0, 161088.0, 39848.0, 15358.0, 6867.0, 3394.0, 1921.0, 1069.0, 631.0, 403.0, 260.0, 154.0, 97.0, 64.0, 41.0, 39.0, 19.0, 18.0, 12.0, 7.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.96875, -4.82489013671875, -4.6810302734375, -4.53717041015625, -4.393310546875, -4.24945068359375, -4.1055908203125, -3.96173095703125, -3.81787109375, -3.67401123046875, -3.5301513671875, -3.38629150390625, -3.242431640625, -3.09857177734375, -2.9547119140625, -2.81085205078125, -2.6669921875, -2.52313232421875, -2.3792724609375, -2.23541259765625, -2.091552734375, -1.94769287109375, -1.8038330078125, -1.65997314453125, -1.51611328125, -1.37225341796875, -1.2283935546875, -1.08453369140625, -0.940673828125, -0.79681396484375, -0.6529541015625, -0.50909423828125, -0.365234375, -0.22137451171875, -0.0775146484375, 0.06634521484375, 0.210205078125, 0.35406494140625, 0.4979248046875, 0.64178466796875, 0.78564453125, 0.92950439453125, 1.0733642578125, 1.21722412109375, 1.361083984375, 1.50494384765625, 1.6488037109375, 1.79266357421875, 1.9365234375, 2.08038330078125, 2.2242431640625, 2.36810302734375, 2.511962890625, 2.65582275390625, 2.7996826171875, 2.94354248046875, 3.08740234375, 3.23126220703125, 3.3751220703125, 3.51898193359375, 3.662841796875, 3.80670166015625, 3.9505615234375, 4.09442138671875, 4.23828125]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 4.0, 4.0, 9.0, 8.0, 8.0, 10.0, 15.0, 18.0, 17.0, 25.0, 39.0, 31.0, 38.0, 43.0, 36.0, 46.0, 53.0, 99.0, 197.0, 1698.0, 172.0, 79.0, 65.0, 49.0, 48.0, 33.0, 40.0, 24.0, 28.0, 29.0, 16.0, 13.0, 9.0, 12.0, 12.0, 9.0, 7.0, 6.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.7109375, -11.3265380859375, -10.942138671875, -10.5577392578125, -10.17333984375, -9.7889404296875, -9.404541015625, -9.0201416015625, -8.6357421875, -8.2513427734375, -7.866943359375, -7.4825439453125, -7.09814453125, -6.7137451171875, -6.329345703125, -5.9449462890625, -5.560546875, -5.1761474609375, -4.791748046875, -4.4073486328125, -4.02294921875, -3.6385498046875, -3.254150390625, -2.8697509765625, -2.4853515625, -2.1009521484375, -1.716552734375, -1.3321533203125, -0.94775390625, -0.5633544921875, -0.178955078125, 0.2054443359375, 0.58984375, 0.9742431640625, 1.358642578125, 1.7430419921875, 2.12744140625, 2.5118408203125, 2.896240234375, 3.2806396484375, 3.6650390625, 4.0494384765625, 4.433837890625, 4.8182373046875, 5.20263671875, 5.5870361328125, 5.971435546875, 6.3558349609375, 6.740234375, 7.1246337890625, 7.509033203125, 7.8934326171875, 8.27783203125, 8.6622314453125, 9.046630859375, 9.4310302734375, 9.8154296875, 10.1998291015625, 10.584228515625, 10.9686279296875, 11.35302734375, 11.7374267578125, 12.121826171875, 12.5062255859375, 12.890625]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 1.0, 3.0, 5.0, 8.0, 12.0, 6.0, 10.0, 13.0, 11.0, 16.0, 16.0, 28.0, 30.0, 49.0, 64.0, 99.0, 136.0, 289.0, 566.0, 1308.0, 4736.0, 31559.0, 1162314.0, 1900350.0, 35809.0, 5369.0, 1496.0, 580.0, 256.0, 163.0, 96.0, 64.0, 44.0, 40.0, 31.0, 29.0, 22.0, 21.0, 7.0, 12.0, 11.0, 7.0, 11.0, 5.0, 6.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-16.171875, -15.61474609375, -15.0576171875, -14.50048828125, -13.943359375, -13.38623046875, -12.8291015625, -12.27197265625, -11.71484375, -11.15771484375, -10.6005859375, -10.04345703125, -9.486328125, -8.92919921875, -8.3720703125, -7.81494140625, -7.2578125, -6.70068359375, -6.1435546875, -5.58642578125, -5.029296875, -4.47216796875, -3.9150390625, -3.35791015625, -2.80078125, -2.24365234375, -1.6865234375, -1.12939453125, -0.572265625, -0.01513671875, 0.5419921875, 1.09912109375, 1.65625, 2.21337890625, 2.7705078125, 3.32763671875, 3.884765625, 4.44189453125, 4.9990234375, 5.55615234375, 6.11328125, 6.67041015625, 7.2275390625, 7.78466796875, 8.341796875, 8.89892578125, 9.4560546875, 10.01318359375, 10.5703125, 11.12744140625, 11.6845703125, 12.24169921875, 12.798828125, 13.35595703125, 13.9130859375, 14.47021484375, 15.02734375, 15.58447265625, 16.1416015625, 16.69873046875, 17.255859375, 17.81298828125, 18.3701171875, 18.92724609375, 19.484375]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 13.0, 49.0, 113.0, 221.0, 279.0, 189.0, 87.0, 45.0, 11.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.557430267333984, -58.18539810180664, -56.8133659362793, -55.44133758544922, -54.069305419921875, -52.69727325439453, -51.32524108886719, -49.953208923339844, -48.5811767578125, -47.209144592285156, -45.83711242675781, -44.46508026123047, -43.09305191040039, -41.72101974487305, -40.3489875793457, -38.97695541381836, -37.60492706298828, -36.23289489746094, -34.860862731933594, -33.48883056640625, -32.11680221557617, -30.744770050048828, -29.372737884521484, -28.00070571899414, -26.62867546081543, -25.256643295288086, -23.884613037109375, -22.51258087158203, -21.140548706054688, -19.768518447875977, -18.396486282348633, -17.024456024169922, -15.652423858642578, -14.28039264678955, -12.908361434936523, -11.53632926940918, -10.164298057556152, -8.792266845703125, -7.420234680175781, -6.048203468322754, -4.676172256469727, -3.30414080619812, -1.9321093559265137, -0.5600776672363281, 0.8119535446166992, 2.1839847564697266, 3.5560169219970703, 4.928048133850098, 6.300079345703125, 7.672110557556152, 9.04414176940918, 10.416173934936523, 11.78820514678955, 13.160236358642578, 14.532268524169922, 15.90429973602295, 17.276330947875977, 18.64836311340332, 20.02039337158203, 21.392425537109375, 22.76445770263672, 24.13648796081543, 25.508520126342773, 26.880550384521484, 28.252582550048828]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 0.0, 3.0, 0.0, 3.0, 3.0, 6.0, 9.0, 5.0, 16.0, 9.0, 16.0, 23.0, 13.0, 15.0, 17.0, 20.0, 22.0, 31.0, 37.0, 35.0, 35.0, 41.0, 46.0, 40.0, 44.0, 40.0, 45.0, 39.0, 43.0, 34.0, 45.0, 29.0, 32.0, 29.0, 31.0, 27.0, 25.0, 17.0, 11.0, 14.0, 10.0, 8.0, 10.0, 10.0, 8.0, 3.0, 6.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-36.66447830200195, -35.542518615722656, -34.420562744140625, -33.29860305786133, -32.17664337158203, -31.054683685302734, -29.93272590637207, -28.810768127441406, -27.68880844116211, -26.566848754882812, -25.44489097595215, -24.322933197021484, -23.200973510742188, -22.07901382446289, -20.957056045532227, -19.835098266601562, -18.713138580322266, -17.59117889404297, -16.469221115112305, -15.347262382507324, -14.225303649902344, -13.103344917297363, -11.981386184692383, -10.859427452087402, -9.737468719482422, -8.615509986877441, -7.493551254272461, -6.3715925216674805, -5.2496337890625, -4.1276750564575195, -3.005716323852539, -1.8837575912475586, -0.7618026733398438, 0.3601560592651367, 1.4821147918701172, 2.6040735244750977, 3.726032257080078, 4.847990989685059, 5.969949722290039, 7.0919084548950195, 8.2138671875, 9.33582592010498, 10.457784652709961, 11.579743385314941, 12.701702117919922, 13.823660850524902, 14.945619583129883, 16.067577362060547, 17.189537048339844, 18.31149673461914, 19.433454513549805, 20.55541229248047, 21.677371978759766, 22.799331665039062, 23.921289443969727, 25.04324722290039, 26.165206909179688, 27.287166595458984, 28.40912437438965, 29.531082153320312, 30.65304183959961, 31.775001525878906, 32.89695739746094, 34.018917083740234, 35.14087677001953]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 7.0, 6.0, 13.0, 4.0, 9.0, 13.0, 13.0, 18.0, 18.0, 24.0, 32.0, 30.0, 38.0, 34.0, 31.0, 38.0, 40.0, 37.0, 54.0, 38.0, 40.0, 26.0, 44.0, 39.0, 50.0, 41.0, 29.0, 37.0, 26.0, 38.0, 24.0, 19.0, 20.0, 13.0, 13.0, 9.0, 10.0, 11.0, 7.0, 1.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.31640625, -3.21588134765625, -3.1153564453125, -3.01483154296875, -2.914306640625, -2.81378173828125, -2.7132568359375, -2.61273193359375, -2.51220703125, -2.41168212890625, -2.3111572265625, -2.21063232421875, -2.110107421875, -2.00958251953125, -1.9090576171875, -1.80853271484375, -1.7080078125, -1.60748291015625, -1.5069580078125, -1.40643310546875, -1.305908203125, -1.20538330078125, -1.1048583984375, -1.00433349609375, -0.90380859375, -0.80328369140625, -0.7027587890625, -0.60223388671875, -0.501708984375, -0.40118408203125, -0.3006591796875, -0.20013427734375, -0.099609375, 0.00091552734375, 0.1014404296875, 0.20196533203125, 0.302490234375, 0.40301513671875, 0.5035400390625, 0.60406494140625, 0.70458984375, 0.80511474609375, 0.9056396484375, 1.00616455078125, 1.106689453125, 1.20721435546875, 1.3077392578125, 1.40826416015625, 1.5087890625, 1.60931396484375, 1.7098388671875, 1.81036376953125, 1.910888671875, 2.01141357421875, 2.1119384765625, 2.21246337890625, 2.31298828125, 2.41351318359375, 2.5140380859375, 2.61456298828125, 2.715087890625, 2.81561279296875, 2.9161376953125, 3.01666259765625, 3.1171875]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 6.0, 4.0, 5.0, 7.0, 5.0, 12.0, 11.0, 17.0, 24.0, 25.0, 30.0, 29.0, 43.0, 55.0, 86.0, 144.0, 216.0, 343.0, 964.0, 3053.0, 14913.0, 95836.0, 1242917.0, 2601142.0, 200004.0, 26793.0, 5076.0, 1297.0, 464.0, 225.0, 150.0, 84.0, 64.0, 49.0, 52.0, 27.0, 26.0, 21.0, 12.0, 7.0, 13.0, 13.0, 9.0, 7.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.03125, -11.6572265625, -11.283203125, -10.9091796875, -10.53515625, -10.1611328125, -9.787109375, -9.4130859375, -9.0390625, -8.6650390625, -8.291015625, -7.9169921875, -7.54296875, -7.1689453125, -6.794921875, -6.4208984375, -6.046875, -5.6728515625, -5.298828125, -4.9248046875, -4.55078125, -4.1767578125, -3.802734375, -3.4287109375, -3.0546875, -2.6806640625, -2.306640625, -1.9326171875, -1.55859375, -1.1845703125, -0.810546875, -0.4365234375, -0.0625, 0.3115234375, 0.685546875, 1.0595703125, 1.43359375, 1.8076171875, 2.181640625, 2.5556640625, 2.9296875, 3.3037109375, 3.677734375, 4.0517578125, 4.42578125, 4.7998046875, 5.173828125, 5.5478515625, 5.921875, 6.2958984375, 6.669921875, 7.0439453125, 7.41796875, 7.7919921875, 8.166015625, 8.5400390625, 8.9140625, 9.2880859375, 9.662109375, 10.0361328125, 10.41015625, 10.7841796875, 11.158203125, 11.5322265625, 11.90625]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 5.0, 5.0, 8.0, 7.0, 17.0, 19.0, 25.0, 33.0, 35.0, 48.0, 65.0, 88.0, 137.0, 172.0, 218.0, 282.0, 343.0, 438.0, 444.0, 391.0, 284.0, 292.0, 194.0, 128.0, 98.0, 73.0, 71.0, 39.0, 45.0, 19.0, 14.0, 8.0, 13.0, 10.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.421875, -8.1605224609375, -7.899169921875, -7.6378173828125, -7.37646484375, -7.1151123046875, -6.853759765625, -6.5924072265625, -6.3310546875, -6.0697021484375, -5.808349609375, -5.5469970703125, -5.28564453125, -5.0242919921875, -4.762939453125, -4.5015869140625, -4.240234375, -3.9788818359375, -3.717529296875, -3.4561767578125, -3.19482421875, -2.9334716796875, -2.672119140625, -2.4107666015625, -2.1494140625, -1.8880615234375, -1.626708984375, -1.3653564453125, -1.10400390625, -0.8426513671875, -0.581298828125, -0.3199462890625, -0.05859375, 0.2027587890625, 0.464111328125, 0.7254638671875, 0.98681640625, 1.2481689453125, 1.509521484375, 1.7708740234375, 2.0322265625, 2.2935791015625, 2.554931640625, 2.8162841796875, 3.07763671875, 3.3389892578125, 3.600341796875, 3.8616943359375, 4.123046875, 4.3843994140625, 4.645751953125, 4.9071044921875, 5.16845703125, 5.4298095703125, 5.691162109375, 5.9525146484375, 6.2138671875, 6.4752197265625, 6.736572265625, 6.9979248046875, 7.25927734375, 7.5206298828125, 7.781982421875, 8.0433349609375, 8.3046875]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 2.0, 1.0, 8.0, 6.0, 16.0, 31.0, 42.0, 50.0, 92.0, 160.0, 304.0, 561.0, 1344.0, 4228.0, 20197.0, 139482.0, 1596484.0, 2210729.0, 186693.0, 25690.0, 5237.0, 1568.0, 597.0, 281.0, 161.0, 121.0, 74.0, 35.0, 21.0, 19.0, 10.0, 12.0, 8.0, 3.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-21.234375, -20.611083984375, -19.98779296875, -19.364501953125, -18.7412109375, -18.117919921875, -17.49462890625, -16.871337890625, -16.248046875, -15.624755859375, -15.00146484375, -14.378173828125, -13.7548828125, -13.131591796875, -12.50830078125, -11.885009765625, -11.26171875, -10.638427734375, -10.01513671875, -9.391845703125, -8.7685546875, -8.145263671875, -7.52197265625, -6.898681640625, -6.275390625, -5.652099609375, -5.02880859375, -4.405517578125, -3.7822265625, -3.158935546875, -2.53564453125, -1.912353515625, -1.2890625, -0.665771484375, -0.04248046875, 0.580810546875, 1.2041015625, 1.827392578125, 2.45068359375, 3.073974609375, 3.697265625, 4.320556640625, 4.94384765625, 5.567138671875, 6.1904296875, 6.813720703125, 7.43701171875, 8.060302734375, 8.68359375, 9.306884765625, 9.93017578125, 10.553466796875, 11.1767578125, 11.800048828125, 12.42333984375, 13.046630859375, 13.669921875, 14.293212890625, 14.91650390625, 15.539794921875, 16.1630859375, 16.786376953125, 17.40966796875, 18.032958984375, 18.65625]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 14.0, 37.0, 70.0, 135.0, 217.0, 197.0, 175.0, 96.0, 47.0, 14.0, 9.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-137.51852416992188, -134.54905700683594, -131.57958984375, -128.61012268066406, -125.6406478881836, -122.67118072509766, -119.70171356201172, -116.73223876953125, -113.76277160644531, -110.79330444335938, -107.82383728027344, -104.85436248779297, -101.88489532470703, -98.9154281616211, -95.94596099853516, -92.97648620605469, -90.00701904296875, -87.03755187988281, -84.06808471679688, -81.0986099243164, -78.12914276123047, -75.15967559814453, -72.1902084350586, -69.22073364257812, -66.25127410888672, -63.28180694580078, -60.31233596801758, -57.34286880493164, -54.37339782714844, -51.4039306640625, -48.43446350097656, -45.46499252319336, -42.49551773071289, -39.52605056762695, -36.55657958984375, -33.58711242675781, -30.61764144897461, -27.648174285888672, -24.6787052154541, -21.70923614501953, -18.73976707458496, -15.77029800415039, -12.80082893371582, -9.831360816955566, -6.861891746520996, -3.892422676086426, -0.9229545593261719, 2.0465145111083984, 5.015983581542969, 7.985452651977539, 10.95492172241211, 13.924389839172363, 16.89385986328125, 19.863327026367188, 22.832796096801758, 25.802265167236328, 28.7717342376709, 31.74120330810547, 34.710670471191406, 37.68014144897461, 40.64960861206055, 43.61907958984375, 46.58854675292969, 49.558013916015625, 52.52748489379883]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 6.0, 3.0, 3.0, 7.0, 5.0, 7.0, 13.0, 8.0, 19.0, 15.0, 21.0, 23.0, 20.0, 22.0, 27.0, 28.0, 42.0, 42.0, 36.0, 35.0, 38.0, 43.0, 43.0, 44.0, 36.0, 38.0, 29.0, 36.0, 34.0, 36.0, 27.0, 30.0, 19.0, 22.0, 22.0, 22.0, 21.0, 22.0, 14.0, 8.0, 13.0, 6.0, 7.0, 5.0, 6.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-30.095977783203125, -29.192276000976562, -28.28857421875, -27.38487434387207, -26.481172561645508, -25.577470779418945, -24.673770904541016, -23.770069122314453, -22.86636734008789, -21.962665557861328, -21.058963775634766, -20.155263900756836, -19.251562118530273, -18.34786033630371, -17.44416046142578, -16.54045867919922, -15.636756896972656, -14.733055114746094, -13.829354286193848, -12.925653457641602, -12.021951675415039, -11.118249893188477, -10.21454906463623, -9.310848236083984, -8.407146453857422, -7.503445148468018, -6.599743843078613, -5.696042537689209, -4.792341232299805, -3.8886399269104004, -2.984938621520996, -2.081237316131592, -1.1775360107421875, -0.2738347053527832, 0.6298666000366211, 1.5335679054260254, 2.4372692108154297, 3.340970516204834, 4.244671821594238, 5.148373126983643, 6.052074432373047, 6.955775737762451, 7.8594770431518555, 8.763177871704102, 9.666879653930664, 10.570581436157227, 11.474282264709473, 12.377983093261719, 13.281684875488281, 14.185386657714844, 15.08908748626709, 15.992788314819336, 16.8964900970459, 17.80019187927246, 18.70389175415039, 19.607593536376953, 20.511295318603516, 21.414997100830078, 22.31869888305664, 23.22239875793457, 24.126100540161133, 25.029802322387695, 25.933502197265625, 26.837203979492188, 27.74090576171875]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 3.0, 6.0, 3.0, 4.0, 9.0, 4.0, 7.0, 15.0, 14.0, 22.0, 19.0, 24.0, 17.0, 31.0, 27.0, 34.0, 36.0, 36.0, 37.0, 44.0, 36.0, 48.0, 47.0, 34.0, 41.0, 52.0, 32.0, 43.0, 34.0, 32.0, 34.0, 22.0, 27.0, 25.0, 22.0, 15.0, 22.0, 9.0, 5.0, 6.0, 7.0, 6.0, 3.0, 6.0, 5.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.599609375, -3.494842529296875, -3.39007568359375, -3.285308837890625, -3.1805419921875, -3.075775146484375, -2.97100830078125, -2.866241455078125, -2.761474609375, -2.656707763671875, -2.55194091796875, -2.447174072265625, -2.3424072265625, -2.237640380859375, -2.13287353515625, -2.028106689453125, -1.92333984375, -1.818572998046875, -1.71380615234375, -1.609039306640625, -1.5042724609375, -1.399505615234375, -1.29473876953125, -1.189971923828125, -1.085205078125, -0.980438232421875, -0.87567138671875, -0.770904541015625, -0.6661376953125, -0.561370849609375, -0.45660400390625, -0.351837158203125, -0.2470703125, -0.142303466796875, -0.03753662109375, 0.067230224609375, 0.1719970703125, 0.276763916015625, 0.38153076171875, 0.486297607421875, 0.591064453125, 0.695831298828125, 0.80059814453125, 0.905364990234375, 1.0101318359375, 1.114898681640625, 1.21966552734375, 1.324432373046875, 1.42919921875, 1.533966064453125, 1.63873291015625, 1.743499755859375, 1.8482666015625, 1.953033447265625, 2.05780029296875, 2.162567138671875, 2.267333984375, 2.372100830078125, 2.47686767578125, 2.581634521484375, 2.6864013671875, 2.791168212890625, 2.89593505859375, 3.000701904296875, 3.10546875]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 2.0, 6.0, 9.0, 16.0, 19.0, 20.0, 43.0, 61.0, 93.0, 127.0, 200.0, 311.0, 448.0, 716.0, 1048.0, 1621.0, 2542.0, 4080.0, 6480.0, 10753.0, 18066.0, 32007.0, 61538.0, 130230.0, 268352.0, 255347.0, 121186.0, 58071.0, 30533.0, 17135.0, 10352.0, 6174.0, 3937.0, 2472.0, 1596.0, 1031.0, 658.0, 436.0, 267.0, 196.0, 118.0, 91.0, 64.0, 35.0, 26.0, 18.0, 9.0, 6.0, 10.0, 3.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.36181640625, -0.350128173828125, -0.33843994140625, -0.326751708984375, -0.3150634765625, -0.303375244140625, -0.29168701171875, -0.279998779296875, -0.268310546875, -0.256622314453125, -0.24493408203125, -0.233245849609375, -0.2215576171875, -0.209869384765625, -0.19818115234375, -0.186492919921875, -0.1748046875, -0.163116455078125, -0.15142822265625, -0.139739990234375, -0.1280517578125, -0.116363525390625, -0.10467529296875, -0.092987060546875, -0.081298828125, -0.069610595703125, -0.05792236328125, -0.046234130859375, -0.0345458984375, -0.022857666015625, -0.01116943359375, 0.000518798828125, 0.01220703125, 0.023895263671875, 0.03558349609375, 0.047271728515625, 0.0589599609375, 0.070648193359375, 0.08233642578125, 0.094024658203125, 0.105712890625, 0.117401123046875, 0.12908935546875, 0.140777587890625, 0.1524658203125, 0.164154052734375, 0.17584228515625, 0.187530517578125, 0.19921875, 0.210906982421875, 0.22259521484375, 0.234283447265625, 0.2459716796875, 0.257659912109375, 0.26934814453125, 0.281036376953125, 0.292724609375, 0.304412841796875, 0.31610107421875, 0.327789306640625, 0.3394775390625, 0.351165771484375, 0.36285400390625, 0.374542236328125, 0.38623046875]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 1.0, 5.0, 5.0, 5.0, 5.0, 14.0, 8.0, 9.0, 15.0, 18.0, 11.0, 22.0, 21.0, 28.0, 32.0, 31.0, 34.0, 36.0, 35.0, 34.0, 33.0, 46.0, 44.0, 1083.0, 32.0, 44.0, 37.0, 35.0, 33.0, 27.0, 32.0, 26.0, 17.0, 22.0, 30.0, 10.0, 16.0, 13.0, 13.0, 6.0, 15.0, 10.0, 9.0, 10.0, 11.0, 1.0, 5.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0], "bins": [-2.064453125, -2.00067138671875, -1.9368896484375, -1.87310791015625, -1.809326171875, -1.74554443359375, -1.6817626953125, -1.61798095703125, -1.55419921875, -1.49041748046875, -1.4266357421875, -1.36285400390625, -1.299072265625, -1.23529052734375, -1.1715087890625, -1.10772705078125, -1.0439453125, -0.98016357421875, -0.9163818359375, -0.85260009765625, -0.788818359375, -0.72503662109375, -0.6612548828125, -0.59747314453125, -0.53369140625, -0.46990966796875, -0.4061279296875, -0.34234619140625, -0.278564453125, -0.21478271484375, -0.1510009765625, -0.08721923828125, -0.0234375, 0.04034423828125, 0.1041259765625, 0.16790771484375, 0.231689453125, 0.29547119140625, 0.3592529296875, 0.42303466796875, 0.48681640625, 0.55059814453125, 0.6143798828125, 0.67816162109375, 0.741943359375, 0.80572509765625, 0.8695068359375, 0.93328857421875, 0.9970703125, 1.06085205078125, 1.1246337890625, 1.18841552734375, 1.252197265625, 1.31597900390625, 1.3797607421875, 1.44354248046875, 1.50732421875, 1.57110595703125, 1.6348876953125, 1.69866943359375, 1.762451171875, 1.82623291015625, 1.8900146484375, 1.95379638671875, 2.017578125]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 6.0, 2.0, 4.0, 2.0, 5.0, 2.0, 6.0, 8.0, 14.0, 26.0, 24.0, 36.0, 49.0, 71.0, 102.0, 156.0, 276.0, 423.0, 687.0, 1105.0, 1800.0, 3155.0, 5546.0, 9607.0, 16902.0, 30202.0, 55519.0, 100959.0, 179390.0, 1288066.0, 177950.0, 100362.0, 54763.0, 30310.0, 16793.0, 9348.0, 5450.0, 3253.0, 1811.0, 1105.0, 653.0, 412.0, 262.0, 167.0, 97.0, 78.0, 67.0, 35.0, 24.0, 20.0, 9.0, 10.0, 9.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2012939453125, -0.19469261169433594, -0.18809127807617188, -0.1814899444580078, -0.17488861083984375, -0.1682872772216797, -0.16168594360351562, -0.15508460998535156, -0.1484832763671875, -0.14188194274902344, -0.13528060913085938, -0.1286792755126953, -0.12207794189453125, -0.11547660827636719, -0.10887527465820312, -0.10227394104003906, -0.095672607421875, -0.08907127380371094, -0.08246994018554688, -0.07586860656738281, -0.06926727294921875, -0.06266593933105469, -0.056064605712890625, -0.04946327209472656, -0.0428619384765625, -0.03626060485839844, -0.029659271240234375, -0.023057937622070312, -0.01645660400390625, -0.009855270385742188, -0.003253936767578125, 0.0033473968505859375, 0.00994873046875, 0.016550064086914062, 0.023151397705078125, 0.029752731323242188, 0.03635406494140625, 0.04295539855957031, 0.049556732177734375, 0.05615806579589844, 0.0627593994140625, 0.06936073303222656, 0.07596206665039062, 0.08256340026855469, 0.08916473388671875, 0.09576606750488281, 0.10236740112304688, 0.10896873474121094, 0.115570068359375, 0.12217140197753906, 0.12877273559570312, 0.1353740692138672, 0.14197540283203125, 0.1485767364501953, 0.15517807006835938, 0.16177940368652344, 0.1683807373046875, 0.17498207092285156, 0.18158340454101562, 0.1881847381591797, 0.19478607177734375, 0.2013874053955078, 0.20798873901367188, 0.21459007263183594, 0.22119140625]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [4.0, 0.0, 3.0, 4.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 5.0, 4.0, 7.0, 5.0, 9.0, 10.0, 13.0, 12.0, 25.0, 25.0, 54.0, 79.0, 135.0, 184.0, 140.0, 78.0, 56.0, 23.0, 22.0, 21.0, 11.0, 11.0, 12.0, 7.0, 4.0, 3.0, 10.0, 2.0, 2.0, 9.0, 5.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0021457672119140625, -0.0020547211170196533, -0.001963675022125244, -0.001872628927230835, -0.0017815828323364258, -0.0016905367374420166, -0.0015994906425476074, -0.0015084445476531982, -0.001417398452758789, -0.0013263523578643799, -0.0012353062629699707, -0.0011442601680755615, -0.0010532140731811523, -0.0009621679782867432, -0.000871121883392334, -0.0007800757884979248, -0.0006890296936035156, -0.0005979835987091064, -0.0005069375038146973, -0.0004158914089202881, -0.0003248453140258789, -0.00023379921913146973, -0.00014275312423706055, -5.170702934265137e-05, 3.933906555175781e-05, 0.000130385160446167, 0.00022143125534057617, 0.00031247735023498535, 0.00040352344512939453, 0.0004945695400238037, 0.0005856156349182129, 0.0006766617298126221, 0.0007677078247070312, 0.0008587539196014404, 0.0009498000144958496, 0.0010408461093902588, 0.001131892204284668, 0.0012229382991790771, 0.0013139843940734863, 0.0014050304889678955, 0.0014960765838623047, 0.0015871226787567139, 0.001678168773651123, 0.0017692148685455322, 0.0018602609634399414, 0.0019513070583343506, 0.0020423531532287598, 0.002133399248123169, 0.002224445343017578, 0.0023154914379119873, 0.0024065375328063965, 0.0024975836277008057, 0.002588629722595215, 0.002679675817489624, 0.002770721912384033, 0.0028617680072784424, 0.0029528141021728516, 0.0030438601970672607, 0.00313490629196167, 0.003225952386856079, 0.0033169984817504883, 0.0034080445766448975, 0.0034990906715393066, 0.003590136766433716, 0.003681182861328125]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 9.0, 8.0, 7.0, 10.0, 15.0, 19.0, 15.0, 25.0, 32.0, 40.0, 59.0, 79.0, 100.0, 166.0, 398.0, 2016.0, 30921.0, 972549.0, 38813.0, 2231.0, 429.0, 176.0, 99.0, 71.0, 52.0, 37.0, 43.0, 26.0, 30.0, 19.0, 17.0, 12.0, 8.0, 7.0, 8.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.04718017578125, -0.045683860778808594, -0.04418754577636719, -0.04269123077392578, -0.041194915771484375, -0.03969860076904297, -0.03820228576660156, -0.036705970764160156, -0.03520965576171875, -0.033713340759277344, -0.03221702575683594, -0.03072071075439453, -0.029224395751953125, -0.02772808074951172, -0.026231765747070312, -0.024735450744628906, -0.0232391357421875, -0.021742820739746094, -0.020246505737304688, -0.01875019073486328, -0.017253875732421875, -0.01575756072998047, -0.014261245727539062, -0.012764930725097656, -0.01126861572265625, -0.009772300720214844, -0.008275985717773438, -0.006779670715332031, -0.005283355712890625, -0.0037870407104492188, -0.0022907257080078125, -0.0007944107055664062, 0.000701904296875, 0.0021982192993164062, 0.0036945343017578125, 0.005190849304199219, 0.006687164306640625, 0.008183479309082031, 0.009679794311523438, 0.011176109313964844, 0.01267242431640625, 0.014168739318847656, 0.015665054321289062, 0.01716136932373047, 0.018657684326171875, 0.02015399932861328, 0.021650314331054688, 0.023146629333496094, 0.0246429443359375, 0.026139259338378906, 0.027635574340820312, 0.02913188934326172, 0.030628204345703125, 0.03212451934814453, 0.03362083435058594, 0.035117149353027344, 0.03661346435546875, 0.038109779357910156, 0.03960609436035156, 0.04110240936279297, 0.042598724365234375, 0.04409503936767578, 0.04559135437011719, 0.047087669372558594, 0.048583984375]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 41.0, 154.0, 635.0, 135.0, 33.0, 9.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004613604862242937, -0.004061953630298376, -0.0035103026311844587, -0.0029586516320705414, -0.0024070004001259804, -0.0018553491681814194, -0.001303698169067502, -0.0007520471699535847, -0.00020039593800902367, 0.0003512551775202155, 0.0009029062930494547, 0.0014545574085786939, 0.002006208524107933, 0.002557859756052494, 0.0031095107551664114, 0.0036611617542803288, 0.00421281298622489, 0.004764464218169451, 0.0053161149844527245, 0.0058677662163972855, 0.0064194174483418465, 0.0069710686802864075, 0.0075227199122309685, 0.00807437114417553, 0.008626021444797516, 0.009177672676742077, 0.009729323908686638, 0.010280975140631199, 0.01083262637257576, 0.011384276673197746, 0.011935927905142307, 0.012487579137086868, 0.013039231300354004, 0.013590882532298565, 0.014142533764243126, 0.014694184996187687, 0.015245836228132248, 0.015797486528754234, 0.01634913869202137, 0.016900788992643356, 0.017452441155910492, 0.01800409145653248, 0.018555743619799614, 0.0191073939204216, 0.019659046083688736, 0.020210696384310722, 0.020762348547577858, 0.021313998848199844, 0.02186564914882183, 0.022417299449443817, 0.022968951612710953, 0.02352060191333294, 0.024072254076600075, 0.02462390437722206, 0.025175556540489197, 0.025727206841111183, 0.02627885714173317, 0.026830507442355156, 0.02738215960562229, 0.027933809906244278, 0.028485462069511414, 0.0290371123701334, 0.029588764533400536, 0.030140414834022522, 0.030692066997289658]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 4.0, 3.0, 9.0, 11.0, 9.0, 15.0, 13.0, 26.0, 27.0, 28.0, 34.0, 35.0, 33.0, 28.0, 58.0, 44.0, 46.0, 47.0, 39.0, 70.0, 58.0, 58.0, 46.0, 43.0, 35.0, 36.0, 25.0, 30.0, 18.0, 17.0, 14.0, 10.0, 9.0, 7.0, 11.0, 7.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0026468634605407715, -0.002573644742369652, -0.002500426024198532, -0.0024272073060274124, -0.0023539885878562927, -0.002280769869685173, -0.0022075511515140533, -0.0021343324333429337, -0.002061113715171814, -0.0019878949970006943, -0.0019146762788295746, -0.001841457560658455, -0.0017682388424873352, -0.0016950201243162155, -0.0016218014061450958, -0.0015485826879739761, -0.0014753639698028564, -0.0014021452516317368, -0.001328926533460617, -0.0012557078152894974, -0.0011824890971183777, -0.001109270378947258, -0.0010360516607761383, -0.0009628329426050186, -0.0008896142244338989, -0.0008163955062627792, -0.0007431767880916595, -0.0006699580699205399, -0.0005967393517494202, -0.0005235206335783005, -0.0004503019154071808, -0.0003770831972360611, -0.0003038644790649414, -0.00023064576089382172, -0.00015742704272270203, -8.420832455158234e-05, -1.0989606380462646e-05, 6.222911179065704e-05, 0.00013544782996177673, 0.00020866654813289642, 0.0002818852663040161, 0.0003551039844751358, 0.0004283227026462555, 0.0005015414208173752, 0.0005747601389884949, 0.0006479788571596146, 0.0007211975753307343, 0.0007944162935018539, 0.0008676350116729736, 0.0009408537298440933, 0.001014072448015213, 0.0010872911661863327, 0.0011605098843574524, 0.001233728602528572, 0.0013069473206996918, 0.0013801660388708115, 0.0014533847570419312, 0.0015266034752130508, 0.0015998221933841705, 0.0016730409115552902, 0.00174625962972641, 0.0018194783478975296, 0.0018926970660686493, 0.001965915784239769, 0.0020391345024108887]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 3.0, 6.0, 3.0, 4.0, 9.0, 4.0, 7.0, 15.0, 14.0, 22.0, 19.0, 24.0, 17.0, 31.0, 27.0, 34.0, 36.0, 36.0, 37.0, 44.0, 36.0, 48.0, 47.0, 34.0, 41.0, 52.0, 32.0, 43.0, 34.0, 32.0, 34.0, 22.0, 27.0, 25.0, 22.0, 15.0, 22.0, 9.0, 5.0, 6.0, 7.0, 6.0, 3.0, 6.0, 5.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.599609375, -3.494842529296875, -3.39007568359375, -3.285308837890625, -3.1805419921875, -3.075775146484375, -2.97100830078125, -2.866241455078125, -2.761474609375, -2.656707763671875, -2.55194091796875, -2.447174072265625, -2.3424072265625, -2.237640380859375, -2.13287353515625, -2.028106689453125, -1.92333984375, -1.818572998046875, -1.71380615234375, -1.609039306640625, -1.5042724609375, -1.399505615234375, -1.29473876953125, -1.189971923828125, -1.085205078125, -0.980438232421875, -0.87567138671875, -0.770904541015625, -0.6661376953125, -0.561370849609375, -0.45660400390625, -0.351837158203125, -0.2470703125, -0.142303466796875, -0.03753662109375, 0.067230224609375, 0.1719970703125, 0.276763916015625, 0.38153076171875, 0.486297607421875, 0.591064453125, 0.695831298828125, 0.80059814453125, 0.905364990234375, 1.0101318359375, 1.114898681640625, 1.21966552734375, 1.324432373046875, 1.42919921875, 1.533966064453125, 1.63873291015625, 1.743499755859375, 1.8482666015625, 1.953033447265625, 2.05780029296875, 2.162567138671875, 2.267333984375, 2.372100830078125, 2.47686767578125, 2.581634521484375, 2.6864013671875, 2.791168212890625, 2.89593505859375, 3.000701904296875, 3.10546875]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 4.0, 5.0, 7.0, 7.0, 6.0, 10.0, 20.0, 31.0, 28.0, 39.0, 57.0, 103.0, 135.0, 200.0, 383.0, 523.0, 930.0, 1491.0, 2521.0, 4573.0, 8152.0, 15329.0, 31350.0, 78173.0, 277007.0, 426897.0, 116368.0, 41450.0, 19289.0, 10044.0, 5535.0, 3174.0, 1727.0, 1061.0, 691.0, 408.0, 257.0, 178.0, 112.0, 85.0, 51.0, 43.0, 33.0, 25.0, 13.0, 12.0, 7.0, 5.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0], "bins": [-3.009765625, -2.9241943359375, -2.838623046875, -2.7530517578125, -2.66748046875, -2.5819091796875, -2.496337890625, -2.4107666015625, -2.3251953125, -2.2396240234375, -2.154052734375, -2.0684814453125, -1.98291015625, -1.8973388671875, -1.811767578125, -1.7261962890625, -1.640625, -1.5550537109375, -1.469482421875, -1.3839111328125, -1.29833984375, -1.2127685546875, -1.127197265625, -1.0416259765625, -0.9560546875, -0.8704833984375, -0.784912109375, -0.6993408203125, -0.61376953125, -0.5281982421875, -0.442626953125, -0.3570556640625, -0.271484375, -0.1859130859375, -0.100341796875, -0.0147705078125, 0.07080078125, 0.1563720703125, 0.241943359375, 0.3275146484375, 0.4130859375, 0.4986572265625, 0.584228515625, 0.6697998046875, 0.75537109375, 0.8409423828125, 0.926513671875, 1.0120849609375, 1.09765625, 1.1832275390625, 1.268798828125, 1.3543701171875, 1.43994140625, 1.5255126953125, 1.611083984375, 1.6966552734375, 1.7822265625, 1.8677978515625, 1.953369140625, 2.0389404296875, 2.12451171875, 2.2100830078125, 2.295654296875, 2.3812255859375, 2.466796875]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 1.0, 0.0, 4.0, 3.0, 2.0, 5.0, 3.0, 2.0, 5.0, 14.0, 14.0, 4.0, 14.0, 16.0, 19.0, 23.0, 33.0, 28.0, 23.0, 25.0, 35.0, 51.0, 48.0, 55.0, 65.0, 117.0, 1572.0, 335.0, 92.0, 49.0, 47.0, 49.0, 31.0, 32.0, 39.0, 31.0, 28.0, 30.0, 18.0, 22.0, 7.0, 15.0, 11.0, 6.0, 11.0, 4.0, 4.0, 5.0, 5.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-12.1640625, -11.8048095703125, -11.445556640625, -11.0863037109375, -10.72705078125, -10.3677978515625, -10.008544921875, -9.6492919921875, -9.2900390625, -8.9307861328125, -8.571533203125, -8.2122802734375, -7.85302734375, -7.4937744140625, -7.134521484375, -6.7752685546875, -6.416015625, -6.0567626953125, -5.697509765625, -5.3382568359375, -4.97900390625, -4.6197509765625, -4.260498046875, -3.9012451171875, -3.5419921875, -3.1827392578125, -2.823486328125, -2.4642333984375, -2.10498046875, -1.7457275390625, -1.386474609375, -1.0272216796875, -0.66796875, -0.3087158203125, 0.050537109375, 0.4097900390625, 0.76904296875, 1.1282958984375, 1.487548828125, 1.8468017578125, 2.2060546875, 2.5653076171875, 2.924560546875, 3.2838134765625, 3.64306640625, 4.0023193359375, 4.361572265625, 4.7208251953125, 5.080078125, 5.4393310546875, 5.798583984375, 6.1578369140625, 6.51708984375, 6.8763427734375, 7.235595703125, 7.5948486328125, 7.9541015625, 8.3133544921875, 8.672607421875, 9.0318603515625, 9.39111328125, 9.7503662109375, 10.109619140625, 10.4688720703125, 10.828125]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 10.0, 12.0, 21.0, 26.0, 30.0, 52.0, 101.0, 198.0, 391.0, 1037.0, 4610.0, 153395.0, 2970869.0, 12111.0, 1645.0, 590.0, 246.0, 138.0, 78.0, 45.0, 28.0, 28.0, 9.0, 12.0, 9.0, 9.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-33.5, -32.490966796875, -31.48193359375, -30.472900390625, -29.4638671875, -28.454833984375, -27.44580078125, -26.436767578125, -25.427734375, -24.418701171875, -23.40966796875, -22.400634765625, -21.3916015625, -20.382568359375, -19.37353515625, -18.364501953125, -17.35546875, -16.346435546875, -15.33740234375, -14.328369140625, -13.3193359375, -12.310302734375, -11.30126953125, -10.292236328125, -9.283203125, -8.274169921875, -7.26513671875, -6.256103515625, -5.2470703125, -4.238037109375, -3.22900390625, -2.219970703125, -1.2109375, -0.201904296875, 0.80712890625, 1.816162109375, 2.8251953125, 3.834228515625, 4.84326171875, 5.852294921875, 6.861328125, 7.870361328125, 8.87939453125, 9.888427734375, 10.8974609375, 11.906494140625, 12.91552734375, 13.924560546875, 14.93359375, 15.942626953125, 16.95166015625, 17.960693359375, 18.9697265625, 19.978759765625, 20.98779296875, 21.996826171875, 23.005859375, 24.014892578125, 25.02392578125, 26.032958984375, 27.0419921875, 28.051025390625, 29.06005859375, 30.069091796875, 31.078125]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 358.0, 647.0, 10.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-294.6358337402344, -289.2885437011719, -283.9412536621094, -278.5939636230469, -273.2466735839844, -267.8994140625, -262.5521240234375, -257.204833984375, -251.8575439453125, -246.51025390625, -241.1629638671875, -235.815673828125, -230.46839904785156, -225.12110900878906, -219.77381896972656, -214.42652893066406, -209.07923889160156, -203.73194885253906, -198.38465881347656, -193.03738403320312, -187.69009399414062, -182.34280395507812, -176.99551391601562, -171.64822387695312, -166.30093383789062, -160.95364379882812, -155.60635375976562, -150.25906372070312, -144.9117889404297, -139.5644989013672, -134.2172088623047, -128.8699188232422, -123.52263641357422, -118.17534637451172, -112.82806396484375, -107.48077392578125, -102.13348388671875, -96.78620147705078, -91.43891143798828, -86.09162902832031, -80.74433898925781, -75.39704895019531, -70.04976654052734, -64.70247650146484, -59.35519027709961, -54.007904052734375, -48.660614013671875, -43.31332778930664, -37.966041564941406, -32.61875534057617, -27.271467208862305, -21.924179077148438, -16.576892852783203, -11.229606628417969, -5.882316589355469, -0.5350303649902344, 4.812255859375, 10.15954303741455, 15.506830215454102, 20.85411834716797, 26.201404571533203, 31.548690795898438, 36.89598083496094, 42.24326705932617, 47.590553283691406]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 4.0, 3.0, 2.0, 3.0, 7.0, 6.0, 13.0, 9.0, 11.0, 19.0, 20.0, 17.0, 20.0, 14.0, 18.0, 23.0, 15.0, 28.0, 33.0, 30.0, 29.0, 32.0, 28.0, 34.0, 34.0, 55.0, 38.0, 47.0, 40.0, 37.0, 33.0, 32.0, 30.0, 25.0, 30.0, 25.0, 24.0, 21.0, 16.0, 15.0, 15.0, 14.0, 12.0, 13.0, 11.0, 7.0, 6.0, 8.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.08755111694336, -28.069482803344727, -27.051414489746094, -26.033348083496094, -25.01527976989746, -23.997211456298828, -22.979145050048828, -21.961076736450195, -20.943008422851562, -19.92494010925293, -18.906871795654297, -17.888805389404297, -16.870737075805664, -15.852668762207031, -14.834601402282715, -13.816534042358398, -12.798465728759766, -11.780397415161133, -10.762330055236816, -9.7442626953125, -8.726194381713867, -7.708126544952393, -6.690058708190918, -5.671990871429443, -4.653923034667969, -3.635855197906494, -2.6177873611450195, -1.599719524383545, -0.5816516876220703, 0.4364161491394043, 1.454483985900879, 2.4725518226623535, 3.4906234741210938, 4.508691310882568, 5.526759147644043, 6.544826984405518, 7.562894821166992, 8.580963134765625, 9.599030494689941, 10.617097854614258, 11.63516616821289, 12.653234481811523, 13.67130184173584, 14.689369201660156, 15.707437515258789, 16.725505828857422, 17.743572235107422, 18.761640548706055, 19.779708862304688, 20.79777717590332, 21.815845489501953, 22.833911895751953, 23.851980209350586, 24.87004852294922, 25.88811492919922, 26.90618324279785, 27.924251556396484, 28.942319869995117, 29.96038818359375, 30.97845458984375, 31.996522903442383, 33.014591217041016, 34.032657623291016, 35.05072784423828, 36.06879425048828]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 2.0, 2.0, 2.0, 6.0, 4.0, 9.0, 6.0, 7.0, 7.0, 15.0, 18.0, 20.0, 24.0, 25.0, 26.0, 23.0, 36.0, 32.0, 44.0, 35.0, 34.0, 48.0, 47.0, 48.0, 49.0, 45.0, 44.0, 41.0, 40.0, 32.0, 36.0, 25.0, 22.0, 31.0, 20.0, 25.0, 22.0, 10.0, 10.0, 6.0, 6.0, 6.0, 8.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.59375, -3.48291015625, -3.3720703125, -3.26123046875, -3.150390625, -3.03955078125, -2.9287109375, -2.81787109375, -2.70703125, -2.59619140625, -2.4853515625, -2.37451171875, -2.263671875, -2.15283203125, -2.0419921875, -1.93115234375, -1.8203125, -1.70947265625, -1.5986328125, -1.48779296875, -1.376953125, -1.26611328125, -1.1552734375, -1.04443359375, -0.93359375, -0.82275390625, -0.7119140625, -0.60107421875, -0.490234375, -0.37939453125, -0.2685546875, -0.15771484375, -0.046875, 0.06396484375, 0.1748046875, 0.28564453125, 0.396484375, 0.50732421875, 0.6181640625, 0.72900390625, 0.83984375, 0.95068359375, 1.0615234375, 1.17236328125, 1.283203125, 1.39404296875, 1.5048828125, 1.61572265625, 1.7265625, 1.83740234375, 1.9482421875, 2.05908203125, 2.169921875, 2.28076171875, 2.3916015625, 2.50244140625, 2.61328125, 2.72412109375, 2.8349609375, 2.94580078125, 3.056640625, 3.16748046875, 3.2783203125, 3.38916015625, 3.5]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 2.0, 5.0, 12.0, 8.0, 10.0, 12.0, 25.0, 33.0, 35.0, 39.0, 62.0, 116.0, 209.0, 377.0, 823.0, 1998.0, 5383.0, 16121.0, 53869.0, 228023.0, 1517171.0, 1954252.0, 315540.0, 69236.0, 19942.0, 6688.0, 2398.0, 921.0, 389.0, 220.0, 114.0, 64.0, 47.0, 27.0, 22.0, 27.0, 19.0, 14.0, 7.0, 6.0, 4.0, 5.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-8.375, -8.12933349609375, -7.8836669921875, -7.63800048828125, -7.392333984375, -7.14666748046875, -6.9010009765625, -6.65533447265625, -6.40966796875, -6.16400146484375, -5.9183349609375, -5.67266845703125, -5.427001953125, -5.18133544921875, -4.9356689453125, -4.69000244140625, -4.4443359375, -4.19866943359375, -3.9530029296875, -3.70733642578125, -3.461669921875, -3.21600341796875, -2.9703369140625, -2.72467041015625, -2.47900390625, -2.23333740234375, -1.9876708984375, -1.74200439453125, -1.496337890625, -1.25067138671875, -1.0050048828125, -0.75933837890625, -0.513671875, -0.26800537109375, -0.0223388671875, 0.22332763671875, 0.468994140625, 0.71466064453125, 0.9603271484375, 1.20599365234375, 1.45166015625, 1.69732666015625, 1.9429931640625, 2.18865966796875, 2.434326171875, 2.67999267578125, 2.9256591796875, 3.17132568359375, 3.4169921875, 3.66265869140625, 3.9083251953125, 4.15399169921875, 4.399658203125, 4.64532470703125, 4.8909912109375, 5.13665771484375, 5.38232421875, 5.62799072265625, 5.8736572265625, 6.11932373046875, 6.364990234375, 6.61065673828125, 6.8563232421875, 7.10198974609375, 7.34765625]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 7.0, 7.0, 18.0, 18.0, 25.0, 23.0, 51.0, 79.0, 124.0, 193.0, 317.0, 475.0, 666.0, 645.0, 535.0, 330.0, 201.0, 143.0, 96.0, 47.0, 26.0, 22.0, 7.0, 9.0, 5.0, 7.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-19.421875, -18.9993896484375, -18.576904296875, -18.1544189453125, -17.73193359375, -17.3094482421875, -16.886962890625, -16.4644775390625, -16.0419921875, -15.6195068359375, -15.197021484375, -14.7745361328125, -14.35205078125, -13.9295654296875, -13.507080078125, -13.0845947265625, -12.662109375, -12.2396240234375, -11.817138671875, -11.3946533203125, -10.97216796875, -10.5496826171875, -10.127197265625, -9.7047119140625, -9.2822265625, -8.8597412109375, -8.437255859375, -8.0147705078125, -7.59228515625, -7.1697998046875, -6.747314453125, -6.3248291015625, -5.90234375, -5.4798583984375, -5.057373046875, -4.6348876953125, -4.21240234375, -3.7899169921875, -3.367431640625, -2.9449462890625, -2.5224609375, -2.0999755859375, -1.677490234375, -1.2550048828125, -0.83251953125, -0.4100341796875, 0.012451171875, 0.4349365234375, 0.857421875, 1.2799072265625, 1.702392578125, 2.1248779296875, 2.54736328125, 2.9698486328125, 3.392333984375, 3.8148193359375, 4.2373046875, 4.6597900390625, 5.082275390625, 5.5047607421875, 5.92724609375, 6.3497314453125, 6.772216796875, 7.1947021484375, 7.6171875]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 8.0, 10.0, 11.0, 23.0, 25.0, 48.0, 65.0, 103.0, 185.0, 392.0, 878.0, 2766.0, 11635.0, 72255.0, 712208.0, 2999076.0, 343505.0, 40583.0, 7227.0, 1889.0, 686.0, 280.0, 136.0, 101.0, 62.0, 49.0, 23.0, 18.0, 17.0, 9.0, 6.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-17.4375, -16.800048828125, -16.16259765625, -15.525146484375, -14.8876953125, -14.250244140625, -13.61279296875, -12.975341796875, -12.337890625, -11.700439453125, -11.06298828125, -10.425537109375, -9.7880859375, -9.150634765625, -8.51318359375, -7.875732421875, -7.23828125, -6.600830078125, -5.96337890625, -5.325927734375, -4.6884765625, -4.051025390625, -3.41357421875, -2.776123046875, -2.138671875, -1.501220703125, -0.86376953125, -0.226318359375, 0.4111328125, 1.048583984375, 1.68603515625, 2.323486328125, 2.9609375, 3.598388671875, 4.23583984375, 4.873291015625, 5.5107421875, 6.148193359375, 6.78564453125, 7.423095703125, 8.060546875, 8.697998046875, 9.33544921875, 9.972900390625, 10.6103515625, 11.247802734375, 11.88525390625, 12.522705078125, 13.16015625, 13.797607421875, 14.43505859375, 15.072509765625, 15.7099609375, 16.347412109375, 16.98486328125, 17.622314453125, 18.259765625, 18.897216796875, 19.53466796875, 20.172119140625, 20.8095703125, 21.447021484375, 22.08447265625, 22.721923828125, 23.359375]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 1.0, 4.0, 9.0, 7.0, 15.0, 27.0, 34.0, 42.0, 58.0, 81.0, 84.0, 85.0, 93.0, 88.0, 78.0, 75.0, 68.0, 38.0, 40.0, 24.0, 14.0, 18.0, 12.0, 8.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.35121536254883, -57.99974822998047, -56.648284912109375, -55.296817779541016, -53.945350646972656, -52.5938835144043, -51.24241638183594, -49.890953063964844, -48.539485931396484, -47.188018798828125, -45.83655548095703, -44.48508834838867, -43.13362121582031, -41.78215408325195, -40.430686950683594, -39.0792236328125, -37.72775650024414, -36.37628936767578, -35.02482604980469, -33.67335891723633, -32.32189178466797, -30.97042465209961, -29.618959426879883, -28.267494201660156, -26.916027069091797, -25.564559936523438, -24.21309471130371, -22.861629486083984, -21.510162353515625, -20.158695220947266, -18.80722999572754, -17.455764770507812, -16.10429573059082, -14.752829551696777, -13.401363372802734, -12.049897193908691, -10.698431015014648, -9.346964836120605, -7.9954986572265625, -6.6440324783325195, -5.292566299438477, -3.9411001205444336, -2.5896339416503906, -1.2381677627563477, 0.11329841613769531, 1.4647645950317383, 2.8162307739257812, 4.167696952819824, 5.519163131713867, 6.87062931060791, 8.222095489501953, 9.573561668395996, 10.925027847290039, 12.276494026184082, 13.627960205078125, 14.979426383972168, 16.33089256286621, 17.682357788085938, 19.033824920654297, 20.385292053222656, 21.736757278442383, 23.08822250366211, 24.43968963623047, 25.791156768798828, 27.142621994018555]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 2.0, 2.0, 8.0, 13.0, 9.0, 10.0, 9.0, 9.0, 19.0, 16.0, 21.0, 18.0, 20.0, 23.0, 23.0, 33.0, 29.0, 31.0, 35.0, 30.0, 32.0, 40.0, 41.0, 40.0, 40.0, 36.0, 34.0, 55.0, 35.0, 34.0, 25.0, 34.0, 23.0, 19.0, 25.0, 20.0, 20.0, 13.0, 11.0, 13.0, 8.0, 7.0, 12.0, 6.0, 4.0, 6.0, 2.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-30.69448471069336, -29.775320053100586, -28.856155395507812, -27.936988830566406, -27.017824172973633, -26.09865951538086, -25.179494857788086, -24.260330200195312, -23.341163635253906, -22.421998977661133, -21.50283432006836, -20.583667755126953, -19.66450309753418, -18.745338439941406, -17.826173782348633, -16.90700912475586, -15.98784351348877, -15.068678855895996, -14.149513244628906, -13.230348587036133, -12.311182975769043, -11.39201831817627, -10.47285270690918, -9.553688049316406, -8.634523391723633, -7.715358257293701, -6.7961931228637695, -5.877028465270996, -4.957862854003906, -4.038698196411133, -3.119533061981201, -2.2003679275512695, -1.2812023162841797, -0.3620372414588928, 0.557127833366394, 1.4762928485870361, 2.3954579830169678, 3.3146228790283203, 4.233788013458252, 5.152953147888184, 6.072118282318115, 6.991283416748047, 7.9104485511779785, 8.82961368560791, 9.748778343200684, 10.667943954467773, 11.587108612060547, 12.50627326965332, 13.42543888092041, 14.344603538513184, 15.263769149780273, 16.182933807373047, 17.10209846496582, 18.021263122558594, 18.9404296875, 19.859594345092773, 20.778759002685547, 21.69792366027832, 22.617088317871094, 23.5362548828125, 24.455419540405273, 25.374584197998047, 26.29374885559082, 27.212913513183594, 28.132080078125]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 3.0, 5.0, 4.0, 1.0, 7.0, 7.0, 7.0, 12.0, 8.0, 7.0, 26.0, 15.0, 29.0, 34.0, 30.0, 31.0, 34.0, 35.0, 48.0, 50.0, 40.0, 44.0, 51.0, 40.0, 53.0, 42.0, 34.0, 37.0, 43.0, 39.0, 26.0, 33.0, 22.0, 19.0, 26.0, 14.0, 12.0, 8.0, 13.0, 7.0, 4.0, 4.0, 4.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.796875, -3.676300048828125, -3.55572509765625, -3.435150146484375, -3.3145751953125, -3.194000244140625, -3.07342529296875, -2.952850341796875, -2.832275390625, -2.711700439453125, -2.59112548828125, -2.470550537109375, -2.3499755859375, -2.229400634765625, -2.10882568359375, -1.988250732421875, -1.86767578125, -1.747100830078125, -1.62652587890625, -1.505950927734375, -1.3853759765625, -1.264801025390625, -1.14422607421875, -1.023651123046875, -0.903076171875, -0.782501220703125, -0.66192626953125, -0.541351318359375, -0.4207763671875, -0.300201416015625, -0.17962646484375, -0.059051513671875, 0.0615234375, 0.182098388671875, 0.30267333984375, 0.423248291015625, 0.5438232421875, 0.664398193359375, 0.78497314453125, 0.905548095703125, 1.026123046875, 1.146697998046875, 1.26727294921875, 1.387847900390625, 1.5084228515625, 1.628997802734375, 1.74957275390625, 1.870147705078125, 1.99072265625, 2.111297607421875, 2.23187255859375, 2.352447509765625, 2.4730224609375, 2.593597412109375, 2.71417236328125, 2.834747314453125, 2.955322265625, 3.075897216796875, 3.19647216796875, 3.317047119140625, 3.4376220703125, 3.558197021484375, 3.67877197265625, 3.799346923828125, 3.919921875]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 3.0, 3.0, 8.0, 11.0, 14.0, 23.0, 32.0, 57.0, 72.0, 104.0, 148.0, 221.0, 326.0, 487.0, 779.0, 1126.0, 1727.0, 2744.0, 4255.0, 6390.0, 10092.0, 16375.0, 27268.0, 47397.0, 88357.0, 177140.0, 268134.0, 181908.0, 91217.0, 48277.0, 27909.0, 16776.0, 10547.0, 6591.0, 4196.0, 2613.0, 1751.0, 1171.0, 763.0, 486.0, 340.0, 254.0, 136.0, 120.0, 75.0, 39.0, 30.0, 19.0, 19.0, 7.0, 10.0, 11.0, 5.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.38134765625, -0.36962127685546875, -0.3578948974609375, -0.34616851806640625, -0.334442138671875, -0.32271575927734375, -0.3109893798828125, -0.29926300048828125, -0.28753662109375, -0.27581024169921875, -0.2640838623046875, -0.25235748291015625, -0.240631103515625, -0.22890472412109375, -0.2171783447265625, -0.20545196533203125, -0.1937255859375, -0.18199920654296875, -0.1702728271484375, -0.15854644775390625, -0.146820068359375, -0.13509368896484375, -0.1233673095703125, -0.11164093017578125, -0.09991455078125, -0.08818817138671875, -0.0764617919921875, -0.06473541259765625, -0.053009033203125, -0.04128265380859375, -0.0295562744140625, -0.01782989501953125, -0.006103515625, 0.00562286376953125, 0.0173492431640625, 0.02907562255859375, 0.040802001953125, 0.05252838134765625, 0.0642547607421875, 0.07598114013671875, 0.08770751953125, 0.09943389892578125, 0.1111602783203125, 0.12288665771484375, 0.134613037109375, 0.14633941650390625, 0.1580657958984375, 0.16979217529296875, 0.1815185546875, 0.19324493408203125, 0.2049713134765625, 0.21669769287109375, 0.228424072265625, 0.24015045166015625, 0.2518768310546875, 0.26360321044921875, 0.27532958984375, 0.28705596923828125, 0.2987823486328125, 0.31050872802734375, 0.322235107421875, 0.33396148681640625, 0.3456878662109375, 0.35741424560546875, 0.369140625]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 2.0, 5.0, 6.0, 5.0, 7.0, 6.0, 4.0, 7.0, 7.0, 10.0, 13.0, 23.0, 17.0, 21.0, 27.0, 24.0, 23.0, 36.0, 34.0, 41.0, 36.0, 41.0, 47.0, 37.0, 1061.0, 34.0, 43.0, 37.0, 39.0, 37.0, 22.0, 32.0, 27.0, 24.0, 35.0, 18.0, 18.0, 27.0, 18.0, 14.0, 14.0, 17.0, 8.0, 7.0, 6.0, 2.0, 4.0, 4.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.04296875, -1.9722900390625, -1.901611328125, -1.8309326171875, -1.76025390625, -1.6895751953125, -1.618896484375, -1.5482177734375, -1.4775390625, -1.4068603515625, -1.336181640625, -1.2655029296875, -1.19482421875, -1.1241455078125, -1.053466796875, -0.9827880859375, -0.912109375, -0.8414306640625, -0.770751953125, -0.7000732421875, -0.62939453125, -0.5587158203125, -0.488037109375, -0.4173583984375, -0.3466796875, -0.2760009765625, -0.205322265625, -0.1346435546875, -0.06396484375, 0.0067138671875, 0.077392578125, 0.1480712890625, 0.21875, 0.2894287109375, 0.360107421875, 0.4307861328125, 0.50146484375, 0.5721435546875, 0.642822265625, 0.7135009765625, 0.7841796875, 0.8548583984375, 0.925537109375, 0.9962158203125, 1.06689453125, 1.1375732421875, 1.208251953125, 1.2789306640625, 1.349609375, 1.4202880859375, 1.490966796875, 1.5616455078125, 1.63232421875, 1.7030029296875, 1.773681640625, 1.8443603515625, 1.9150390625, 1.9857177734375, 2.056396484375, 2.1270751953125, 2.19775390625, 2.2684326171875, 2.339111328125, 2.4097900390625, 2.48046875]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 1.0, 0.0, 5.0, 2.0, 2.0, 4.0, 10.0, 15.0, 19.0, 27.0, 27.0, 41.0, 74.0, 84.0, 137.0, 199.0, 334.0, 498.0, 840.0, 1360.0, 2282.0, 3981.0, 7005.0, 12526.0, 22797.0, 41902.0, 75468.0, 136617.0, 743214.0, 742445.0, 136474.0, 74942.0, 41424.0, 22842.0, 12726.0, 6871.0, 4000.0, 2331.0, 1338.0, 803.0, 505.0, 327.0, 217.0, 136.0, 93.0, 50.0, 33.0, 36.0, 27.0, 18.0, 10.0, 9.0, 2.0, 1.0, 5.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0], "bins": [-0.2244873046875, -0.21747207641601562, -0.21045684814453125, -0.20344161987304688, -0.1964263916015625, -0.18941116333007812, -0.18239593505859375, -0.17538070678710938, -0.168365478515625, -0.16135025024414062, -0.15433502197265625, -0.14731979370117188, -0.1403045654296875, -0.13328933715820312, -0.12627410888671875, -0.11925888061523438, -0.11224365234375, -0.10522842407226562, -0.09821319580078125, -0.09119796752929688, -0.0841827392578125, -0.07716751098632812, -0.07015228271484375, -0.06313705444335938, -0.056121826171875, -0.049106597900390625, -0.04209136962890625, -0.035076141357421875, -0.0280609130859375, -0.021045684814453125, -0.01403045654296875, -0.007015228271484375, 0.0, 0.007015228271484375, 0.01403045654296875, 0.021045684814453125, 0.0280609130859375, 0.035076141357421875, 0.04209136962890625, 0.049106597900390625, 0.056121826171875, 0.06313705444335938, 0.07015228271484375, 0.07716751098632812, 0.0841827392578125, 0.09119796752929688, 0.09821319580078125, 0.10522842407226562, 0.11224365234375, 0.11925888061523438, 0.12627410888671875, 0.13328933715820312, 0.1403045654296875, 0.14731979370117188, 0.15433502197265625, 0.16135025024414062, 0.168365478515625, 0.17538070678710938, 0.18239593505859375, 0.18941116333007812, 0.1964263916015625, 0.20344161987304688, 0.21045684814453125, 0.21747207641601562, 0.2244873046875]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 4.0, 4.0, 4.0, 5.0, 6.0, 6.0, 10.0, 8.0, 12.0, 7.0, 18.0, 20.0, 26.0, 33.0, 44.0, 96.0, 131.0, 162.0, 108.0, 73.0, 54.0, 28.0, 20.0, 26.0, 11.0, 12.0, 7.0, 8.0, 7.0, 12.0, 3.0, 6.0, 4.0, 4.0, 5.0, 4.0, 6.0, 3.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.005901336669921875, -0.005724668502807617, -0.005548000335693359, -0.0053713321685791016, -0.005194664001464844, -0.005017995834350586, -0.004841327667236328, -0.00466465950012207, -0.0044879913330078125, -0.004311323165893555, -0.004134654998779297, -0.003957986831665039, -0.0037813186645507812, -0.0036046504974365234, -0.0034279823303222656, -0.003251314163208008, -0.00307464599609375, -0.002897977828979492, -0.0027213096618652344, -0.0025446414947509766, -0.0023679733276367188, -0.002191305160522461, -0.002014636993408203, -0.0018379688262939453, -0.0016613006591796875, -0.0014846324920654297, -0.0013079643249511719, -0.001131296157836914, -0.0009546279907226562, -0.0007779598236083984, -0.0006012916564941406, -0.0004246234893798828, -0.000247955322265625, -7.128715515136719e-05, 0.00010538101196289062, 0.00028204917907714844, 0.00045871734619140625, 0.0006353855133056641, 0.0008120536804199219, 0.0009887218475341797, 0.0011653900146484375, 0.0013420581817626953, 0.0015187263488769531, 0.001695394515991211, 0.0018720626831054688, 0.0020487308502197266, 0.0022253990173339844, 0.002402067184448242, 0.0025787353515625, 0.002755403518676758, 0.0029320716857910156, 0.0031087398529052734, 0.0032854080200195312, 0.003462076187133789, 0.003638744354248047, 0.0038154125213623047, 0.0039920806884765625, 0.00416874885559082, 0.004345417022705078, 0.004522085189819336, 0.004698753356933594, 0.0048754215240478516, 0.005052089691162109, 0.005228757858276367, 0.005405426025390625]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 0.0, 3.0, 1.0, 3.0, 6.0, 5.0, 10.0, 8.0, 15.0, 6.0, 9.0, 13.0, 24.0, 19.0, 33.0, 45.0, 56.0, 66.0, 114.0, 193.0, 362.0, 1274.0, 13215.0, 970061.0, 59100.0, 2621.0, 562.0, 239.0, 137.0, 79.0, 54.0, 42.0, 39.0, 31.0, 25.0, 15.0, 18.0, 15.0, 7.0, 10.0, 8.0, 7.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07989501953125, -0.07720470428466797, -0.07451438903808594, -0.0718240737915039, -0.06913375854492188, -0.06644344329833984, -0.06375312805175781, -0.06106281280517578, -0.05837249755859375, -0.05568218231201172, -0.05299186706542969, -0.050301551818847656, -0.047611236572265625, -0.044920921325683594, -0.04223060607910156, -0.03954029083251953, -0.0368499755859375, -0.03415966033935547, -0.03146934509277344, -0.028779029846191406, -0.026088714599609375, -0.023398399353027344, -0.020708084106445312, -0.01801776885986328, -0.01532745361328125, -0.012637138366699219, -0.009946823120117188, -0.007256507873535156, -0.004566192626953125, -0.0018758773803710938, 0.0008144378662109375, 0.0035047531127929688, 0.006195068359375, 0.008885383605957031, 0.011575698852539062, 0.014266014099121094, 0.016956329345703125, 0.019646644592285156, 0.022336959838867188, 0.02502727508544922, 0.02771759033203125, 0.03040790557861328, 0.03309822082519531, 0.035788536071777344, 0.038478851318359375, 0.041169166564941406, 0.04385948181152344, 0.04654979705810547, 0.0492401123046875, 0.05193042755126953, 0.05462074279785156, 0.057311058044433594, 0.060001373291015625, 0.06269168853759766, 0.06538200378417969, 0.06807231903076172, 0.07076263427734375, 0.07345294952392578, 0.07614326477050781, 0.07883358001708984, 0.08152389526367188, 0.0842142105102539, 0.08690452575683594, 0.08959484100341797, 0.09228515625]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [8.0, 75.0, 800.0, 119.0, 15.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004419796168804169, -0.00264784786850214, -0.000875899801030755, 0.00089604826644063, 0.0026679965667426586, 0.0044399444013834, 0.006211892701685429, 0.007983841001987457, 0.009755789302289486, 0.011527737602591515, 0.013299685902893543, 0.015071634203195572, 0.016843581572175026, 0.01861552894115448, 0.020387478172779083, 0.022159427404403687, 0.02393137477338314, 0.025703322142362595, 0.027475271373987198, 0.029247218742966652, 0.031019167974591255, 0.03279111534357071, 0.03456306457519531, 0.036335013806819916, 0.03810695931315422, 0.039878908544778824, 0.04165085405111313, 0.04342280328273773, 0.045194752514362335, 0.04696670174598694, 0.04873864725232124, 0.05051059648394585, 0.05228254571557045, 0.05405449494719505, 0.05582644045352936, 0.05759838968515396, 0.059370338916778564, 0.06114228814840317, 0.06291423738002777, 0.06468617916107178, 0.06645812839269638, 0.06823007762432098, 0.07000202685594559, 0.07177397608757019, 0.0735459178686142, 0.0753178671002388, 0.0770898163318634, 0.078861765563488, 0.08063371479511261, 0.08240566402673721, 0.08417761325836182, 0.08594956248998642, 0.08772150427103043, 0.08949345350265503, 0.09126540273427963, 0.09303735196590424, 0.09480930119752884, 0.09658125042915344, 0.09835319966077805, 0.10012514889240265, 0.10189709067344666, 0.10366903990507126, 0.10544098913669586, 0.10721293836832047, 0.10898488759994507]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 6.0, 8.0, 7.0, 8.0, 14.0, 12.0, 16.0, 31.0, 37.0, 54.0, 37.0, 31.0, 47.0, 50.0, 48.0, 49.0, 42.0, 51.0, 53.0, 40.0, 59.0, 37.0, 48.0, 28.0, 31.0, 39.0, 26.0, 20.0, 16.0, 10.0, 14.0, 7.0, 7.0, 7.0, 5.0, 5.0, 2.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00777125358581543, -0.007561325095593929, -0.007351396605372429, -0.0071414681151509285, -0.006931539624929428, -0.006721611134707928, -0.006511682644486427, -0.006301754154264927, -0.0060918256640434265, -0.005881897173821926, -0.005671968683600426, -0.005462040193378925, -0.005252111703157425, -0.0050421832129359245, -0.004832254722714424, -0.004622326232492924, -0.004412397742271423, -0.004202469252049923, -0.0039925407618284225, -0.003782612271606922, -0.0035726837813854218, -0.0033627552911639214, -0.003152826800942421, -0.0029428983107209206, -0.00273296982049942, -0.0025230413302779198, -0.0023131128400564194, -0.002103184349834919, -0.0018932558596134186, -0.0016833273693919182, -0.0014733988791704178, -0.0012634703889489174, -0.001053541898727417, -0.0008436134085059166, -0.0006336849182844162, -0.0004237564280629158, -0.0002138279378414154, -3.8994476199150085e-06, 0.0002060290426015854, 0.0004159575328230858, 0.0006258860230445862, 0.0008358145132660866, 0.001045743003487587, 0.0012556714937090874, 0.0014655999839305878, 0.0016755284741520882, 0.0018854569643735886, 0.002095385454595089, 0.0023053139448165894, 0.0025152424350380898, 0.00272517092525959, 0.0029350994154810905, 0.003145027905702591, 0.0033549563959240913, 0.0035648848861455917, 0.003774813376367092, 0.0039847418665885925, 0.004194670356810093, 0.004404598847031593, 0.004614527337253094, 0.004824455827474594, 0.0050343843176960945, 0.005244312807917595, 0.005454241298139095, 0.005664169788360596]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 3.0, 5.0, 4.0, 1.0, 7.0, 7.0, 7.0, 12.0, 8.0, 7.0, 26.0, 16.0, 28.0, 33.0, 31.0, 31.0, 34.0, 35.0, 48.0, 50.0, 40.0, 44.0, 51.0, 40.0, 53.0, 42.0, 34.0, 37.0, 43.0, 39.0, 26.0, 33.0, 22.0, 19.0, 26.0, 14.0, 12.0, 8.0, 13.0, 7.0, 4.0, 4.0, 4.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.796875, -3.676300048828125, -3.55572509765625, -3.435150146484375, -3.3145751953125, -3.194000244140625, -3.07342529296875, -2.952850341796875, -2.832275390625, -2.711700439453125, -2.59112548828125, -2.470550537109375, -2.3499755859375, -2.229400634765625, -2.10882568359375, -1.988250732421875, -1.86767578125, -1.747100830078125, -1.62652587890625, -1.505950927734375, -1.3853759765625, -1.264801025390625, -1.14422607421875, -1.023651123046875, -0.903076171875, -0.782501220703125, -0.66192626953125, -0.541351318359375, -0.4207763671875, -0.300201416015625, -0.17962646484375, -0.059051513671875, 0.0615234375, 0.182098388671875, 0.30267333984375, 0.423248291015625, 0.5438232421875, 0.664398193359375, 0.78497314453125, 0.905548095703125, 1.026123046875, 1.146697998046875, 1.26727294921875, 1.387847900390625, 1.5084228515625, 1.628997802734375, 1.74957275390625, 1.870147705078125, 1.99072265625, 2.111297607421875, 2.23187255859375, 2.352447509765625, 2.4730224609375, 2.593597412109375, 2.71417236328125, 2.834747314453125, 2.955322265625, 3.075897216796875, 3.19647216796875, 3.317047119140625, 3.4376220703125, 3.558197021484375, 3.67877197265625, 3.799346923828125, 3.919921875]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 3.0, 7.0, 14.0, 11.0, 17.0, 30.0, 36.0, 44.0, 60.0, 112.0, 156.0, 201.0, 297.0, 433.0, 730.0, 1139.0, 1711.0, 2930.0, 4907.0, 8622.0, 15599.0, 29793.0, 63009.0, 148960.0, 354177.0, 234576.0, 91179.0, 41695.0, 20646.0, 11266.0, 6429.0, 3697.0, 2171.0, 1359.0, 823.0, 581.0, 332.0, 237.0, 166.0, 124.0, 81.0, 74.0, 46.0, 25.0, 21.0, 12.0, 8.0, 4.0, 9.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-1.8818359375, -1.8225250244140625, -1.763214111328125, -1.7039031982421875, -1.64459228515625, -1.5852813720703125, -1.525970458984375, -1.4666595458984375, -1.4073486328125, -1.3480377197265625, -1.288726806640625, -1.2294158935546875, -1.17010498046875, -1.1107940673828125, -1.051483154296875, -0.9921722412109375, -0.932861328125, -0.8735504150390625, -0.814239501953125, -0.7549285888671875, -0.69561767578125, -0.6363067626953125, -0.576995849609375, -0.5176849365234375, -0.4583740234375, -0.3990631103515625, -0.339752197265625, -0.2804412841796875, -0.22113037109375, -0.1618194580078125, -0.102508544921875, -0.0431976318359375, 0.01611328125, 0.0754241943359375, 0.134735107421875, 0.1940460205078125, 0.25335693359375, 0.3126678466796875, 0.371978759765625, 0.4312896728515625, 0.4906005859375, 0.5499114990234375, 0.609222412109375, 0.6685333251953125, 0.72784423828125, 0.7871551513671875, 0.846466064453125, 0.9057769775390625, 0.965087890625, 1.0243988037109375, 1.083709716796875, 1.1430206298828125, 1.20233154296875, 1.2616424560546875, 1.320953369140625, 1.3802642822265625, 1.4395751953125, 1.4988861083984375, 1.558197021484375, 1.6175079345703125, 1.67681884765625, 1.7361297607421875, 1.795440673828125, 1.8547515869140625, 1.9140625]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 8.0, 4.0, 7.0, 6.0, 8.0, 25.0, 29.0, 20.0, 19.0, 27.0, 24.0, 24.0, 31.0, 32.0, 39.0, 53.0, 55.0, 65.0, 129.0, 1660.0, 241.0, 96.0, 54.0, 46.0, 44.0, 35.0, 43.0, 30.0, 29.0, 28.0, 19.0, 14.0, 16.0, 21.0, 14.0, 12.0, 7.0, 5.0, 7.0, 7.0, 5.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.2578125, -11.8717041015625, -11.485595703125, -11.0994873046875, -10.71337890625, -10.3272705078125, -9.941162109375, -9.5550537109375, -9.1689453125, -8.7828369140625, -8.396728515625, -8.0106201171875, -7.62451171875, -7.2384033203125, -6.852294921875, -6.4661865234375, -6.080078125, -5.6939697265625, -5.307861328125, -4.9217529296875, -4.53564453125, -4.1495361328125, -3.763427734375, -3.3773193359375, -2.9912109375, -2.6051025390625, -2.218994140625, -1.8328857421875, -1.44677734375, -1.0606689453125, -0.674560546875, -0.2884521484375, 0.09765625, 0.4837646484375, 0.869873046875, 1.2559814453125, 1.64208984375, 2.0281982421875, 2.414306640625, 2.8004150390625, 3.1865234375, 3.5726318359375, 3.958740234375, 4.3448486328125, 4.73095703125, 5.1170654296875, 5.503173828125, 5.8892822265625, 6.275390625, 6.6614990234375, 7.047607421875, 7.4337158203125, 7.81982421875, 8.2059326171875, 8.592041015625, 8.9781494140625, 9.3642578125, 9.7503662109375, 10.136474609375, 10.5225830078125, 10.90869140625, 11.2947998046875, 11.680908203125, 12.0670166015625, 12.453125]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 5.0, 4.0, 8.0, 8.0, 7.0, 7.0, 8.0, 13.0, 20.0, 24.0, 20.0, 23.0, 29.0, 56.0, 69.0, 98.0, 148.0, 256.0, 396.0, 862.0, 2261.0, 12402.0, 674661.0, 2431478.0, 17836.0, 2766.0, 916.0, 509.0, 239.0, 153.0, 111.0, 68.0, 38.0, 44.0, 25.0, 33.0, 27.0, 23.0, 16.0, 6.0, 8.0, 5.0, 5.0, 8.0, 5.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.171875, -17.567626953125, -16.96337890625, -16.359130859375, -15.7548828125, -15.150634765625, -14.54638671875, -13.942138671875, -13.337890625, -12.733642578125, -12.12939453125, -11.525146484375, -10.9208984375, -10.316650390625, -9.71240234375, -9.108154296875, -8.50390625, -7.899658203125, -7.29541015625, -6.691162109375, -6.0869140625, -5.482666015625, -4.87841796875, -4.274169921875, -3.669921875, -3.065673828125, -2.46142578125, -1.857177734375, -1.2529296875, -0.648681640625, -0.04443359375, 0.559814453125, 1.1640625, 1.768310546875, 2.37255859375, 2.976806640625, 3.5810546875, 4.185302734375, 4.78955078125, 5.393798828125, 5.998046875, 6.602294921875, 7.20654296875, 7.810791015625, 8.4150390625, 9.019287109375, 9.62353515625, 10.227783203125, 10.83203125, 11.436279296875, 12.04052734375, 12.644775390625, 13.2490234375, 13.853271484375, 14.45751953125, 15.061767578125, 15.666015625, 16.270263671875, 16.87451171875, 17.478759765625, 18.0830078125, 18.687255859375, 19.29150390625, 19.895751953125, 20.5]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 7.0, 72.0, 348.0, 447.0, 124.0, 13.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-117.26617431640625, -115.05855560302734, -112.85093688964844, -110.64331817626953, -108.43569946289062, -106.22808837890625, -104.02046203613281, -101.81285095214844, -99.60523223876953, -97.39761352539062, -95.18999481201172, -92.98237609863281, -90.7747573852539, -88.567138671875, -86.35952758789062, -84.15190887451172, -81.94429016113281, -79.7366714477539, -77.529052734375, -75.3214340209961, -73.11381530761719, -70.90620422363281, -68.69857788085938, -66.490966796875, -64.28334045410156, -62.075721740722656, -59.86810302734375, -57.660484313964844, -55.4528694152832, -53.2452507019043, -51.03763198852539, -48.830013275146484, -46.622398376464844, -44.41477966308594, -42.20716094970703, -39.999542236328125, -37.791927337646484, -35.58430862426758, -33.37668991088867, -31.169071197509766, -28.961456298828125, -26.75383758544922, -24.546220779418945, -22.33860206604004, -20.130985260009766, -17.92336654663086, -15.715747833251953, -13.508130073547363, -11.300512313842773, -9.092894554138184, -6.8852763175964355, -4.6776580810546875, -2.4700403213500977, -0.2624225616455078, 1.9451961517333984, 4.152813911437988, 6.360431671142578, 8.568049430847168, 10.775667190551758, 12.983285903930664, 15.190903663635254, 17.398521423339844, 19.60614013671875, 21.813758850097656, 24.02137565612793]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 3.0, 6.0, 5.0, 5.0, 10.0, 15.0, 12.0, 19.0, 18.0, 30.0, 24.0, 29.0, 27.0, 39.0, 32.0, 36.0, 35.0, 43.0, 33.0, 52.0, 39.0, 58.0, 43.0, 50.0, 36.0, 46.0, 29.0, 27.0, 27.0, 19.0, 27.0, 26.0, 18.0, 15.0, 19.0, 13.0, 4.0, 9.0, 10.0, 1.0, 5.0, 6.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.27018737792969, -34.985939025878906, -33.701690673828125, -32.41743850708008, -31.133190155029297, -29.848941802978516, -28.564693450927734, -27.280445098876953, -25.99619483947754, -24.711946487426758, -23.427696228027344, -22.143447875976562, -20.85919952392578, -19.574949264526367, -18.290700912475586, -17.006450653076172, -15.72220230102539, -14.437952995300293, -13.153703689575195, -11.869455337524414, -10.585206031799316, -9.300956726074219, -8.016708374023438, -6.73245906829834, -5.448209762573242, -4.1639604568481445, -2.879711627960205, -1.5954625606536865, -0.31121349334716797, 0.9730358123779297, 2.257284641265869, 3.5415334701538086, 4.825778961181641, 6.110028266906738, 7.394277095794678, 8.678525924682617, 9.962775230407715, 11.247024536132812, 12.531272888183594, 13.815522193908691, 15.099771499633789, 16.38401985168457, 17.668270111083984, 18.952518463134766, 20.236766815185547, 21.52101707458496, 22.805265426635742, 24.089515686035156, 25.373764038085938, 26.65801239013672, 27.942262649536133, 29.226511001586914, 30.510761260986328, 31.79500961303711, 33.07925796508789, 34.36350631713867, 35.64775848388672, 36.9320068359375, 38.21625518798828, 39.50050735473633, 40.78475570678711, 42.06900405883789, 43.35325241088867, 44.63750076293945, 45.921749114990234]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 1.0, 5.0, 8.0, 8.0, 9.0, 10.0, 5.0, 16.0, 23.0, 23.0, 27.0, 28.0, 34.0, 29.0, 41.0, 36.0, 45.0, 47.0, 48.0, 52.0, 50.0, 48.0, 39.0, 40.0, 45.0, 40.0, 36.0, 33.0, 32.0, 28.0, 20.0, 22.0, 12.0, 18.0, 11.0, 7.0, 9.0, 8.0, 4.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.876953125, -3.751861572265625, -3.62677001953125, -3.501678466796875, -3.3765869140625, -3.251495361328125, -3.12640380859375, -3.001312255859375, -2.876220703125, -2.751129150390625, -2.62603759765625, -2.500946044921875, -2.3758544921875, -2.250762939453125, -2.12567138671875, -2.000579833984375, -1.87548828125, -1.750396728515625, -1.62530517578125, -1.500213623046875, -1.3751220703125, -1.250030517578125, -1.12493896484375, -0.999847412109375, -0.874755859375, -0.749664306640625, -0.62457275390625, -0.499481201171875, -0.3743896484375, -0.249298095703125, -0.12420654296875, 0.000885009765625, 0.1259765625, 0.251068115234375, 0.37615966796875, 0.501251220703125, 0.6263427734375, 0.751434326171875, 0.87652587890625, 1.001617431640625, 1.126708984375, 1.251800537109375, 1.37689208984375, 1.501983642578125, 1.6270751953125, 1.752166748046875, 1.87725830078125, 2.002349853515625, 2.12744140625, 2.252532958984375, 2.37762451171875, 2.502716064453125, 2.6278076171875, 2.752899169921875, 2.87799072265625, 3.003082275390625, 3.128173828125, 3.253265380859375, 3.37835693359375, 3.503448486328125, 3.6285400390625, 3.753631591796875, 3.87872314453125, 4.003814697265625, 4.12890625]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 1.0, 0.0, 2.0, 3.0, 10.0, 9.0, 7.0, 5.0, 13.0, 15.0, 15.0, 20.0, 25.0, 39.0, 53.0, 100.0, 182.0, 447.0, 1282.0, 4463.0, 17470.0, 84433.0, 713191.0, 2851817.0, 441216.0, 61076.0, 13115.0, 3466.0, 1059.0, 325.0, 146.0, 80.0, 53.0, 33.0, 33.0, 18.0, 14.0, 7.0, 16.0, 8.0, 4.0, 9.0, 4.0, 1.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.34375, -11.004150390625, -10.66455078125, -10.324951171875, -9.9853515625, -9.645751953125, -9.30615234375, -8.966552734375, -8.626953125, -8.287353515625, -7.94775390625, -7.608154296875, -7.2685546875, -6.928955078125, -6.58935546875, -6.249755859375, -5.91015625, -5.570556640625, -5.23095703125, -4.891357421875, -4.5517578125, -4.212158203125, -3.87255859375, -3.532958984375, -3.193359375, -2.853759765625, -2.51416015625, -2.174560546875, -1.8349609375, -1.495361328125, -1.15576171875, -0.816162109375, -0.4765625, -0.136962890625, 0.20263671875, 0.542236328125, 0.8818359375, 1.221435546875, 1.56103515625, 1.900634765625, 2.240234375, 2.579833984375, 2.91943359375, 3.259033203125, 3.5986328125, 3.938232421875, 4.27783203125, 4.617431640625, 4.95703125, 5.296630859375, 5.63623046875, 5.975830078125, 6.3154296875, 6.655029296875, 6.99462890625, 7.334228515625, 7.673828125, 8.013427734375, 8.35302734375, 8.692626953125, 9.0322265625, 9.371826171875, 9.71142578125, 10.051025390625, 10.390625]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 10.0, 9.0, 7.0, 9.0, 9.0, 13.0, 31.0, 28.0, 40.0, 62.0, 85.0, 113.0, 151.0, 232.0, 344.0, 407.0, 500.0, 552.0, 442.0, 292.0, 214.0, 169.0, 115.0, 75.0, 45.0, 38.0, 22.0, 16.0, 13.0, 14.0, 7.0, 6.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.0078125, -9.6732177734375, -9.338623046875, -9.0040283203125, -8.66943359375, -8.3348388671875, -8.000244140625, -7.6656494140625, -7.3310546875, -6.9964599609375, -6.661865234375, -6.3272705078125, -5.99267578125, -5.6580810546875, -5.323486328125, -4.9888916015625, -4.654296875, -4.3197021484375, -3.985107421875, -3.6505126953125, -3.31591796875, -2.9813232421875, -2.646728515625, -2.3121337890625, -1.9775390625, -1.6429443359375, -1.308349609375, -0.9737548828125, -0.63916015625, -0.3045654296875, 0.030029296875, 0.3646240234375, 0.69921875, 1.0338134765625, 1.368408203125, 1.7030029296875, 2.03759765625, 2.3721923828125, 2.706787109375, 3.0413818359375, 3.3759765625, 3.7105712890625, 4.045166015625, 4.3797607421875, 4.71435546875, 5.0489501953125, 5.383544921875, 5.7181396484375, 6.052734375, 6.3873291015625, 6.721923828125, 7.0565185546875, 7.39111328125, 7.7257080078125, 8.060302734375, 8.3948974609375, 8.7294921875, 9.0640869140625, 9.398681640625, 9.7332763671875, 10.06787109375, 10.4024658203125, 10.737060546875, 11.0716552734375, 11.40625]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 4.0, 6.0, 9.0, 13.0, 10.0, 26.0, 35.0, 40.0, 64.0, 134.0, 197.0, 415.0, 777.0, 1998.0, 6264.0, 26808.0, 158493.0, 1471535.0, 2245096.0, 232848.0, 36968.0, 8053.0, 2336.0, 1012.0, 483.0, 258.0, 153.0, 84.0, 56.0, 37.0, 27.0, 10.0, 11.0, 9.0, 9.0, 5.0, 2.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.171875, -18.609619140625, -18.04736328125, -17.485107421875, -16.9228515625, -16.360595703125, -15.79833984375, -15.236083984375, -14.673828125, -14.111572265625, -13.54931640625, -12.987060546875, -12.4248046875, -11.862548828125, -11.30029296875, -10.738037109375, -10.17578125, -9.613525390625, -9.05126953125, -8.489013671875, -7.9267578125, -7.364501953125, -6.80224609375, -6.239990234375, -5.677734375, -5.115478515625, -4.55322265625, -3.990966796875, -3.4287109375, -2.866455078125, -2.30419921875, -1.741943359375, -1.1796875, -0.617431640625, -0.05517578125, 0.507080078125, 1.0693359375, 1.631591796875, 2.19384765625, 2.756103515625, 3.318359375, 3.880615234375, 4.44287109375, 5.005126953125, 5.5673828125, 6.129638671875, 6.69189453125, 7.254150390625, 7.81640625, 8.378662109375, 8.94091796875, 9.503173828125, 10.0654296875, 10.627685546875, 11.18994140625, 11.752197265625, 12.314453125, 12.876708984375, 13.43896484375, 14.001220703125, 14.5634765625, 15.125732421875, 15.68798828125, 16.250244140625, 16.8125]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 11.0, 16.0, 30.0, 53.0, 95.0, 163.0, 164.0, 195.0, 123.0, 85.0, 35.0, 28.0, 6.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-94.38919830322266, -91.76712036132812, -89.14505004882812, -86.5229721069336, -83.90089416503906, -81.27882385253906, -78.65674591064453, -76.03466796875, -73.41259765625, -70.79051971435547, -68.16844940185547, -65.54637145996094, -62.924293518066406, -60.30221939086914, -57.680145263671875, -55.058067321777344, -52.43598937988281, -49.81391525268555, -47.191837310791016, -44.56976318359375, -41.94768524169922, -39.32561111450195, -36.70353698730469, -34.081459045410156, -31.45938491821289, -28.837308883666992, -26.215232849121094, -23.593158721923828, -20.97108268737793, -18.34900665283203, -15.72693157196045, -13.104856491088867, -10.482780456542969, -7.8607048988342285, -5.238629341125488, -2.616553783416748, 0.0055217742919921875, 2.6275978088378906, 5.249672889709473, 7.871747970581055, 10.493824005126953, 13.115900039672852, 15.737975120544434, 18.360050201416016, 20.982126235961914, 23.604202270507812, 26.226276397705078, 28.848352432250977, 31.470428466796875, 34.09250259399414, 36.71458053588867, 39.33665466308594, 41.95873260498047, 44.580806732177734, 47.202880859375, 49.82495880126953, 52.4470329284668, 55.06910705566406, 57.691184997558594, 60.31325912475586, 62.935333251953125, 65.55741119384766, 68.17948913574219, 70.80155944824219, 73.42363739013672]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 4.0, 5.0, 2.0, 11.0, 7.0, 10.0, 16.0, 9.0, 14.0, 14.0, 15.0, 18.0, 19.0, 26.0, 27.0, 22.0, 23.0, 32.0, 45.0, 26.0, 30.0, 46.0, 38.0, 31.0, 43.0, 23.0, 37.0, 32.0, 30.0, 30.0, 26.0, 38.0, 25.0, 29.0, 29.0, 32.0, 18.0, 16.0, 13.0, 15.0, 15.0, 14.0, 8.0, 3.0, 3.0, 8.0, 9.0, 7.0, 2.0, 4.0, 0.0, 4.0, 1.0, 1.0, 3.0, 2.0], "bins": [-29.889083862304688, -28.96579360961914, -28.042503356933594, -27.119213104248047, -26.1959228515625, -25.272632598876953, -24.34934425354004, -23.426054000854492, -22.502763748168945, -21.5794734954834, -20.65618324279785, -19.732892990112305, -18.80960464477539, -17.886314392089844, -16.963024139404297, -16.03973388671875, -15.116443634033203, -14.193153381347656, -13.26986312866211, -12.346573829650879, -11.423283576965332, -10.499993324279785, -9.576704025268555, -8.653413772583008, -7.730123519897461, -6.806833267211914, -5.883543491363525, -4.960253715515137, -4.03696346282959, -3.113673210144043, -2.1903834342956543, -1.2670936584472656, -0.34380340576171875, 0.579486608505249, 1.5027766227722168, 2.4260666370391846, 3.3493566513061523, 4.272646903991699, 5.195936679840088, 6.119226455688477, 7.042516708374023, 7.96580696105957, 8.889097213745117, 9.812386512756348, 10.735676765441895, 11.658967018127441, 12.582256317138672, 13.505546569824219, 14.428836822509766, 15.352127075195312, 16.27541732788086, 17.198707580566406, 18.121997833251953, 19.0452880859375, 19.968576431274414, 20.89186668395996, 21.815156936645508, 22.738447189331055, 23.6617374420166, 24.58502769470215, 25.508316040039062, 26.43160629272461, 27.354896545410156, 28.278186798095703, 29.20147705078125]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 6.0, 11.0, 4.0, 8.0, 10.0, 10.0, 8.0, 18.0, 15.0, 15.0, 22.0, 27.0, 21.0, 30.0, 33.0, 35.0, 48.0, 53.0, 44.0, 45.0, 50.0, 46.0, 50.0, 46.0, 42.0, 38.0, 39.0, 32.0, 27.0, 24.0, 29.0, 20.0, 26.0, 12.0, 16.0, 12.0, 10.0, 6.0, 7.0, 3.0, 3.0, 4.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.0625, -3.9384765625, -3.814453125, -3.6904296875, -3.56640625, -3.4423828125, -3.318359375, -3.1943359375, -3.0703125, -2.9462890625, -2.822265625, -2.6982421875, -2.57421875, -2.4501953125, -2.326171875, -2.2021484375, -2.078125, -1.9541015625, -1.830078125, -1.7060546875, -1.58203125, -1.4580078125, -1.333984375, -1.2099609375, -1.0859375, -0.9619140625, -0.837890625, -0.7138671875, -0.58984375, -0.4658203125, -0.341796875, -0.2177734375, -0.09375, 0.0302734375, 0.154296875, 0.2783203125, 0.40234375, 0.5263671875, 0.650390625, 0.7744140625, 0.8984375, 1.0224609375, 1.146484375, 1.2705078125, 1.39453125, 1.5185546875, 1.642578125, 1.7666015625, 1.890625, 2.0146484375, 2.138671875, 2.2626953125, 2.38671875, 2.5107421875, 2.634765625, 2.7587890625, 2.8828125, 3.0068359375, 3.130859375, 3.2548828125, 3.37890625, 3.5029296875, 3.626953125, 3.7509765625, 3.875]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 4.0, 4.0, 2.0, 12.0, 15.0, 15.0, 28.0, 38.0, 58.0, 72.0, 122.0, 163.0, 239.0, 363.0, 491.0, 740.0, 987.0, 1517.0, 2274.0, 3267.0, 4937.0, 7248.0, 11273.0, 16924.0, 26741.0, 41357.0, 67137.0, 113194.0, 185021.0, 206415.0, 137387.0, 81003.0, 49249.0, 30810.0, 19895.0, 13141.0, 8627.0, 5898.0, 3808.0, 2551.0, 1703.0, 1196.0, 815.0, 559.0, 353.0, 285.0, 185.0, 142.0, 95.0, 48.0, 51.0, 40.0, 22.0, 19.0, 11.0, 8.0, 4.0, 4.0, 2.0, 0.0, 2.0], "bins": [-0.345703125, -0.3349609375, -0.32421875, -0.3134765625, -0.302734375, -0.2919921875, -0.28125, -0.2705078125, -0.259765625, -0.2490234375, -0.23828125, -0.2275390625, -0.216796875, -0.2060546875, -0.1953125, -0.1845703125, -0.173828125, -0.1630859375, -0.15234375, -0.1416015625, -0.130859375, -0.1201171875, -0.109375, -0.0986328125, -0.087890625, -0.0771484375, -0.06640625, -0.0556640625, -0.044921875, -0.0341796875, -0.0234375, -0.0126953125, -0.001953125, 0.0087890625, 0.01953125, 0.0302734375, 0.041015625, 0.0517578125, 0.0625, 0.0732421875, 0.083984375, 0.0947265625, 0.10546875, 0.1162109375, 0.126953125, 0.1376953125, 0.1484375, 0.1591796875, 0.169921875, 0.1806640625, 0.19140625, 0.2021484375, 0.212890625, 0.2236328125, 0.234375, 0.2451171875, 0.255859375, 0.2666015625, 0.27734375, 0.2880859375, 0.298828125, 0.3095703125, 0.3203125, 0.3310546875, 0.341796875]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 6.0, 4.0, 10.0, 10.0, 6.0, 12.0, 11.0, 10.0, 17.0, 28.0, 17.0, 23.0, 27.0, 24.0, 30.0, 23.0, 37.0, 40.0, 49.0, 46.0, 40.0, 1067.0, 42.0, 33.0, 46.0, 51.0, 38.0, 41.0, 25.0, 32.0, 26.0, 30.0, 17.0, 15.0, 23.0, 12.0, 13.0, 11.0, 8.0, 5.0, 5.0, 7.0, 8.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.55078125, -2.470916748046875, -2.39105224609375, -2.311187744140625, -2.2313232421875, -2.151458740234375, -2.07159423828125, -1.991729736328125, -1.911865234375, -1.832000732421875, -1.75213623046875, -1.672271728515625, -1.5924072265625, -1.512542724609375, -1.43267822265625, -1.352813720703125, -1.27294921875, -1.193084716796875, -1.11322021484375, -1.033355712890625, -0.9534912109375, -0.873626708984375, -0.79376220703125, -0.713897705078125, -0.634033203125, -0.554168701171875, -0.47430419921875, -0.394439697265625, -0.3145751953125, -0.234710693359375, -0.15484619140625, -0.074981689453125, 0.0048828125, 0.084747314453125, 0.16461181640625, 0.244476318359375, 0.3243408203125, 0.404205322265625, 0.48406982421875, 0.563934326171875, 0.643798828125, 0.723663330078125, 0.80352783203125, 0.883392333984375, 0.9632568359375, 1.043121337890625, 1.12298583984375, 1.202850341796875, 1.28271484375, 1.362579345703125, 1.44244384765625, 1.522308349609375, 1.6021728515625, 1.682037353515625, 1.76190185546875, 1.841766357421875, 1.921630859375, 2.001495361328125, 2.08135986328125, 2.161224365234375, 2.2410888671875, 2.320953369140625, 2.40081787109375, 2.480682373046875, 2.560546875]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 2.0, 6.0, 3.0, 3.0, 6.0, 11.0, 13.0, 27.0, 26.0, 39.0, 69.0, 92.0, 126.0, 222.0, 303.0, 464.0, 812.0, 1384.0, 2254.0, 3971.0, 6871.0, 12497.0, 22942.0, 41899.0, 79403.0, 146302.0, 1232424.0, 262621.0, 129863.0, 69236.0, 37272.0, 19861.0, 11181.0, 6190.0, 3450.0, 2067.0, 1263.0, 715.0, 434.0, 267.0, 179.0, 122.0, 78.0, 52.0, 39.0, 24.0, 15.0, 19.0, 3.0, 5.0, 3.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.2415771484375, -0.23375892639160156, -0.22594070434570312, -0.2181224822998047, -0.21030426025390625, -0.2024860382080078, -0.19466781616210938, -0.18684959411621094, -0.1790313720703125, -0.17121315002441406, -0.16339492797851562, -0.1555767059326172, -0.14775848388671875, -0.1399402618408203, -0.13212203979492188, -0.12430381774902344, -0.116485595703125, -0.10866737365722656, -0.10084915161132812, -0.09303092956542969, -0.08521270751953125, -0.07739448547363281, -0.06957626342773438, -0.06175804138183594, -0.0539398193359375, -0.04612159729003906, -0.038303375244140625, -0.030485153198242188, -0.02266693115234375, -0.014848709106445312, -0.007030487060546875, 0.0007877349853515625, 0.00860595703125, 0.016424179077148438, 0.024242401123046875, 0.03206062316894531, 0.03987884521484375, 0.04769706726074219, 0.055515289306640625, 0.06333351135253906, 0.0711517333984375, 0.07896995544433594, 0.08678817749023438, 0.09460639953613281, 0.10242462158203125, 0.11024284362792969, 0.11806106567382812, 0.12587928771972656, 0.133697509765625, 0.14151573181152344, 0.14933395385742188, 0.1571521759033203, 0.16497039794921875, 0.1727886199951172, 0.18060684204101562, 0.18842506408691406, 0.1962432861328125, 0.20406150817871094, 0.21187973022460938, 0.2196979522705078, 0.22751617431640625, 0.2353343963623047, 0.24315261840820312, 0.25097084045410156, 0.2587890625]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 6.0, 6.0, 4.0, 8.0, 4.0, 9.0, 13.0, 12.0, 13.0, 24.0, 31.0, 45.0, 47.0, 82.0, 161.0, 155.0, 111.0, 71.0, 42.0, 28.0, 26.0, 25.0, 15.0, 14.0, 13.0, 11.0, 2.0, 5.0, 5.0, 3.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.008209228515625, -0.007962405681610107, -0.007715582847595215, -0.007468760013580322, -0.00722193717956543, -0.006975114345550537, -0.0067282915115356445, -0.006481468677520752, -0.006234645843505859, -0.005987823009490967, -0.005741000175476074, -0.005494177341461182, -0.005247354507446289, -0.0050005316734313965, -0.004753708839416504, -0.004506886005401611, -0.004260063171386719, -0.004013240337371826, -0.0037664175033569336, -0.003519594669342041, -0.0032727718353271484, -0.003025949001312256, -0.0027791261672973633, -0.0025323033332824707, -0.002285480499267578, -0.0020386576652526855, -0.001791834831237793, -0.0015450119972229004, -0.0012981891632080078, -0.0010513663291931152, -0.0008045434951782227, -0.0005577206611633301, -0.0003108978271484375, -6.407499313354492e-05, 0.00018274784088134766, 0.00042957067489624023, 0.0006763935089111328, 0.0009232163429260254, 0.001170039176940918, 0.0014168620109558105, 0.0016636848449707031, 0.0019105076789855957, 0.0021573305130004883, 0.002404153347015381, 0.0026509761810302734, 0.002897799015045166, 0.0031446218490600586, 0.003391444683074951, 0.0036382675170898438, 0.0038850903511047363, 0.004131913185119629, 0.0043787360191345215, 0.004625558853149414, 0.004872381687164307, 0.005119204521179199, 0.005366027355194092, 0.005612850189208984, 0.005859673023223877, 0.0061064958572387695, 0.006353318691253662, 0.006600141525268555, 0.006846964359283447, 0.00709378719329834, 0.007340610027313232, 0.007587432861328125]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 6.0, 5.0, 6.0, 7.0, 6.0, 5.0, 25.0, 24.0, 34.0, 44.0, 66.0, 106.0, 172.0, 300.0, 773.0, 9133.0, 976638.0, 58613.0, 1588.0, 398.0, 215.0, 126.0, 75.0, 48.0, 43.0, 24.0, 14.0, 13.0, 11.0, 4.0, 9.0, 7.0, 5.0, 8.0, 1.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11456298828125, -0.11083221435546875, -0.1071014404296875, -0.10337066650390625, -0.099639892578125, -0.09590911865234375, -0.0921783447265625, -0.08844757080078125, -0.084716796875, -0.08098602294921875, -0.0772552490234375, -0.07352447509765625, -0.069793701171875, -0.06606292724609375, -0.0623321533203125, -0.05860137939453125, -0.05487060546875, -0.05113983154296875, -0.0474090576171875, -0.04367828369140625, -0.039947509765625, -0.03621673583984375, -0.0324859619140625, -0.02875518798828125, -0.0250244140625, -0.02129364013671875, -0.0175628662109375, -0.01383209228515625, -0.010101318359375, -0.00637054443359375, -0.0026397705078125, 0.00109100341796875, 0.00482177734375, 0.00855255126953125, 0.0122833251953125, 0.01601409912109375, 0.019744873046875, 0.02347564697265625, 0.0272064208984375, 0.03093719482421875, 0.03466796875, 0.03839874267578125, 0.0421295166015625, 0.04586029052734375, 0.049591064453125, 0.05332183837890625, 0.0570526123046875, 0.06078338623046875, 0.06451416015625, 0.06824493408203125, 0.0719757080078125, 0.07570648193359375, 0.079437255859375, 0.08316802978515625, 0.0868988037109375, 0.09062957763671875, 0.0943603515625, 0.09809112548828125, 0.1018218994140625, 0.10555267333984375, 0.109283447265625, 0.11301422119140625, 0.1167449951171875, 0.12047576904296875, 0.12420654296875]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 25.0, 669.0, 303.0, 17.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006496635731309652, -0.004209447652101517, -0.0019222591072320938, 0.0003649289719760418, 0.0026521175168454647, 0.004939306061714888, 0.007226493675261736, 0.009513681754469872, 0.011800870299339294, 0.014088058844208717, 0.01637524738907814, 0.018662434071302414, 0.020949624478816986, 0.02323681116104126, 0.025523999705910683, 0.027811188250780106, 0.03009837679564953, 0.03238556534051895, 0.034672752022743225, 0.0369599424302578, 0.03924712911248207, 0.04153431951999664, 0.04382150620222092, 0.04610869288444519, 0.04839588329195976, 0.050683069974184036, 0.05297026038169861, 0.05525744706392288, 0.057544637471437454, 0.05983182415366173, 0.0621190145611763, 0.06440620124340057, 0.06669338792562485, 0.06898057460784912, 0.0712677612900734, 0.07355495542287827, 0.07584214210510254, 0.07812932878732681, 0.08041651546955109, 0.08270370960235596, 0.08499089628458023, 0.0872780829668045, 0.08956526964902878, 0.09185246378183365, 0.09413965046405792, 0.0964268371462822, 0.09871402382850647, 0.10100121796131134, 0.10328839719295502, 0.10557558387517929, 0.10786277055740356, 0.11014996469020844, 0.11243715137243271, 0.11472433805465698, 0.11701152473688126, 0.11929871141910553, 0.1215859055519104, 0.12387309223413467, 0.12616027891635895, 0.12844747304916382, 0.1307346522808075, 0.13302184641361237, 0.13530904054641724, 0.1375962197780609, 0.13988341391086578]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 6.0, 6.0, 6.0, 14.0, 21.0, 19.0, 31.0, 26.0, 24.0, 39.0, 31.0, 35.0, 60.0, 55.0, 60.0, 51.0, 66.0, 55.0, 52.0, 49.0, 33.0, 38.0, 54.0, 36.0, 21.0, 26.0, 24.0, 24.0, 9.0, 14.0, 8.0, 4.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.009534597396850586, -0.009262402541935444, -0.008990207687020302, -0.00871801283210516, -0.008445817977190018, -0.008173623122274876, -0.007901428267359734, -0.0076292334124445915, -0.0073570385575294495, -0.007084843702614307, -0.006812648847699165, -0.006540453992784023, -0.006268259137868881, -0.005996064282953739, -0.005723869428038597, -0.005451674573123455, -0.005179479718208313, -0.004907284863293171, -0.004635090008378029, -0.004362895153462887, -0.004090700298547745, -0.0038185054436326027, -0.0035463105887174606, -0.0032741157338023186, -0.0030019208788871765, -0.0027297260239720345, -0.0024575311690568924, -0.0021853363141417503, -0.0019131414592266083, -0.0016409466043114662, -0.0013687517493963242, -0.001096556894481182, -0.00082436203956604, -0.000552167184650898, -0.0002799723297357559, -7.777474820613861e-06, 0.0002644173800945282, 0.0005366122350096703, 0.0008088070899248123, 0.0010810019448399544, 0.0013531967997550964, 0.0016253916546702385, 0.0018975865095853806, 0.0021697813645005226, 0.0024419762194156647, 0.0027141710743308067, 0.002986365929245949, 0.003258560784161091, 0.003530755639076233, 0.003802950493991375, 0.004075145348906517, 0.004347340203821659, 0.004619535058736801, 0.004891729913651943, 0.005163924768567085, 0.005436119623482227, 0.005708314478397369, 0.0059805093333125114, 0.0062527041882276535, 0.0065248990431427956, 0.006797093898057938, 0.00706928875297308, 0.007341483607888222, 0.007613678462803364, 0.007885873317718506]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 6.0, 11.0, 4.0, 9.0, 9.0, 10.0, 10.0, 16.0, 15.0, 15.0, 22.0, 27.0, 21.0, 31.0, 32.0, 35.0, 48.0, 53.0, 44.0, 45.0, 51.0, 47.0, 49.0, 45.0, 42.0, 38.0, 40.0, 31.0, 27.0, 24.0, 29.0, 21.0, 25.0, 13.0, 15.0, 12.0, 10.0, 6.0, 7.0, 3.0, 3.0, 4.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.0625, -3.938446044921875, -3.81439208984375, -3.690338134765625, -3.5662841796875, -3.442230224609375, -3.31817626953125, -3.194122314453125, -3.070068359375, -2.946014404296875, -2.82196044921875, -2.697906494140625, -2.5738525390625, -2.449798583984375, -2.32574462890625, -2.201690673828125, -2.07763671875, -1.953582763671875, -1.82952880859375, -1.705474853515625, -1.5814208984375, -1.457366943359375, -1.33331298828125, -1.209259033203125, -1.085205078125, -0.961151123046875, -0.83709716796875, -0.713043212890625, -0.5889892578125, -0.464935302734375, -0.34088134765625, -0.216827392578125, -0.0927734375, 0.031280517578125, 0.15533447265625, 0.279388427734375, 0.4034423828125, 0.527496337890625, 0.65155029296875, 0.775604248046875, 0.899658203125, 1.023712158203125, 1.14776611328125, 1.271820068359375, 1.3958740234375, 1.519927978515625, 1.64398193359375, 1.768035888671875, 1.89208984375, 2.016143798828125, 2.14019775390625, 2.264251708984375, 2.3883056640625, 2.512359619140625, 2.63641357421875, 2.760467529296875, 2.884521484375, 3.008575439453125, 3.13262939453125, 3.256683349609375, 3.3807373046875, 3.504791259765625, 3.62884521484375, 3.752899169921875, 3.876953125]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 2.0, 4.0, 3.0, 6.0, 16.0, 27.0, 18.0, 43.0, 53.0, 79.0, 117.0, 208.0, 297.0, 441.0, 738.0, 1193.0, 1893.0, 3187.0, 5282.0, 8922.0, 15504.0, 28474.0, 58024.0, 148787.0, 440539.0, 190376.0, 69004.0, 32703.0, 17575.0, 9937.0, 5874.0, 3406.0, 2202.0, 1354.0, 814.0, 522.0, 296.0, 198.0, 159.0, 95.0, 60.0, 39.0, 26.0, 22.0, 12.0, 9.0, 6.0, 3.0, 6.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.78125, -2.68402099609375, -2.5867919921875, -2.48956298828125, -2.392333984375, -2.29510498046875, -2.1978759765625, -2.10064697265625, -2.00341796875, -1.90618896484375, -1.8089599609375, -1.71173095703125, -1.614501953125, -1.51727294921875, -1.4200439453125, -1.32281494140625, -1.2255859375, -1.12835693359375, -1.0311279296875, -0.93389892578125, -0.836669921875, -0.73944091796875, -0.6422119140625, -0.54498291015625, -0.44775390625, -0.35052490234375, -0.2532958984375, -0.15606689453125, -0.058837890625, 0.03839111328125, 0.1356201171875, 0.23284912109375, 0.330078125, 0.42730712890625, 0.5245361328125, 0.62176513671875, 0.718994140625, 0.81622314453125, 0.9134521484375, 1.01068115234375, 1.10791015625, 1.20513916015625, 1.3023681640625, 1.39959716796875, 1.496826171875, 1.59405517578125, 1.6912841796875, 1.78851318359375, 1.8857421875, 1.98297119140625, 2.0802001953125, 2.17742919921875, 2.274658203125, 2.37188720703125, 2.4691162109375, 2.56634521484375, 2.66357421875, 2.76080322265625, 2.8580322265625, 2.95526123046875, 3.052490234375, 3.14971923828125, 3.2469482421875, 3.34417724609375, 3.44140625]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 2.0, 3.0, 7.0, 3.0, 5.0, 14.0, 9.0, 13.0, 10.0, 18.0, 14.0, 14.0, 25.0, 28.0, 28.0, 24.0, 21.0, 28.0, 32.0, 38.0, 38.0, 64.0, 74.0, 194.0, 1607.0, 210.0, 84.0, 63.0, 47.0, 43.0, 30.0, 33.0, 35.0, 23.0, 26.0, 21.0, 17.0, 12.0, 22.0, 18.0, 12.0, 10.0, 7.0, 6.0, 3.0, 2.0, 7.0, 5.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.921875, -11.54345703125, -11.1650390625, -10.78662109375, -10.408203125, -10.02978515625, -9.6513671875, -9.27294921875, -8.89453125, -8.51611328125, -8.1376953125, -7.75927734375, -7.380859375, -7.00244140625, -6.6240234375, -6.24560546875, -5.8671875, -5.48876953125, -5.1103515625, -4.73193359375, -4.353515625, -3.97509765625, -3.5966796875, -3.21826171875, -2.83984375, -2.46142578125, -2.0830078125, -1.70458984375, -1.326171875, -0.94775390625, -0.5693359375, -0.19091796875, 0.1875, 0.56591796875, 0.9443359375, 1.32275390625, 1.701171875, 2.07958984375, 2.4580078125, 2.83642578125, 3.21484375, 3.59326171875, 3.9716796875, 4.35009765625, 4.728515625, 5.10693359375, 5.4853515625, 5.86376953125, 6.2421875, 6.62060546875, 6.9990234375, 7.37744140625, 7.755859375, 8.13427734375, 8.5126953125, 8.89111328125, 9.26953125, 9.64794921875, 10.0263671875, 10.40478515625, 10.783203125, 11.16162109375, 11.5400390625, 11.91845703125, 12.296875]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 3.0, 5.0, 6.0, 3.0, 10.0, 11.0, 22.0, 19.0, 34.0, 34.0, 43.0, 64.0, 85.0, 119.0, 238.0, 366.0, 761.0, 2544.0, 26239.0, 2695401.0, 405884.0, 10686.0, 1610.0, 598.0, 282.0, 163.0, 101.0, 86.0, 72.0, 58.0, 39.0, 31.0, 20.0, 16.0, 15.0, 15.0, 7.0, 3.0, 7.0, 4.0, 4.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-28.34375, -27.5302734375, -26.716796875, -25.9033203125, -25.08984375, -24.2763671875, -23.462890625, -22.6494140625, -21.8359375, -21.0224609375, -20.208984375, -19.3955078125, -18.58203125, -17.7685546875, -16.955078125, -16.1416015625, -15.328125, -14.5146484375, -13.701171875, -12.8876953125, -12.07421875, -11.2607421875, -10.447265625, -9.6337890625, -8.8203125, -8.0068359375, -7.193359375, -6.3798828125, -5.56640625, -4.7529296875, -3.939453125, -3.1259765625, -2.3125, -1.4990234375, -0.685546875, 0.1279296875, 0.94140625, 1.7548828125, 2.568359375, 3.3818359375, 4.1953125, 5.0087890625, 5.822265625, 6.6357421875, 7.44921875, 8.2626953125, 9.076171875, 9.8896484375, 10.703125, 11.5166015625, 12.330078125, 13.1435546875, 13.95703125, 14.7705078125, 15.583984375, 16.3974609375, 17.2109375, 18.0244140625, 18.837890625, 19.6513671875, 20.46484375, 21.2783203125, 22.091796875, 22.9052734375, 23.71875]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 106.0, 841.0, 69.0, 1.0, 0.0, 1.0], "bins": [-433.6553955078125, -426.35809326171875, -419.0607604980469, -411.7634582519531, -404.4661560058594, -397.1688232421875, -389.87152099609375, -382.57421875, -375.2768859863281, -367.9795837402344, -360.6822509765625, -353.38494873046875, -346.087646484375, -338.7903137207031, -331.4930114746094, -324.1957092285156, -316.89837646484375, -309.60107421875, -302.3037414550781, -295.0064392089844, -287.7091369628906, -280.41180419921875, -273.114501953125, -265.81719970703125, -258.5198974609375, -251.2225799560547, -243.92527770996094, -236.62796020507812, -229.3306427001953, -222.0333251953125, -214.73602294921875, -207.43870544433594, -200.14138793945312, -192.8440704345703, -185.54676818847656, -178.24945068359375, -170.95213317871094, -163.65481567382812, -156.35751342773438, -149.06019592285156, -141.7628936767578, -134.465576171875, -127.16826629638672, -119.87095642089844, -112.57363891601562, -105.27632904052734, -97.97901916503906, -90.68170166015625, -83.38439178466797, -76.08708190917969, -68.78976440429688, -61.492454528808594, -54.19514083862305, -46.8978271484375, -39.60051727294922, -32.30320358276367, -25.005889892578125, -17.708576202392578, -10.411264419555664, -3.11395263671875, 4.183361053466797, 11.480674743652344, 18.777984619140625, 26.075298309326172, 33.37261199951172]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 8.0, 6.0, 4.0, 7.0, 11.0, 7.0, 17.0, 16.0, 19.0, 23.0, 27.0, 21.0, 36.0, 42.0, 47.0, 41.0, 41.0, 46.0, 45.0, 39.0, 38.0, 35.0, 43.0, 33.0, 34.0, 37.0, 35.0, 25.0, 27.0, 35.0, 24.0, 22.0, 26.0, 12.0, 11.0, 16.0, 10.0, 8.0, 7.0, 5.0, 5.0, 2.0, 3.0, 3.0, 1.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.166595458984375, -34.896400451660156, -33.62620162963867, -32.35600280761719, -31.08580780029297, -29.815610885620117, -28.545413970947266, -27.275217056274414, -26.005020141601562, -24.73482322692871, -23.46462631225586, -22.194429397583008, -20.924232482910156, -19.654035568237305, -18.383838653564453, -17.1136417388916, -15.84344482421875, -14.573247909545898, -13.303050994873047, -12.032854080200195, -10.762657165527344, -9.492460250854492, -8.22226333618164, -6.952066421508789, -5.6818695068359375, -4.411672592163086, -3.1414756774902344, -1.8712787628173828, -0.6010818481445312, 0.6691150665283203, 1.9393119812011719, 3.2095088958740234, 4.479705810546875, 5.749902725219727, 7.020099639892578, 8.29029655456543, 9.560493469238281, 10.830690383911133, 12.100887298583984, 13.371084213256836, 14.641281127929688, 15.911478042602539, 17.18167495727539, 18.451871871948242, 19.722068786621094, 20.992265701293945, 22.262462615966797, 23.53265953063965, 24.8028564453125, 26.07305335998535, 27.343250274658203, 28.613447189331055, 29.883644104003906, 31.153841018676758, 32.42403793334961, 33.694236755371094, 34.96443176269531, 36.23462677001953, 37.504825592041016, 38.7750244140625, 40.04521942138672, 41.31541442871094, 42.58561325073242, 43.855812072753906, 45.126007080078125]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 4.0, 5.0, 9.0, 10.0, 6.0, 10.0, 10.0, 12.0, 12.0, 11.0, 7.0, 29.0, 19.0, 33.0, 25.0, 31.0, 37.0, 45.0, 49.0, 47.0, 51.0, 37.0, 50.0, 49.0, 53.0, 35.0, 42.0, 44.0, 29.0, 37.0, 19.0, 27.0, 15.0, 22.0, 16.0, 21.0, 9.0, 9.0, 13.0, 9.0, 4.0, 5.0, 1.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.203125, -4.0758056640625, -3.948486328125, -3.8211669921875, -3.69384765625, -3.5665283203125, -3.439208984375, -3.3118896484375, -3.1845703125, -3.0572509765625, -2.929931640625, -2.8026123046875, -2.67529296875, -2.5479736328125, -2.420654296875, -2.2933349609375, -2.166015625, -2.0386962890625, -1.911376953125, -1.7840576171875, -1.65673828125, -1.5294189453125, -1.402099609375, -1.2747802734375, -1.1474609375, -1.0201416015625, -0.892822265625, -0.7655029296875, -0.63818359375, -0.5108642578125, -0.383544921875, -0.2562255859375, -0.12890625, -0.0015869140625, 0.125732421875, 0.2530517578125, 0.38037109375, 0.5076904296875, 0.635009765625, 0.7623291015625, 0.8896484375, 1.0169677734375, 1.144287109375, 1.2716064453125, 1.39892578125, 1.5262451171875, 1.653564453125, 1.7808837890625, 1.908203125, 2.0355224609375, 2.162841796875, 2.2901611328125, 2.41748046875, 2.5447998046875, 2.672119140625, 2.7994384765625, 2.9267578125, 3.0540771484375, 3.181396484375, 3.3087158203125, 3.43603515625, 3.5633544921875, 3.690673828125, 3.8179931640625, 3.9453125]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 6.0, 14.0, 14.0, 20.0, 31.0, 41.0, 55.0, 86.0, 116.0, 187.0, 293.0, 481.0, 674.0, 1087.0, 1690.0, 2721.0, 4673.0, 7918.0, 14066.0, 25269.0, 48459.0, 99017.0, 225907.0, 591658.0, 1271775.0, 1086364.0, 456828.0, 181724.0, 81786.0, 40833.0, 21649.0, 11910.0, 6659.0, 3930.0, 2381.0, 1456.0, 898.0, 560.0, 365.0, 241.0, 139.0, 109.0, 58.0, 44.0, 37.0, 22.0, 17.0, 7.0, 2.0, 3.0, 4.0, 3.0, 4.0], "bins": [-4.765625, -4.63275146484375, -4.4998779296875, -4.36700439453125, -4.234130859375, -4.10125732421875, -3.9683837890625, -3.83551025390625, -3.70263671875, -3.56976318359375, -3.4368896484375, -3.30401611328125, -3.171142578125, -3.03826904296875, -2.9053955078125, -2.77252197265625, -2.6396484375, -2.50677490234375, -2.3739013671875, -2.24102783203125, -2.108154296875, -1.97528076171875, -1.8424072265625, -1.70953369140625, -1.57666015625, -1.44378662109375, -1.3109130859375, -1.17803955078125, -1.045166015625, -0.91229248046875, -0.7794189453125, -0.64654541015625, -0.513671875, -0.38079833984375, -0.2479248046875, -0.11505126953125, 0.017822265625, 0.15069580078125, 0.2835693359375, 0.41644287109375, 0.54931640625, 0.68218994140625, 0.8150634765625, 0.94793701171875, 1.080810546875, 1.21368408203125, 1.3465576171875, 1.47943115234375, 1.6123046875, 1.74517822265625, 1.8780517578125, 2.01092529296875, 2.143798828125, 2.27667236328125, 2.4095458984375, 2.54241943359375, 2.67529296875, 2.80816650390625, 2.9410400390625, 3.07391357421875, 3.206787109375, 3.33966064453125, 3.4725341796875, 3.60540771484375, 3.73828125]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 8.0, 3.0, 5.0, 10.0, 9.0, 22.0, 29.0, 39.0, 45.0, 68.0, 106.0, 166.0, 240.0, 336.0, 513.0, 600.0, 544.0, 387.0, 291.0, 217.0, 145.0, 86.0, 75.0, 45.0, 28.0, 13.0, 10.0, 7.0, 8.0, 9.0, 6.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.90625, -14.5308837890625, -14.155517578125, -13.7801513671875, -13.40478515625, -13.0294189453125, -12.654052734375, -12.2786865234375, -11.9033203125, -11.5279541015625, -11.152587890625, -10.7772216796875, -10.40185546875, -10.0264892578125, -9.651123046875, -9.2757568359375, -8.900390625, -8.5250244140625, -8.149658203125, -7.7742919921875, -7.39892578125, -7.0235595703125, -6.648193359375, -6.2728271484375, -5.8974609375, -5.5220947265625, -5.146728515625, -4.7713623046875, -4.39599609375, -4.0206298828125, -3.645263671875, -3.2698974609375, -2.89453125, -2.5191650390625, -2.143798828125, -1.7684326171875, -1.39306640625, -1.0177001953125, -0.642333984375, -0.2669677734375, 0.1083984375, 0.4837646484375, 0.859130859375, 1.2344970703125, 1.60986328125, 1.9852294921875, 2.360595703125, 2.7359619140625, 3.111328125, 3.4866943359375, 3.862060546875, 4.2374267578125, 4.61279296875, 4.9881591796875, 5.363525390625, 5.7388916015625, 6.1142578125, 6.4896240234375, 6.864990234375, 7.2403564453125, 7.61572265625, 7.9910888671875, 8.366455078125, 8.7418212890625, 9.1171875]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 4.0, 8.0, 3.0, 15.0, 13.0, 29.0, 28.0, 39.0, 51.0, 85.0, 132.0, 188.0, 332.0, 629.0, 1451.0, 3389.0, 10843.0, 42034.0, 203692.0, 1369674.0, 2156465.0, 320206.0, 61794.0, 15094.0, 4678.0, 1600.0, 739.0, 407.0, 224.0, 147.0, 76.0, 72.0, 40.0, 26.0, 27.0, 12.0, 16.0, 9.0, 4.0, 4.0, 1.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.5390625, -15.055419921875, -14.57177734375, -14.088134765625, -13.6044921875, -13.120849609375, -12.63720703125, -12.153564453125, -11.669921875, -11.186279296875, -10.70263671875, -10.218994140625, -9.7353515625, -9.251708984375, -8.76806640625, -8.284423828125, -7.80078125, -7.317138671875, -6.83349609375, -6.349853515625, -5.8662109375, -5.382568359375, -4.89892578125, -4.415283203125, -3.931640625, -3.447998046875, -2.96435546875, -2.480712890625, -1.9970703125, -1.513427734375, -1.02978515625, -0.546142578125, -0.0625, 0.421142578125, 0.90478515625, 1.388427734375, 1.8720703125, 2.355712890625, 2.83935546875, 3.322998046875, 3.806640625, 4.290283203125, 4.77392578125, 5.257568359375, 5.7412109375, 6.224853515625, 6.70849609375, 7.192138671875, 7.67578125, 8.159423828125, 8.64306640625, 9.126708984375, 9.6103515625, 10.093994140625, 10.57763671875, 11.061279296875, 11.544921875, 12.028564453125, 12.51220703125, 12.995849609375, 13.4794921875, 13.963134765625, 14.44677734375, 14.930419921875, 15.4140625]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 8.0, 26.0, 48.0, 87.0, 124.0, 158.0, 175.0, 138.0, 109.0, 67.0, 34.0, 14.0, 10.0, 7.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-135.07627868652344, -132.4461669921875, -129.81605529785156, -127.18595123291016, -124.55584716796875, -121.92573547363281, -119.29562377929688, -116.66551971435547, -114.03540802001953, -111.4052963256836, -108.77519226074219, -106.14508056640625, -103.51497650146484, -100.8848648071289, -98.2547607421875, -95.62464904785156, -92.99453735351562, -90.36442565917969, -87.73432159423828, -85.10420989990234, -82.47410583496094, -79.843994140625, -77.21388244628906, -74.58377838134766, -71.95367431640625, -69.32356262207031, -66.6934585571289, -64.06334686279297, -61.4332389831543, -58.803131103515625, -56.17302322387695, -53.54291534423828, -50.91280746459961, -48.28269958496094, -45.652591705322266, -43.022483825683594, -40.392372131347656, -37.762264251708984, -35.13215637207031, -32.502044677734375, -29.871938705444336, -27.241830825805664, -24.61172103881836, -21.981613159179688, -19.351505279541016, -16.72139549255371, -14.091287612915039, -11.461177825927734, -8.831069946289062, -6.200961112976074, -3.570852756500244, -0.9407444000244141, 1.6893644332885742, 4.3194732666015625, 6.949581146240234, 9.579690933227539, 12.209798812866211, 14.8399076461792, 17.470016479492188, 20.10012435913086, 22.73023223876953, 25.360342025756836, 27.990449905395508, 30.620559692382812, 33.250667572021484]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 4.0, 6.0, 6.0, 5.0, 8.0, 5.0, 21.0, 9.0, 9.0, 19.0, 16.0, 23.0, 22.0, 23.0, 22.0, 23.0, 27.0, 31.0, 43.0, 24.0, 35.0, 43.0, 31.0, 36.0, 39.0, 29.0, 29.0, 37.0, 32.0, 34.0, 32.0, 38.0, 25.0, 34.0, 41.0, 16.0, 23.0, 21.0, 12.0, 10.0, 9.0, 6.0, 11.0, 6.0, 5.0, 8.0, 3.0, 3.0, 5.0, 3.0, 4.0, 1.0, 3.0, 2.0, 1.0], "bins": [-31.04693603515625, -30.109779357910156, -29.172624588012695, -28.2354679107666, -27.29831314086914, -26.361156463623047, -25.423999786376953, -24.486845016479492, -23.54969024658203, -22.612533569335938, -21.675378799438477, -20.738222122192383, -19.801067352294922, -18.863910675048828, -17.926753997802734, -16.989599227905273, -16.05244255065918, -15.115286827087402, -14.178131103515625, -13.240974426269531, -12.30381965637207, -11.366662979125977, -10.4295072555542, -9.492351531982422, -8.555195808410645, -7.618040084838867, -6.68088436126709, -5.743728160858154, -4.806572437286377, -3.8694167137145996, -2.932260513305664, -1.9951047897338867, -1.0579490661621094, -0.12079322338104248, 0.8163626194000244, 1.7535185813903809, 2.690674304962158, 3.6278300285339355, 4.564986228942871, 5.502141952514648, 6.439297676086426, 7.376453399658203, 8.31360912322998, 9.250764846801758, 10.187921524047852, 11.125076293945312, 12.062232971191406, 12.999388694763184, 13.936544418334961, 14.873700141906738, 15.810855865478516, 16.74801254272461, 17.68516731262207, 18.622323989868164, 19.559478759765625, 20.49663543701172, 21.433792114257812, 22.370948791503906, 23.308103561401367, 24.24526023864746, 25.182415008544922, 26.119571685791016, 27.05672836303711, 27.99388313293457, 28.93103790283203]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 3.0, 6.0, 3.0, 6.0, 7.0, 9.0, 9.0, 13.0, 19.0, 13.0, 14.0, 23.0, 16.0, 26.0, 25.0, 24.0, 45.0, 42.0, 40.0, 50.0, 55.0, 47.0, 50.0, 39.0, 42.0, 37.0, 48.0, 42.0, 35.0, 31.0, 26.0, 35.0, 27.0, 22.0, 10.0, 23.0, 7.0, 16.0, 4.0, 6.0, 3.0, 3.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-4.8203125, -4.68719482421875, -4.5540771484375, -4.42095947265625, -4.287841796875, -4.15472412109375, -4.0216064453125, -3.88848876953125, -3.75537109375, -3.62225341796875, -3.4891357421875, -3.35601806640625, -3.222900390625, -3.08978271484375, -2.9566650390625, -2.82354736328125, -2.6904296875, -2.55731201171875, -2.4241943359375, -2.29107666015625, -2.157958984375, -2.02484130859375, -1.8917236328125, -1.75860595703125, -1.62548828125, -1.49237060546875, -1.3592529296875, -1.22613525390625, -1.093017578125, -0.95989990234375, -0.8267822265625, -0.69366455078125, -0.560546875, -0.42742919921875, -0.2943115234375, -0.16119384765625, -0.028076171875, 0.10504150390625, 0.2381591796875, 0.37127685546875, 0.50439453125, 0.63751220703125, 0.7706298828125, 0.90374755859375, 1.036865234375, 1.16998291015625, 1.3031005859375, 1.43621826171875, 1.5693359375, 1.70245361328125, 1.8355712890625, 1.96868896484375, 2.101806640625, 2.23492431640625, 2.3680419921875, 2.50115966796875, 2.63427734375, 2.76739501953125, 2.9005126953125, 3.03363037109375, 3.166748046875, 3.29986572265625, 3.4329833984375, 3.56610107421875, 3.69921875]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 3.0, 4.0, 0.0, 8.0, 14.0, 21.0, 25.0, 30.0, 54.0, 77.0, 121.0, 184.0, 271.0, 428.0, 648.0, 873.0, 1391.0, 2081.0, 2982.0, 4474.0, 6684.0, 10425.0, 15541.0, 24045.0, 37938.0, 61385.0, 102102.0, 174045.0, 217230.0, 149888.0, 87642.0, 53084.0, 32907.0, 21069.0, 13866.0, 8869.0, 5996.0, 4015.0, 2640.0, 1854.0, 1213.0, 811.0, 547.0, 397.0, 236.0, 155.0, 84.0, 72.0, 40.0, 42.0, 20.0, 12.0, 12.0, 3.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.388916015625, -0.3765106201171875, -0.364105224609375, -0.3516998291015625, -0.33929443359375, -0.3268890380859375, -0.314483642578125, -0.3020782470703125, -0.2896728515625, -0.2772674560546875, -0.264862060546875, -0.2524566650390625, -0.24005126953125, -0.2276458740234375, -0.215240478515625, -0.2028350830078125, -0.1904296875, -0.1780242919921875, -0.165618896484375, -0.1532135009765625, -0.14080810546875, -0.1284027099609375, -0.115997314453125, -0.1035919189453125, -0.0911865234375, -0.0787811279296875, -0.066375732421875, -0.0539703369140625, -0.04156494140625, -0.0291595458984375, -0.016754150390625, -0.0043487548828125, 0.008056640625, 0.0204620361328125, 0.032867431640625, 0.0452728271484375, 0.05767822265625, 0.0700836181640625, 0.082489013671875, 0.0948944091796875, 0.1072998046875, 0.1197052001953125, 0.132110595703125, 0.1445159912109375, 0.15692138671875, 0.1693267822265625, 0.181732177734375, 0.1941375732421875, 0.20654296875, 0.2189483642578125, 0.231353759765625, 0.2437591552734375, 0.25616455078125, 0.2685699462890625, 0.280975341796875, 0.2933807373046875, 0.3057861328125, 0.3181915283203125, 0.330596923828125, 0.3430023193359375, 0.35540771484375, 0.3678131103515625, 0.380218505859375, 0.3926239013671875, 0.405029296875]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 7.0, 6.0, 6.0, 6.0, 7.0, 12.0, 11.0, 18.0, 17.0, 22.0, 32.0, 24.0, 27.0, 14.0, 22.0, 31.0, 32.0, 33.0, 33.0, 37.0, 42.0, 35.0, 1055.0, 41.0, 37.0, 34.0, 30.0, 34.0, 24.0, 37.0, 31.0, 27.0, 32.0, 29.0, 17.0, 25.0, 16.0, 13.0, 12.0, 7.0, 5.0, 5.0, 13.0, 9.0, 3.0, 5.0, 0.0, 4.0, 5.0, 4.0, 1.0, 4.0, 3.0], "bins": [-2.595703125, -2.51934814453125, -2.4429931640625, -2.36663818359375, -2.290283203125, -2.21392822265625, -2.1375732421875, -2.06121826171875, -1.98486328125, -1.90850830078125, -1.8321533203125, -1.75579833984375, -1.679443359375, -1.60308837890625, -1.5267333984375, -1.45037841796875, -1.3740234375, -1.29766845703125, -1.2213134765625, -1.14495849609375, -1.068603515625, -0.99224853515625, -0.9158935546875, -0.83953857421875, -0.76318359375, -0.68682861328125, -0.6104736328125, -0.53411865234375, -0.457763671875, -0.38140869140625, -0.3050537109375, -0.22869873046875, -0.15234375, -0.07598876953125, 0.0003662109375, 0.07672119140625, 0.153076171875, 0.22943115234375, 0.3057861328125, 0.38214111328125, 0.45849609375, 0.53485107421875, 0.6112060546875, 0.68756103515625, 0.763916015625, 0.84027099609375, 0.9166259765625, 0.99298095703125, 1.0693359375, 1.14569091796875, 1.2220458984375, 1.29840087890625, 1.374755859375, 1.45111083984375, 1.5274658203125, 1.60382080078125, 1.68017578125, 1.75653076171875, 1.8328857421875, 1.90924072265625, 1.985595703125, 2.06195068359375, 2.1383056640625, 2.21466064453125, 2.291015625]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 5.0, 7.0, 14.0, 23.0, 20.0, 21.0, 31.0, 47.0, 103.0, 121.0, 222.0, 379.0, 609.0, 1050.0, 1710.0, 3081.0, 5494.0, 9684.0, 18199.0, 34124.0, 65689.0, 125938.0, 235264.0, 1265267.0, 154700.0, 82622.0, 42740.0, 22358.0, 12052.0, 6703.0, 3637.0, 2092.0, 1188.0, 730.0, 424.0, 265.0, 165.0, 121.0, 67.0, 46.0, 38.0, 22.0, 24.0, 15.0, 12.0, 8.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.2459716796875, -0.23753929138183594, -0.22910690307617188, -0.2206745147705078, -0.21224212646484375, -0.2038097381591797, -0.19537734985351562, -0.18694496154785156, -0.1785125732421875, -0.17008018493652344, -0.16164779663085938, -0.1532154083251953, -0.14478302001953125, -0.1363506317138672, -0.12791824340820312, -0.11948585510253906, -0.111053466796875, -0.10262107849121094, -0.09418869018554688, -0.08575630187988281, -0.07732391357421875, -0.06889152526855469, -0.060459136962890625, -0.05202674865722656, -0.0435943603515625, -0.03516197204589844, -0.026729583740234375, -0.018297195434570312, -0.00986480712890625, -0.0014324188232421875, 0.006999969482421875, 0.015432357788085938, 0.02386474609375, 0.03229713439941406, 0.040729522705078125, 0.04916191101074219, 0.05759429931640625, 0.06602668762207031, 0.07445907592773438, 0.08289146423339844, 0.0913238525390625, 0.09975624084472656, 0.10818862915039062, 0.11662101745605469, 0.12505340576171875, 0.1334857940673828, 0.14191818237304688, 0.15035057067871094, 0.158782958984375, 0.16721534729003906, 0.17564773559570312, 0.1840801239013672, 0.19251251220703125, 0.2009449005126953, 0.20937728881835938, 0.21780967712402344, 0.2262420654296875, 0.23467445373535156, 0.24310684204101562, 0.2515392303466797, 0.25997161865234375, 0.2684040069580078, 0.2768363952636719, 0.28526878356933594, 0.293701171875]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 5.0, 2.0, 6.0, 4.0, 0.0, 9.0, 0.0, 5.0, 10.0, 11.0, 13.0, 9.0, 16.0, 12.0, 27.0, 37.0, 40.0, 40.0, 49.0, 39.0, 57.0, 100.0, 92.0, 53.0, 68.0, 60.0, 34.0, 38.0, 35.0, 27.0, 18.0, 12.0, 20.0, 12.0, 7.0, 5.0, 7.0, 7.0, 1.0, 6.0, 4.0, 5.0, 2.0, 4.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0087127685546875, -0.008456230163574219, -0.008199691772460938, -0.007943153381347656, -0.007686614990234375, -0.007430076599121094, -0.0071735382080078125, -0.006916999816894531, -0.00666046142578125, -0.006403923034667969, -0.0061473846435546875, -0.005890846252441406, -0.005634307861328125, -0.005377769470214844, -0.0051212310791015625, -0.004864692687988281, -0.004608154296875, -0.004351615905761719, -0.0040950775146484375, -0.0038385391235351562, -0.003582000732421875, -0.0033254623413085938, -0.0030689239501953125, -0.0028123855590820312, -0.00255584716796875, -0.0022993087768554688, -0.0020427703857421875, -0.0017862319946289062, -0.001529693603515625, -0.0012731552124023438, -0.0010166168212890625, -0.0007600784301757812, -0.0005035400390625, -0.00024700164794921875, 9.5367431640625e-06, 0.00026607513427734375, 0.000522613525390625, 0.0007791519165039062, 0.0010356903076171875, 0.0012922286987304688, 0.00154876708984375, 0.0018053054809570312, 0.0020618438720703125, 0.0023183822631835938, 0.002574920654296875, 0.0028314590454101562, 0.0030879974365234375, 0.0033445358276367188, 0.00360107421875, 0.0038576126098632812, 0.0041141510009765625, 0.004370689392089844, 0.004627227783203125, 0.004883766174316406, 0.0051403045654296875, 0.005396842956542969, 0.00565338134765625, 0.005909919738769531, 0.0061664581298828125, 0.006422996520996094, 0.006679534912109375, 0.006936073303222656, 0.0071926116943359375, 0.007449150085449219, 0.0077056884765625]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 4.0, 3.0, 5.0, 8.0, 4.0, 8.0, 15.0, 16.0, 19.0, 26.0, 34.0, 50.0, 68.0, 85.0, 140.0, 192.0, 376.0, 846.0, 6272.0, 733826.0, 300372.0, 4440.0, 732.0, 348.0, 200.0, 127.0, 104.0, 53.0, 42.0, 30.0, 31.0, 17.0, 17.0, 9.0, 12.0, 3.0, 3.0, 8.0, 6.0, 1.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.1358642578125, -0.13161087036132812, -0.12735748291015625, -0.12310409545898438, -0.1188507080078125, -0.11459732055664062, -0.11034393310546875, -0.10609054565429688, -0.101837158203125, -0.09758377075195312, -0.09333038330078125, -0.08907699584960938, -0.0848236083984375, -0.08057022094726562, -0.07631683349609375, -0.07206344604492188, -0.06781005859375, -0.06355667114257812, -0.05930328369140625, -0.055049896240234375, -0.0507965087890625, -0.046543121337890625, -0.04228973388671875, -0.038036346435546875, -0.033782958984375, -0.029529571533203125, -0.02527618408203125, -0.021022796630859375, -0.0167694091796875, -0.012516021728515625, -0.00826263427734375, -0.004009246826171875, 0.000244140625, 0.004497528076171875, 0.00875091552734375, 0.013004302978515625, 0.0172576904296875, 0.021511077880859375, 0.02576446533203125, 0.030017852783203125, 0.034271240234375, 0.038524627685546875, 0.04277801513671875, 0.047031402587890625, 0.0512847900390625, 0.055538177490234375, 0.05979156494140625, 0.06404495239257812, 0.06829833984375, 0.07255172729492188, 0.07680511474609375, 0.08105850219726562, 0.0853118896484375, 0.08956527709960938, 0.09381866455078125, 0.09807205200195312, 0.102325439453125, 0.10657882690429688, 0.11083221435546875, 0.11508560180664062, 0.1193389892578125, 0.12359237670898438, 0.12784576416015625, 0.13209915161132812, 0.1363525390625]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 4.0, 174.0, 793.0, 44.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.013901765458285809, -0.00959918275475502, -0.005296600982546806, -0.000994018279016018, 0.003308563493192196, 0.00761114526540041, 0.011913728900253773, 0.01621631160378456, 0.020518891513347626, 0.02482147328555584, 0.029124055057764053, 0.033426638692617416, 0.03772921860218048, 0.042031802237033844, 0.04633438587188721, 0.05063696950674057, 0.054939549416303635, 0.059242133051157, 0.06354471296072006, 0.06784729659557343, 0.07214988023042679, 0.07645246386528015, 0.08075504004955292, 0.08505762368440628, 0.08936020731925964, 0.093662790954113, 0.09796537458896637, 0.10226795077323914, 0.1065705344080925, 0.11087311804294586, 0.11517570167779922, 0.11947828531265259, 0.12378086149692535, 0.12808343768119812, 0.13238602876663208, 0.13668860495090485, 0.1409911960363388, 0.14529377222061157, 0.14959636330604553, 0.1538989394903183, 0.15820151567459106, 0.16250409185886383, 0.1668066829442978, 0.17110925912857056, 0.17541185021400452, 0.17971442639827728, 0.18401700258255005, 0.188319593667984, 0.19262218475341797, 0.19692476093769073, 0.2012273520231247, 0.20552992820739746, 0.20983251929283142, 0.2141350954771042, 0.21843767166137695, 0.2227402627468109, 0.22704283893108368, 0.23134541511535645, 0.2356480062007904, 0.23995058238506317, 0.24425317347049713, 0.2485557496547699, 0.25285834074020386, 0.25716090202331543, 0.2614634931087494]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 6.0, 8.0, 5.0, 14.0, 11.0, 20.0, 26.0, 24.0, 30.0, 36.0, 40.0, 41.0, 47.0, 38.0, 50.0, 53.0, 60.0, 45.0, 62.0, 50.0, 60.0, 45.0, 38.0, 30.0, 28.0, 30.0, 30.0, 17.0, 11.0, 13.0, 14.0, 8.0, 2.0, 3.0, 1.0, 8.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.017148256301879883, -0.016681604087352753, -0.016214951872825623, -0.015748299658298492, -0.015281647443771362, -0.014814995229244232, -0.014348343014717102, -0.013881690800189972, -0.013415038585662842, -0.012948386371135712, -0.012481734156608582, -0.012015081942081451, -0.011548429727554321, -0.011081777513027191, -0.010615125298500061, -0.010148473083972931, -0.0096818208694458, -0.00921516865491867, -0.00874851644039154, -0.00828186422586441, -0.00781521201133728, -0.00734855979681015, -0.00688190758228302, -0.00641525536775589, -0.00594860315322876, -0.00548195093870163, -0.0050152987241744995, -0.004548646509647369, -0.004081994295120239, -0.003615342080593109, -0.003148689866065979, -0.002682037651538849, -0.0022153854370117188, -0.0017487332224845886, -0.0012820810079574585, -0.0008154287934303284, -0.00034877657890319824, 0.00011787563562393188, 0.000584527850151062, 0.0010511800646781921, 0.0015178322792053223, 0.0019844844937324524, 0.0024511367082595825, 0.0029177889227867126, 0.0033844411373138428, 0.003851093351840973, 0.004317745566368103, 0.004784397780895233, 0.005251049995422363, 0.005717702209949493, 0.0061843544244766235, 0.006651006639003754, 0.007117658853530884, 0.007584311068058014, 0.008050963282585144, 0.008517615497112274, 0.008984267711639404, 0.009450919926166534, 0.009917572140693665, 0.010384224355220795, 0.010850876569747925, 0.011317528784275055, 0.011784180998802185, 0.012250833213329315, 0.012717485427856445]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 3.0, 6.0, 3.0, 6.0, 7.0, 9.0, 9.0, 13.0, 19.0, 13.0, 14.0, 23.0, 16.0, 26.0, 25.0, 25.0, 43.0, 43.0, 40.0, 50.0, 55.0, 47.0, 50.0, 39.0, 42.0, 37.0, 48.0, 42.0, 35.0, 31.0, 26.0, 35.0, 27.0, 22.0, 10.0, 23.0, 7.0, 16.0, 4.0, 5.0, 4.0, 3.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-4.8203125, -4.68719482421875, -4.5540771484375, -4.42095947265625, -4.287841796875, -4.15472412109375, -4.0216064453125, -3.88848876953125, -3.75537109375, -3.62225341796875, -3.4891357421875, -3.35601806640625, -3.222900390625, -3.08978271484375, -2.9566650390625, -2.82354736328125, -2.6904296875, -2.55731201171875, -2.4241943359375, -2.29107666015625, -2.157958984375, -2.02484130859375, -1.8917236328125, -1.75860595703125, -1.62548828125, -1.49237060546875, -1.3592529296875, -1.22613525390625, -1.093017578125, -0.95989990234375, -0.8267822265625, -0.69366455078125, -0.560546875, -0.42742919921875, -0.2943115234375, -0.16119384765625, -0.028076171875, 0.10504150390625, 0.2381591796875, 0.37127685546875, 0.50439453125, 0.63751220703125, 0.7706298828125, 0.90374755859375, 1.036865234375, 1.16998291015625, 1.3031005859375, 1.43621826171875, 1.5693359375, 1.70245361328125, 1.8355712890625, 1.96868896484375, 2.101806640625, 2.23492431640625, 2.3680419921875, 2.50115966796875, 2.63427734375, 2.76739501953125, 2.9005126953125, 3.03363037109375, 3.166748046875, 3.29986572265625, 3.4329833984375, 3.56610107421875, 3.69921875]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 4.0, 4.0, 3.0, 2.0, 10.0, 9.0, 15.0, 26.0, 29.0, 40.0, 56.0, 82.0, 99.0, 137.0, 207.0, 282.0, 428.0, 571.0, 790.0, 1371.0, 1986.0, 3347.0, 5921.0, 11115.0, 23077.0, 53860.0, 142657.0, 383963.0, 255761.0, 89755.0, 35927.0, 16449.0, 8157.0, 4558.0, 2689.0, 1683.0, 1145.0, 698.0, 514.0, 355.0, 233.0, 160.0, 109.0, 81.0, 53.0, 40.0, 33.0, 23.0, 17.0, 9.0, 8.0, 7.0, 9.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-3.314453125, -3.21630859375, -3.1181640625, -3.02001953125, -2.921875, -2.82373046875, -2.7255859375, -2.62744140625, -2.529296875, -2.43115234375, -2.3330078125, -2.23486328125, -2.13671875, -2.03857421875, -1.9404296875, -1.84228515625, -1.744140625, -1.64599609375, -1.5478515625, -1.44970703125, -1.3515625, -1.25341796875, -1.1552734375, -1.05712890625, -0.958984375, -0.86083984375, -0.7626953125, -0.66455078125, -0.56640625, -0.46826171875, -0.3701171875, -0.27197265625, -0.173828125, -0.07568359375, 0.0224609375, 0.12060546875, 0.21875, 0.31689453125, 0.4150390625, 0.51318359375, 0.611328125, 0.70947265625, 0.8076171875, 0.90576171875, 1.00390625, 1.10205078125, 1.2001953125, 1.29833984375, 1.396484375, 1.49462890625, 1.5927734375, 1.69091796875, 1.7890625, 1.88720703125, 1.9853515625, 2.08349609375, 2.181640625, 2.27978515625, 2.3779296875, 2.47607421875, 2.57421875, 2.67236328125, 2.7705078125, 2.86865234375, 2.966796875]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 2.0, 1.0, 6.0, 5.0, 8.0, 7.0, 14.0, 10.0, 11.0, 10.0, 7.0, 16.0, 19.0, 19.0, 25.0, 37.0, 23.0, 24.0, 32.0, 44.0, 43.0, 53.0, 81.0, 123.0, 1420.0, 391.0, 121.0, 79.0, 50.0, 45.0, 38.0, 45.0, 35.0, 28.0, 29.0, 17.0, 24.0, 30.0, 15.0, 12.0, 9.0, 6.0, 7.0, 5.0, 8.0, 6.0, 7.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-14.1328125, -13.717041015625, -13.30126953125, -12.885498046875, -12.4697265625, -12.053955078125, -11.63818359375, -11.222412109375, -10.806640625, -10.390869140625, -9.97509765625, -9.559326171875, -9.1435546875, -8.727783203125, -8.31201171875, -7.896240234375, -7.48046875, -7.064697265625, -6.64892578125, -6.233154296875, -5.8173828125, -5.401611328125, -4.98583984375, -4.570068359375, -4.154296875, -3.738525390625, -3.32275390625, -2.906982421875, -2.4912109375, -2.075439453125, -1.65966796875, -1.243896484375, -0.828125, -0.412353515625, 0.00341796875, 0.419189453125, 0.8349609375, 1.250732421875, 1.66650390625, 2.082275390625, 2.498046875, 2.913818359375, 3.32958984375, 3.745361328125, 4.1611328125, 4.576904296875, 4.99267578125, 5.408447265625, 5.82421875, 6.239990234375, 6.65576171875, 7.071533203125, 7.4873046875, 7.903076171875, 8.31884765625, 8.734619140625, 9.150390625, 9.566162109375, 9.98193359375, 10.397705078125, 10.8134765625, 11.229248046875, 11.64501953125, 12.060791015625, 12.4765625]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 6.0, 4.0, 12.0, 10.0, 11.0, 12.0, 14.0, 29.0, 43.0, 49.0, 79.0, 113.0, 191.0, 310.0, 586.0, 1916.0, 24049.0, 3032197.0, 80946.0, 3418.0, 716.0, 339.0, 175.0, 131.0, 111.0, 64.0, 44.0, 30.0, 15.0, 19.0, 21.0, 13.0, 10.0, 7.0, 9.0, 5.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-42.0625, -40.945068359375, -39.82763671875, -38.710205078125, -37.5927734375, -36.475341796875, -35.35791015625, -34.240478515625, -33.123046875, -32.005615234375, -30.88818359375, -29.770751953125, -28.6533203125, -27.535888671875, -26.41845703125, -25.301025390625, -24.18359375, -23.066162109375, -21.94873046875, -20.831298828125, -19.7138671875, -18.596435546875, -17.47900390625, -16.361572265625, -15.244140625, -14.126708984375, -13.00927734375, -11.891845703125, -10.7744140625, -9.656982421875, -8.53955078125, -7.422119140625, -6.3046875, -5.187255859375, -4.06982421875, -2.952392578125, -1.8349609375, -0.717529296875, 0.39990234375, 1.517333984375, 2.634765625, 3.752197265625, 4.86962890625, 5.987060546875, 7.1044921875, 8.221923828125, 9.33935546875, 10.456787109375, 11.57421875, 12.691650390625, 13.80908203125, 14.926513671875, 16.0439453125, 17.161376953125, 18.27880859375, 19.396240234375, 20.513671875, 21.631103515625, 22.74853515625, 23.865966796875, 24.9833984375, 26.100830078125, 27.21826171875, 28.335693359375, 29.453125]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [19.0, 501.0, 491.0, 7.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.02536392211914, -6.010832786560059, 0.0036983489990234375, 6.018230438232422, 12.032760620117188, 18.047290802001953, 24.061824798583984, 30.07635498046875, 36.090885162353516, 42.10541534423828, 48.11994934082031, 54.13447952270508, 60.149009704589844, 66.16354370117188, 72.17807006835938, 78.1926040649414, 84.20713806152344, 90.22167205810547, 96.23619842529297, 102.250732421875, 108.2652587890625, 114.27979278564453, 120.29432678222656, 126.30885314941406, 132.32337951660156, 138.33790588378906, 144.35244750976562, 150.36697387695312, 156.38150024414062, 162.39602661132812, 168.4105682373047, 174.4250946044922, 180.43963623046875, 186.45416259765625, 192.4687042236328, 198.4832305908203, 204.4977569580078, 210.51229858398438, 216.52682495117188, 222.54135131835938, 228.55587768554688, 234.57040405273438, 240.58494567871094, 246.59947204589844, 252.61399841308594, 258.6285400390625, 264.64306640625, 270.6575927734375, 276.672119140625, 282.6866455078125, 288.701171875, 294.7156982421875, 300.7302551269531, 306.7447814941406, 312.7593078613281, 318.7738342285156, 324.78839111328125, 330.80291748046875, 336.81744384765625, 342.83197021484375, 348.8465270996094, 354.8610534667969, 360.8755798339844, 366.8901062011719, 372.9046325683594]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 3.0, 6.0, 6.0, 7.0, 13.0, 15.0, 16.0, 20.0, 14.0, 16.0, 21.0, 32.0, 29.0, 31.0, 31.0, 27.0, 41.0, 37.0, 39.0, 48.0, 53.0, 48.0, 42.0, 43.0, 33.0, 37.0, 25.0, 37.0, 28.0, 33.0, 25.0, 14.0, 12.0, 22.0, 20.0, 17.0, 16.0, 14.0, 9.0, 4.0, 5.0, 5.0, 6.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-39.34980392456055, -38.12963104248047, -36.909454345703125, -35.68927764892578, -34.4691047668457, -33.248931884765625, -32.02875518798828, -30.80858039855957, -29.58840560913086, -28.36823081970215, -27.148056030273438, -25.927881240844727, -24.707706451416016, -23.487531661987305, -22.267356872558594, -21.047182083129883, -19.827007293701172, -18.60683250427246, -17.38665771484375, -16.16648292541504, -14.946308135986328, -13.726133346557617, -12.505958557128906, -11.285783767700195, -10.065608978271484, -8.845434188842773, -7.6252593994140625, -6.405084609985352, -5.184909820556641, -3.9647350311279297, -2.7445602416992188, -1.5243854522705078, -0.3042106628417969, 0.9159641265869141, 2.136138916015625, 3.356313705444336, 4.576488494873047, 5.796663284301758, 7.016838073730469, 8.23701286315918, 9.45718765258789, 10.677362442016602, 11.897537231445312, 13.117712020874023, 14.337886810302734, 15.558061599731445, 16.778236389160156, 17.998411178588867, 19.218585968017578, 20.43876075744629, 21.658935546875, 22.87911033630371, 24.099285125732422, 25.319459915161133, 26.539634704589844, 27.759809494018555, 28.979984283447266, 30.200159072875977, 31.420333862304688, 32.64051055908203, 33.86068344116211, 35.08085632324219, 36.30103302001953, 37.521209716796875, 38.74138259887695]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 6.0, 4.0, 5.0, 6.0, 6.0, 13.0, 13.0, 13.0, 16.0, 21.0, 19.0, 16.0, 29.0, 30.0, 29.0, 35.0, 45.0, 46.0, 43.0, 47.0, 45.0, 43.0, 40.0, 55.0, 41.0, 40.0, 44.0, 20.0, 36.0, 26.0, 36.0, 28.0, 29.0, 12.0, 14.0, 17.0, 9.0, 10.0, 5.0, 2.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.66796875, -4.5316162109375, -4.395263671875, -4.2589111328125, -4.12255859375, -3.9862060546875, -3.849853515625, -3.7135009765625, -3.5771484375, -3.4407958984375, -3.304443359375, -3.1680908203125, -3.03173828125, -2.8953857421875, -2.759033203125, -2.6226806640625, -2.486328125, -2.3499755859375, -2.213623046875, -2.0772705078125, -1.94091796875, -1.8045654296875, -1.668212890625, -1.5318603515625, -1.3955078125, -1.2591552734375, -1.122802734375, -0.9864501953125, -0.85009765625, -0.7137451171875, -0.577392578125, -0.4410400390625, -0.3046875, -0.1683349609375, -0.031982421875, 0.1043701171875, 0.24072265625, 0.3770751953125, 0.513427734375, 0.6497802734375, 0.7861328125, 0.9224853515625, 1.058837890625, 1.1951904296875, 1.33154296875, 1.4678955078125, 1.604248046875, 1.7406005859375, 1.876953125, 2.0133056640625, 2.149658203125, 2.2860107421875, 2.42236328125, 2.5587158203125, 2.695068359375, 2.8314208984375, 2.9677734375, 3.1041259765625, 3.240478515625, 3.3768310546875, 3.51318359375, 3.6495361328125, 3.785888671875, 3.9222412109375, 4.05859375]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 7.0, 3.0, 5.0, 6.0, 6.0, 5.0, 11.0, 12.0, 20.0, 27.0, 32.0, 29.0, 47.0, 54.0, 102.0, 152.0, 378.0, 1282.0, 5877.0, 36845.0, 418726.0, 3236820.0, 447720.0, 38117.0, 5819.0, 1288.0, 398.0, 154.0, 85.0, 69.0, 45.0, 31.0, 29.0, 18.0, 12.0, 13.0, 10.0, 9.0, 7.0, 5.0, 5.0, 3.0, 7.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-15.96875, -15.4921875, -15.015625, -14.5390625, -14.0625, -13.5859375, -13.109375, -12.6328125, -12.15625, -11.6796875, -11.203125, -10.7265625, -10.25, -9.7734375, -9.296875, -8.8203125, -8.34375, -7.8671875, -7.390625, -6.9140625, -6.4375, -5.9609375, -5.484375, -5.0078125, -4.53125, -4.0546875, -3.578125, -3.1015625, -2.625, -2.1484375, -1.671875, -1.1953125, -0.71875, -0.2421875, 0.234375, 0.7109375, 1.1875, 1.6640625, 2.140625, 2.6171875, 3.09375, 3.5703125, 4.046875, 4.5234375, 5.0, 5.4765625, 5.953125, 6.4296875, 6.90625, 7.3828125, 7.859375, 8.3359375, 8.8125, 9.2890625, 9.765625, 10.2421875, 10.71875, 11.1953125, 11.671875, 12.1484375, 12.625, 13.1015625, 13.578125, 14.0546875, 14.53125]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 7.0, 6.0, 9.0, 14.0, 17.0, 21.0, 29.0, 35.0, 66.0, 81.0, 137.0, 164.0, 222.0, 311.0, 461.0, 505.0, 509.0, 420.0, 317.0, 227.0, 162.0, 118.0, 72.0, 50.0, 39.0, 15.0, 18.0, 19.0, 10.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0], "bins": [-12.9921875, -12.6392822265625, -12.286376953125, -11.9334716796875, -11.58056640625, -11.2276611328125, -10.874755859375, -10.5218505859375, -10.1689453125, -9.8160400390625, -9.463134765625, -9.1102294921875, -8.75732421875, -8.4044189453125, -8.051513671875, -7.6986083984375, -7.345703125, -6.9927978515625, -6.639892578125, -6.2869873046875, -5.93408203125, -5.5811767578125, -5.228271484375, -4.8753662109375, -4.5224609375, -4.1695556640625, -3.816650390625, -3.4637451171875, -3.11083984375, -2.7579345703125, -2.405029296875, -2.0521240234375, -1.69921875, -1.3463134765625, -0.993408203125, -0.6405029296875, -0.28759765625, 0.0653076171875, 0.418212890625, 0.7711181640625, 1.1240234375, 1.4769287109375, 1.829833984375, 2.1827392578125, 2.53564453125, 2.8885498046875, 3.241455078125, 3.5943603515625, 3.947265625, 4.3001708984375, 4.653076171875, 5.0059814453125, 5.35888671875, 5.7117919921875, 6.064697265625, 6.4176025390625, 6.7705078125, 7.1234130859375, 7.476318359375, 7.8292236328125, 8.18212890625, 8.5350341796875, 8.887939453125, 9.2408447265625, 9.59375]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 6.0, 4.0, 13.0, 19.0, 29.0, 23.0, 43.0, 66.0, 120.0, 210.0, 418.0, 888.0, 3205.0, 25794.0, 552711.0, 3402139.0, 193097.0, 12001.0, 1981.0, 700.0, 331.0, 155.0, 116.0, 69.0, 43.0, 35.0, 23.0, 17.0, 14.0, 5.0, 1.0, 3.0, 4.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.953125, -26.03466796875, -25.1162109375, -24.19775390625, -23.279296875, -22.36083984375, -21.4423828125, -20.52392578125, -19.60546875, -18.68701171875, -17.7685546875, -16.85009765625, -15.931640625, -15.01318359375, -14.0947265625, -13.17626953125, -12.2578125, -11.33935546875, -10.4208984375, -9.50244140625, -8.583984375, -7.66552734375, -6.7470703125, -5.82861328125, -4.91015625, -3.99169921875, -3.0732421875, -2.15478515625, -1.236328125, -0.31787109375, 0.6005859375, 1.51904296875, 2.4375, 3.35595703125, 4.2744140625, 5.19287109375, 6.111328125, 7.02978515625, 7.9482421875, 8.86669921875, 9.78515625, 10.70361328125, 11.6220703125, 12.54052734375, 13.458984375, 14.37744140625, 15.2958984375, 16.21435546875, 17.1328125, 18.05126953125, 18.9697265625, 19.88818359375, 20.806640625, 21.72509765625, 22.6435546875, 23.56201171875, 24.48046875, 25.39892578125, 26.3173828125, 27.23583984375, 28.154296875, 29.07275390625, 29.9912109375, 30.90966796875, 31.828125]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 4.0, 4.0, 9.0, 11.0, 18.0, 17.0, 30.0, 39.0, 28.0, 46.0, 78.0, 68.0, 72.0, 94.0, 89.0, 77.0, 77.0, 59.0, 56.0, 31.0, 35.0, 22.0, 12.0, 17.0, 8.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0], "bins": [-64.56389617919922, -63.1259651184082, -61.68803787231445, -60.25010681152344, -58.81217956542969, -57.37424850463867, -55.936317443847656, -54.498390197753906, -53.06045913696289, -51.622528076171875, -50.184600830078125, -48.74666976928711, -47.308738708496094, -45.870811462402344, -44.43288040161133, -42.99494934082031, -41.55702209472656, -40.11909103393555, -38.6811637878418, -37.24323272705078, -35.80530548095703, -34.367374420166016, -32.929443359375, -31.491514205932617, -30.053585052490234, -28.61565589904785, -27.17772674560547, -25.739795684814453, -24.30186653137207, -22.863937377929688, -21.426006317138672, -19.98807716369629, -18.550151824951172, -17.11222267150879, -15.67429256439209, -14.23636245727539, -12.798433303833008, -11.360504150390625, -9.922574043273926, -8.484643936157227, -7.046714782714844, -5.608785152435303, -4.170855522155762, -2.7329258918762207, -1.2949962615966797, 0.14293336868286133, 1.5808629989624023, 3.0187931060791016, 4.456722259521484, 5.894651889801025, 7.332581520080566, 8.770511627197266, 10.208440780639648, 11.646369934082031, 13.08430004119873, 14.52223014831543, 15.960159301757812, 17.398088455200195, 18.836017608642578, 20.273948669433594, 21.711877822875977, 23.14980697631836, 24.587738037109375, 26.025667190551758, 27.46359634399414]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 9.0, 5.0, 4.0, 7.0, 6.0, 5.0, 10.0, 8.0, 16.0, 17.0, 20.0, 13.0, 19.0, 28.0, 22.0, 32.0, 25.0, 36.0, 39.0, 33.0, 40.0, 37.0, 38.0, 38.0, 29.0, 46.0, 40.0, 27.0, 42.0, 38.0, 27.0, 38.0, 25.0, 29.0, 33.0, 19.0, 10.0, 17.0, 13.0, 10.0, 13.0, 12.0, 9.0, 6.0, 5.0, 4.0, 1.0, 3.0, 0.0, 2.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0], "bins": [-28.962432861328125, -28.05179786682129, -27.14116096496582, -26.230525970458984, -25.319889068603516, -24.40925407409668, -23.498619079589844, -22.587982177734375, -21.677345275878906, -20.76671028137207, -19.8560733795166, -18.945438385009766, -18.034801483154297, -17.12416648864746, -16.213531494140625, -15.302894592285156, -14.39225959777832, -13.481623649597168, -12.570987701416016, -11.66035270690918, -10.749715805053711, -9.839080810546875, -8.928444862365723, -8.01780891418457, -7.107172966003418, -6.196537017822266, -5.285901069641113, -4.375265598297119, -3.464629650115967, -2.5539937019348145, -1.6433582305908203, -0.732722282409668, 0.17791366577148438, 1.0885494947433472, 1.99918532371521, 2.909821033477783, 3.8204569816589355, 4.731092929840088, 5.641728401184082, 6.552364349365234, 7.463000297546387, 8.373636245727539, 9.284272193908691, 10.194908142089844, 11.10554313659668, 12.016180038452148, 12.926815032958984, 13.837450981140137, 14.748086929321289, 15.658722877502441, 16.569358825683594, 17.47999382019043, 18.3906307220459, 19.301265716552734, 20.211902618408203, 21.12253761291504, 22.033172607421875, 22.94380760192871, 23.85444450378418, 24.765079498291016, 25.675716400146484, 26.58635139465332, 27.496986389160156, 28.407623291015625, 29.318260192871094]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 3.0, 6.0, 3.0, 4.0, 11.0, 7.0, 8.0, 12.0, 10.0, 15.0, 13.0, 18.0, 29.0, 25.0, 24.0, 33.0, 33.0, 31.0, 40.0, 34.0, 42.0, 44.0, 44.0, 42.0, 47.0, 38.0, 43.0, 36.0, 29.0, 38.0, 32.0, 35.0, 27.0, 19.0, 20.0, 32.0, 14.0, 20.0, 16.0, 13.0, 5.0, 3.0, 2.0, 3.0, 3.0, 0.0, 1.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.265625, -4.13348388671875, -4.0013427734375, -3.86920166015625, -3.737060546875, -3.60491943359375, -3.4727783203125, -3.34063720703125, -3.20849609375, -3.07635498046875, -2.9442138671875, -2.81207275390625, -2.679931640625, -2.54779052734375, -2.4156494140625, -2.28350830078125, -2.1513671875, -2.01922607421875, -1.8870849609375, -1.75494384765625, -1.622802734375, -1.49066162109375, -1.3585205078125, -1.22637939453125, -1.09423828125, -0.96209716796875, -0.8299560546875, -0.69781494140625, -0.565673828125, -0.43353271484375, -0.3013916015625, -0.16925048828125, -0.037109375, 0.09503173828125, 0.2271728515625, 0.35931396484375, 0.491455078125, 0.62359619140625, 0.7557373046875, 0.88787841796875, 1.02001953125, 1.15216064453125, 1.2843017578125, 1.41644287109375, 1.548583984375, 1.68072509765625, 1.8128662109375, 1.94500732421875, 2.0771484375, 2.20928955078125, 2.3414306640625, 2.47357177734375, 2.605712890625, 2.73785400390625, 2.8699951171875, 3.00213623046875, 3.13427734375, 3.26641845703125, 3.3985595703125, 3.53070068359375, 3.662841796875, 3.79498291015625, 3.9271240234375, 4.05926513671875, 4.19140625]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 4.0, 6.0, 7.0, 10.0, 15.0, 25.0, 31.0, 37.0, 70.0, 84.0, 112.0, 192.0, 272.0, 376.0, 488.0, 740.0, 1025.0, 1553.0, 2318.0, 3352.0, 4849.0, 6980.0, 10320.0, 14538.0, 21596.0, 32189.0, 49091.0, 78578.0, 131487.0, 198249.0, 180106.0, 110888.0, 67408.0, 42961.0, 28027.0, 18757.0, 13094.0, 8901.0, 6206.0, 4257.0, 2772.0, 2025.0, 1398.0, 943.0, 664.0, 484.0, 331.0, 236.0, 140.0, 123.0, 73.0, 55.0, 31.0, 34.0, 23.0, 13.0, 9.0, 7.0, 4.0, 2.0, 0.0, 4.0], "bins": [-0.354248046875, -0.3431205749511719, -0.33199310302734375, -0.3208656311035156, -0.3097381591796875, -0.2986106872558594, -0.28748321533203125, -0.2763557434082031, -0.265228271484375, -0.2541007995605469, -0.24297332763671875, -0.23184585571289062, -0.2207183837890625, -0.20959091186523438, -0.19846343994140625, -0.18733596801757812, -0.17620849609375, -0.16508102416992188, -0.15395355224609375, -0.14282608032226562, -0.1316986083984375, -0.12057113647460938, -0.10944366455078125, -0.09831619262695312, -0.087188720703125, -0.07606124877929688, -0.06493377685546875, -0.053806304931640625, -0.0426788330078125, -0.031551361083984375, -0.02042388916015625, -0.009296417236328125, 0.0018310546875, 0.012958526611328125, 0.02408599853515625, 0.035213470458984375, 0.0463409423828125, 0.057468414306640625, 0.06859588623046875, 0.07972335815429688, 0.090850830078125, 0.10197830200195312, 0.11310577392578125, 0.12423324584960938, 0.1353607177734375, 0.14648818969726562, 0.15761566162109375, 0.16874313354492188, 0.17987060546875, 0.19099807739257812, 0.20212554931640625, 0.21325302124023438, 0.2243804931640625, 0.23550796508789062, 0.24663543701171875, 0.2577629089355469, 0.268890380859375, 0.2800178527832031, 0.29114532470703125, 0.3022727966308594, 0.3134002685546875, 0.3245277404785156, 0.33565521240234375, 0.3467826843261719, 0.35791015625]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 8.0, 6.0, 9.0, 7.0, 3.0, 11.0, 13.0, 18.0, 24.0, 15.0, 28.0, 16.0, 23.0, 21.0, 27.0, 40.0, 34.0, 28.0, 46.0, 38.0, 44.0, 27.0, 1067.0, 47.0, 33.0, 37.0, 33.0, 36.0, 44.0, 25.0, 27.0, 29.0, 26.0, 21.0, 21.0, 17.0, 11.0, 13.0, 10.0, 11.0, 7.0, 7.0, 10.0, 2.0, 3.0, 1.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-2.724609375, -2.645355224609375, -2.56610107421875, -2.486846923828125, -2.4075927734375, -2.328338623046875, -2.24908447265625, -2.169830322265625, -2.090576171875, -2.011322021484375, -1.93206787109375, -1.852813720703125, -1.7735595703125, -1.694305419921875, -1.61505126953125, -1.535797119140625, -1.45654296875, -1.377288818359375, -1.29803466796875, -1.218780517578125, -1.1395263671875, -1.060272216796875, -0.98101806640625, -0.901763916015625, -0.822509765625, -0.743255615234375, -0.66400146484375, -0.584747314453125, -0.5054931640625, -0.426239013671875, -0.34698486328125, -0.267730712890625, -0.1884765625, -0.109222412109375, -0.02996826171875, 0.049285888671875, 0.1285400390625, 0.207794189453125, 0.28704833984375, 0.366302490234375, 0.445556640625, 0.524810791015625, 0.60406494140625, 0.683319091796875, 0.7625732421875, 0.841827392578125, 0.92108154296875, 1.000335693359375, 1.07958984375, 1.158843994140625, 1.23809814453125, 1.317352294921875, 1.3966064453125, 1.475860595703125, 1.55511474609375, 1.634368896484375, 1.713623046875, 1.792877197265625, 1.87213134765625, 1.951385498046875, 2.0306396484375, 2.109893798828125, 2.18914794921875, 2.268402099609375, 2.34765625]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 4.0, 6.0, 6.0, 12.0, 11.0, 22.0, 11.0, 22.0, 27.0, 56.0, 68.0, 97.0, 158.0, 219.0, 345.0, 529.0, 827.0, 1348.0, 2241.0, 3645.0, 5880.0, 10001.0, 16575.0, 28317.0, 48186.0, 83791.0, 140390.0, 1200773.0, 243038.0, 127551.0, 75514.0, 43470.0, 25743.0, 14965.0, 8970.0, 5557.0, 3299.0, 2024.0, 1225.0, 762.0, 458.0, 313.0, 231.0, 133.0, 108.0, 62.0, 34.0, 43.0, 21.0, 17.0, 11.0, 8.0, 6.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.229736328125, -0.2223033905029297, -0.21487045288085938, -0.20743751525878906, -0.20000457763671875, -0.19257164001464844, -0.18513870239257812, -0.1777057647705078, -0.1702728271484375, -0.1628398895263672, -0.15540695190429688, -0.14797401428222656, -0.14054107666015625, -0.13310813903808594, -0.12567520141601562, -0.11824226379394531, -0.110809326171875, -0.10337638854980469, -0.09594345092773438, -0.08851051330566406, -0.08107757568359375, -0.07364463806152344, -0.06621170043945312, -0.05877876281738281, -0.0513458251953125, -0.04391288757324219, -0.036479949951171875, -0.029047012329101562, -0.02161407470703125, -0.014181137084960938, -0.006748199462890625, 0.0006847381591796875, 0.00811767578125, 0.015550613403320312, 0.022983551025390625, 0.030416488647460938, 0.03784942626953125, 0.04528236389160156, 0.052715301513671875, 0.06014823913574219, 0.0675811767578125, 0.07501411437988281, 0.08244705200195312, 0.08987998962402344, 0.09731292724609375, 0.10474586486816406, 0.11217880249023438, 0.11961174011230469, 0.127044677734375, 0.1344776153564453, 0.14191055297851562, 0.14934349060058594, 0.15677642822265625, 0.16420936584472656, 0.17164230346679688, 0.1790752410888672, 0.1865081787109375, 0.1939411163330078, 0.20137405395507812, 0.20880699157714844, 0.21623992919921875, 0.22367286682128906, 0.23110580444335938, 0.2385387420654297, 0.2459716796875]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 8.0, 4.0, 3.0, 5.0, 8.0, 8.0, 5.0, 18.0, 29.0, 20.0, 36.0, 37.0, 36.0, 65.0, 72.0, 76.0, 75.0, 85.0, 70.0, 63.0, 68.0, 44.0, 36.0, 37.0, 21.0, 21.0, 10.0, 14.0, 7.0, 3.0, 2.0, 4.0, 3.0, 3.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00603485107421875, -0.005817413330078125, -0.0055999755859375, -0.005382537841796875, -0.00516510009765625, -0.004947662353515625, -0.004730224609375, -0.004512786865234375, -0.00429534912109375, -0.004077911376953125, -0.0038604736328125, -0.003643035888671875, -0.00342559814453125, -0.003208160400390625, -0.00299072265625, -0.002773284912109375, -0.00255584716796875, -0.002338409423828125, -0.0021209716796875, -0.001903533935546875, -0.00168609619140625, -0.001468658447265625, -0.001251220703125, -0.001033782958984375, -0.00081634521484375, -0.000598907470703125, -0.0003814697265625, -0.000164031982421875, 5.340576171875e-05, 0.000270843505859375, 0.00048828125, 0.000705718994140625, 0.00092315673828125, 0.001140594482421875, 0.0013580322265625, 0.001575469970703125, 0.00179290771484375, 0.002010345458984375, 0.002227783203125, 0.002445220947265625, 0.00266265869140625, 0.002880096435546875, 0.0030975341796875, 0.003314971923828125, 0.00353240966796875, 0.003749847412109375, 0.00396728515625, 0.004184722900390625, 0.00440216064453125, 0.004619598388671875, 0.0048370361328125, 0.005054473876953125, 0.00527191162109375, 0.005489349365234375, 0.005706787109375, 0.005924224853515625, 0.00614166259765625, 0.006359100341796875, 0.0065765380859375, 0.006793975830078125, 0.00701141357421875, 0.007228851318359375, 0.0074462890625, 0.007663726806640625, 0.00788116455078125]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 8.0, 6.0, 4.0, 10.0, 15.0, 17.0, 22.0, 24.0, 56.0, 71.0, 121.0, 145.0, 270.0, 470.0, 1651.0, 26314.0, 977278.0, 38743.0, 2027.0, 532.0, 262.0, 144.0, 102.0, 71.0, 51.0, 31.0, 26.0, 24.0, 15.0, 14.0, 9.0, 5.0, 6.0, 6.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0], "bins": [-0.12646484375, -0.1231842041015625, -0.119903564453125, -0.1166229248046875, -0.11334228515625, -0.1100616455078125, -0.106781005859375, -0.1035003662109375, -0.1002197265625, -0.0969390869140625, -0.093658447265625, -0.0903778076171875, -0.08709716796875, -0.0838165283203125, -0.080535888671875, -0.0772552490234375, -0.073974609375, -0.0706939697265625, -0.067413330078125, -0.0641326904296875, -0.06085205078125, -0.0575714111328125, -0.054290771484375, -0.0510101318359375, -0.0477294921875, -0.0444488525390625, -0.041168212890625, -0.0378875732421875, -0.03460693359375, -0.0313262939453125, -0.028045654296875, -0.0247650146484375, -0.021484375, -0.0182037353515625, -0.014923095703125, -0.0116424560546875, -0.00836181640625, -0.0050811767578125, -0.001800537109375, 0.0014801025390625, 0.0047607421875, 0.0080413818359375, 0.011322021484375, 0.0146026611328125, 0.01788330078125, 0.0211639404296875, 0.024444580078125, 0.0277252197265625, 0.031005859375, 0.0342864990234375, 0.037567138671875, 0.0408477783203125, 0.04412841796875, 0.0474090576171875, 0.050689697265625, 0.0539703369140625, 0.0572509765625, 0.0605316162109375, 0.063812255859375, 0.0670928955078125, 0.07037353515625, 0.0736541748046875, 0.076934814453125, 0.0802154541015625, 0.08349609375]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 27.0, 503.0, 452.0, 26.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.015099737793207169, -0.012585761956870556, -0.010071786120533943, -0.007557809352874756, -0.005043833516538143, -0.0025298576802015305, -1.588091254234314e-05, 0.002498093992471695, 0.005012070760130882, 0.007526046596467495, 0.010040022432804108, 0.012553999200463295, 0.015067975036799908, 0.01758195087313652, 0.020095927640795708, 0.022609902545809746, 0.025123879313468933, 0.02763785608112812, 0.03015183098614216, 0.032665807753801346, 0.035179782658815384, 0.03769376128911972, 0.04020773619413376, 0.0427217110991478, 0.045235686004161835, 0.04774966090917587, 0.05026363953948021, 0.05277761444449425, 0.055291589349508286, 0.05780556797981262, 0.06031954288482666, 0.0628335177898407, 0.06534750014543533, 0.06786147505044937, 0.07037544995546341, 0.07288943231105804, 0.07540340721607208, 0.07791738212108612, 0.08043135702610016, 0.0829453319311142, 0.08545930683612823, 0.08797328174114227, 0.09048725664615631, 0.09300123155117035, 0.09551521390676498, 0.09802918881177902, 0.10054316371679306, 0.1030571386218071, 0.10557112097740173, 0.10808509588241577, 0.11059907078742981, 0.11311304569244385, 0.11562702804803848, 0.11814100295305252, 0.12065497785806656, 0.1231689527630806, 0.12568292021751404, 0.12819689512252808, 0.13071087002754211, 0.13322484493255615, 0.1357388198375702, 0.13825279474258423, 0.14076676964759827, 0.1432807445526123, 0.14579473435878754]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 3.0, 4.0, 5.0, 9.0, 7.0, 7.0, 15.0, 10.0, 23.0, 23.0, 24.0, 35.0, 20.0, 44.0, 31.0, 34.0, 38.0, 33.0, 45.0, 37.0, 52.0, 48.0, 42.0, 42.0, 37.0, 52.0, 33.0, 24.0, 33.0, 23.0, 31.0, 26.0, 22.0, 23.0, 18.0, 11.0, 12.0, 11.0, 6.0, 1.0, 8.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.00953984260559082, -0.009259789250791073, -0.008979735895991325, -0.008699682541191578, -0.00841962918639183, -0.008139575831592083, -0.007859522476792336, -0.007579469121992588, -0.007299415767192841, -0.007019362412393093, -0.006739309057593346, -0.006459255702793598, -0.006179202347993851, -0.005899148993194103, -0.005619095638394356, -0.005339042283594608, -0.005058988928794861, -0.004778935573995113, -0.004498882219195366, -0.0042188288643956184, -0.003938775509595871, -0.0036587221547961235, -0.003378668799996376, -0.0030986154451966286, -0.002818562090396881, -0.0025385087355971336, -0.002258455380797386, -0.0019784020259976387, -0.0016983486711978912, -0.0014182953163981438, -0.0011382419615983963, -0.0008581886067986488, -0.0005781352519989014, -0.0002980818971991539, -1.8028542399406433e-05, 0.00026202481240034103, 0.0005420781672000885, 0.000822131521999836, 0.0011021848767995834, 0.001382238231599331, 0.0016622915863990784, 0.0019423449411988258, 0.0022223982959985733, 0.0025024516507983208, 0.0027825050055980682, 0.0030625583603978157, 0.003342611715197563, 0.0036226650699973106, 0.003902718424797058, 0.004182771779596806, 0.004462825134396553, 0.0047428784891963005, 0.005022931843996048, 0.0053029851987957954, 0.005583038553595543, 0.00586309190839529, 0.006143145263195038, 0.006423198617994785, 0.006703251972794533, 0.00698330532759428, 0.007263358682394028, 0.007543412037193775, 0.007823465391993523, 0.00810351874679327, 0.008383572101593018]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 6.0, 3.0, 5.0, 11.0, 6.0, 8.0, 12.0, 10.0, 16.0, 12.0, 19.0, 28.0, 25.0, 25.0, 33.0, 32.0, 31.0, 40.0, 36.0, 40.0, 45.0, 45.0, 41.0, 46.0, 38.0, 46.0, 33.0, 31.0, 36.0, 32.0, 36.0, 27.0, 18.0, 20.0, 32.0, 14.0, 20.0, 16.0, 13.0, 5.0, 3.0, 2.0, 3.0, 3.0, 0.0, 1.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.26171875, -4.129638671875, -3.99755859375, -3.865478515625, -3.7333984375, -3.601318359375, -3.46923828125, -3.337158203125, -3.205078125, -3.072998046875, -2.94091796875, -2.808837890625, -2.6767578125, -2.544677734375, -2.41259765625, -2.280517578125, -2.1484375, -2.016357421875, -1.88427734375, -1.752197265625, -1.6201171875, -1.488037109375, -1.35595703125, -1.223876953125, -1.091796875, -0.959716796875, -0.82763671875, -0.695556640625, -0.5634765625, -0.431396484375, -0.29931640625, -0.167236328125, -0.03515625, 0.096923828125, 0.22900390625, 0.361083984375, 0.4931640625, 0.625244140625, 0.75732421875, 0.889404296875, 1.021484375, 1.153564453125, 1.28564453125, 1.417724609375, 1.5498046875, 1.681884765625, 1.81396484375, 1.946044921875, 2.078125, 2.210205078125, 2.34228515625, 2.474365234375, 2.6064453125, 2.738525390625, 2.87060546875, 3.002685546875, 3.134765625, 3.266845703125, 3.39892578125, 3.531005859375, 3.6630859375, 3.795166015625, 3.92724609375, 4.059326171875, 4.19140625]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 6.0, 4.0, 7.0, 10.0, 13.0, 19.0, 41.0, 42.0, 66.0, 85.0, 159.0, 201.0, 320.0, 507.0, 861.0, 1308.0, 2062.0, 3238.0, 5586.0, 9373.0, 15831.0, 28875.0, 54207.0, 112145.0, 301497.0, 284770.0, 107912.0, 52737.0, 27924.0, 15761.0, 8941.0, 5364.0, 3282.0, 1967.0, 1230.0, 757.0, 493.0, 352.0, 206.0, 136.0, 96.0, 56.0, 47.0, 20.0, 12.0, 19.0, 5.0, 5.0, 4.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.005859375, -2.90557861328125, -2.8052978515625, -2.70501708984375, -2.604736328125, -2.50445556640625, -2.4041748046875, -2.30389404296875, -2.20361328125, -2.10333251953125, -2.0030517578125, -1.90277099609375, -1.802490234375, -1.70220947265625, -1.6019287109375, -1.50164794921875, -1.4013671875, -1.30108642578125, -1.2008056640625, -1.10052490234375, -1.000244140625, -0.89996337890625, -0.7996826171875, -0.69940185546875, -0.59912109375, -0.49884033203125, -0.3985595703125, -0.29827880859375, -0.197998046875, -0.09771728515625, 0.0025634765625, 0.10284423828125, 0.203125, 0.30340576171875, 0.4036865234375, 0.50396728515625, 0.604248046875, 0.70452880859375, 0.8048095703125, 0.90509033203125, 1.00537109375, 1.10565185546875, 1.2059326171875, 1.30621337890625, 1.406494140625, 1.50677490234375, 1.6070556640625, 1.70733642578125, 1.8076171875, 1.90789794921875, 2.0081787109375, 2.10845947265625, 2.208740234375, 2.30902099609375, 2.4093017578125, 2.50958251953125, 2.60986328125, 2.71014404296875, 2.8104248046875, 2.91070556640625, 3.010986328125, 3.11126708984375, 3.2115478515625, 3.31182861328125, 3.412109375]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 3.0, 4.0, 3.0, 6.0, 7.0, 13.0, 10.0, 12.0, 7.0, 16.0, 26.0, 20.0, 19.0, 25.0, 29.0, 35.0, 36.0, 29.0, 42.0, 47.0, 87.0, 181.0, 1464.0, 316.0, 125.0, 71.0, 43.0, 39.0, 43.0, 45.0, 34.0, 29.0, 30.0, 20.0, 22.0, 28.0, 12.0, 13.0, 9.0, 8.0, 7.0, 8.0, 6.0, 4.0, 8.0, 5.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.8203125, -14.3681640625, -13.916015625, -13.4638671875, -13.01171875, -12.5595703125, -12.107421875, -11.6552734375, -11.203125, -10.7509765625, -10.298828125, -9.8466796875, -9.39453125, -8.9423828125, -8.490234375, -8.0380859375, -7.5859375, -7.1337890625, -6.681640625, -6.2294921875, -5.77734375, -5.3251953125, -4.873046875, -4.4208984375, -3.96875, -3.5166015625, -3.064453125, -2.6123046875, -2.16015625, -1.7080078125, -1.255859375, -0.8037109375, -0.3515625, 0.1005859375, 0.552734375, 1.0048828125, 1.45703125, 1.9091796875, 2.361328125, 2.8134765625, 3.265625, 3.7177734375, 4.169921875, 4.6220703125, 5.07421875, 5.5263671875, 5.978515625, 6.4306640625, 6.8828125, 7.3349609375, 7.787109375, 8.2392578125, 8.69140625, 9.1435546875, 9.595703125, 10.0478515625, 10.5, 10.9521484375, 11.404296875, 11.8564453125, 12.30859375, 12.7607421875, 13.212890625, 13.6650390625, 14.1171875]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 9.0, 9.0, 17.0, 21.0, 22.0, 29.0, 45.0, 60.0, 107.0, 163.0, 237.0, 395.0, 992.0, 11946.0, 3021730.0, 106401.0, 2118.0, 557.0, 296.0, 199.0, 120.0, 63.0, 49.0, 27.0, 31.0, 17.0, 12.0, 12.0, 8.0, 10.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.59375, -40.23974609375, -38.8857421875, -37.53173828125, -36.177734375, -34.82373046875, -33.4697265625, -32.11572265625, -30.76171875, -29.40771484375, -28.0537109375, -26.69970703125, -25.345703125, -23.99169921875, -22.6376953125, -21.28369140625, -19.9296875, -18.57568359375, -17.2216796875, -15.86767578125, -14.513671875, -13.15966796875, -11.8056640625, -10.45166015625, -9.09765625, -7.74365234375, -6.3896484375, -5.03564453125, -3.681640625, -2.32763671875, -0.9736328125, 0.38037109375, 1.734375, 3.08837890625, 4.4423828125, 5.79638671875, 7.150390625, 8.50439453125, 9.8583984375, 11.21240234375, 12.56640625, 13.92041015625, 15.2744140625, 16.62841796875, 17.982421875, 19.33642578125, 20.6904296875, 22.04443359375, 23.3984375, 24.75244140625, 26.1064453125, 27.46044921875, 28.814453125, 30.16845703125, 31.5224609375, 32.87646484375, 34.23046875, 35.58447265625, 36.9384765625, 38.29248046875, 39.646484375, 41.00048828125, 42.3544921875, 43.70849609375, 45.0625]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 12.0, 16.0, 30.0, 88.0, 116.0, 136.0, 169.0, 150.0, 110.0, 90.0, 51.0, 20.0, 12.0, 5.0, 2.0, 0.0, 1.0], "bins": [-56.37644958496094, -55.32145309448242, -54.26646041870117, -53.211463928222656, -52.156471252441406, -51.10147476196289, -50.046478271484375, -48.991485595703125, -47.93648910522461, -46.881492614746094, -45.826499938964844, -44.77150344848633, -43.71650695800781, -42.66151428222656, -41.60651779174805, -40.5515251159668, -39.49652862548828, -38.441532135009766, -37.386539459228516, -36.33154296875, -35.27655029296875, -34.221553802490234, -33.16655731201172, -32.11156463623047, -31.056568145751953, -30.00157356262207, -28.946578979492188, -27.891582489013672, -26.83658790588379, -25.781593322753906, -24.72659683227539, -23.671602249145508, -22.616607666015625, -21.561613082885742, -20.50661849975586, -19.451622009277344, -18.39662742614746, -17.341632843017578, -16.286636352539062, -15.23164176940918, -14.176648139953613, -13.121652603149414, -12.066658020019531, -11.011663436889648, -9.95666790008545, -8.90167236328125, -7.846677780151367, -6.791682720184326, -5.736687660217285, -4.681692600250244, -3.626697540283203, -2.571702480316162, -1.516707420349121, -0.4617123603820801, 0.5932826995849609, 1.648277759552002, 2.703272819519043, 3.758267879486084, 4.813262939453125, 5.868257999420166, 6.923253059387207, 7.978248119354248, 9.033243179321289, 10.088237762451172, 11.143233299255371]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 5.0, 6.0, 5.0, 9.0, 7.0, 7.0, 10.0, 19.0, 24.0, 22.0, 20.0, 29.0, 29.0, 35.0, 18.0, 35.0, 54.0, 46.0, 32.0, 58.0, 55.0, 42.0, 42.0, 51.0, 41.0, 44.0, 39.0, 30.0, 24.0, 29.0, 20.0, 24.0, 12.0, 20.0, 12.0, 15.0, 8.0, 10.0, 5.0, 4.0, 2.0, 0.0, 3.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.029823303222656, -45.411128997802734, -43.79243469238281, -42.173744201660156, -40.555049896240234, -38.93635559082031, -37.31766128540039, -35.69896697998047, -34.08027648925781, -32.46158218383789, -30.8428897857666, -29.22419548034668, -27.60550308227539, -25.98680877685547, -24.368114471435547, -22.749420166015625, -21.130725860595703, -19.51203155517578, -17.893339157104492, -16.27464485168457, -14.655951499938965, -13.03725814819336, -11.418563842773438, -9.799870491027832, -8.181177139282227, -6.562483787536621, -4.943789958953857, -3.3250961303710938, -1.7064027786254883, -0.08770942687988281, 1.530984878540039, 3.1496782302856445, 4.768375396728516, 6.387068748474121, 8.005762100219727, 9.624456405639648, 11.243149757385254, 12.86184310913086, 14.480537414550781, 16.099231719970703, 17.717924118041992, 19.336618423461914, 20.955310821533203, 22.574005126953125, 24.192699432373047, 25.811391830444336, 27.430086135864258, 29.048778533935547, 30.66747283935547, 32.28616714477539, 33.90486145019531, 35.52355194091797, 37.14224624633789, 38.76094055175781, 40.379634857177734, 41.998329162597656, 43.61701965332031, 45.235713958740234, 46.854408264160156, 48.47309875488281, 50.091793060302734, 51.710487365722656, 53.32918167114258, 54.9478759765625, 56.56657028198242]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 6.0, 6.0, 5.0, 6.0, 7.0, 9.0, 11.0, 10.0, 21.0, 10.0, 17.0, 24.0, 29.0, 34.0, 26.0, 30.0, 33.0, 41.0, 29.0, 38.0, 54.0, 36.0, 40.0, 46.0, 38.0, 38.0, 41.0, 49.0, 29.0, 34.0, 28.0, 24.0, 24.0, 22.0, 21.0, 23.0, 24.0, 10.0, 11.0, 9.0, 2.0, 4.0, 1.0, 7.0, 0.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.32421875, -4.18646240234375, -4.0487060546875, -3.91094970703125, -3.773193359375, -3.63543701171875, -3.4976806640625, -3.35992431640625, -3.22216796875, -3.08441162109375, -2.9466552734375, -2.80889892578125, -2.671142578125, -2.53338623046875, -2.3956298828125, -2.25787353515625, -2.1201171875, -1.98236083984375, -1.8446044921875, -1.70684814453125, -1.569091796875, -1.43133544921875, -1.2935791015625, -1.15582275390625, -1.01806640625, -0.88031005859375, -0.7425537109375, -0.60479736328125, -0.467041015625, -0.32928466796875, -0.1915283203125, -0.05377197265625, 0.083984375, 0.22174072265625, 0.3594970703125, 0.49725341796875, 0.635009765625, 0.77276611328125, 0.9105224609375, 1.04827880859375, 1.18603515625, 1.32379150390625, 1.4615478515625, 1.59930419921875, 1.737060546875, 1.87481689453125, 2.0125732421875, 2.15032958984375, 2.2880859375, 2.42584228515625, 2.5635986328125, 2.70135498046875, 2.839111328125, 2.97686767578125, 3.1146240234375, 3.25238037109375, 3.39013671875, 3.52789306640625, 3.6656494140625, 3.80340576171875, 3.941162109375, 4.07891845703125, 4.2166748046875, 4.35443115234375, 4.4921875]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [5.0, 0.0, 2.0, 6.0, 4.0, 7.0, 7.0, 7.0, 8.0, 16.0, 18.0, 21.0, 32.0, 41.0, 45.0, 78.0, 107.0, 140.0, 211.0, 342.0, 554.0, 871.0, 1648.0, 2988.0, 5336.0, 10611.0, 21523.0, 46161.0, 108253.0, 287733.0, 841265.0, 1461887.0, 882009.0, 312735.0, 114376.0, 48730.0, 22610.0, 11111.0, 5683.0, 2971.0, 1619.0, 896.0, 569.0, 347.0, 205.0, 143.0, 88.0, 67.0, 52.0, 36.0, 33.0, 27.0, 16.0, 12.0, 10.0, 11.0, 7.0, 0.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0], "bins": [-5.25, -5.08349609375, -4.9169921875, -4.75048828125, -4.583984375, -4.41748046875, -4.2509765625, -4.08447265625, -3.91796875, -3.75146484375, -3.5849609375, -3.41845703125, -3.251953125, -3.08544921875, -2.9189453125, -2.75244140625, -2.5859375, -2.41943359375, -2.2529296875, -2.08642578125, -1.919921875, -1.75341796875, -1.5869140625, -1.42041015625, -1.25390625, -1.08740234375, -0.9208984375, -0.75439453125, -0.587890625, -0.42138671875, -0.2548828125, -0.08837890625, 0.078125, 0.24462890625, 0.4111328125, 0.57763671875, 0.744140625, 0.91064453125, 1.0771484375, 1.24365234375, 1.41015625, 1.57666015625, 1.7431640625, 1.90966796875, 2.076171875, 2.24267578125, 2.4091796875, 2.57568359375, 2.7421875, 2.90869140625, 3.0751953125, 3.24169921875, 3.408203125, 3.57470703125, 3.7412109375, 3.90771484375, 4.07421875, 4.24072265625, 4.4072265625, 4.57373046875, 4.740234375, 4.90673828125, 5.0732421875, 5.23974609375, 5.40625]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 5.0, 2.0, 0.0, 6.0, 9.0, 10.0, 12.0, 19.0, 26.0, 34.0, 35.0, 47.0, 66.0, 68.0, 92.0, 131.0, 177.0, 215.0, 278.0, 362.0, 400.0, 395.0, 353.0, 306.0, 259.0, 164.0, 136.0, 111.0, 74.0, 69.0, 60.0, 36.0, 38.0, 24.0, 14.0, 11.0, 7.0, 9.0, 2.0, 5.0, 2.0, 2.0, 0.0, 5.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.015625, -8.7340087890625, -8.452392578125, -8.1707763671875, -7.88916015625, -7.6075439453125, -7.325927734375, -7.0443115234375, -6.7626953125, -6.4810791015625, -6.199462890625, -5.9178466796875, -5.63623046875, -5.3546142578125, -5.072998046875, -4.7913818359375, -4.509765625, -4.2281494140625, -3.946533203125, -3.6649169921875, -3.38330078125, -3.1016845703125, -2.820068359375, -2.5384521484375, -2.2568359375, -1.9752197265625, -1.693603515625, -1.4119873046875, -1.13037109375, -0.8487548828125, -0.567138671875, -0.2855224609375, -0.00390625, 0.2777099609375, 0.559326171875, 0.8409423828125, 1.12255859375, 1.4041748046875, 1.685791015625, 1.9674072265625, 2.2490234375, 2.5306396484375, 2.812255859375, 3.0938720703125, 3.37548828125, 3.6571044921875, 3.938720703125, 4.2203369140625, 4.501953125, 4.7835693359375, 5.065185546875, 5.3468017578125, 5.62841796875, 5.9100341796875, 6.191650390625, 6.4732666015625, 6.7548828125, 7.0364990234375, 7.318115234375, 7.5997314453125, 7.88134765625, 8.1629638671875, 8.444580078125, 8.7261962890625, 9.0078125]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 5.0, 2.0, 4.0, 6.0, 4.0, 8.0, 15.0, 30.0, 33.0, 34.0, 58.0, 82.0, 161.0, 241.0, 455.0, 1118.0, 3946.0, 20825.0, 184741.0, 2413744.0, 1441626.0, 108900.0, 13621.0, 2748.0, 862.0, 430.0, 194.0, 120.0, 79.0, 61.0, 39.0, 21.0, 28.0, 14.0, 6.0, 10.0, 7.0, 4.0, 4.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.234375, -19.557373046875, -18.88037109375, -18.203369140625, -17.5263671875, -16.849365234375, -16.17236328125, -15.495361328125, -14.818359375, -14.141357421875, -13.46435546875, -12.787353515625, -12.1103515625, -11.433349609375, -10.75634765625, -10.079345703125, -9.40234375, -8.725341796875, -8.04833984375, -7.371337890625, -6.6943359375, -6.017333984375, -5.34033203125, -4.663330078125, -3.986328125, -3.309326171875, -2.63232421875, -1.955322265625, -1.2783203125, -0.601318359375, 0.07568359375, 0.752685546875, 1.4296875, 2.106689453125, 2.78369140625, 3.460693359375, 4.1376953125, 4.814697265625, 5.49169921875, 6.168701171875, 6.845703125, 7.522705078125, 8.19970703125, 8.876708984375, 9.5537109375, 10.230712890625, 10.90771484375, 11.584716796875, 12.26171875, 12.938720703125, 13.61572265625, 14.292724609375, 14.9697265625, 15.646728515625, 16.32373046875, 17.000732421875, 17.677734375, 18.354736328125, 19.03173828125, 19.708740234375, 20.3857421875, 21.062744140625, 21.73974609375, 22.416748046875, 23.09375]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 7.0, 14.0, 12.0, 19.0, 38.0, 62.0, 85.0, 125.0, 135.0, 128.0, 123.0, 104.0, 67.0, 38.0, 24.0, 19.0, 7.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.57677459716797, -82.36090850830078, -80.1450424194336, -77.92918395996094, -75.71331787109375, -73.49745178222656, -71.28158569335938, -69.06571960449219, -66.849853515625, -64.63398742675781, -62.41812515258789, -60.2022590637207, -57.98639678955078, -55.770530700683594, -53.554664611816406, -51.33879852294922, -49.12294006347656, -46.907073974609375, -44.69121170043945, -42.475345611572266, -40.259483337402344, -38.043617248535156, -35.82775115966797, -33.61188507080078, -31.39602279663086, -29.180158615112305, -26.96429443359375, -24.748428344726562, -22.532564163208008, -20.316699981689453, -18.100833892822266, -15.884969711303711, -13.669105529785156, -11.453241348266602, -9.23737621307373, -7.021511554718018, -4.805646896362305, -2.58978271484375, -0.3739175796508789, 1.8419475555419922, 4.057811737060547, 6.27367639541626, 8.489541053771973, 10.705406188964844, 12.921270370483398, 15.137134552001953, 17.35300064086914, 19.568864822387695, 21.78472900390625, 24.000593185424805, 26.21645736694336, 28.432323455810547, 30.6481876373291, 32.864051818847656, 35.079917907714844, 37.29578399658203, 39.51164627075195, 41.72751235961914, 43.94337463378906, 46.15924072265625, 48.37510681152344, 50.59096908569336, 52.80683517456055, 55.02269744873047, 57.238563537597656]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 8.0, 0.0, 3.0, 4.0, 2.0, 6.0, 6.0, 12.0, 10.0, 15.0, 12.0, 17.0, 22.0, 31.0, 29.0, 29.0, 28.0, 38.0, 33.0, 55.0, 38.0, 49.0, 44.0, 49.0, 44.0, 37.0, 37.0, 29.0, 45.0, 36.0, 32.0, 33.0, 31.0, 22.0, 18.0, 26.0, 17.0, 6.0, 11.0, 8.0, 14.0, 6.0, 8.0, 5.0, 2.0, 3.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-36.7362060546875, -35.65469741821289, -34.57318878173828, -33.49168014526367, -32.41017150878906, -31.328662872314453, -30.247156143188477, -29.165647506713867, -28.084138870239258, -27.00263023376465, -25.92112159729004, -24.83961296081543, -23.758106231689453, -22.676597595214844, -21.595088958740234, -20.513580322265625, -19.432071685791016, -18.350563049316406, -17.269054412841797, -16.187545776367188, -15.106038093566895, -14.024529457092285, -12.943021774291992, -11.861513137817383, -10.780004501342773, -9.698495864868164, -8.616987228393555, -7.535479545593262, -6.453970909118652, -5.372462272644043, -4.290954113006592, -3.2094459533691406, -2.1279373168945312, -1.046428918838501, 0.0350794792175293, 1.1165878772735596, 2.19809627532959, 3.279604911804199, 4.36111307144165, 5.442621231079102, 6.524129867553711, 7.60563850402832, 8.68714714050293, 9.768654823303223, 10.850163459777832, 11.931672096252441, 13.013179779052734, 14.094688415527344, 15.176197052001953, 16.257705688476562, 17.339214324951172, 18.42072296142578, 19.50223159790039, 20.583740234375, 21.665246963500977, 22.746755599975586, 23.828264236450195, 24.909772872924805, 25.991281509399414, 27.072790145874023, 28.154296875, 29.23580551147461, 30.31731414794922, 31.398822784423828, 32.48033142089844]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 6.0, 7.0, 8.0, 13.0, 12.0, 8.0, 13.0, 15.0, 17.0, 19.0, 27.0, 23.0, 35.0, 40.0, 31.0, 49.0, 37.0, 45.0, 48.0, 38.0, 49.0, 38.0, 46.0, 44.0, 42.0, 23.0, 48.0, 42.0, 22.0, 25.0, 21.0, 19.0, 16.0, 18.0, 10.0, 14.0, 11.0, 7.0, 5.0, 5.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.46875, -4.32464599609375, -4.1805419921875, -4.03643798828125, -3.892333984375, -3.74822998046875, -3.6041259765625, -3.46002197265625, -3.31591796875, -3.17181396484375, -3.0277099609375, -2.88360595703125, -2.739501953125, -2.59539794921875, -2.4512939453125, -2.30718994140625, -2.1630859375, -2.01898193359375, -1.8748779296875, -1.73077392578125, -1.586669921875, -1.44256591796875, -1.2984619140625, -1.15435791015625, -1.01025390625, -0.86614990234375, -0.7220458984375, -0.57794189453125, -0.433837890625, -0.28973388671875, -0.1456298828125, -0.00152587890625, 0.142578125, 0.28668212890625, 0.4307861328125, 0.57489013671875, 0.718994140625, 0.86309814453125, 1.0072021484375, 1.15130615234375, 1.29541015625, 1.43951416015625, 1.5836181640625, 1.72772216796875, 1.871826171875, 2.01593017578125, 2.1600341796875, 2.30413818359375, 2.4482421875, 2.59234619140625, 2.7364501953125, 2.88055419921875, 3.024658203125, 3.16876220703125, 3.3128662109375, 3.45697021484375, 3.60107421875, 3.74517822265625, 3.8892822265625, 4.03338623046875, 4.177490234375, 4.32159423828125, 4.4656982421875, 4.60980224609375, 4.75390625]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 7.0, 4.0, 6.0, 9.0, 13.0, 25.0, 24.0, 48.0, 78.0, 99.0, 140.0, 212.0, 326.0, 478.0, 697.0, 1031.0, 1631.0, 2268.0, 3400.0, 5259.0, 7898.0, 12020.0, 18271.0, 28653.0, 48022.0, 84580.0, 157402.0, 241460.0, 185206.0, 100014.0, 55689.0, 33116.0, 20562.0, 13431.0, 8757.0, 5878.0, 3973.0, 2565.0, 1726.0, 1166.0, 769.0, 555.0, 373.0, 234.0, 152.0, 115.0, 76.0, 49.0, 34.0, 27.0, 16.0, 10.0, 4.0, 7.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.428955078125, -0.41448211669921875, -0.4000091552734375, -0.38553619384765625, -0.371063232421875, -0.35659027099609375, -0.3421173095703125, -0.32764434814453125, -0.31317138671875, -0.29869842529296875, -0.2842254638671875, -0.26975250244140625, -0.255279541015625, -0.24080657958984375, -0.2263336181640625, -0.21186065673828125, -0.1973876953125, -0.18291473388671875, -0.1684417724609375, -0.15396881103515625, -0.139495849609375, -0.12502288818359375, -0.1105499267578125, -0.09607696533203125, -0.08160400390625, -0.06713104248046875, -0.0526580810546875, -0.03818511962890625, -0.023712158203125, -0.00923919677734375, 0.0052337646484375, 0.01970672607421875, 0.0341796875, 0.04865264892578125, 0.0631256103515625, 0.07759857177734375, 0.092071533203125, 0.10654449462890625, 0.1210174560546875, 0.13549041748046875, 0.14996337890625, 0.16443634033203125, 0.1789093017578125, 0.19338226318359375, 0.207855224609375, 0.22232818603515625, 0.2368011474609375, 0.25127410888671875, 0.2657470703125, 0.28022003173828125, 0.2946929931640625, 0.30916595458984375, 0.323638916015625, 0.33811187744140625, 0.3525848388671875, 0.36705780029296875, 0.38153076171875, 0.39600372314453125, 0.4104766845703125, 0.42494964599609375, 0.439422607421875, 0.45389556884765625, 0.4683685302734375, 0.48284149169921875, 0.497314453125]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 7.0, 5.0, 2.0, 4.0, 11.0, 5.0, 12.0, 12.0, 19.0, 15.0, 16.0, 25.0, 22.0, 21.0, 35.0, 29.0, 42.0, 33.0, 37.0, 40.0, 36.0, 33.0, 1063.0, 33.0, 26.0, 32.0, 35.0, 43.0, 41.0, 41.0, 31.0, 27.0, 36.0, 19.0, 20.0, 19.0, 17.0, 13.0, 14.0, 10.0, 13.0, 12.0, 3.0, 6.0, 2.0, 7.0, 1.0, 1.0, 3.0, 2.0, 2.0, 5.0], "bins": [-2.87890625, -2.796112060546875, -2.71331787109375, -2.630523681640625, -2.5477294921875, -2.464935302734375, -2.38214111328125, -2.299346923828125, -2.216552734375, -2.133758544921875, -2.05096435546875, -1.968170166015625, -1.8853759765625, -1.802581787109375, -1.71978759765625, -1.636993408203125, -1.55419921875, -1.471405029296875, -1.38861083984375, -1.305816650390625, -1.2230224609375, -1.140228271484375, -1.05743408203125, -0.974639892578125, -0.891845703125, -0.809051513671875, -0.72625732421875, -0.643463134765625, -0.5606689453125, -0.477874755859375, -0.39508056640625, -0.312286376953125, -0.2294921875, -0.146697998046875, -0.06390380859375, 0.018890380859375, 0.1016845703125, 0.184478759765625, 0.26727294921875, 0.350067138671875, 0.432861328125, 0.515655517578125, 0.59844970703125, 0.681243896484375, 0.7640380859375, 0.846832275390625, 0.92962646484375, 1.012420654296875, 1.09521484375, 1.178009033203125, 1.26080322265625, 1.343597412109375, 1.4263916015625, 1.509185791015625, 1.59197998046875, 1.674774169921875, 1.757568359375, 1.840362548828125, 1.92315673828125, 2.005950927734375, 2.0887451171875, 2.171539306640625, 2.25433349609375, 2.337127685546875, 2.419921875]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 5.0, 12.0, 6.0, 18.0, 23.0, 33.0, 67.0, 91.0, 99.0, 218.0, 325.0, 587.0, 1043.0, 1836.0, 3410.0, 6351.0, 12536.0, 24741.0, 49781.0, 100491.0, 195957.0, 1316761.0, 189642.0, 96028.0, 47572.0, 23901.0, 11911.0, 6239.0, 3233.0, 1781.0, 989.0, 553.0, 347.0, 196.0, 107.0, 79.0, 56.0, 39.0, 22.0, 15.0, 8.0, 7.0, 10.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.300048828125, -0.2898674011230469, -0.27968597412109375, -0.2695045471191406, -0.2593231201171875, -0.24914169311523438, -0.23896026611328125, -0.22877883911132812, -0.218597412109375, -0.20841598510742188, -0.19823455810546875, -0.18805313110351562, -0.1778717041015625, -0.16769027709960938, -0.15750885009765625, -0.14732742309570312, -0.13714599609375, -0.12696456909179688, -0.11678314208984375, -0.10660171508789062, -0.0964202880859375, -0.08623886108398438, -0.07605743408203125, -0.06587600708007812, -0.055694580078125, -0.045513153076171875, -0.03533172607421875, -0.025150299072265625, -0.0149688720703125, -0.004787445068359375, 0.00539398193359375, 0.015575408935546875, 0.0257568359375, 0.035938262939453125, 0.04611968994140625, 0.056301116943359375, 0.0664825439453125, 0.07666397094726562, 0.08684539794921875, 0.09702682495117188, 0.107208251953125, 0.11738967895507812, 0.12757110595703125, 0.13775253295898438, 0.1479339599609375, 0.15811538696289062, 0.16829681396484375, 0.17847824096679688, 0.18865966796875, 0.19884109497070312, 0.20902252197265625, 0.21920394897460938, 0.2293853759765625, 0.23956680297851562, 0.24974822998046875, 0.2599296569824219, 0.270111083984375, 0.2802925109863281, 0.29047393798828125, 0.3006553649902344, 0.3108367919921875, 0.3210182189941406, 0.33119964599609375, 0.3413810729980469, 0.3515625]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 4.0, 3.0, 6.0, 6.0, 6.0, 6.0, 8.0, 8.0, 17.0, 15.0, 12.0, 23.0, 33.0, 46.0, 48.0, 72.0, 117.0, 125.0, 111.0, 82.0, 51.0, 40.0, 27.0, 27.0, 20.0, 20.0, 13.0, 12.0, 7.0, 8.0, 5.0, 4.0, 8.0, 3.0, 3.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.008544921875, -0.008317232131958008, -0.008089542388916016, -0.007861852645874023, -0.007634162902832031, -0.007406473159790039, -0.007178783416748047, -0.006951093673706055, -0.0067234039306640625, -0.00649571418762207, -0.006268024444580078, -0.006040334701538086, -0.005812644958496094, -0.0055849552154541016, -0.005357265472412109, -0.005129575729370117, -0.004901885986328125, -0.004674196243286133, -0.004446506500244141, -0.0042188167572021484, -0.003991127014160156, -0.003763437271118164, -0.003535747528076172, -0.0033080577850341797, -0.0030803680419921875, -0.0028526782989501953, -0.002624988555908203, -0.002397298812866211, -0.0021696090698242188, -0.0019419193267822266, -0.0017142295837402344, -0.0014865398406982422, -0.00125885009765625, -0.0010311603546142578, -0.0008034706115722656, -0.0005757808685302734, -0.00034809112548828125, -0.00012040138244628906, 0.00010728836059570312, 0.0003349781036376953, 0.0005626678466796875, 0.0007903575897216797, 0.0010180473327636719, 0.001245737075805664, 0.0014734268188476562, 0.0017011165618896484, 0.0019288063049316406, 0.002156496047973633, 0.002384185791015625, 0.002611875534057617, 0.0028395652770996094, 0.0030672550201416016, 0.0032949447631835938, 0.003522634506225586, 0.003750324249267578, 0.00397801399230957, 0.0042057037353515625, 0.004433393478393555, 0.004661083221435547, 0.004888772964477539, 0.005116462707519531, 0.0053441524505615234, 0.005571842193603516, 0.005799531936645508, 0.0060272216796875]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 5.0, 0.0, 2.0, 7.0, 1.0, 3.0, 5.0, 5.0, 10.0, 10.0, 9.0, 11.0, 24.0, 29.0, 31.0, 53.0, 64.0, 100.0, 148.0, 218.0, 559.0, 3426.0, 81554.0, 935275.0, 24321.0, 1650.0, 388.0, 206.0, 150.0, 86.0, 56.0, 29.0, 20.0, 23.0, 17.0, 17.0, 8.0, 13.0, 12.0, 5.0, 2.0, 6.0, 5.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08843994140625, -0.0850820541381836, -0.08172416687011719, -0.07836627960205078, -0.07500839233398438, -0.07165050506591797, -0.06829261779785156, -0.06493473052978516, -0.06157684326171875, -0.058218955993652344, -0.05486106872558594, -0.05150318145751953, -0.048145294189453125, -0.04478740692138672, -0.04142951965332031, -0.038071632385253906, -0.0347137451171875, -0.031355857849121094, -0.027997970581054688, -0.02464008331298828, -0.021282196044921875, -0.01792430877685547, -0.014566421508789062, -0.011208534240722656, -0.00785064697265625, -0.004492759704589844, -0.0011348724365234375, 0.0022230148315429688, 0.005580902099609375, 0.008938789367675781, 0.012296676635742188, 0.015654563903808594, 0.019012451171875, 0.022370338439941406, 0.025728225708007812, 0.02908611297607422, 0.032444000244140625, 0.03580188751220703, 0.03915977478027344, 0.042517662048339844, 0.04587554931640625, 0.049233436584472656, 0.05259132385253906, 0.05594921112060547, 0.059307098388671875, 0.06266498565673828, 0.06602287292480469, 0.0693807601928711, 0.0727386474609375, 0.0760965347290039, 0.07945442199707031, 0.08281230926513672, 0.08617019653320312, 0.08952808380126953, 0.09288597106933594, 0.09624385833740234, 0.09960174560546875, 0.10295963287353516, 0.10631752014160156, 0.10967540740966797, 0.11303329467773438, 0.11639118194580078, 0.11974906921386719, 0.1231069564819336, 0.12646484375]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [6.0, 20.0, 109.0, 674.0, 182.0, 18.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00816649105399847, -0.005901330150663853, -0.0036361697129905224, -0.001371009275317192, 0.0008941516280174255, 0.003159312531352043, 0.005424472503364086, 0.007689633406698704, 0.009954794310033321, 0.012219955213367939, 0.014485115185379982, 0.0167502760887146, 0.019015436992049217, 0.021280597895383835, 0.023545756936073303, 0.02581091970205307, 0.02807607874274254, 0.030341239646077156, 0.032606400549411774, 0.03487155959010124, 0.03713672235608101, 0.03940188139677048, 0.041667044162750244, 0.04393220320343971, 0.04619736596941948, 0.04846252501010895, 0.050727687776088715, 0.05299284681677818, 0.05525800958275795, 0.05752316862344742, 0.059788331389427185, 0.06205349043011665, 0.06431864947080612, 0.06658381223678589, 0.06884896755218506, 0.07111413031816483, 0.07337929308414459, 0.07564445585012436, 0.07790961116552353, 0.0801747739315033, 0.08243993669748306, 0.08470509946346283, 0.086970254778862, 0.08923541754484177, 0.09150058031082153, 0.0937657430768013, 0.09603089839220047, 0.09829606115818024, 0.1005612164735794, 0.10282637923955917, 0.10509153455495834, 0.10735669732093811, 0.10962186008691788, 0.11188702285289764, 0.11415217816829681, 0.11641734093427658, 0.11868250370025635, 0.12094766646623611, 0.12321282178163528, 0.12547798454761505, 0.12774313986301422, 0.13000831007957458, 0.13227346539497375, 0.13453862071037292, 0.1368037909269333]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 4.0, 7.0, 14.0, 12.0, 14.0, 15.0, 21.0, 20.0, 30.0, 27.0, 37.0, 39.0, 31.0, 42.0, 49.0, 46.0, 49.0, 58.0, 63.0, 59.0, 45.0, 37.0, 53.0, 36.0, 30.0, 36.0, 27.0, 28.0, 22.0, 9.0, 11.0, 8.0, 10.0, 6.0, 8.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.009418964385986328, -0.009087435901165009, -0.008755907416343689, -0.00842437893152237, -0.00809285044670105, -0.00776132196187973, -0.007429793477058411, -0.007098264992237091, -0.0067667365074157715, -0.006435208022594452, -0.006103679537773132, -0.005772151052951813, -0.005440622568130493, -0.005109094083309174, -0.004777565598487854, -0.004446037113666534, -0.004114508628845215, -0.0037829801440238953, -0.0034514516592025757, -0.003119923174381256, -0.0027883946895599365, -0.002456866204738617, -0.0021253377199172974, -0.0017938092350959778, -0.0014622807502746582, -0.0011307522654533386, -0.000799223780632019, -0.00046769529581069946, -0.00013616681098937988, 0.0001953616738319397, 0.0005268901586532593, 0.0008584186434745789, 0.0011899471282958984, 0.001521475613117218, 0.0018530040979385376, 0.002184532582759857, 0.0025160610675811768, 0.0028475895524024963, 0.003179118037223816, 0.0035106465220451355, 0.003842175006866455, 0.004173703491687775, 0.004505231976509094, 0.004836760461330414, 0.005168288946151733, 0.005499817430973053, 0.0058313459157943726, 0.006162874400615692, 0.006494402885437012, 0.006825931370258331, 0.007157459855079651, 0.0074889883399009705, 0.00782051682472229, 0.00815204530954361, 0.00848357379436493, 0.008815102279186249, 0.009146630764007568, 0.009478159248828888, 0.009809687733650208, 0.010141216218471527, 0.010472744703292847, 0.010804273188114166, 0.011135801672935486, 0.011467330157756805, 0.011798858642578125]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 6.0, 7.0, 8.0, 13.0, 12.0, 8.0, 13.0, 15.0, 17.0, 19.0, 27.0, 23.0, 35.0, 40.0, 31.0, 49.0, 37.0, 45.0, 48.0, 38.0, 49.0, 38.0, 46.0, 44.0, 42.0, 23.0, 48.0, 42.0, 22.0, 25.0, 21.0, 19.0, 16.0, 18.0, 10.0, 14.0, 11.0, 7.0, 5.0, 5.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.46875, -4.32464599609375, -4.1805419921875, -4.03643798828125, -3.892333984375, -3.74822998046875, -3.6041259765625, -3.46002197265625, -3.31591796875, -3.17181396484375, -3.0277099609375, -2.88360595703125, -2.739501953125, -2.59539794921875, -2.4512939453125, -2.30718994140625, -2.1630859375, -2.01898193359375, -1.8748779296875, -1.73077392578125, -1.586669921875, -1.44256591796875, -1.2984619140625, -1.15435791015625, -1.01025390625, -0.86614990234375, -0.7220458984375, -0.57794189453125, -0.433837890625, -0.28973388671875, -0.1456298828125, -0.00152587890625, 0.142578125, 0.28668212890625, 0.4307861328125, 0.57489013671875, 0.718994140625, 0.86309814453125, 1.0072021484375, 1.15130615234375, 1.29541015625, 1.43951416015625, 1.5836181640625, 1.72772216796875, 1.871826171875, 2.01593017578125, 2.1600341796875, 2.30413818359375, 2.4482421875, 2.59234619140625, 2.7364501953125, 2.88055419921875, 3.024658203125, 3.16876220703125, 3.3128662109375, 3.45697021484375, 3.60107421875, 3.74517822265625, 3.8892822265625, 4.03338623046875, 4.177490234375, 4.32159423828125, 4.4656982421875, 4.60980224609375, 4.75390625]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 6.0, 16.0, 17.0, 12.0, 19.0, 36.0, 48.0, 56.0, 70.0, 101.0, 153.0, 189.0, 299.0, 431.0, 689.0, 1215.0, 2121.0, 4046.0, 7635.0, 15883.0, 35068.0, 86250.0, 253084.0, 401393.0, 140518.0, 53002.0, 23075.0, 10675.0, 5341.0, 2823.0, 1567.0, 902.0, 567.0, 373.0, 259.0, 181.0, 107.0, 100.0, 56.0, 39.0, 39.0, 27.0, 17.0, 20.0, 10.0, 6.0, 2.0, 3.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.2265625, -4.095458984375, -3.96435546875, -3.833251953125, -3.7021484375, -3.571044921875, -3.43994140625, -3.308837890625, -3.177734375, -3.046630859375, -2.91552734375, -2.784423828125, -2.6533203125, -2.522216796875, -2.39111328125, -2.260009765625, -2.12890625, -1.997802734375, -1.86669921875, -1.735595703125, -1.6044921875, -1.473388671875, -1.34228515625, -1.211181640625, -1.080078125, -0.948974609375, -0.81787109375, -0.686767578125, -0.5556640625, -0.424560546875, -0.29345703125, -0.162353515625, -0.03125, 0.099853515625, 0.23095703125, 0.362060546875, 0.4931640625, 0.624267578125, 0.75537109375, 0.886474609375, 1.017578125, 1.148681640625, 1.27978515625, 1.410888671875, 1.5419921875, 1.673095703125, 1.80419921875, 1.935302734375, 2.06640625, 2.197509765625, 2.32861328125, 2.459716796875, 2.5908203125, 2.721923828125, 2.85302734375, 2.984130859375, 3.115234375, 3.246337890625, 3.37744140625, 3.508544921875, 3.6396484375, 3.770751953125, 3.90185546875, 4.032958984375, 4.1640625]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 4.0, 5.0, 6.0, 6.0, 10.0, 17.0, 10.0, 22.0, 18.0, 26.0, 32.0, 28.0, 49.0, 44.0, 53.0, 65.0, 99.0, 225.0, 1622.0, 226.0, 85.0, 52.0, 48.0, 42.0, 39.0, 42.0, 34.0, 25.0, 27.0, 23.0, 18.0, 14.0, 5.0, 11.0, 4.0, 3.0, 3.0, 4.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-18.328125, -17.7265625, -17.125, -16.5234375, -15.921875, -15.3203125, -14.71875, -14.1171875, -13.515625, -12.9140625, -12.3125, -11.7109375, -11.109375, -10.5078125, -9.90625, -9.3046875, -8.703125, -8.1015625, -7.5, -6.8984375, -6.296875, -5.6953125, -5.09375, -4.4921875, -3.890625, -3.2890625, -2.6875, -2.0859375, -1.484375, -0.8828125, -0.28125, 0.3203125, 0.921875, 1.5234375, 2.125, 2.7265625, 3.328125, 3.9296875, 4.53125, 5.1328125, 5.734375, 6.3359375, 6.9375, 7.5390625, 8.140625, 8.7421875, 9.34375, 9.9453125, 10.546875, 11.1484375, 11.75, 12.3515625, 12.953125, 13.5546875, 14.15625, 14.7578125, 15.359375, 15.9609375, 16.5625, 17.1640625, 17.765625, 18.3671875, 18.96875, 19.5703125, 20.171875]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 3.0, 4.0, 6.0, 6.0, 3.0, 9.0, 8.0, 19.0, 27.0, 39.0, 41.0, 57.0, 66.0, 103.0, 111.0, 184.0, 257.0, 477.0, 1670.0, 19461.0, 3045412.0, 73368.0, 2751.0, 617.0, 308.0, 185.0, 141.0, 97.0, 85.0, 58.0, 29.0, 24.0, 14.0, 17.0, 17.0, 12.0, 8.0, 8.0, 4.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-44.90625, -43.5712890625, -42.236328125, -40.9013671875, -39.56640625, -38.2314453125, -36.896484375, -35.5615234375, -34.2265625, -32.8916015625, -31.556640625, -30.2216796875, -28.88671875, -27.5517578125, -26.216796875, -24.8818359375, -23.546875, -22.2119140625, -20.876953125, -19.5419921875, -18.20703125, -16.8720703125, -15.537109375, -14.2021484375, -12.8671875, -11.5322265625, -10.197265625, -8.8623046875, -7.52734375, -6.1923828125, -4.857421875, -3.5224609375, -2.1875, -0.8525390625, 0.482421875, 1.8173828125, 3.15234375, 4.4873046875, 5.822265625, 7.1572265625, 8.4921875, 9.8271484375, 11.162109375, 12.4970703125, 13.83203125, 15.1669921875, 16.501953125, 17.8369140625, 19.171875, 20.5068359375, 21.841796875, 23.1767578125, 24.51171875, 25.8466796875, 27.181640625, 28.5166015625, 29.8515625, 31.1865234375, 32.521484375, 33.8564453125, 35.19140625, 36.5263671875, 37.861328125, 39.1962890625, 40.53125]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 7.0, 342.0, 618.0, 52.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.135183334350586, -13.119504928588867, -7.103827476501465, -1.0881500244140625, 4.927528381347656, 10.943206787109375, 16.95888328552246, 22.97456169128418, 28.9902400970459, 35.005916595458984, 41.0215950012207, 47.03727340698242, 53.05295181274414, 59.06863021850586, 65.08430480957031, 71.09998321533203, 77.11566162109375, 83.13134002685547, 89.14701843261719, 95.1626968383789, 101.17837524414062, 107.19405364990234, 113.20973205566406, 119.22540283203125, 125.2410888671875, 131.2567596435547, 137.27244567871094, 143.28811645507812, 149.30380249023438, 155.31947326660156, 161.3351593017578, 167.350830078125, 173.3665008544922, 179.38217163085938, 185.39785766601562, 191.4135284423828, 197.42921447753906, 203.44488525390625, 209.4605712890625, 215.4762420654297, 221.49192810058594, 227.50759887695312, 233.52328491210938, 239.53895568847656, 245.5546417236328, 251.5703125, 257.58599853515625, 263.6016845703125, 269.6173400878906, 275.6330261230469, 281.648681640625, 287.66436767578125, 293.6800537109375, 299.69573974609375, 305.7113952636719, 311.7270812988281, 317.7427673339844, 323.7584533691406, 329.77410888671875, 335.789794921875, 341.80548095703125, 347.8211669921875, 353.8368225097656, 359.8525085449219, 365.8681945800781]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 2.0, 5.0, 9.0, 9.0, 13.0, 11.0, 15.0, 15.0, 28.0, 30.0, 23.0, 25.0, 27.0, 40.0, 21.0, 31.0, 41.0, 37.0, 35.0, 42.0, 44.0, 40.0, 44.0, 43.0, 37.0, 33.0, 24.0, 35.0, 29.0, 33.0, 31.0, 21.0, 24.0, 19.0, 13.0, 13.0, 16.0, 7.0, 6.0, 7.0, 5.0, 7.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-36.2802734375, -35.06113052368164, -33.84198760986328, -32.622840881347656, -31.403697967529297, -30.184555053710938, -28.965412139892578, -27.74626922607422, -26.527124404907227, -25.307981491088867, -24.088836669921875, -22.869693756103516, -21.650550842285156, -20.431406021118164, -19.212263107299805, -17.993118286132812, -16.773975372314453, -15.554831504821777, -14.335687637329102, -13.116544723510742, -11.897400856018066, -10.67825698852539, -9.459114074707031, -8.239970207214355, -7.02082633972168, -5.801682472229004, -4.582539081573486, -3.3633954524993896, -2.144251823425293, -0.9251079559326172, 0.2940354347229004, 1.513178825378418, 2.7323226928710938, 3.9514663219451904, 5.170609951019287, 6.389753341674805, 7.6088972091674805, 8.828041076660156, 10.047183990478516, 11.266327857971191, 12.485471725463867, 13.704615592956543, 14.923759460449219, 16.142902374267578, 17.362045288085938, 18.58119010925293, 19.80033302307129, 21.01947784423828, 22.23862075805664, 23.457763671875, 24.676908493041992, 25.89605140686035, 27.115196228027344, 28.334339141845703, 29.553482055664062, 30.772624969482422, 31.991769790649414, 33.210914611816406, 34.430057525634766, 35.649200439453125, 36.868343353271484, 38.087486267089844, 39.30663299560547, 40.52577590942383, 41.74491882324219]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 7.0, 7.0, 7.0, 5.0, 6.0, 14.0, 11.0, 13.0, 17.0, 16.0, 21.0, 16.0, 18.0, 22.0, 36.0, 39.0, 40.0, 34.0, 44.0, 40.0, 43.0, 42.0, 31.0, 42.0, 41.0, 38.0, 26.0, 37.0, 44.0, 45.0, 19.0, 27.0, 29.0, 26.0, 13.0, 15.0, 21.0, 9.0, 9.0, 9.0, 7.0, 4.0, 5.0, 7.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.078125, -3.93829345703125, -3.7984619140625, -3.65863037109375, -3.518798828125, -3.37896728515625, -3.2391357421875, -3.09930419921875, -2.95947265625, -2.81964111328125, -2.6798095703125, -2.53997802734375, -2.400146484375, -2.26031494140625, -2.1204833984375, -1.98065185546875, -1.8408203125, -1.70098876953125, -1.5611572265625, -1.42132568359375, -1.281494140625, -1.14166259765625, -1.0018310546875, -0.86199951171875, -0.72216796875, -0.58233642578125, -0.4425048828125, -0.30267333984375, -0.162841796875, -0.02301025390625, 0.1168212890625, 0.25665283203125, 0.396484375, 0.53631591796875, 0.6761474609375, 0.81597900390625, 0.955810546875, 1.09564208984375, 1.2354736328125, 1.37530517578125, 1.51513671875, 1.65496826171875, 1.7947998046875, 1.93463134765625, 2.074462890625, 2.21429443359375, 2.3541259765625, 2.49395751953125, 2.6337890625, 2.77362060546875, 2.9134521484375, 3.05328369140625, 3.193115234375, 3.33294677734375, 3.4727783203125, 3.61260986328125, 3.75244140625, 3.89227294921875, 4.0321044921875, 4.17193603515625, 4.311767578125, 4.45159912109375, 4.5914306640625, 4.73126220703125, 4.87109375]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 8.0, 10.0, 4.0, 6.0, 8.0, 9.0, 8.0, 18.0, 19.0, 18.0, 39.0, 28.0, 56.0, 118.0, 164.0, 364.0, 844.0, 3016.0, 16339.0, 141538.0, 2124175.0, 1774474.0, 115315.0, 13605.0, 2584.0, 733.0, 292.0, 156.0, 96.0, 62.0, 35.0, 27.0, 29.0, 19.0, 12.0, 17.0, 8.0, 7.0, 7.0, 6.0, 4.0, 6.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.2421875, -13.7503662109375, -13.258544921875, -12.7667236328125, -12.27490234375, -11.7830810546875, -11.291259765625, -10.7994384765625, -10.3076171875, -9.8157958984375, -9.323974609375, -8.8321533203125, -8.34033203125, -7.8485107421875, -7.356689453125, -6.8648681640625, -6.373046875, -5.8812255859375, -5.389404296875, -4.8975830078125, -4.40576171875, -3.9139404296875, -3.422119140625, -2.9302978515625, -2.4384765625, -1.9466552734375, -1.454833984375, -0.9630126953125, -0.47119140625, 0.0206298828125, 0.512451171875, 1.0042724609375, 1.49609375, 1.9879150390625, 2.479736328125, 2.9715576171875, 3.46337890625, 3.9552001953125, 4.447021484375, 4.9388427734375, 5.4306640625, 5.9224853515625, 6.414306640625, 6.9061279296875, 7.39794921875, 7.8897705078125, 8.381591796875, 8.8734130859375, 9.365234375, 9.8570556640625, 10.348876953125, 10.8406982421875, 11.33251953125, 11.8243408203125, 12.316162109375, 12.8079833984375, 13.2998046875, 13.7916259765625, 14.283447265625, 14.7752685546875, 15.26708984375, 15.7589111328125, 16.250732421875, 16.7425537109375, 17.234375]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 6.0, 17.0, 16.0, 19.0, 45.0, 69.0, 95.0, 168.0, 263.0, 381.0, 586.0, 693.0, 625.0, 385.0, 278.0, 177.0, 88.0, 63.0, 39.0, 17.0, 17.0, 11.0, 7.0, 10.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.28125, -16.794189453125, -16.30712890625, -15.820068359375, -15.3330078125, -14.845947265625, -14.35888671875, -13.871826171875, -13.384765625, -12.897705078125, -12.41064453125, -11.923583984375, -11.4365234375, -10.949462890625, -10.46240234375, -9.975341796875, -9.48828125, -9.001220703125, -8.51416015625, -8.027099609375, -7.5400390625, -7.052978515625, -6.56591796875, -6.078857421875, -5.591796875, -5.104736328125, -4.61767578125, -4.130615234375, -3.6435546875, -3.156494140625, -2.66943359375, -2.182373046875, -1.6953125, -1.208251953125, -0.72119140625, -0.234130859375, 0.2529296875, 0.739990234375, 1.22705078125, 1.714111328125, 2.201171875, 2.688232421875, 3.17529296875, 3.662353515625, 4.1494140625, 4.636474609375, 5.12353515625, 5.610595703125, 6.09765625, 6.584716796875, 7.07177734375, 7.558837890625, 8.0458984375, 8.532958984375, 9.02001953125, 9.507080078125, 9.994140625, 10.481201171875, 10.96826171875, 11.455322265625, 11.9423828125, 12.429443359375, 12.91650390625, 13.403564453125, 13.890625]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 8.0, 7.0, 14.0, 17.0, 37.0, 45.0, 66.0, 95.0, 213.0, 367.0, 812.0, 2758.0, 28328.0, 1021170.0, 3049922.0, 83108.0, 5225.0, 1033.0, 467.0, 223.0, 144.0, 92.0, 52.0, 32.0, 21.0, 14.0, 6.0, 1.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.421875, -27.412841796875, -26.40380859375, -25.394775390625, -24.3857421875, -23.376708984375, -22.36767578125, -21.358642578125, -20.349609375, -19.340576171875, -18.33154296875, -17.322509765625, -16.3134765625, -15.304443359375, -14.29541015625, -13.286376953125, -12.27734375, -11.268310546875, -10.25927734375, -9.250244140625, -8.2412109375, -7.232177734375, -6.22314453125, -5.214111328125, -4.205078125, -3.196044921875, -2.18701171875, -1.177978515625, -0.1689453125, 0.840087890625, 1.84912109375, 2.858154296875, 3.8671875, 4.876220703125, 5.88525390625, 6.894287109375, 7.9033203125, 8.912353515625, 9.92138671875, 10.930419921875, 11.939453125, 12.948486328125, 13.95751953125, 14.966552734375, 15.9755859375, 16.984619140625, 17.99365234375, 19.002685546875, 20.01171875, 21.020751953125, 22.02978515625, 23.038818359375, 24.0478515625, 25.056884765625, 26.06591796875, 27.074951171875, 28.083984375, 29.093017578125, 30.10205078125, 31.111083984375, 32.1201171875, 33.129150390625, 34.13818359375, 35.147216796875, 36.15625]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 3.0, 5.0, 9.0, 7.0, 16.0, 17.0, 18.0, 36.0, 40.0, 45.0, 37.0, 81.0, 61.0, 53.0, 72.0, 61.0, 65.0, 62.0, 70.0, 44.0, 41.0, 42.0, 30.0, 24.0, 16.0, 15.0, 14.0, 9.0, 5.0, 6.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-45.99741744995117, -44.876564025878906, -43.755714416503906, -42.63486099243164, -41.514007568359375, -40.393157958984375, -39.27230453491211, -38.151451110839844, -37.030601501464844, -35.90974807739258, -34.78889846801758, -33.66804504394531, -32.54719161987305, -31.426340103149414, -30.30548858642578, -29.184635162353516, -28.06378173828125, -26.942930221557617, -25.82207679748535, -24.70122528076172, -23.580371856689453, -22.45952033996582, -21.338668823242188, -20.217815399169922, -19.09696388244629, -17.976112365722656, -16.85525894165039, -15.734407424926758, -14.613554954528809, -13.49270248413086, -12.371850967407227, -11.250998497009277, -10.130144119262695, -9.009291648864746, -7.888439655303955, -6.767587661743164, -5.646735191345215, -4.525882720947266, -3.4050307273864746, -2.2841787338256836, -1.1633262634277344, -0.04247403144836426, 1.0783782005310059, 2.199230432510376, 3.320082664489746, 4.440935134887695, 5.561787128448486, 6.682639122009277, 7.803491592407227, 8.924344062805176, 10.045196533203125, 11.166048049926758, 12.286900520324707, 13.407752990722656, 14.528604507446289, 15.649456977844238, 16.770309448242188, 17.89116096496582, 19.012014389038086, 20.13286590576172, 21.253719329833984, 22.374570846557617, 23.49542236328125, 24.616275787353516, 25.73712730407715]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 4.0, 7.0, 7.0, 5.0, 8.0, 10.0, 11.0, 7.0, 9.0, 16.0, 21.0, 26.0, 20.0, 18.0, 27.0, 26.0, 33.0, 32.0, 34.0, 36.0, 44.0, 43.0, 31.0, 42.0, 34.0, 40.0, 33.0, 40.0, 47.0, 37.0, 40.0, 34.0, 28.0, 18.0, 20.0, 20.0, 27.0, 12.0, 12.0, 9.0, 12.0, 5.0, 6.0, 8.0, 4.0, 3.0, 6.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.520980834960938, -27.49746322631836, -26.47394371032715, -25.45042610168457, -24.42690658569336, -23.40338897705078, -22.379871368408203, -21.356353759765625, -20.332834243774414, -19.309316635131836, -18.285797119140625, -17.262279510498047, -16.23876190185547, -15.215242385864258, -14.19172477722168, -13.168206214904785, -12.14468765258789, -11.121169090270996, -10.097650527954102, -9.074132919311523, -8.050614356994629, -7.027095794677734, -6.003577709197998, -4.980059623718262, -3.956541061401367, -2.9330227375030518, -1.9095044136047363, -0.8859860897064209, 0.13753223419189453, 1.161050796508789, 2.1845688819885254, 3.2080869674682617, 4.231605529785156, 5.255124092102051, 6.278642177581787, 7.302160263061523, 8.325678825378418, 9.349197387695312, 10.37271499633789, 11.396233558654785, 12.41975212097168, 13.443270683288574, 14.466789245605469, 15.490306854248047, 16.513824462890625, 17.537343978881836, 18.560861587524414, 19.584381103515625, 20.607898712158203, 21.63141632080078, 22.654935836791992, 23.67845344543457, 24.70197296142578, 25.72549057006836, 26.749008178710938, 27.772525787353516, 28.796045303344727, 29.819562911987305, 30.843082427978516, 31.866600036621094, 32.89011764526367, 33.91363525390625, 34.937156677246094, 35.96067428588867, 36.98419189453125]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 6.0, 4.0, 3.0, 2.0, 7.0, 6.0, 8.0, 13.0, 12.0, 11.0, 21.0, 17.0, 32.0, 19.0, 26.0, 27.0, 30.0, 31.0, 36.0, 35.0, 40.0, 37.0, 41.0, 42.0, 51.0, 46.0, 34.0, 36.0, 25.0, 37.0, 33.0, 36.0, 26.0, 30.0, 24.0, 12.0, 24.0, 17.0, 14.0, 11.0, 11.0, 3.0, 9.0, 8.0, 6.0, 6.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.09765625, -3.96026611328125, -3.8228759765625, -3.68548583984375, -3.548095703125, -3.41070556640625, -3.2733154296875, -3.13592529296875, -2.99853515625, -2.86114501953125, -2.7237548828125, -2.58636474609375, -2.448974609375, -2.31158447265625, -2.1741943359375, -2.03680419921875, -1.8994140625, -1.76202392578125, -1.6246337890625, -1.48724365234375, -1.349853515625, -1.21246337890625, -1.0750732421875, -0.93768310546875, -0.80029296875, -0.66290283203125, -0.5255126953125, -0.38812255859375, -0.250732421875, -0.11334228515625, 0.0240478515625, 0.16143798828125, 0.298828125, 0.43621826171875, 0.5736083984375, 0.71099853515625, 0.848388671875, 0.98577880859375, 1.1231689453125, 1.26055908203125, 1.39794921875, 1.53533935546875, 1.6727294921875, 1.81011962890625, 1.947509765625, 2.08489990234375, 2.2222900390625, 2.35968017578125, 2.4970703125, 2.63446044921875, 2.7718505859375, 2.90924072265625, 3.046630859375, 3.18402099609375, 3.3214111328125, 3.45880126953125, 3.59619140625, 3.73358154296875, 3.8709716796875, 4.00836181640625, 4.145751953125, 4.28314208984375, 4.4205322265625, 4.55792236328125, 4.6953125]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 6.0, 11.0, 7.0, 24.0, 35.0, 50.0, 80.0, 121.0, 176.0, 267.0, 397.0, 682.0, 958.0, 1531.0, 2068.0, 3281.0, 4775.0, 7137.0, 11288.0, 16991.0, 27396.0, 45257.0, 81808.0, 161270.0, 266367.0, 186119.0, 94503.0, 50896.0, 30429.0, 18871.0, 12140.0, 7981.0, 5171.0, 3524.0, 2277.0, 1619.0, 1017.0, 668.0, 513.0, 284.0, 191.0, 148.0, 62.0, 62.0, 38.0, 30.0, 16.0, 6.0, 7.0, 3.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5146484375, -0.497833251953125, -0.48101806640625, -0.464202880859375, -0.4473876953125, -0.430572509765625, -0.41375732421875, -0.396942138671875, -0.380126953125, -0.363311767578125, -0.34649658203125, -0.329681396484375, -0.3128662109375, -0.296051025390625, -0.27923583984375, -0.262420654296875, -0.24560546875, -0.228790283203125, -0.21197509765625, -0.195159912109375, -0.1783447265625, -0.161529541015625, -0.14471435546875, -0.127899169921875, -0.111083984375, -0.094268798828125, -0.07745361328125, -0.060638427734375, -0.0438232421875, -0.027008056640625, -0.01019287109375, 0.006622314453125, 0.0234375, 0.040252685546875, 0.05706787109375, 0.073883056640625, 0.0906982421875, 0.107513427734375, 0.12432861328125, 0.141143798828125, 0.157958984375, 0.174774169921875, 0.19158935546875, 0.208404541015625, 0.2252197265625, 0.242034912109375, 0.25885009765625, 0.275665283203125, 0.29248046875, 0.309295654296875, 0.32611083984375, 0.342926025390625, 0.3597412109375, 0.376556396484375, 0.39337158203125, 0.410186767578125, 0.427001953125, 0.443817138671875, 0.46063232421875, 0.477447509765625, 0.4942626953125, 0.511077880859375, 0.52789306640625, 0.544708251953125, 0.5615234375]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 5.0, 7.0, 8.0, 8.0, 8.0, 11.0, 9.0, 12.0, 18.0, 21.0, 24.0, 22.0, 25.0, 26.0, 38.0, 38.0, 34.0, 29.0, 42.0, 34.0, 32.0, 1058.0, 44.0, 37.0, 34.0, 41.0, 35.0, 30.0, 31.0, 39.0, 23.0, 42.0, 25.0, 24.0, 21.0, 20.0, 16.0, 10.0, 7.0, 9.0, 5.0, 9.0, 5.0, 5.0, 3.0, 1.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.716796875, -2.631866455078125, -2.54693603515625, -2.462005615234375, -2.3770751953125, -2.292144775390625, -2.20721435546875, -2.122283935546875, -2.037353515625, -1.952423095703125, -1.86749267578125, -1.782562255859375, -1.6976318359375, -1.612701416015625, -1.52777099609375, -1.442840576171875, -1.35791015625, -1.272979736328125, -1.18804931640625, -1.103118896484375, -1.0181884765625, -0.933258056640625, -0.84832763671875, -0.763397216796875, -0.678466796875, -0.593536376953125, -0.50860595703125, -0.423675537109375, -0.3387451171875, -0.253814697265625, -0.16888427734375, -0.083953857421875, 0.0009765625, 0.085906982421875, 0.17083740234375, 0.255767822265625, 0.3406982421875, 0.425628662109375, 0.51055908203125, 0.595489501953125, 0.680419921875, 0.765350341796875, 0.85028076171875, 0.935211181640625, 1.0201416015625, 1.105072021484375, 1.19000244140625, 1.274932861328125, 1.35986328125, 1.444793701171875, 1.52972412109375, 1.614654541015625, 1.6995849609375, 1.784515380859375, 1.86944580078125, 1.954376220703125, 2.039306640625, 2.124237060546875, 2.20916748046875, 2.294097900390625, 2.3790283203125, 2.463958740234375, 2.54888916015625, 2.633819580078125, 2.71875]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 6.0, 4.0, 2.0, 10.0, 12.0, 13.0, 12.0, 24.0, 36.0, 40.0, 68.0, 98.0, 161.0, 212.0, 336.0, 559.0, 857.0, 1451.0, 2200.0, 3678.0, 6348.0, 10495.0, 18123.0, 32645.0, 58950.0, 106056.0, 178527.0, 1270561.0, 172935.0, 101765.0, 56370.0, 31432.0, 17530.0, 10193.0, 5979.0, 3656.0, 2077.0, 1343.0, 850.0, 521.0, 344.0, 211.0, 139.0, 95.0, 74.0, 37.0, 31.0, 14.0, 14.0, 15.0, 8.0, 8.0, 10.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0], "bins": [-0.26171875, -0.2531280517578125, -0.244537353515625, -0.2359466552734375, -0.22735595703125, -0.2187652587890625, -0.210174560546875, -0.2015838623046875, -0.1929931640625, -0.1844024658203125, -0.175811767578125, -0.1672210693359375, -0.15863037109375, -0.1500396728515625, -0.141448974609375, -0.1328582763671875, -0.124267578125, -0.1156768798828125, -0.107086181640625, -0.0984954833984375, -0.08990478515625, -0.0813140869140625, -0.072723388671875, -0.0641326904296875, -0.0555419921875, -0.0469512939453125, -0.038360595703125, -0.0297698974609375, -0.02117919921875, -0.0125885009765625, -0.003997802734375, 0.0045928955078125, 0.01318359375, 0.0217742919921875, 0.030364990234375, 0.0389556884765625, 0.04754638671875, 0.0561370849609375, 0.064727783203125, 0.0733184814453125, 0.0819091796875, 0.0904998779296875, 0.099090576171875, 0.1076812744140625, 0.11627197265625, 0.1248626708984375, 0.133453369140625, 0.1420440673828125, 0.150634765625, 0.1592254638671875, 0.167816162109375, 0.1764068603515625, 0.18499755859375, 0.1935882568359375, 0.202178955078125, 0.2107696533203125, 0.2193603515625, 0.2279510498046875, 0.236541748046875, 0.2451324462890625, 0.25372314453125, 0.2623138427734375, 0.270904541015625, 0.2794952392578125, 0.2880859375]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 0.0, 3.0, 5.0, 0.0, 5.0, 2.0, 1.0, 1.0, 4.0, 7.0, 4.0, 11.0, 9.0, 8.0, 8.0, 10.0, 15.0, 24.0, 26.0, 23.0, 30.0, 34.0, 52.0, 68.0, 112.0, 105.0, 90.0, 59.0, 54.0, 36.0, 44.0, 28.0, 17.0, 19.0, 12.0, 5.0, 14.0, 5.0, 7.0, 11.0, 7.0, 7.0, 3.0, 6.0, 5.0, 4.0, 3.0, 2.0, 3.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.005084991455078125, -0.004905402660369873, -0.004725813865661621, -0.004546225070953369, -0.004366636276245117, -0.004187047481536865, -0.004007458686828613, -0.0038278698921203613, -0.0036482810974121094, -0.0034686923027038574, -0.0032891035079956055, -0.0031095147132873535, -0.0029299259185791016, -0.0027503371238708496, -0.0025707483291625977, -0.0023911595344543457, -0.0022115707397460938, -0.002031981945037842, -0.0018523931503295898, -0.0016728043556213379, -0.001493215560913086, -0.001313626766204834, -0.001134037971496582, -0.0009544491767883301, -0.0007748603820800781, -0.0005952715873718262, -0.0004156827926635742, -0.00023609399795532227, -5.650520324707031e-05, 0.00012308359146118164, 0.0003026723861694336, 0.00048226118087768555, 0.0006618499755859375, 0.0008414387702941895, 0.0010210275650024414, 0.0012006163597106934, 0.0013802051544189453, 0.0015597939491271973, 0.0017393827438354492, 0.0019189715385437012, 0.002098560333251953, 0.002278149127960205, 0.002457737922668457, 0.002637326717376709, 0.002816915512084961, 0.002996504306793213, 0.003176093101501465, 0.003355681896209717, 0.0035352706909179688, 0.0037148594856262207, 0.0038944482803344727, 0.004074037075042725, 0.0042536258697509766, 0.0044332146644592285, 0.0046128034591674805, 0.004792392253875732, 0.004971981048583984, 0.005151569843292236, 0.005331158638000488, 0.00551074743270874, 0.005690336227416992, 0.005869925022125244, 0.006049513816833496, 0.006229102611541748, 0.00640869140625]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 4.0, 4.0, 8.0, 3.0, 5.0, 8.0, 9.0, 13.0, 9.0, 16.0, 15.0, 27.0, 31.0, 46.0, 67.0, 88.0, 170.0, 402.0, 2752.0, 51646.0, 930400.0, 58770.0, 3099.0, 409.0, 177.0, 120.0, 70.0, 43.0, 27.0, 23.0, 19.0, 11.0, 9.0, 11.0, 9.0, 6.0, 6.0, 6.0, 0.0, 2.0, 5.0, 2.0, 0.0, 4.0, 2.0, 0.0, 3.0, 2.0, 1.0], "bins": [-0.1259765625, -0.12242984771728516, -0.11888313293457031, -0.11533641815185547, -0.11178970336914062, -0.10824298858642578, -0.10469627380371094, -0.1011495590209961, -0.09760284423828125, -0.0940561294555664, -0.09050941467285156, -0.08696269989013672, -0.08341598510742188, -0.07986927032470703, -0.07632255554199219, -0.07277584075927734, -0.0692291259765625, -0.06568241119384766, -0.06213569641113281, -0.05858898162841797, -0.055042266845703125, -0.05149555206298828, -0.04794883728027344, -0.044402122497558594, -0.04085540771484375, -0.037308692932128906, -0.03376197814941406, -0.03021526336669922, -0.026668548583984375, -0.02312183380126953, -0.019575119018554688, -0.016028404235839844, -0.012481689453125, -0.008934974670410156, -0.0053882598876953125, -0.0018415451049804688, 0.001705169677734375, 0.005251884460449219, 0.008798599243164062, 0.012345314025878906, 0.01589202880859375, 0.019438743591308594, 0.022985458374023438, 0.02653217315673828, 0.030078887939453125, 0.03362560272216797, 0.03717231750488281, 0.040719032287597656, 0.0442657470703125, 0.047812461853027344, 0.05135917663574219, 0.05490589141845703, 0.058452606201171875, 0.06199932098388672, 0.06554603576660156, 0.0690927505493164, 0.07263946533203125, 0.0761861801147461, 0.07973289489746094, 0.08327960968017578, 0.08682632446289062, 0.09037303924560547, 0.09391975402832031, 0.09746646881103516, 0.10101318359375]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [9.0, 36.0, 160.0, 589.0, 150.0, 47.0, 14.0, 8.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007822678424417973, -0.005590456537902355, -0.0033582341857254505, -0.0011260118335485458, 0.0011062100529670715, 0.003338431939482689, 0.005570654757320881, 0.007802876643836498, 0.010035098530352116, 0.012267320416867733, 0.014499543234705925, 0.016731765121221542, 0.01896398700773716, 0.021196208894252777, 0.023428432643413544, 0.025660652667284012, 0.02789287641644478, 0.030125098302960396, 0.03235732018947601, 0.03458954393863678, 0.03682176396250725, 0.039053987711668015, 0.04128620773553848, 0.04351843148469925, 0.04575065150856972, 0.047982875257730484, 0.05021509528160095, 0.05244731903076172, 0.05467953905463219, 0.056911762803792953, 0.05914398282766342, 0.06137620657682419, 0.06360843032598495, 0.06584065407514572, 0.06807287782430649, 0.07030509412288666, 0.07253731787204742, 0.07476954162120819, 0.07700176537036896, 0.07923398911952972, 0.0814662054181099, 0.08369842916727066, 0.08593065291643143, 0.0881628692150116, 0.09039509296417236, 0.09262731671333313, 0.0948595404624939, 0.09709176421165466, 0.09932398796081543, 0.1015562117099762, 0.10378843545913696, 0.10602065175771713, 0.1082528755068779, 0.11048509925603867, 0.11271732300519943, 0.1149495393037796, 0.11718176305294037, 0.11941398680210114, 0.1216462105512619, 0.12387842684984207, 0.12611065804958344, 0.128342866897583, 0.13057509064674377, 0.13280731439590454, 0.1350395381450653]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 4.0, 0.0, 8.0, 5.0, 9.0, 11.0, 17.0, 10.0, 20.0, 26.0, 16.0, 25.0, 28.0, 22.0, 31.0, 37.0, 35.0, 56.0, 42.0, 53.0, 60.0, 40.0, 47.0, 46.0, 31.0, 27.0, 36.0, 30.0, 25.0, 36.0, 25.0, 22.0, 26.0, 23.0, 17.0, 12.0, 9.0, 14.0, 9.0, 4.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.008260905742645264, -0.008003235794603825, -0.0077455658465623856, -0.0074878958985209465, -0.0072302259504795074, -0.006972556002438068, -0.006714886054396629, -0.00645721610635519, -0.006199546158313751, -0.005941876210272312, -0.005684206262230873, -0.005426536314189434, -0.005168866366147995, -0.004911196418106556, -0.004653526470065117, -0.004395856522023678, -0.004138186573982239, -0.0038805166259407997, -0.0036228466778993607, -0.0033651767298579216, -0.0031075067818164825, -0.0028498368337750435, -0.0025921668857336044, -0.0023344969376921654, -0.0020768269896507263, -0.0018191570416092873, -0.0015614870935678482, -0.0013038171455264091, -0.00104614719748497, -0.000788477249443531, -0.000530807301402092, -0.0002731373533606529, -1.5467405319213867e-05, 0.0002422025427222252, 0.0004998724907636642, 0.0007575424388051033, 0.0010152123868465424, 0.0012728823348879814, 0.0015305522829294205, 0.0017882222309708595, 0.0020458921790122986, 0.0023035621270537376, 0.0025612320750951767, 0.0028189020231366158, 0.003076571971178055, 0.003334241919219494, 0.003591911867260933, 0.003849581815302372, 0.004107251763343811, 0.00436492171138525, 0.004622591659426689, 0.004880261607468128, 0.005137931555509567, 0.005395601503551006, 0.005653271451592445, 0.005910941399633884, 0.0061686113476753235, 0.0064262812957167625, 0.006683951243758202, 0.006941621191799641, 0.00719929113984108, 0.007456961087882519, 0.007714631035923958, 0.007972300983965397, 0.008229970932006836]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 6.0, 4.0, 3.0, 2.0, 7.0, 6.0, 8.0, 13.0, 12.0, 11.0, 21.0, 18.0, 31.0, 19.0, 26.0, 27.0, 30.0, 31.0, 36.0, 35.0, 40.0, 37.0, 41.0, 42.0, 51.0, 45.0, 34.0, 37.0, 25.0, 37.0, 33.0, 36.0, 26.0, 30.0, 24.0, 12.0, 24.0, 17.0, 14.0, 11.0, 11.0, 3.0, 9.0, 8.0, 6.0, 6.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.09765625, -3.96026611328125, -3.8228759765625, -3.68548583984375, -3.548095703125, -3.41070556640625, -3.2733154296875, -3.13592529296875, -2.99853515625, -2.86114501953125, -2.7237548828125, -2.58636474609375, -2.448974609375, -2.31158447265625, -2.1741943359375, -2.03680419921875, -1.8994140625, -1.76202392578125, -1.6246337890625, -1.48724365234375, -1.349853515625, -1.21246337890625, -1.0750732421875, -0.93768310546875, -0.80029296875, -0.66290283203125, -0.5255126953125, -0.38812255859375, -0.250732421875, -0.11334228515625, 0.0240478515625, 0.16143798828125, 0.298828125, 0.43621826171875, 0.5736083984375, 0.71099853515625, 0.848388671875, 0.98577880859375, 1.1231689453125, 1.26055908203125, 1.39794921875, 1.53533935546875, 1.6727294921875, 1.81011962890625, 1.947509765625, 2.08489990234375, 2.2222900390625, 2.35968017578125, 2.4970703125, 2.63446044921875, 2.7718505859375, 2.90924072265625, 3.046630859375, 3.18402099609375, 3.3214111328125, 3.45880126953125, 3.59619140625, 3.73358154296875, 3.8709716796875, 4.00836181640625, 4.145751953125, 4.28314208984375, 4.4205322265625, 4.55792236328125, 4.6953125]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 7.0, 9.0, 14.0, 25.0, 42.0, 90.0, 121.0, 261.0, 389.0, 599.0, 1114.0, 1969.0, 3443.0, 6594.0, 13356.0, 27295.0, 60112.0, 149167.0, 451685.0, 194687.0, 72203.0, 32502.0, 15596.0, 7902.0, 4096.0, 2235.0, 1239.0, 728.0, 441.0, 259.0, 144.0, 100.0, 60.0, 28.0, 29.0, 11.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.609375, -5.44732666015625, -5.2852783203125, -5.12322998046875, -4.961181640625, -4.79913330078125, -4.6370849609375, -4.47503662109375, -4.31298828125, -4.15093994140625, -3.9888916015625, -3.82684326171875, -3.664794921875, -3.50274658203125, -3.3406982421875, -3.17864990234375, -3.0166015625, -2.85455322265625, -2.6925048828125, -2.53045654296875, -2.368408203125, -2.20635986328125, -2.0443115234375, -1.88226318359375, -1.72021484375, -1.55816650390625, -1.3961181640625, -1.23406982421875, -1.072021484375, -0.90997314453125, -0.7479248046875, -0.58587646484375, -0.423828125, -0.26177978515625, -0.0997314453125, 0.06231689453125, 0.224365234375, 0.38641357421875, 0.5484619140625, 0.71051025390625, 0.87255859375, 1.03460693359375, 1.1966552734375, 1.35870361328125, 1.520751953125, 1.68280029296875, 1.8448486328125, 2.00689697265625, 2.1689453125, 2.33099365234375, 2.4930419921875, 2.65509033203125, 2.817138671875, 2.97918701171875, 3.1412353515625, 3.30328369140625, 3.46533203125, 3.62738037109375, 3.7894287109375, 3.95147705078125, 4.113525390625, 4.27557373046875, 4.4376220703125, 4.59967041015625, 4.76171875]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 6.0, 8.0, 10.0, 7.0, 15.0, 16.0, 17.0, 23.0, 18.0, 21.0, 32.0, 36.0, 34.0, 28.0, 32.0, 31.0, 62.0, 92.0, 158.0, 1408.0, 358.0, 143.0, 83.0, 67.0, 50.0, 28.0, 47.0, 37.0, 32.0, 27.0, 18.0, 16.0, 18.0, 11.0, 7.0, 10.0, 7.0, 7.0, 11.0, 6.0, 2.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.0625, -14.6053466796875, -14.148193359375, -13.6910400390625, -13.23388671875, -12.7767333984375, -12.319580078125, -11.8624267578125, -11.4052734375, -10.9481201171875, -10.490966796875, -10.0338134765625, -9.57666015625, -9.1195068359375, -8.662353515625, -8.2052001953125, -7.748046875, -7.2908935546875, -6.833740234375, -6.3765869140625, -5.91943359375, -5.4622802734375, -5.005126953125, -4.5479736328125, -4.0908203125, -3.6336669921875, -3.176513671875, -2.7193603515625, -2.26220703125, -1.8050537109375, -1.347900390625, -0.8907470703125, -0.43359375, 0.0235595703125, 0.480712890625, 0.9378662109375, 1.39501953125, 1.8521728515625, 2.309326171875, 2.7664794921875, 3.2236328125, 3.6807861328125, 4.137939453125, 4.5950927734375, 5.05224609375, 5.5093994140625, 5.966552734375, 6.4237060546875, 6.880859375, 7.3380126953125, 7.795166015625, 8.2523193359375, 8.70947265625, 9.1666259765625, 9.623779296875, 10.0809326171875, 10.5380859375, 10.9952392578125, 11.452392578125, 11.9095458984375, 12.36669921875, 12.8238525390625, 13.281005859375, 13.7381591796875, 14.1953125]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 5.0, 2.0, 7.0, 12.0, 16.0, 10.0, 9.0, 16.0, 32.0, 37.0, 49.0, 56.0, 85.0, 99.0, 159.0, 207.0, 316.0, 647.0, 1972.0, 24391.0, 2689277.0, 417275.0, 8298.0, 1177.0, 510.0, 264.0, 190.0, 135.0, 110.0, 78.0, 55.0, 45.0, 36.0, 25.0, 28.0, 25.0, 11.0, 7.0, 7.0, 6.0, 5.0, 5.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-29.96875, -28.92919921875, -27.8896484375, -26.85009765625, -25.810546875, -24.77099609375, -23.7314453125, -22.69189453125, -21.65234375, -20.61279296875, -19.5732421875, -18.53369140625, -17.494140625, -16.45458984375, -15.4150390625, -14.37548828125, -13.3359375, -12.29638671875, -11.2568359375, -10.21728515625, -9.177734375, -8.13818359375, -7.0986328125, -6.05908203125, -5.01953125, -3.97998046875, -2.9404296875, -1.90087890625, -0.861328125, 0.17822265625, 1.2177734375, 2.25732421875, 3.296875, 4.33642578125, 5.3759765625, 6.41552734375, 7.455078125, 8.49462890625, 9.5341796875, 10.57373046875, 11.61328125, 12.65283203125, 13.6923828125, 14.73193359375, 15.771484375, 16.81103515625, 17.8505859375, 18.89013671875, 19.9296875, 20.96923828125, 22.0087890625, 23.04833984375, 24.087890625, 25.12744140625, 26.1669921875, 27.20654296875, 28.24609375, 29.28564453125, 30.3251953125, 31.36474609375, 32.404296875, 33.44384765625, 34.4833984375, 35.52294921875, 36.5625]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [4.0, 299.0, 713.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.30411720275879, -11.967141151428223, -1.6301651000976562, 8.706811904907227, 19.043787002563477, 29.380762100219727, 39.717742919921875, 50.054718017578125, 60.391693115234375, 70.72866821289062, 81.06564331054688, 91.40261840820312, 101.73959350585938, 112.07656860351562, 122.4135513305664, 132.75051879882812, 143.08749389648438, 153.42446899414062, 163.76144409179688, 174.09841918945312, 184.43539428710938, 194.77236938476562, 205.10934448242188, 215.44631958007812, 225.78330993652344, 236.1202850341797, 246.45726013183594, 256.79425048828125, 267.1312255859375, 277.46820068359375, 287.80517578125, 298.14215087890625, 308.4790954589844, 318.8160705566406, 329.1530456542969, 339.4900207519531, 349.8269958496094, 360.1639709472656, 370.5009460449219, 380.8379211425781, 391.1748962402344, 401.5118713378906, 411.8488464355469, 422.1858215332031, 432.5227966308594, 442.8597717285156, 453.1967468261719, 463.5337219238281, 473.8707275390625, 484.20770263671875, 494.544677734375, 504.88165283203125, 515.2186279296875, 525.5556030273438, 535.892578125, 546.2295532226562, 556.5665283203125, 566.9035034179688, 577.240478515625, 587.5774536132812, 597.9144287109375, 608.2514038085938, 618.58837890625, 628.9253540039062, 639.2623291015625]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 8.0, 4.0, 2.0, 6.0, 9.0, 10.0, 12.0, 14.0, 11.0, 19.0, 17.0, 26.0, 36.0, 32.0, 33.0, 34.0, 37.0, 37.0, 33.0, 55.0, 44.0, 51.0, 40.0, 42.0, 46.0, 42.0, 41.0, 32.0, 31.0, 32.0, 21.0, 28.0, 23.0, 20.0, 25.0, 8.0, 6.0, 9.0, 7.0, 4.0, 6.0, 3.0, 1.0, 4.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.68959045410156, -44.201534271240234, -42.71348190307617, -41.225425720214844, -39.737369537353516, -38.24931335449219, -36.761260986328125, -35.2732048034668, -33.78514862060547, -32.29709243774414, -30.809038162231445, -29.32098388671875, -27.832927703857422, -26.344873428344727, -24.85681915283203, -23.368762969970703, -21.88071060180664, -20.392656326293945, -18.904600143432617, -17.416545867919922, -15.92849063873291, -14.440435409545898, -12.952381134033203, -11.464325904846191, -9.97627067565918, -8.488215446472168, -7.0001606941223145, -5.512105941772461, -4.024050712585449, -2.5359954833984375, -1.0479412078857422, 0.44011402130126953, 1.9281692504882812, 3.416224241256714, 4.9042792320251465, 6.392333984375, 7.880389213562012, 9.368444442749023, 10.856498718261719, 12.34455394744873, 13.832609176635742, 15.320664405822754, 16.808719635009766, 18.29677391052246, 19.784828186035156, 21.272884368896484, 22.76093864440918, 24.248992919921875, 25.737049102783203, 27.2251033782959, 28.713159561157227, 30.201213836669922, 31.68927001953125, 33.17732238769531, 34.66537857055664, 36.15343475341797, 37.64148712158203, 39.12954330444336, 40.61759567260742, 42.10565185546875, 43.59370803833008, 45.081764221191406, 46.56981658935547, 48.0578727722168, 49.545928955078125]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 3.0, 3.0, 7.0, 2.0, 4.0, 9.0, 11.0, 11.0, 10.0, 18.0, 8.0, 18.0, 21.0, 25.0, 25.0, 22.0, 35.0, 24.0, 27.0, 36.0, 41.0, 36.0, 38.0, 45.0, 26.0, 38.0, 41.0, 36.0, 37.0, 38.0, 35.0, 37.0, 27.0, 32.0, 28.0, 21.0, 21.0, 19.0, 17.0, 18.0, 11.0, 9.0, 6.0, 7.0, 5.0, 4.0, 7.0, 4.0, 10.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.10546875, -3.96295166015625, -3.8204345703125, -3.67791748046875, -3.535400390625, -3.39288330078125, -3.2503662109375, -3.10784912109375, -2.96533203125, -2.82281494140625, -2.6802978515625, -2.53778076171875, -2.395263671875, -2.25274658203125, -2.1102294921875, -1.96771240234375, -1.8251953125, -1.68267822265625, -1.5401611328125, -1.39764404296875, -1.255126953125, -1.11260986328125, -0.9700927734375, -0.82757568359375, -0.68505859375, -0.54254150390625, -0.4000244140625, -0.25750732421875, -0.114990234375, 0.02752685546875, 0.1700439453125, 0.31256103515625, 0.455078125, 0.59759521484375, 0.7401123046875, 0.88262939453125, 1.025146484375, 1.16766357421875, 1.3101806640625, 1.45269775390625, 1.59521484375, 1.73773193359375, 1.8802490234375, 2.02276611328125, 2.165283203125, 2.30780029296875, 2.4503173828125, 2.59283447265625, 2.7353515625, 2.87786865234375, 3.0203857421875, 3.16290283203125, 3.305419921875, 3.44793701171875, 3.5904541015625, 3.73297119140625, 3.87548828125, 4.01800537109375, 4.1605224609375, 4.30303955078125, 4.445556640625, 4.58807373046875, 4.7305908203125, 4.87310791015625, 5.015625]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 6.0, 1.0, 5.0, 2.0, 1.0, 6.0, 3.0, 0.0, 9.0, 7.0, 7.0, 10.0, 14.0, 13.0, 16.0, 20.0, 23.0, 38.0, 55.0, 86.0, 191.0, 397.0, 832.0, 2197.0, 7355.0, 30984.0, 181240.0, 1502780.0, 2107851.0, 300746.0, 44779.0, 9989.0, 2708.0, 984.0, 402.0, 196.0, 105.0, 50.0, 43.0, 25.0, 20.0, 16.0, 17.0, 11.0, 13.0, 6.0, 7.0, 5.0, 4.0, 4.0, 8.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-10.8984375, -10.524169921875, -10.14990234375, -9.775634765625, -9.4013671875, -9.027099609375, -8.65283203125, -8.278564453125, -7.904296875, -7.530029296875, -7.15576171875, -6.781494140625, -6.4072265625, -6.032958984375, -5.65869140625, -5.284423828125, -4.91015625, -4.535888671875, -4.16162109375, -3.787353515625, -3.4130859375, -3.038818359375, -2.66455078125, -2.290283203125, -1.916015625, -1.541748046875, -1.16748046875, -0.793212890625, -0.4189453125, -0.044677734375, 0.32958984375, 0.703857421875, 1.078125, 1.452392578125, 1.82666015625, 2.200927734375, 2.5751953125, 2.949462890625, 3.32373046875, 3.697998046875, 4.072265625, 4.446533203125, 4.82080078125, 5.195068359375, 5.5693359375, 5.943603515625, 6.31787109375, 6.692138671875, 7.06640625, 7.440673828125, 7.81494140625, 8.189208984375, 8.5634765625, 8.937744140625, 9.31201171875, 9.686279296875, 10.060546875, 10.434814453125, 10.80908203125, 11.183349609375, 11.5576171875, 11.931884765625, 12.30615234375, 12.680419921875, 13.0546875]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 4.0, 6.0, 5.0, 4.0, 12.0, 13.0, 18.0, 21.0, 25.0, 34.0, 47.0, 66.0, 100.0, 123.0, 162.0, 244.0, 310.0, 407.0, 485.0, 448.0, 367.0, 291.0, 228.0, 162.0, 126.0, 102.0, 77.0, 47.0, 36.0, 31.0, 22.0, 12.0, 11.0, 7.0, 12.0, 6.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.9140625, -10.5909423828125, -10.267822265625, -9.9447021484375, -9.62158203125, -9.2984619140625, -8.975341796875, -8.6522216796875, -8.3291015625, -8.0059814453125, -7.682861328125, -7.3597412109375, -7.03662109375, -6.7135009765625, -6.390380859375, -6.0672607421875, -5.744140625, -5.4210205078125, -5.097900390625, -4.7747802734375, -4.45166015625, -4.1285400390625, -3.805419921875, -3.4822998046875, -3.1591796875, -2.8360595703125, -2.512939453125, -2.1898193359375, -1.86669921875, -1.5435791015625, -1.220458984375, -0.8973388671875, -0.57421875, -0.2510986328125, 0.072021484375, 0.3951416015625, 0.71826171875, 1.0413818359375, 1.364501953125, 1.6876220703125, 2.0107421875, 2.3338623046875, 2.656982421875, 2.9801025390625, 3.30322265625, 3.6263427734375, 3.949462890625, 4.2725830078125, 4.595703125, 4.9188232421875, 5.241943359375, 5.5650634765625, 5.88818359375, 6.2113037109375, 6.534423828125, 6.8575439453125, 7.1806640625, 7.5037841796875, 7.826904296875, 8.1500244140625, 8.47314453125, 8.7962646484375, 9.119384765625, 9.4425048828125, 9.765625]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0, 8.0, 7.0, 10.0, 12.0, 18.0, 26.0, 38.0, 45.0, 71.0, 105.0, 165.0, 197.0, 330.0, 700.0, 2609.0, 28763.0, 1100179.0, 2979400.0, 74972.0, 4602.0, 913.0, 392.0, 227.0, 145.0, 96.0, 66.0, 49.0, 30.0, 23.0, 25.0, 20.0, 13.0, 8.0, 4.0, 4.0, 7.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.078125, -29.046142578125, -28.01416015625, -26.982177734375, -25.9501953125, -24.918212890625, -23.88623046875, -22.854248046875, -21.822265625, -20.790283203125, -19.75830078125, -18.726318359375, -17.6943359375, -16.662353515625, -15.63037109375, -14.598388671875, -13.56640625, -12.534423828125, -11.50244140625, -10.470458984375, -9.4384765625, -8.406494140625, -7.37451171875, -6.342529296875, -5.310546875, -4.278564453125, -3.24658203125, -2.214599609375, -1.1826171875, -0.150634765625, 0.88134765625, 1.913330078125, 2.9453125, 3.977294921875, 5.00927734375, 6.041259765625, 7.0732421875, 8.105224609375, 9.13720703125, 10.169189453125, 11.201171875, 12.233154296875, 13.26513671875, 14.297119140625, 15.3291015625, 16.361083984375, 17.39306640625, 18.425048828125, 19.45703125, 20.489013671875, 21.52099609375, 22.552978515625, 23.5849609375, 24.616943359375, 25.64892578125, 26.680908203125, 27.712890625, 28.744873046875, 29.77685546875, 30.808837890625, 31.8408203125, 32.872802734375, 33.90478515625, 34.936767578125, 35.96875]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 8.0, 7.0, 12.0, 31.0, 46.0, 68.0, 72.0, 79.0, 95.0, 93.0, 92.0, 90.0, 78.0, 74.0, 55.0, 28.0, 28.0, 19.0, 12.0, 8.0, 6.0, 1.0, 4.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.54754066467285, -24.93934440612793, -23.331148147583008, -21.72295379638672, -20.114757537841797, -18.506561279296875, -16.898365020751953, -15.290169715881348, -13.681973457336426, -12.073777198791504, -10.465581893920898, -8.857385635375977, -7.249189853668213, -5.640994071960449, -4.032797813415527, -2.424602508544922, -0.81640625, 0.7917896509170532, 2.3999855518341064, 4.008181571960449, 5.616377353668213, 7.224573135375977, 8.832769393920898, 10.440964698791504, 12.049160957336426, 13.657357215881348, 15.265552520751953, 16.873748779296875, 18.481945037841797, 20.09014129638672, 21.69833755493164, 23.30653190612793, 24.914730072021484, 26.522926330566406, 28.131122589111328, 29.73931884765625, 31.34751319885254, 32.955711364746094, 34.56390380859375, 36.17210006713867, 37.780296325683594, 39.388492584228516, 40.99668884277344, 42.60488510131836, 44.21308135986328, 45.82127380371094, 47.429473876953125, 49.03766632080078, 50.64586639404297, 52.25406265258789, 53.86225891113281, 55.470455169677734, 57.078651428222656, 58.68684387207031, 60.2950439453125, 61.903236389160156, 63.51143264770508, 65.11962890625, 66.72782135009766, 68.33602142333984, 69.9442138671875, 71.55241394042969, 73.16060638427734, 74.76880645751953, 76.37699890136719]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 1.0, 4.0, 6.0, 12.0, 8.0, 12.0, 13.0, 12.0, 10.0, 17.0, 19.0, 22.0, 19.0, 32.0, 31.0, 35.0, 41.0, 39.0, 38.0, 38.0, 51.0, 48.0, 40.0, 33.0, 38.0, 31.0, 45.0, 43.0, 44.0, 28.0, 21.0, 25.0, 27.0, 15.0, 14.0, 13.0, 12.0, 14.0, 9.0, 5.0, 8.0, 9.0, 9.0, 5.0, 4.0, 0.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0], "bins": [-36.012786865234375, -34.96269607543945, -33.91260528564453, -32.862518310546875, -31.812427520751953, -30.76233673095703, -29.712247848510742, -28.662158966064453, -27.61206817626953, -26.56197738647461, -25.51188850402832, -24.46179962158203, -23.41170883178711, -22.361618041992188, -21.3115291595459, -20.26144027709961, -19.211349487304688, -18.161258697509766, -17.111169815063477, -16.061080932617188, -15.010990142822266, -13.96090030670166, -12.910810470581055, -11.86072063446045, -10.810630798339844, -9.760540962219238, -8.710451126098633, -7.660361289978027, -6.610271453857422, -5.560181617736816, -4.510091781616211, -3.4600019454956055, -2.409912109375, -1.3598222732543945, -0.30973243713378906, 0.7403573989868164, 1.7904472351074219, 2.8405370712280273, 3.890626907348633, 4.940716743469238, 5.990806579589844, 7.040896415710449, 8.090986251831055, 9.14107608795166, 10.191165924072266, 11.241255760192871, 12.291345596313477, 13.341435432434082, 14.391525268554688, 15.441615104675293, 16.4917049407959, 17.541793823242188, 18.59188461303711, 19.64197540283203, 20.69206428527832, 21.74215316772461, 22.79224395751953, 23.842334747314453, 24.892423629760742, 25.94251251220703, 26.992603302001953, 28.042694091796875, 29.092782974243164, 30.142871856689453, 31.192962646484375]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 4.0, 2.0, 6.0, 0.0, 5.0, 2.0, 3.0, 7.0, 11.0, 7.0, 12.0, 14.0, 19.0, 18.0, 23.0, 34.0, 21.0, 28.0, 34.0, 29.0, 40.0, 43.0, 49.0, 44.0, 37.0, 41.0, 41.0, 41.0, 38.0, 42.0, 25.0, 31.0, 31.0, 40.0, 30.0, 30.0, 22.0, 14.0, 13.0, 13.0, 12.0, 9.0, 13.0, 10.0, 5.0, 6.0, 2.0, 3.0, 2.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.94140625, -3.793701171875, -3.64599609375, -3.498291015625, -3.3505859375, -3.202880859375, -3.05517578125, -2.907470703125, -2.759765625, -2.612060546875, -2.46435546875, -2.316650390625, -2.1689453125, -2.021240234375, -1.87353515625, -1.725830078125, -1.578125, -1.430419921875, -1.28271484375, -1.135009765625, -0.9873046875, -0.839599609375, -0.69189453125, -0.544189453125, -0.396484375, -0.248779296875, -0.10107421875, 0.046630859375, 0.1943359375, 0.342041015625, 0.48974609375, 0.637451171875, 0.78515625, 0.932861328125, 1.08056640625, 1.228271484375, 1.3759765625, 1.523681640625, 1.67138671875, 1.819091796875, 1.966796875, 2.114501953125, 2.26220703125, 2.409912109375, 2.5576171875, 2.705322265625, 2.85302734375, 3.000732421875, 3.1484375, 3.296142578125, 3.44384765625, 3.591552734375, 3.7392578125, 3.886962890625, 4.03466796875, 4.182373046875, 4.330078125, 4.477783203125, 4.62548828125, 4.773193359375, 4.9208984375, 5.068603515625, 5.21630859375, 5.364013671875, 5.51171875]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 6.0, 6.0, 5.0, 6.0, 10.0, 16.0, 28.0, 54.0, 62.0, 91.0, 133.0, 174.0, 271.0, 447.0, 796.0, 1165.0, 1849.0, 2892.0, 4680.0, 7043.0, 11161.0, 18035.0, 28881.0, 48616.0, 89890.0, 180769.0, 275518.0, 170328.0, 84403.0, 46265.0, 27611.0, 17248.0, 11088.0, 7032.0, 4420.0, 2629.0, 1709.0, 1100.0, 760.0, 488.0, 296.0, 205.0, 134.0, 93.0, 60.0, 36.0, 20.0, 10.0, 12.0, 6.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.54931640625, -0.531280517578125, -0.51324462890625, -0.495208740234375, -0.4771728515625, -0.459136962890625, -0.44110107421875, -0.423065185546875, -0.405029296875, -0.386993408203125, -0.36895751953125, -0.350921630859375, -0.3328857421875, -0.314849853515625, -0.29681396484375, -0.278778076171875, -0.2607421875, -0.242706298828125, -0.22467041015625, -0.206634521484375, -0.1885986328125, -0.170562744140625, -0.15252685546875, -0.134490966796875, -0.116455078125, -0.098419189453125, -0.08038330078125, -0.062347412109375, -0.0443115234375, -0.026275634765625, -0.00823974609375, 0.009796142578125, 0.02783203125, 0.045867919921875, 0.06390380859375, 0.081939697265625, 0.0999755859375, 0.118011474609375, 0.13604736328125, 0.154083251953125, 0.172119140625, 0.190155029296875, 0.20819091796875, 0.226226806640625, 0.2442626953125, 0.262298583984375, 0.28033447265625, 0.298370361328125, 0.31640625, 0.334442138671875, 0.35247802734375, 0.370513916015625, 0.3885498046875, 0.406585693359375, 0.42462158203125, 0.442657470703125, 0.460693359375, 0.478729248046875, 0.49676513671875, 0.514801025390625, 0.5328369140625, 0.550872802734375, 0.56890869140625, 0.586944580078125, 0.60498046875]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 3.0, 3.0, 5.0, 7.0, 10.0, 10.0, 14.0, 14.0, 16.0, 9.0, 20.0, 26.0, 28.0, 14.0, 42.0, 36.0, 22.0, 31.0, 37.0, 32.0, 38.0, 41.0, 1066.0, 49.0, 35.0, 38.0, 33.0, 48.0, 30.0, 34.0, 35.0, 24.0, 24.0, 21.0, 21.0, 21.0, 16.0, 16.0, 16.0, 9.0, 11.0, 6.0, 5.0, 4.0, 5.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-3.009765625, -2.914215087890625, -2.81866455078125, -2.723114013671875, -2.6275634765625, -2.532012939453125, -2.43646240234375, -2.340911865234375, -2.245361328125, -2.149810791015625, -2.05426025390625, -1.958709716796875, -1.8631591796875, -1.767608642578125, -1.67205810546875, -1.576507568359375, -1.48095703125, -1.385406494140625, -1.28985595703125, -1.194305419921875, -1.0987548828125, -1.003204345703125, -0.90765380859375, -0.812103271484375, -0.716552734375, -0.621002197265625, -0.52545166015625, -0.429901123046875, -0.3343505859375, -0.238800048828125, -0.14324951171875, -0.047698974609375, 0.0478515625, 0.143402099609375, 0.23895263671875, 0.334503173828125, 0.4300537109375, 0.525604248046875, 0.62115478515625, 0.716705322265625, 0.812255859375, 0.907806396484375, 1.00335693359375, 1.098907470703125, 1.1944580078125, 1.290008544921875, 1.38555908203125, 1.481109619140625, 1.57666015625, 1.672210693359375, 1.76776123046875, 1.863311767578125, 1.9588623046875, 2.054412841796875, 2.14996337890625, 2.245513916015625, 2.341064453125, 2.436614990234375, 2.53216552734375, 2.627716064453125, 2.7232666015625, 2.818817138671875, 2.91436767578125, 3.009918212890625, 3.10546875]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 5.0, 6.0, 4.0, 6.0, 7.0, 12.0, 22.0, 25.0, 42.0, 59.0, 71.0, 108.0, 180.0, 290.0, 476.0, 724.0, 1224.0, 1948.0, 3336.0, 5637.0, 9925.0, 17245.0, 30630.0, 56335.0, 103875.0, 179898.0, 1279039.0, 177929.0, 102157.0, 55205.0, 30239.0, 16793.0, 9605.0, 5564.0, 3345.0, 1935.0, 1230.0, 720.0, 423.0, 286.0, 184.0, 111.0, 84.0, 60.0, 41.0, 29.0, 25.0, 12.0, 15.0, 8.0, 9.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.28173828125, -0.2721824645996094, -0.26262664794921875, -0.2530708312988281, -0.2435150146484375, -0.23395919799804688, -0.22440338134765625, -0.21484756469726562, -0.205291748046875, -0.19573593139648438, -0.18618011474609375, -0.17662429809570312, -0.1670684814453125, -0.15751266479492188, -0.14795684814453125, -0.13840103149414062, -0.12884521484375, -0.11928939819335938, -0.10973358154296875, -0.10017776489257812, -0.0906219482421875, -0.08106613159179688, -0.07151031494140625, -0.061954498291015625, -0.052398681640625, -0.042842864990234375, -0.03328704833984375, -0.023731231689453125, -0.0141754150390625, -0.004619598388671875, 0.00493621826171875, 0.014492034912109375, 0.0240478515625, 0.033603668212890625, 0.04315948486328125, 0.052715301513671875, 0.0622711181640625, 0.07182693481445312, 0.08138275146484375, 0.09093856811523438, 0.100494384765625, 0.11005020141601562, 0.11960601806640625, 0.12916183471679688, 0.1387176513671875, 0.14827346801757812, 0.15782928466796875, 0.16738510131835938, 0.17694091796875, 0.18649673461914062, 0.19605255126953125, 0.20560836791992188, 0.2151641845703125, 0.22472000122070312, 0.23427581787109375, 0.24383163452148438, 0.253387451171875, 0.2629432678222656, 0.27249908447265625, 0.2820549011230469, 0.2916107177734375, 0.3011665344238281, 0.31072235107421875, 0.3202781677246094, 0.329833984375]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 3.0, 5.0, 1.0, 7.0, 1.0, 7.0, 10.0, 15.0, 15.0, 14.0, 18.0, 14.0, 15.0, 18.0, 29.0, 31.0, 30.0, 29.0, 64.0, 63.0, 72.0, 97.0, 93.0, 73.0, 50.0, 39.0, 20.0, 25.0, 18.0, 28.0, 18.0, 18.0, 14.0, 13.0, 4.0, 9.0, 5.0, 7.0, 3.0, 4.0, 1.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0070648193359375, -0.0068454742431640625, -0.006626129150390625, -0.0064067840576171875, -0.00618743896484375, -0.0059680938720703125, -0.005748748779296875, -0.0055294036865234375, -0.00531005859375, -0.0050907135009765625, -0.004871368408203125, -0.0046520233154296875, -0.00443267822265625, -0.0042133331298828125, -0.003993988037109375, -0.0037746429443359375, -0.0035552978515625, -0.0033359527587890625, -0.003116607666015625, -0.0028972625732421875, -0.00267791748046875, -0.0024585723876953125, -0.002239227294921875, -0.0020198822021484375, -0.001800537109375, -0.0015811920166015625, -0.001361846923828125, -0.0011425018310546875, -0.00092315673828125, -0.0007038116455078125, -0.000484466552734375, -0.0002651214599609375, -4.57763671875e-05, 0.0001735687255859375, 0.000392913818359375, 0.0006122589111328125, 0.00083160400390625, 0.0010509490966796875, 0.001270294189453125, 0.0014896392822265625, 0.001708984375, 0.0019283294677734375, 0.002147674560546875, 0.0023670196533203125, 0.00258636474609375, 0.0028057098388671875, 0.003025054931640625, 0.0032444000244140625, 0.0034637451171875, 0.0036830902099609375, 0.003902435302734375, 0.0041217803955078125, 0.00434112548828125, 0.0045604705810546875, 0.004779815673828125, 0.0049991607666015625, 0.005218505859375, 0.0054378509521484375, 0.005657196044921875, 0.0058765411376953125, 0.00609588623046875, 0.0063152313232421875, 0.006534576416015625, 0.0067539215087890625, 0.0069732666015625]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 3.0, 4.0, 3.0, 7.0, 9.0, 8.0, 8.0, 17.0, 20.0, 26.0, 40.0, 41.0, 63.0, 84.0, 163.0, 326.0, 1463.0, 22051.0, 917009.0, 102391.0, 3769.0, 458.0, 194.0, 84.0, 68.0, 63.0, 33.0, 23.0, 24.0, 30.0, 15.0, 17.0, 10.0, 8.0, 5.0, 4.0, 6.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.143310546875, -0.13879013061523438, -0.13426971435546875, -0.12974929809570312, -0.1252288818359375, -0.12070846557617188, -0.11618804931640625, -0.11166763305664062, -0.107147216796875, -0.10262680053710938, -0.09810638427734375, -0.09358596801757812, -0.0890655517578125, -0.08454513549804688, -0.08002471923828125, -0.07550430297851562, -0.07098388671875, -0.06646347045898438, -0.06194305419921875, -0.057422637939453125, -0.0529022216796875, -0.048381805419921875, -0.04386138916015625, -0.039340972900390625, -0.034820556640625, -0.030300140380859375, -0.02577972412109375, -0.021259307861328125, -0.0167388916015625, -0.012218475341796875, -0.00769805908203125, -0.003177642822265625, 0.0013427734375, 0.005863189697265625, 0.01038360595703125, 0.014904022216796875, 0.0194244384765625, 0.023944854736328125, 0.02846527099609375, 0.032985687255859375, 0.037506103515625, 0.042026519775390625, 0.04654693603515625, 0.051067352294921875, 0.0555877685546875, 0.060108184814453125, 0.06462860107421875, 0.06914901733398438, 0.07366943359375, 0.07818984985351562, 0.08271026611328125, 0.08723068237304688, 0.0917510986328125, 0.09627151489257812, 0.10079193115234375, 0.10531234741210938, 0.109832763671875, 0.11435317993164062, 0.11887359619140625, 0.12339401245117188, 0.1279144287109375, 0.13243484497070312, 0.13695526123046875, 0.14147567749023438, 0.14599609375]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [39.0, 386.0, 549.0, 34.0, 6.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.009780713357031345, -0.004994294606149197, -0.00020787585526704788, 0.004578542895615101, 0.00936496164649725, 0.014151380397379398, 0.01893780007958412, 0.02372422069311142, 0.02851063758134842, 0.03329705446958542, 0.03808347508311272, 0.042869895696640015, 0.047656312584877014, 0.052442729473114014, 0.05722915008664131, 0.06201557070016861, 0.06680198758840561, 0.07158840447664261, 0.0763748288154602, 0.0811612457036972, 0.0859476625919342, 0.0907340794801712, 0.0955204963684082, 0.1003069207072258, 0.1050933375954628, 0.1098797544836998, 0.1146661788225174, 0.1194525957107544, 0.1242390125989914, 0.1290254294872284, 0.1338118463754654, 0.1385982632637024, 0.14338469505310059, 0.14817111194133759, 0.15295752882957458, 0.15774394571781158, 0.16253036260604858, 0.16731679439544678, 0.17210321128368378, 0.17688962817192078, 0.18167604506015778, 0.18646246194839478, 0.19124887883663177, 0.19603529572486877, 0.20082172751426697, 0.20560814440250397, 0.21039456129074097, 0.21518097817897797, 0.21996739506721497, 0.22475381195545197, 0.22954022884368896, 0.23432664573192596, 0.23911306262016296, 0.24389949440956116, 0.24868591129779816, 0.25347232818603516, 0.25825875997543335, 0.26304519176483154, 0.26783159375190735, 0.27261802554130554, 0.27740442752838135, 0.28219085931777954, 0.28697726130485535, 0.29176369309425354, 0.29655009508132935]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 7.0, 4.0, 12.0, 12.0, 14.0, 13.0, 23.0, 18.0, 29.0, 32.0, 40.0, 41.0, 45.0, 55.0, 61.0, 47.0, 50.0, 47.0, 59.0, 53.0, 47.0, 48.0, 42.0, 34.0, 41.0, 29.0, 22.0, 21.0, 11.0, 10.0, 11.0, 9.0, 10.0, 5.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.015636742115020752, -0.015188802033662796, -0.01474086195230484, -0.014292921870946884, -0.013844981789588928, -0.013397041708230972, -0.012949101626873016, -0.01250116154551506, -0.012053221464157104, -0.011605281382799149, -0.011157341301441193, -0.010709401220083237, -0.01026146113872528, -0.009813521057367325, -0.009365580976009369, -0.008917640894651413, -0.008469700813293457, -0.008021760731935501, -0.007573820650577545, -0.007125880569219589, -0.006677940487861633, -0.006230000406503677, -0.0057820603251457214, -0.0053341202437877655, -0.00488618016242981, -0.004438240081071854, -0.003990299999713898, -0.0035423599183559418, -0.003094419836997986, -0.00264647975564003, -0.002198539674282074, -0.001750599592924118, -0.0013026595115661621, -0.0008547194302082062, -0.00040677934885025024, 4.116073250770569e-05, 0.0004891008138656616, 0.0009370408952236176, 0.0013849809765815735, 0.0018329210579395294, 0.0022808611392974854, 0.0027288012206554413, 0.003176741302013397, 0.003624681383371353, 0.004072621464729309, 0.004520561546087265, 0.004968501627445221, 0.005416441708803177, 0.005864381790161133, 0.006312321871519089, 0.006760261952877045, 0.007208202034235001, 0.0076561421155929565, 0.008104082196950912, 0.008552022278308868, 0.008999962359666824, 0.00944790244102478, 0.009895842522382736, 0.010343782603740692, 0.010791722685098648, 0.011239662766456604, 0.01168760284781456, 0.012135542929172516, 0.012583483010530472, 0.013031423091888428]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 4.0, 2.0, 6.0, 0.0, 5.0, 2.0, 3.0, 7.0, 11.0, 7.0, 12.0, 14.0, 19.0, 19.0, 22.0, 34.0, 23.0, 26.0, 34.0, 29.0, 40.0, 45.0, 48.0, 43.0, 39.0, 39.0, 41.0, 41.0, 38.0, 42.0, 25.0, 31.0, 31.0, 40.0, 30.0, 30.0, 22.0, 14.0, 13.0, 13.0, 12.0, 9.0, 13.0, 10.0, 5.0, 6.0, 2.0, 3.0, 2.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.939453125, -3.791778564453125, -3.64410400390625, -3.496429443359375, -3.3487548828125, -3.201080322265625, -3.05340576171875, -2.905731201171875, -2.758056640625, -2.610382080078125, -2.46270751953125, -2.315032958984375, -2.1673583984375, -2.019683837890625, -1.87200927734375, -1.724334716796875, -1.57666015625, -1.428985595703125, -1.28131103515625, -1.133636474609375, -0.9859619140625, -0.838287353515625, -0.69061279296875, -0.542938232421875, -0.395263671875, -0.247589111328125, -0.09991455078125, 0.047760009765625, 0.1954345703125, 0.343109130859375, 0.49078369140625, 0.638458251953125, 0.7861328125, 0.933807373046875, 1.08148193359375, 1.229156494140625, 1.3768310546875, 1.524505615234375, 1.67218017578125, 1.819854736328125, 1.967529296875, 2.115203857421875, 2.26287841796875, 2.410552978515625, 2.5582275390625, 2.705902099609375, 2.85357666015625, 3.001251220703125, 3.14892578125, 3.296600341796875, 3.44427490234375, 3.591949462890625, 3.7396240234375, 3.887298583984375, 4.03497314453125, 4.182647705078125, 4.330322265625, 4.477996826171875, 4.62567138671875, 4.773345947265625, 4.9210205078125, 5.068695068359375, 5.21636962890625, 5.364044189453125, 5.51171875]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 4.0, 6.0, 7.0, 15.0, 24.0, 31.0, 45.0, 72.0, 120.0, 200.0, 299.0, 478.0, 778.0, 1201.0, 2034.0, 3472.0, 5655.0, 10090.0, 19593.0, 43978.0, 126056.0, 408618.0, 276056.0, 83148.0, 31650.0, 14805.0, 8185.0, 4698.0, 2685.0, 1699.0, 1020.0, 670.0, 416.0, 284.0, 167.0, 100.0, 71.0, 46.0, 32.0, 17.0, 15.0, 10.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.21484375, -4.07806396484375, -3.9412841796875, -3.80450439453125, -3.667724609375, -3.53094482421875, -3.3941650390625, -3.25738525390625, -3.12060546875, -2.98382568359375, -2.8470458984375, -2.71026611328125, -2.573486328125, -2.43670654296875, -2.2999267578125, -2.16314697265625, -2.0263671875, -1.88958740234375, -1.7528076171875, -1.61602783203125, -1.479248046875, -1.34246826171875, -1.2056884765625, -1.06890869140625, -0.93212890625, -0.79534912109375, -0.6585693359375, -0.52178955078125, -0.385009765625, -0.24822998046875, -0.1114501953125, 0.02532958984375, 0.162109375, 0.29888916015625, 0.4356689453125, 0.57244873046875, 0.709228515625, 0.84600830078125, 0.9827880859375, 1.11956787109375, 1.25634765625, 1.39312744140625, 1.5299072265625, 1.66668701171875, 1.803466796875, 1.94024658203125, 2.0770263671875, 2.21380615234375, 2.3505859375, 2.48736572265625, 2.6241455078125, 2.76092529296875, 2.897705078125, 3.03448486328125, 3.1712646484375, 3.30804443359375, 3.44482421875, 3.58160400390625, 3.7183837890625, 3.85516357421875, 3.991943359375, 4.12872314453125, 4.2655029296875, 4.40228271484375, 4.5390625]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 10.0, 4.0, 4.0, 13.0, 10.0, 9.0, 13.0, 20.0, 24.0, 27.0, 33.0, 34.0, 39.0, 41.0, 28.0, 54.0, 62.0, 101.0, 249.0, 1627.0, 172.0, 90.0, 71.0, 38.0, 30.0, 38.0, 31.0, 22.0, 35.0, 25.0, 19.0, 17.0, 14.0, 10.0, 9.0, 6.0, 6.0, 8.0, 1.0, 4.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.7109375, -14.1300048828125, -13.549072265625, -12.9681396484375, -12.38720703125, -11.8062744140625, -11.225341796875, -10.6444091796875, -10.0634765625, -9.4825439453125, -8.901611328125, -8.3206787109375, -7.73974609375, -7.1588134765625, -6.577880859375, -5.9969482421875, -5.416015625, -4.8350830078125, -4.254150390625, -3.6732177734375, -3.09228515625, -2.5113525390625, -1.930419921875, -1.3494873046875, -0.7685546875, -0.1876220703125, 0.393310546875, 0.9742431640625, 1.55517578125, 2.1361083984375, 2.717041015625, 3.2979736328125, 3.87890625, 4.4598388671875, 5.040771484375, 5.6217041015625, 6.20263671875, 6.7835693359375, 7.364501953125, 7.9454345703125, 8.5263671875, 9.1072998046875, 9.688232421875, 10.2691650390625, 10.85009765625, 11.4310302734375, 12.011962890625, 12.5928955078125, 13.173828125, 13.7547607421875, 14.335693359375, 14.9166259765625, 15.49755859375, 16.0784912109375, 16.659423828125, 17.2403564453125, 17.8212890625, 18.4022216796875, 18.983154296875, 19.5640869140625, 20.14501953125, 20.7259521484375, 21.306884765625, 21.8878173828125, 22.46875]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 8.0, 13.0, 11.0, 29.0, 32.0, 51.0, 79.0, 130.0, 192.0, 311.0, 673.0, 6388.0, 3105877.0, 29852.0, 1053.0, 374.0, 228.0, 149.0, 104.0, 53.0, 42.0, 22.0, 13.0, 9.0, 4.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-59.15625, -57.01708984375, -54.8779296875, -52.73876953125, -50.599609375, -48.46044921875, -46.3212890625, -44.18212890625, -42.04296875, -39.90380859375, -37.7646484375, -35.62548828125, -33.486328125, -31.34716796875, -29.2080078125, -27.06884765625, -24.9296875, -22.79052734375, -20.6513671875, -18.51220703125, -16.373046875, -14.23388671875, -12.0947265625, -9.95556640625, -7.81640625, -5.67724609375, -3.5380859375, -1.39892578125, 0.740234375, 2.87939453125, 5.0185546875, 7.15771484375, 9.296875, 11.43603515625, 13.5751953125, 15.71435546875, 17.853515625, 19.99267578125, 22.1318359375, 24.27099609375, 26.41015625, 28.54931640625, 30.6884765625, 32.82763671875, 34.966796875, 37.10595703125, 39.2451171875, 41.38427734375, 43.5234375, 45.66259765625, 47.8017578125, 49.94091796875, 52.080078125, 54.21923828125, 56.3583984375, 58.49755859375, 60.63671875, 62.77587890625, 64.9150390625, 67.05419921875, 69.193359375, 71.33251953125, 73.4716796875, 75.61083984375, 77.75]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 30.0, 229.0, 498.0, 220.0, 35.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-183.8447723388672, -180.52789306640625, -177.2110137939453, -173.89413452148438, -170.57725524902344, -167.2603759765625, -163.94351196289062, -160.6266326904297, -157.30975341796875, -153.9928741455078, -150.67599487304688, -147.35911560058594, -144.042236328125, -140.72537231445312, -137.40847778320312, -134.09161376953125, -130.77471923828125, -127.45783996582031, -124.14096069335938, -120.82408142089844, -117.50720977783203, -114.1903305053711, -110.87345123291016, -107.55657196044922, -104.23970031738281, -100.92282104492188, -97.60594177246094, -94.2890625, -90.9721908569336, -87.65531158447266, -84.33843231201172, -81.02155303955078, -77.70468139648438, -74.38780212402344, -71.0709228515625, -67.75404357910156, -64.43717193603516, -61.12029266357422, -57.80341339111328, -54.486534118652344, -51.16966247558594, -47.852783203125, -44.53590774536133, -41.21902847290039, -37.90215301513672, -34.58527374267578, -31.268394470214844, -27.95151710510254, -24.634639739990234, -21.31776237487793, -18.000885009765625, -14.684005737304688, -11.367128372192383, -8.050251007080078, -4.733371734619141, -1.416494369506836, 1.9003829956054688, 5.217260837554932, 8.534138679504395, 11.851016998291016, 15.16789436340332, 18.484771728515625, 21.801651000976562, 25.118528366088867, 28.435405731201172]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 2.0, 8.0, 5.0, 11.0, 12.0, 17.0, 11.0, 19.0, 14.0, 14.0, 25.0, 33.0, 35.0, 30.0, 41.0, 42.0, 46.0, 32.0, 41.0, 39.0, 47.0, 47.0, 52.0, 46.0, 37.0, 43.0, 17.0, 28.0, 36.0, 33.0, 21.0, 13.0, 16.0, 12.0, 14.0, 13.0, 10.0, 8.0, 8.0, 4.0, 5.0, 4.0, 3.0, 3.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-47.849639892578125, -46.30297088623047, -44.75630187988281, -43.20963668823242, -41.662967681884766, -40.11629867553711, -38.56962966918945, -37.02296447753906, -35.476295471191406, -33.92962646484375, -32.382957458496094, -30.83629035949707, -29.289623260498047, -27.74295425415039, -26.196285247802734, -24.64961814880371, -23.102949142456055, -21.5562801361084, -20.009613037109375, -18.46294403076172, -16.916276931762695, -15.369607925415039, -13.8229398727417, -12.27627182006836, -10.72960376739502, -9.18293571472168, -7.63626766204834, -6.089599132537842, -4.542931079864502, -2.996263027191162, -1.449594497680664, 0.09707355499267578, 1.6437416076660156, 3.1904096603393555, 4.737077713012695, 6.283746242523193, 7.830414295196533, 9.377082824707031, 10.923750877380371, 12.470418930053711, 14.01708698272705, 15.56375503540039, 17.110424041748047, 18.65709114074707, 20.203760147094727, 21.75042724609375, 23.297096252441406, 24.843765258789062, 26.390432357788086, 27.937101364135742, 29.483768463134766, 31.030437469482422, 32.57710647583008, 34.12377166748047, 35.670440673828125, 37.21710968017578, 38.76377868652344, 40.310447692871094, 41.85711669921875, 43.40378189086914, 44.9504508972168, 46.49711990356445, 48.04378890991211, 49.5904541015625, 51.137123107910156]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 5.0, 4.0, 5.0, 4.0, 4.0, 6.0, 12.0, 10.0, 15.0, 18.0, 16.0, 10.0, 19.0, 31.0, 23.0, 23.0, 33.0, 43.0, 32.0, 45.0, 33.0, 49.0, 50.0, 37.0, 52.0, 36.0, 41.0, 30.0, 31.0, 37.0, 36.0, 28.0, 31.0, 20.0, 27.0, 23.0, 15.0, 10.0, 9.0, 13.0, 9.0, 7.0, 6.0, 4.0, 7.0, 4.0, 4.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.1484375, -3.9935302734375, -3.838623046875, -3.6837158203125, -3.52880859375, -3.3739013671875, -3.218994140625, -3.0640869140625, -2.9091796875, -2.7542724609375, -2.599365234375, -2.4444580078125, -2.28955078125, -2.1346435546875, -1.979736328125, -1.8248291015625, -1.669921875, -1.5150146484375, -1.360107421875, -1.2052001953125, -1.05029296875, -0.8953857421875, -0.740478515625, -0.5855712890625, -0.4306640625, -0.2757568359375, -0.120849609375, 0.0340576171875, 0.18896484375, 0.3438720703125, 0.498779296875, 0.6536865234375, 0.80859375, 0.9635009765625, 1.118408203125, 1.2733154296875, 1.42822265625, 1.5831298828125, 1.738037109375, 1.8929443359375, 2.0478515625, 2.2027587890625, 2.357666015625, 2.5125732421875, 2.66748046875, 2.8223876953125, 2.977294921875, 3.1322021484375, 3.287109375, 3.4420166015625, 3.596923828125, 3.7518310546875, 3.90673828125, 4.0616455078125, 4.216552734375, 4.3714599609375, 4.5263671875, 4.6812744140625, 4.836181640625, 4.9910888671875, 5.14599609375, 5.3009033203125, 5.455810546875, 5.6107177734375, 5.765625]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 5.0, 2.0, 1.0, 3.0, 9.0, 4.0, 6.0, 9.0, 16.0, 14.0, 10.0, 23.0, 64.0, 89.0, 176.0, 288.0, 530.0, 1008.0, 2180.0, 5209.0, 14152.0, 46654.0, 197926.0, 996643.0, 2091443.0, 658204.0, 128972.0, 33067.0, 10253.0, 3873.0, 1656.0, 800.0, 447.0, 206.0, 116.0, 72.0, 49.0, 33.0, 22.0, 11.0, 7.0, 12.0, 6.0, 5.0, 3.0, 5.0, 2.0, 1.0, 1.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.87890625, -7.59100341796875, -7.3031005859375, -7.01519775390625, -6.727294921875, -6.43939208984375, -6.1514892578125, -5.86358642578125, -5.57568359375, -5.28778076171875, -4.9998779296875, -4.71197509765625, -4.424072265625, -4.13616943359375, -3.8482666015625, -3.56036376953125, -3.2724609375, -2.98455810546875, -2.6966552734375, -2.40875244140625, -2.120849609375, -1.83294677734375, -1.5450439453125, -1.25714111328125, -0.96923828125, -0.68133544921875, -0.3934326171875, -0.10552978515625, 0.182373046875, 0.47027587890625, 0.7581787109375, 1.04608154296875, 1.333984375, 1.62188720703125, 1.9097900390625, 2.19769287109375, 2.485595703125, 2.77349853515625, 3.0614013671875, 3.34930419921875, 3.63720703125, 3.92510986328125, 4.2130126953125, 4.50091552734375, 4.788818359375, 5.07672119140625, 5.3646240234375, 5.65252685546875, 5.9404296875, 6.22833251953125, 6.5162353515625, 6.80413818359375, 7.092041015625, 7.37994384765625, 7.6678466796875, 7.95574951171875, 8.24365234375, 8.53155517578125, 8.8194580078125, 9.10736083984375, 9.395263671875, 9.68316650390625, 9.9710693359375, 10.25897216796875, 10.546875]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 3.0, 3.0, 7.0, 6.0, 11.0, 6.0, 14.0, 28.0, 40.0, 44.0, 54.0, 78.0, 87.0, 150.0, 257.0, 314.0, 410.0, 518.0, 510.0, 415.0, 303.0, 231.0, 174.0, 113.0, 89.0, 77.0, 42.0, 31.0, 21.0, 13.0, 13.0, 8.0, 6.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.78125, -10.421142578125, -10.06103515625, -9.700927734375, -9.3408203125, -8.980712890625, -8.62060546875, -8.260498046875, -7.900390625, -7.540283203125, -7.18017578125, -6.820068359375, -6.4599609375, -6.099853515625, -5.73974609375, -5.379638671875, -5.01953125, -4.659423828125, -4.29931640625, -3.939208984375, -3.5791015625, -3.218994140625, -2.85888671875, -2.498779296875, -2.138671875, -1.778564453125, -1.41845703125, -1.058349609375, -0.6982421875, -0.338134765625, 0.02197265625, 0.382080078125, 0.7421875, 1.102294921875, 1.46240234375, 1.822509765625, 2.1826171875, 2.542724609375, 2.90283203125, 3.262939453125, 3.623046875, 3.983154296875, 4.34326171875, 4.703369140625, 5.0634765625, 5.423583984375, 5.78369140625, 6.143798828125, 6.50390625, 6.864013671875, 7.22412109375, 7.584228515625, 7.9443359375, 8.304443359375, 8.66455078125, 9.024658203125, 9.384765625, 9.744873046875, 10.10498046875, 10.465087890625, 10.8251953125, 11.185302734375, 11.54541015625, 11.905517578125, 12.265625]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 4.0, 9.0, 9.0, 18.0, 15.0, 27.0, 39.0, 72.0, 92.0, 140.0, 187.0, 261.0, 520.0, 1849.0, 21131.0, 815561.0, 3264411.0, 83875.0, 4304.0, 769.0, 318.0, 170.0, 120.0, 104.0, 75.0, 60.0, 47.0, 23.0, 28.0, 8.0, 11.0, 10.0, 3.0, 6.0, 0.0, 3.0, 4.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-37.03125, -35.94873046875, -34.8662109375, -33.78369140625, -32.701171875, -31.61865234375, -30.5361328125, -29.45361328125, -28.37109375, -27.28857421875, -26.2060546875, -25.12353515625, -24.041015625, -22.95849609375, -21.8759765625, -20.79345703125, -19.7109375, -18.62841796875, -17.5458984375, -16.46337890625, -15.380859375, -14.29833984375, -13.2158203125, -12.13330078125, -11.05078125, -9.96826171875, -8.8857421875, -7.80322265625, -6.720703125, -5.63818359375, -4.5556640625, -3.47314453125, -2.390625, -1.30810546875, -0.2255859375, 0.85693359375, 1.939453125, 3.02197265625, 4.1044921875, 5.18701171875, 6.26953125, 7.35205078125, 8.4345703125, 9.51708984375, 10.599609375, 11.68212890625, 12.7646484375, 13.84716796875, 14.9296875, 16.01220703125, 17.0947265625, 18.17724609375, 19.259765625, 20.34228515625, 21.4248046875, 22.50732421875, 23.58984375, 24.67236328125, 25.7548828125, 26.83740234375, 27.919921875, 29.00244140625, 30.0849609375, 31.16748046875, 32.25]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 17.0, 54.0, 160.0, 266.0, 269.0, 151.0, 72.0, 13.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-205.6472625732422, -201.53433227539062, -197.42138671875, -193.30845642089844, -189.19552612304688, -185.08258056640625, -180.9696502685547, -176.85671997070312, -172.7437744140625, -168.63084411621094, -164.5178985595703, -160.40496826171875, -156.2920379638672, -152.17909240722656, -148.066162109375, -143.95323181152344, -139.84030151367188, -135.7273712158203, -131.6144256591797, -127.50149536132812, -123.38855743408203, -119.27561950683594, -115.16268920898438, -111.04975128173828, -106.93681335449219, -102.8238754272461, -98.71094512939453, -94.59800720214844, -90.48506927490234, -86.37213134765625, -82.25920104980469, -78.1462631225586, -74.03333282470703, -69.92039489746094, -65.80746459960938, -61.69452667236328, -57.58158874511719, -53.46865463256836, -49.35572052001953, -45.24278259277344, -41.12984848022461, -37.01691436767578, -32.90397644042969, -28.79104232788086, -24.6781063079834, -20.565170288085938, -16.45223617553711, -12.339300155639648, -8.226364135742188, -4.113428592681885, -0.0004930496215820312, 4.1124420166015625, 8.225378036499023, 12.338314056396484, 16.451248168945312, 20.564184188842773, 24.677120208740234, 28.790056228637695, 32.902992248535156, 37.015926361083984, 41.12886047363281, 45.241798400878906, 49.354732513427734, 53.46766662597656, 57.580604553222656]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 0.0, 4.0, 4.0, 5.0, 6.0, 6.0, 12.0, 9.0, 15.0, 16.0, 19.0, 18.0, 22.0, 28.0, 34.0, 40.0, 37.0, 36.0, 36.0, 33.0, 39.0, 40.0, 44.0, 46.0, 50.0, 33.0, 47.0, 54.0, 29.0, 40.0, 26.0, 29.0, 19.0, 27.0, 12.0, 24.0, 15.0, 4.0, 14.0, 7.0, 9.0, 3.0, 7.0, 2.0, 5.0, 1.0, 1.0, 0.0, 3.0, 2.0], "bins": [-40.830482482910156, -39.719764709472656, -38.609046936035156, -37.498329162597656, -36.38760757446289, -35.27688980102539, -34.16617202758789, -33.05545425415039, -31.94473648071289, -30.83401870727539, -29.723299026489258, -28.612581253051758, -27.501863479614258, -26.391143798828125, -25.280426025390625, -24.169708251953125, -23.058988571166992, -21.948270797729492, -20.83755111694336, -19.72683334350586, -18.61611557006836, -17.50539779663086, -16.394678115844727, -15.283960342407227, -14.17324161529541, -13.062522888183594, -11.951805114746094, -10.841086387634277, -9.730367660522461, -8.619649887084961, -7.5089311599731445, -6.398212909698486, -5.287494659423828, -4.17677640914917, -3.0660579204559326, -1.9553394317626953, -0.8446211814880371, 0.2660970687866211, 1.3768157958984375, 2.4875340461730957, 3.598252296447754, 4.708970546722412, 5.81968879699707, 6.930407524108887, 8.041126251220703, 9.151844024658203, 10.26256275177002, 11.373281478881836, 12.483999252319336, 13.594717979431152, 14.705435752868652, 15.816154479980469, 16.92687225341797, 18.03759002685547, 19.1483097076416, 20.2590274810791, 21.369747161865234, 22.480464935302734, 23.591184616088867, 24.701902389526367, 25.812620162963867, 26.92333984375, 28.0340576171875, 29.144775390625, 30.2554931640625]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 4.0, 5.0, 5.0, 4.0, 3.0, 8.0, 9.0, 6.0, 8.0, 9.0, 8.0, 10.0, 15.0, 17.0, 16.0, 25.0, 25.0, 32.0, 22.0, 39.0, 37.0, 37.0, 36.0, 56.0, 37.0, 44.0, 39.0, 41.0, 34.0, 41.0, 39.0, 32.0, 25.0, 28.0, 30.0, 27.0, 19.0, 21.0, 12.0, 20.0, 19.0, 15.0, 10.0, 6.0, 9.0, 5.0, 6.0, 1.0, 8.0, 4.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.9453125, -3.80010986328125, -3.6549072265625, -3.50970458984375, -3.364501953125, -3.21929931640625, -3.0740966796875, -2.92889404296875, -2.78369140625, -2.63848876953125, -2.4932861328125, -2.34808349609375, -2.202880859375, -2.05767822265625, -1.9124755859375, -1.76727294921875, -1.6220703125, -1.47686767578125, -1.3316650390625, -1.18646240234375, -1.041259765625, -0.89605712890625, -0.7508544921875, -0.60565185546875, -0.46044921875, -0.31524658203125, -0.1700439453125, -0.02484130859375, 0.120361328125, 0.26556396484375, 0.4107666015625, 0.55596923828125, 0.701171875, 0.84637451171875, 0.9915771484375, 1.13677978515625, 1.281982421875, 1.42718505859375, 1.5723876953125, 1.71759033203125, 1.86279296875, 2.00799560546875, 2.1531982421875, 2.29840087890625, 2.443603515625, 2.58880615234375, 2.7340087890625, 2.87921142578125, 3.0244140625, 3.16961669921875, 3.3148193359375, 3.46002197265625, 3.605224609375, 3.75042724609375, 3.8956298828125, 4.04083251953125, 4.18603515625, 4.33123779296875, 4.4764404296875, 4.62164306640625, 4.766845703125, 4.91204833984375, 5.0572509765625, 5.20245361328125, 5.34765625]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 4.0, 5.0, 5.0, 3.0, 7.0, 8.0, 9.0, 13.0, 18.0, 27.0, 57.0, 64.0, 82.0, 120.0, 188.0, 290.0, 428.0, 595.0, 1065.0, 1545.0, 2316.0, 3620.0, 5457.0, 8705.0, 13838.0, 21984.0, 37191.0, 66709.0, 130342.0, 239501.0, 232399.0, 124186.0, 63367.0, 35642.0, 21670.0, 13131.0, 8385.0, 5423.0, 3490.0, 2346.0, 1449.0, 936.0, 655.0, 416.0, 304.0, 202.0, 123.0, 69.0, 63.0, 39.0, 26.0, 18.0, 12.0, 11.0, 1.0, 2.0, 5.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0], "bins": [-0.53271484375, -0.5155105590820312, -0.4983062744140625, -0.48110198974609375, -0.463897705078125, -0.44669342041015625, -0.4294891357421875, -0.41228485107421875, -0.39508056640625, -0.37787628173828125, -0.3606719970703125, -0.34346771240234375, -0.326263427734375, -0.30905914306640625, -0.2918548583984375, -0.27465057373046875, -0.2574462890625, -0.24024200439453125, -0.2230377197265625, -0.20583343505859375, -0.188629150390625, -0.17142486572265625, -0.1542205810546875, -0.13701629638671875, -0.11981201171875, -0.10260772705078125, -0.0854034423828125, -0.06819915771484375, -0.050994873046875, -0.03379058837890625, -0.0165863037109375, 0.00061798095703125, 0.017822265625, 0.03502655029296875, 0.0522308349609375, 0.06943511962890625, 0.086639404296875, 0.10384368896484375, 0.1210479736328125, 0.13825225830078125, 0.15545654296875, 0.17266082763671875, 0.1898651123046875, 0.20706939697265625, 0.224273681640625, 0.24147796630859375, 0.2586822509765625, 0.27588653564453125, 0.2930908203125, 0.31029510498046875, 0.3274993896484375, 0.34470367431640625, 0.361907958984375, 0.37911224365234375, 0.3963165283203125, 0.41352081298828125, 0.43072509765625, 0.44792938232421875, 0.4651336669921875, 0.48233795166015625, 0.499542236328125, 0.5167465209960938, 0.5339508056640625, 0.5511550903320312, 0.568359375]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 7.0, 2.0, 6.0, 5.0, 10.0, 8.0, 9.0, 9.0, 13.0, 10.0, 16.0, 19.0, 35.0, 24.0, 28.0, 42.0, 33.0, 46.0, 41.0, 39.0, 43.0, 57.0, 1069.0, 41.0, 39.0, 46.0, 39.0, 40.0, 44.0, 32.0, 20.0, 23.0, 30.0, 25.0, 19.0, 17.0, 6.0, 15.0, 10.0, 8.0, 10.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.48828125, -3.3814697265625, -3.274658203125, -3.1678466796875, -3.06103515625, -2.9542236328125, -2.847412109375, -2.7406005859375, -2.6337890625, -2.5269775390625, -2.420166015625, -2.3133544921875, -2.20654296875, -2.0997314453125, -1.992919921875, -1.8861083984375, -1.779296875, -1.6724853515625, -1.565673828125, -1.4588623046875, -1.35205078125, -1.2452392578125, -1.138427734375, -1.0316162109375, -0.9248046875, -0.8179931640625, -0.711181640625, -0.6043701171875, -0.49755859375, -0.3907470703125, -0.283935546875, -0.1771240234375, -0.0703125, 0.0364990234375, 0.143310546875, 0.2501220703125, 0.35693359375, 0.4637451171875, 0.570556640625, 0.6773681640625, 0.7841796875, 0.8909912109375, 0.997802734375, 1.1046142578125, 1.21142578125, 1.3182373046875, 1.425048828125, 1.5318603515625, 1.638671875, 1.7454833984375, 1.852294921875, 1.9591064453125, 2.06591796875, 2.1727294921875, 2.279541015625, 2.3863525390625, 2.4931640625, 2.5999755859375, 2.706787109375, 2.8135986328125, 2.92041015625, 3.0272216796875, 3.134033203125, 3.2408447265625, 3.34765625]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 10.0, 6.0, 17.0, 15.0, 30.0, 32.0, 64.0, 77.0, 101.0, 171.0, 300.0, 451.0, 731.0, 1283.0, 2106.0, 3625.0, 6533.0, 11786.0, 21467.0, 39768.0, 74443.0, 137038.0, 581861.0, 911046.0, 139468.0, 75082.0, 40543.0, 21472.0, 11824.0, 6720.0, 3683.0, 2085.0, 1280.0, 743.0, 442.0, 280.0, 197.0, 112.0, 62.0, 60.0, 29.0, 31.0, 24.0, 10.0, 12.0, 5.0, 2.0, 3.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.29833984375, -0.28839874267578125, -0.2784576416015625, -0.26851654052734375, -0.258575439453125, -0.24863433837890625, -0.2386932373046875, -0.22875213623046875, -0.21881103515625, -0.20886993408203125, -0.1989288330078125, -0.18898773193359375, -0.179046630859375, -0.16910552978515625, -0.1591644287109375, -0.14922332763671875, -0.1392822265625, -0.12934112548828125, -0.1194000244140625, -0.10945892333984375, -0.099517822265625, -0.08957672119140625, -0.0796356201171875, -0.06969451904296875, -0.05975341796875, -0.04981231689453125, -0.0398712158203125, -0.02993011474609375, -0.019989013671875, -0.01004791259765625, -0.0001068115234375, 0.00983428955078125, 0.019775390625, 0.02971649169921875, 0.0396575927734375, 0.04959869384765625, 0.059539794921875, 0.06948089599609375, 0.0794219970703125, 0.08936309814453125, 0.09930419921875, 0.10924530029296875, 0.1191864013671875, 0.12912750244140625, 0.139068603515625, 0.14900970458984375, 0.1589508056640625, 0.16889190673828125, 0.1788330078125, 0.18877410888671875, 0.1987152099609375, 0.20865631103515625, 0.218597412109375, 0.22853851318359375, 0.2384796142578125, 0.24842071533203125, 0.25836181640625, 0.26830291748046875, 0.2782440185546875, 0.28818511962890625, 0.298126220703125, 0.30806732177734375, 0.3180084228515625, 0.32794952392578125, 0.337890625]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 3.0, 4.0, 8.0, 9.0, 8.0, 7.0, 19.0, 15.0, 20.0, 35.0, 53.0, 52.0, 94.0, 160.0, 169.0, 114.0, 54.0, 42.0, 21.0, 19.0, 23.0, 11.0, 10.0, 10.0, 10.0, 8.0, 4.0, 10.0, 1.0, 1.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00865936279296875, -0.008419454097747803, -0.008179545402526855, -0.007939636707305908, -0.007699728012084961, -0.007459819316864014, -0.007219910621643066, -0.006980001926422119, -0.006740093231201172, -0.006500184535980225, -0.006260275840759277, -0.00602036714553833, -0.005780458450317383, -0.0055405497550964355, -0.005300641059875488, -0.005060732364654541, -0.004820823669433594, -0.0045809149742126465, -0.004341006278991699, -0.004101097583770752, -0.0038611888885498047, -0.0036212801933288574, -0.00338137149810791, -0.003141462802886963, -0.0029015541076660156, -0.0026616454124450684, -0.002421736717224121, -0.002181828022003174, -0.0019419193267822266, -0.0017020106315612793, -0.001462101936340332, -0.0012221932411193848, -0.0009822845458984375, -0.0007423758506774902, -0.000502467155456543, -0.0002625584602355957, -2.2649765014648438e-05, 0.00021725893020629883, 0.0004571676254272461, 0.0006970763206481934, 0.0009369850158691406, 0.0011768937110900879, 0.0014168024063110352, 0.0016567111015319824, 0.0018966197967529297, 0.002136528491973877, 0.0023764371871948242, 0.0026163458824157715, 0.0028562545776367188, 0.003096163272857666, 0.0033360719680786133, 0.0035759806632995605, 0.003815889358520508, 0.004055798053741455, 0.004295706748962402, 0.00453561544418335, 0.004775524139404297, 0.005015432834625244, 0.005255341529846191, 0.005495250225067139, 0.005735158920288086, 0.005975067615509033, 0.0062149763107299805, 0.006454885005950928, 0.006694793701171875]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 0.0, 2.0, 4.0, 10.0, 5.0, 9.0, 9.0, 14.0, 14.0, 18.0, 32.0, 27.0, 51.0, 97.0, 309.0, 1641.0, 26381.0, 984864.0, 32554.0, 1897.0, 314.0, 98.0, 53.0, 43.0, 20.0, 28.0, 11.0, 15.0, 7.0, 7.0, 7.0, 3.0, 2.0, 5.0, 6.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1339111328125, -0.12921714782714844, -0.12452316284179688, -0.11982917785644531, -0.11513519287109375, -0.11044120788574219, -0.10574722290039062, -0.10105323791503906, -0.0963592529296875, -0.09166526794433594, -0.08697128295898438, -0.08227729797363281, -0.07758331298828125, -0.07288932800292969, -0.06819534301757812, -0.06350135803222656, -0.058807373046875, -0.05411338806152344, -0.049419403076171875, -0.04472541809082031, -0.04003143310546875, -0.03533744812011719, -0.030643463134765625, -0.025949478149414062, -0.0212554931640625, -0.016561508178710938, -0.011867523193359375, -0.0071735382080078125, -0.00247955322265625, 0.0022144317626953125, 0.006908416748046875, 0.011602401733398438, 0.01629638671875, 0.020990371704101562, 0.025684356689453125, 0.030378341674804688, 0.03507232666015625, 0.03976631164550781, 0.044460296630859375, 0.04915428161621094, 0.0538482666015625, 0.05854225158691406, 0.06323623657226562, 0.06793022155761719, 0.07262420654296875, 0.07731819152832031, 0.08201217651367188, 0.08670616149902344, 0.091400146484375, 0.09609413146972656, 0.10078811645507812, 0.10548210144042969, 0.11017608642578125, 0.11487007141113281, 0.11956405639648438, 0.12425804138183594, 0.1289520263671875, 0.13364601135253906, 0.13833999633789062, 0.1430339813232422, 0.14772796630859375, 0.1524219512939453, 0.15711593627929688, 0.16180992126464844, 0.16650390625]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 13.0, 53.0, 227.0, 575.0, 103.0, 24.0, 9.0, 6.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.014282971620559692, -0.011988595128059387, -0.009694218635559082, -0.0073998430743813515, -0.005105466581881046, -0.002811090089380741, -0.0005167145282030106, 0.0017776619642972946, 0.0040720384567976, 0.006366414949297905, 0.00866079144179821, 0.01095516700297594, 0.013249543495476246, 0.015543919987976551, 0.01783829554915428, 0.020132672041654587, 0.022427048534154892, 0.024721425026655197, 0.027015801519155502, 0.029310178011655807, 0.03160455450415611, 0.03389893099665642, 0.036193303763866425, 0.03848768025636673, 0.040782056748867035, 0.04307643324136734, 0.045370809733867645, 0.04766518622636795, 0.049959562718868256, 0.05225393921136856, 0.054548315703868866, 0.05684269219636917, 0.059137068688869476, 0.06143144518136978, 0.06372582167387009, 0.06602019816637039, 0.0683145746588707, 0.070608951151371, 0.07290332764387131, 0.07519770413637161, 0.07749208062887192, 0.07978645712137222, 0.08208083361387253, 0.08437521010637283, 0.08666958659887314, 0.08896396309137344, 0.09125833958387375, 0.09355271607637405, 0.09584708511829376, 0.09814146161079407, 0.10043583810329437, 0.10273021459579468, 0.10502459108829498, 0.10731896758079529, 0.1096133440732956, 0.1119077205657959, 0.1142020970582962, 0.11649647355079651, 0.11879085004329681, 0.12108522653579712, 0.12337960302829742, 0.12567397952079773, 0.12796835601329803, 0.13026273250579834, 0.13255710899829865]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 4.0, 2.0, 4.0, 6.0, 9.0, 13.0, 8.0, 18.0, 20.0, 19.0, 20.0, 14.0, 30.0, 35.0, 39.0, 37.0, 24.0, 47.0, 43.0, 44.0, 44.0, 36.0, 47.0, 44.0, 42.0, 32.0, 42.0, 35.0, 39.0, 31.0, 24.0, 24.0, 16.0, 19.0, 20.0, 13.0, 14.0, 11.0, 8.0, 6.0, 7.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 4.0, 1.0], "bins": [-0.007064700126647949, -0.006859057582914829, -0.006653415039181709, -0.006447772495448589, -0.006242129951715469, -0.006036487407982349, -0.005830844864249229, -0.0056252023205161095, -0.0054195597767829895, -0.0052139172330498695, -0.00500827468931675, -0.00480263214558363, -0.00459698960185051, -0.00439134705811739, -0.00418570451438427, -0.00398006197065115, -0.00377441942691803, -0.00356877688318491, -0.00336313433945179, -0.00315749179571867, -0.00295184925198555, -0.00274620670825243, -0.00254056416451931, -0.00233492162078619, -0.00212927907705307, -0.00192363653331995, -0.0017179939895868301, -0.0015123514458537102, -0.0013067089021205902, -0.0011010663583874702, -0.0008954238146543503, -0.0006897812709212303, -0.00048413872718811035, -0.0002784961834549904, -7.285363972187042e-05, 0.00013278890401124954, 0.0003384314477443695, 0.0005440739914774895, 0.0007497165352106094, 0.0009553590789437294, 0.0011610016226768494, 0.0013666441664099693, 0.0015722867101430893, 0.0017779292538762093, 0.0019835717976093292, 0.002189214341342449, 0.002394856885075569, 0.002600499428808689, 0.002806141972541809, 0.003011784516274929, 0.003217427060008049, 0.003423069603741169, 0.003628712147474289, 0.003834354691207409, 0.004039997234940529, 0.004245639778673649, 0.004451282322406769, 0.004656924866139889, 0.004862567409873009, 0.005068209953606129, 0.005273852497339249, 0.005479495041072369, 0.005685137584805489, 0.0058907801285386086, 0.0060964226722717285]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 4.0, 5.0, 5.0, 4.0, 3.0, 8.0, 9.0, 6.0, 8.0, 9.0, 8.0, 10.0, 15.0, 16.0, 17.0, 25.0, 25.0, 32.0, 22.0, 39.0, 37.0, 37.0, 36.0, 56.0, 38.0, 43.0, 39.0, 41.0, 34.0, 41.0, 39.0, 32.0, 25.0, 28.0, 30.0, 27.0, 19.0, 21.0, 12.0, 20.0, 19.0, 15.0, 10.0, 6.0, 9.0, 5.0, 6.0, 2.0, 7.0, 4.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.9453125, -3.80010986328125, -3.6549072265625, -3.50970458984375, -3.364501953125, -3.21929931640625, -3.0740966796875, -2.92889404296875, -2.78369140625, -2.63848876953125, -2.4932861328125, -2.34808349609375, -2.202880859375, -2.05767822265625, -1.9124755859375, -1.76727294921875, -1.6220703125, -1.47686767578125, -1.3316650390625, -1.18646240234375, -1.041259765625, -0.89605712890625, -0.7508544921875, -0.60565185546875, -0.46044921875, -0.31524658203125, -0.1700439453125, -0.02484130859375, 0.120361328125, 0.26556396484375, 0.4107666015625, 0.55596923828125, 0.701171875, 0.84637451171875, 0.9915771484375, 1.13677978515625, 1.281982421875, 1.42718505859375, 1.5723876953125, 1.71759033203125, 1.86279296875, 2.00799560546875, 2.1531982421875, 2.29840087890625, 2.443603515625, 2.58880615234375, 2.7340087890625, 2.87921142578125, 3.0244140625, 3.16961669921875, 3.3148193359375, 3.46002197265625, 3.605224609375, 3.75042724609375, 3.8956298828125, 4.04083251953125, 4.18603515625, 4.33123779296875, 4.4764404296875, 4.62164306640625, 4.766845703125, 4.91204833984375, 5.0572509765625, 5.20245361328125, 5.34765625]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [5.0, 4.0, 7.0, 8.0, 8.0, 11.0, 9.0, 17.0, 23.0, 21.0, 43.0, 45.0, 68.0, 104.0, 188.0, 237.0, 393.0, 565.0, 857.0, 1271.0, 2234.0, 3210.0, 5277.0, 9680.0, 23020.0, 71670.0, 307985.0, 456935.0, 105137.0, 30736.0, 12312.0, 6042.0, 3502.0, 2374.0, 1489.0, 1076.0, 688.0, 435.0, 258.0, 197.0, 133.0, 83.0, 60.0, 43.0, 27.0, 21.0, 16.0, 6.0, 10.0, 11.0, 7.0, 4.0, 2.0, 0.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.75390625, -3.6156005859375, -3.477294921875, -3.3389892578125, -3.20068359375, -3.0623779296875, -2.924072265625, -2.7857666015625, -2.6474609375, -2.5091552734375, -2.370849609375, -2.2325439453125, -2.09423828125, -1.9559326171875, -1.817626953125, -1.6793212890625, -1.541015625, -1.4027099609375, -1.264404296875, -1.1260986328125, -0.98779296875, -0.8494873046875, -0.711181640625, -0.5728759765625, -0.4345703125, -0.2962646484375, -0.157958984375, -0.0196533203125, 0.11865234375, 0.2569580078125, 0.395263671875, 0.5335693359375, 0.671875, 0.8101806640625, 0.948486328125, 1.0867919921875, 1.22509765625, 1.3634033203125, 1.501708984375, 1.6400146484375, 1.7783203125, 1.9166259765625, 2.054931640625, 2.1932373046875, 2.33154296875, 2.4698486328125, 2.608154296875, 2.7464599609375, 2.884765625, 3.0230712890625, 3.161376953125, 3.2996826171875, 3.43798828125, 3.5762939453125, 3.714599609375, 3.8529052734375, 3.9912109375, 4.1295166015625, 4.267822265625, 4.4061279296875, 4.54443359375, 4.6827392578125, 4.821044921875, 4.9593505859375, 5.09765625]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 1.0, 6.0, 7.0, 4.0, 5.0, 6.0, 8.0, 10.0, 17.0, 19.0, 29.0, 27.0, 26.0, 23.0, 31.0, 32.0, 46.0, 47.0, 55.0, 92.0, 345.0, 1684.0, 102.0, 53.0, 45.0, 46.0, 40.0, 30.0, 24.0, 37.0, 21.0, 21.0, 21.0, 17.0, 13.0, 17.0, 14.0, 10.0, 2.0, 5.0, 1.0, 3.0, 2.0, 4.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-19.859375, -19.260498046875, -18.66162109375, -18.062744140625, -17.4638671875, -16.864990234375, -16.26611328125, -15.667236328125, -15.068359375, -14.469482421875, -13.87060546875, -13.271728515625, -12.6728515625, -12.073974609375, -11.47509765625, -10.876220703125, -10.27734375, -9.678466796875, -9.07958984375, -8.480712890625, -7.8818359375, -7.282958984375, -6.68408203125, -6.085205078125, -5.486328125, -4.887451171875, -4.28857421875, -3.689697265625, -3.0908203125, -2.491943359375, -1.89306640625, -1.294189453125, -0.6953125, -0.096435546875, 0.50244140625, 1.101318359375, 1.7001953125, 2.299072265625, 2.89794921875, 3.496826171875, 4.095703125, 4.694580078125, 5.29345703125, 5.892333984375, 6.4912109375, 7.090087890625, 7.68896484375, 8.287841796875, 8.88671875, 9.485595703125, 10.08447265625, 10.683349609375, 11.2822265625, 11.881103515625, 12.47998046875, 13.078857421875, 13.677734375, 14.276611328125, 14.87548828125, 15.474365234375, 16.0732421875, 16.672119140625, 17.27099609375, 17.869873046875, 18.46875]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 3.0, 5.0, 2.0, 7.0, 3.0, 5.0, 5.0, 9.0, 18.0, 19.0, 25.0, 39.0, 39.0, 56.0, 99.0, 115.0, 176.0, 302.0, 635.0, 7014.0, 3084124.0, 50182.0, 1695.0, 387.0, 236.0, 142.0, 107.0, 64.0, 53.0, 39.0, 23.0, 24.0, 15.0, 10.0, 7.0, 10.0, 4.0, 8.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.09375, -38.4736328125, -36.853515625, -35.2333984375, -33.61328125, -31.9931640625, -30.373046875, -28.7529296875, -27.1328125, -25.5126953125, -23.892578125, -22.2724609375, -20.65234375, -19.0322265625, -17.412109375, -15.7919921875, -14.171875, -12.5517578125, -10.931640625, -9.3115234375, -7.69140625, -6.0712890625, -4.451171875, -2.8310546875, -1.2109375, 0.4091796875, 2.029296875, 3.6494140625, 5.26953125, 6.8896484375, 8.509765625, 10.1298828125, 11.75, 13.3701171875, 14.990234375, 16.6103515625, 18.23046875, 19.8505859375, 21.470703125, 23.0908203125, 24.7109375, 26.3310546875, 27.951171875, 29.5712890625, 31.19140625, 32.8115234375, 34.431640625, 36.0517578125, 37.671875, 39.2919921875, 40.912109375, 42.5322265625, 44.15234375, 45.7724609375, 47.392578125, 49.0126953125, 50.6328125, 52.2529296875, 53.873046875, 55.4931640625, 57.11328125, 58.7333984375, 60.353515625, 61.9736328125, 63.59375]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 21.0, 913.0, 82.0, 0.0, 1.0], "bins": [-436.9225158691406, -429.71136474609375, -422.5002136230469, -415.2890625, -408.0779113769531, -400.86676025390625, -393.65557861328125, -386.4444274902344, -379.2332763671875, -372.0221252441406, -364.81097412109375, -357.5998229980469, -350.388671875, -343.177490234375, -335.96636962890625, -328.75518798828125, -321.5440673828125, -314.3329162597656, -307.12176513671875, -299.9106140136719, -292.699462890625, -285.48828125, -278.27716064453125, -271.06597900390625, -263.8548278808594, -256.6436767578125, -249.43252563476562, -242.22137451171875, -235.0102081298828, -227.79905700683594, -220.58790588378906, -213.3767547607422, -206.16558837890625, -198.95443725585938, -191.7432861328125, -184.53213500976562, -177.3209686279297, -170.1098175048828, -162.89866638183594, -155.68751525878906, -148.4763641357422, -141.2652130126953, -134.05406188964844, -126.84290313720703, -119.63174438476562, -112.42059326171875, -105.20944213867188, -97.998291015625, -90.7871322631836, -83.57598114013672, -76.36482238769531, -69.15367126464844, -61.9425163269043, -54.731361389160156, -47.52021026611328, -40.30905532836914, -33.097900390625, -25.88674545288086, -18.67559242248535, -11.464439392089844, -4.253284454345703, 2.9578704833984375, 10.169021606445312, 17.380176544189453, 24.591333389282227]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 6.0, 1.0, 6.0, 2.0, 7.0, 8.0, 6.0, 6.0, 9.0, 10.0, 12.0, 9.0, 16.0, 25.0, 32.0, 36.0, 26.0, 39.0, 28.0, 31.0, 39.0, 29.0, 48.0, 43.0, 45.0, 48.0, 37.0, 35.0, 36.0, 35.0, 40.0, 36.0, 27.0, 29.0, 18.0, 22.0, 19.0, 13.0, 21.0, 19.0, 15.0, 14.0, 8.0, 8.0, 4.0, 3.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-52.799407958984375, -51.22303771972656, -49.64666748046875, -48.07029724121094, -46.49392318725586, -44.91755294799805, -43.341182708740234, -41.76481246948242, -40.188438415527344, -38.61206817626953, -37.03569793701172, -35.459327697753906, -33.88295364379883, -32.306583404541016, -30.730213165283203, -29.15384292602539, -27.577472686767578, -26.001102447509766, -24.42473030090332, -22.848360061645508, -21.271987915039062, -19.69561767578125, -18.119247436523438, -16.542877197265625, -14.96650505065918, -13.39013385772705, -11.813762664794922, -10.23739242553711, -8.66102123260498, -7.084650039672852, -5.508279800415039, -3.93190860748291, -2.3555374145507812, -0.7791664600372314, 0.7972044944763184, 2.373575210571289, 3.949946403503418, 5.526317596435547, 7.102687835693359, 8.679059028625488, 10.255430221557617, 11.831801414489746, 13.408172607421875, 14.984542846679688, 16.5609130859375, 18.137285232543945, 19.713655471801758, 21.290027618408203, 22.866397857666016, 24.442768096923828, 26.019140243530273, 27.595510482788086, 29.17188262939453, 30.748252868652344, 32.324623107910156, 33.90099334716797, 35.47736358642578, 37.053733825683594, 38.630104064941406, 40.20647430419922, 41.7828483581543, 43.35921859741211, 44.93558883666992, 46.511959075927734, 48.08833312988281]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 2.0, 7.0, 8.0, 7.0, 8.0, 7.0, 8.0, 11.0, 10.0, 12.0, 20.0, 17.0, 16.0, 22.0, 28.0, 35.0, 33.0, 36.0, 36.0, 50.0, 38.0, 45.0, 52.0, 31.0, 38.0, 44.0, 33.0, 40.0, 24.0, 37.0, 31.0, 31.0, 25.0, 21.0, 26.0, 11.0, 13.0, 21.0, 14.0, 6.0, 7.0, 10.0, 10.0, 6.0, 6.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.46484375, -4.3128662109375, -4.160888671875, -4.0089111328125, -3.85693359375, -3.7049560546875, -3.552978515625, -3.4010009765625, -3.2490234375, -3.0970458984375, -2.945068359375, -2.7930908203125, -2.64111328125, -2.4891357421875, -2.337158203125, -2.1851806640625, -2.033203125, -1.8812255859375, -1.729248046875, -1.5772705078125, -1.42529296875, -1.2733154296875, -1.121337890625, -0.9693603515625, -0.8173828125, -0.6654052734375, -0.513427734375, -0.3614501953125, -0.20947265625, -0.0574951171875, 0.094482421875, 0.2464599609375, 0.3984375, 0.5504150390625, 0.702392578125, 0.8543701171875, 1.00634765625, 1.1583251953125, 1.310302734375, 1.4622802734375, 1.6142578125, 1.7662353515625, 1.918212890625, 2.0701904296875, 2.22216796875, 2.3741455078125, 2.526123046875, 2.6781005859375, 2.830078125, 2.9820556640625, 3.134033203125, 3.2860107421875, 3.43798828125, 3.5899658203125, 3.741943359375, 3.8939208984375, 4.0458984375, 4.1978759765625, 4.349853515625, 4.5018310546875, 4.65380859375, 4.8057861328125, 4.957763671875, 5.1097412109375, 5.26171875]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 6.0, 11.0, 7.0, 13.0, 11.0, 31.0, 25.0, 38.0, 46.0, 69.0, 77.0, 137.0, 154.0, 292.0, 430.0, 765.0, 1458.0, 3022.0, 7165.0, 19067.0, 58598.0, 222765.0, 981842.0, 1951869.0, 717148.0, 159627.0, 44012.0, 14623.0, 5610.0, 2449.0, 1089.0, 627.0, 388.0, 236.0, 150.0, 111.0, 78.0, 59.0, 51.0, 31.0, 23.0, 13.0, 12.0, 11.0, 12.0, 6.0, 4.0, 5.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-7.48828125, -7.23345947265625, -6.9786376953125, -6.72381591796875, -6.468994140625, -6.21417236328125, -5.9593505859375, -5.70452880859375, -5.44970703125, -5.19488525390625, -4.9400634765625, -4.68524169921875, -4.430419921875, -4.17559814453125, -3.9207763671875, -3.66595458984375, -3.4111328125, -3.15631103515625, -2.9014892578125, -2.64666748046875, -2.391845703125, -2.13702392578125, -1.8822021484375, -1.62738037109375, -1.37255859375, -1.11773681640625, -0.8629150390625, -0.60809326171875, -0.353271484375, -0.09844970703125, 0.1563720703125, 0.41119384765625, 0.666015625, 0.92083740234375, 1.1756591796875, 1.43048095703125, 1.685302734375, 1.94012451171875, 2.1949462890625, 2.44976806640625, 2.70458984375, 2.95941162109375, 3.2142333984375, 3.46905517578125, 3.723876953125, 3.97869873046875, 4.2335205078125, 4.48834228515625, 4.7431640625, 4.99798583984375, 5.2528076171875, 5.50762939453125, 5.762451171875, 6.01727294921875, 6.2720947265625, 6.52691650390625, 6.78173828125, 7.03656005859375, 7.2913818359375, 7.54620361328125, 7.801025390625, 8.05584716796875, 8.3106689453125, 8.56549072265625, 8.8203125]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 0.0, 4.0, 0.0, 2.0, 7.0, 6.0, 4.0, 5.0, 11.0, 14.0, 18.0, 19.0, 23.0, 29.0, 30.0, 52.0, 60.0, 95.0, 86.0, 99.0, 176.0, 181.0, 246.0, 310.0, 368.0, 410.0, 375.0, 262.0, 266.0, 211.0, 159.0, 110.0, 95.0, 71.0, 51.0, 50.0, 36.0, 20.0, 29.0, 18.0, 19.0, 4.0, 10.0, 10.0, 5.0, 5.0, 7.0, 6.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-8.265625, -8.0113525390625, -7.757080078125, -7.5028076171875, -7.24853515625, -6.9942626953125, -6.739990234375, -6.4857177734375, -6.2314453125, -5.9771728515625, -5.722900390625, -5.4686279296875, -5.21435546875, -4.9600830078125, -4.705810546875, -4.4515380859375, -4.197265625, -3.9429931640625, -3.688720703125, -3.4344482421875, -3.18017578125, -2.9259033203125, -2.671630859375, -2.4173583984375, -2.1630859375, -1.9088134765625, -1.654541015625, -1.4002685546875, -1.14599609375, -0.8917236328125, -0.637451171875, -0.3831787109375, -0.12890625, 0.1253662109375, 0.379638671875, 0.6339111328125, 0.88818359375, 1.1424560546875, 1.396728515625, 1.6510009765625, 1.9052734375, 2.1595458984375, 2.413818359375, 2.6680908203125, 2.92236328125, 3.1766357421875, 3.430908203125, 3.6851806640625, 3.939453125, 4.1937255859375, 4.447998046875, 4.7022705078125, 4.95654296875, 5.2108154296875, 5.465087890625, 5.7193603515625, 5.9736328125, 6.2279052734375, 6.482177734375, 6.7364501953125, 6.99072265625, 7.2449951171875, 7.499267578125, 7.7535400390625, 8.0078125]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 3.0, 6.0, 5.0, 7.0, 7.0, 15.0, 10.0, 24.0, 24.0, 22.0, 39.0, 47.0, 55.0, 83.0, 117.0, 133.0, 233.0, 303.0, 545.0, 3542.0, 76667.0, 3449569.0, 645576.0, 14630.0, 1268.0, 375.0, 222.0, 166.0, 142.0, 119.0, 73.0, 54.0, 39.0, 39.0, 22.0, 23.0, 18.0, 14.0, 11.0, 10.0, 6.0, 5.0, 6.0, 2.0, 3.0, 1.0, 0.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-34.46875, -33.34814453125, -32.2275390625, -31.10693359375, -29.986328125, -28.86572265625, -27.7451171875, -26.62451171875, -25.50390625, -24.38330078125, -23.2626953125, -22.14208984375, -21.021484375, -19.90087890625, -18.7802734375, -17.65966796875, -16.5390625, -15.41845703125, -14.2978515625, -13.17724609375, -12.056640625, -10.93603515625, -9.8154296875, -8.69482421875, -7.57421875, -6.45361328125, -5.3330078125, -4.21240234375, -3.091796875, -1.97119140625, -0.8505859375, 0.27001953125, 1.390625, 2.51123046875, 3.6318359375, 4.75244140625, 5.873046875, 6.99365234375, 8.1142578125, 9.23486328125, 10.35546875, 11.47607421875, 12.5966796875, 13.71728515625, 14.837890625, 15.95849609375, 17.0791015625, 18.19970703125, 19.3203125, 20.44091796875, 21.5615234375, 22.68212890625, 23.802734375, 24.92333984375, 26.0439453125, 27.16455078125, 28.28515625, 29.40576171875, 30.5263671875, 31.64697265625, 32.767578125, 33.88818359375, 35.0087890625, 36.12939453125, 37.25]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 26.0, 144.0, 369.0, 376.0, 86.0, 9.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-243.83567810058594, -237.72731018066406, -231.6189422607422, -225.5105743408203, -219.40220642089844, -213.2938232421875, -207.18545532226562, -201.07708740234375, -194.96871948242188, -188.8603515625, -182.75198364257812, -176.64361572265625, -170.53524780273438, -164.4268798828125, -158.31851196289062, -152.2101287841797, -146.10177612304688, -139.993408203125, -133.88504028320312, -127.77667236328125, -121.66829681396484, -115.55992889404297, -109.4515609741211, -103.34318542480469, -97.23481750488281, -91.12644958496094, -85.01808166503906, -78.90971374511719, -72.80133819580078, -66.6929702758789, -60.58460235595703, -54.47623062133789, -48.36785888671875, -42.259490966796875, -36.151119232177734, -30.04275131225586, -23.93438148498535, -17.826011657714844, -11.717643737792969, -5.609272003173828, 0.4990959167480469, 6.6074652671813965, 12.715834617614746, 18.824203491210938, 24.932573318481445, 31.040943145751953, 37.14931106567383, 43.25768280029297, 49.366050720214844, 55.47441864013672, 61.58279037475586, 67.691162109375, 73.79953002929688, 79.90789794921875, 86.01626586914062, 92.1246337890625, 98.23300170898438, 104.34136962890625, 110.44973754882812, 116.55810546875, 122.6664810180664, 128.77484130859375, 134.88320922851562, 140.99159240722656, 147.09996032714844]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 7.0, 11.0, 10.0, 8.0, 12.0, 12.0, 23.0, 23.0, 16.0, 33.0, 19.0, 27.0, 36.0, 32.0, 29.0, 55.0, 28.0, 36.0, 46.0, 38.0, 43.0, 31.0, 37.0, 45.0, 35.0, 31.0, 46.0, 32.0, 22.0, 39.0, 27.0, 22.0, 22.0, 17.0, 19.0, 10.0, 12.0, 7.0, 5.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-37.22868347167969, -36.12742614746094, -35.02616500854492, -33.92490768432617, -32.823646545410156, -31.722389221191406, -30.621129989624023, -29.51987075805664, -28.418611526489258, -27.317352294921875, -26.216093063354492, -25.11483383178711, -24.01357650756836, -22.912315368652344, -21.811058044433594, -20.70979881286621, -19.608539581298828, -18.507280349731445, -17.406021118164062, -16.30476188659668, -15.203503608703613, -14.10224437713623, -13.000986099243164, -11.899726867675781, -10.798467636108398, -9.697208404541016, -8.595949172973633, -7.494690895080566, -6.393431663513184, -5.292172431945801, -4.190913677215576, -3.0896549224853516, -1.9883956909179688, -0.887136697769165, 0.21412229537963867, 1.3153812885284424, 2.416640281677246, 3.517899513244629, 4.6191582679748535, 5.720417022705078, 6.821676254272461, 7.922935485839844, 9.024194717407227, 10.125452995300293, 11.226712226867676, 12.327971458435059, 13.429229736328125, 14.530488967895508, 15.63174819946289, 16.733007431030273, 17.834266662597656, 18.93552589416504, 20.036785125732422, 21.138042449951172, 22.239301681518555, 23.340560913085938, 24.44182014465332, 25.543079376220703, 26.644338607788086, 27.74559783935547, 28.84685516357422, 29.948116302490234, 31.049373626708984, 32.150634765625, 33.25189208984375]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 2.0, 1.0, 9.0, 5.0, 8.0, 6.0, 8.0, 15.0, 10.0, 12.0, 16.0, 18.0, 23.0, 24.0, 27.0, 42.0, 36.0, 47.0, 33.0, 37.0, 38.0, 43.0, 44.0, 47.0, 45.0, 54.0, 35.0, 31.0, 23.0, 36.0, 32.0, 34.0, 22.0, 21.0, 20.0, 21.0, 7.0, 12.0, 10.0, 6.0, 8.0, 3.0, 7.0, 7.0, 9.0, 7.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-4.69921875, -4.5478515625, -4.396484375, -4.2451171875, -4.09375, -3.9423828125, -3.791015625, -3.6396484375, -3.48828125, -3.3369140625, -3.185546875, -3.0341796875, -2.8828125, -2.7314453125, -2.580078125, -2.4287109375, -2.27734375, -2.1259765625, -1.974609375, -1.8232421875, -1.671875, -1.5205078125, -1.369140625, -1.2177734375, -1.06640625, -0.9150390625, -0.763671875, -0.6123046875, -0.4609375, -0.3095703125, -0.158203125, -0.0068359375, 0.14453125, 0.2958984375, 0.447265625, 0.5986328125, 0.75, 0.9013671875, 1.052734375, 1.2041015625, 1.35546875, 1.5068359375, 1.658203125, 1.8095703125, 1.9609375, 2.1123046875, 2.263671875, 2.4150390625, 2.56640625, 2.7177734375, 2.869140625, 3.0205078125, 3.171875, 3.3232421875, 3.474609375, 3.6259765625, 3.77734375, 3.9287109375, 4.080078125, 4.2314453125, 4.3828125, 4.5341796875, 4.685546875, 4.8369140625, 4.98828125]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 7.0, 9.0, 10.0, 17.0, 20.0, 27.0, 41.0, 73.0, 104.0, 125.0, 225.0, 340.0, 512.0, 883.0, 1451.0, 2314.0, 3748.0, 6314.0, 10368.0, 17028.0, 29061.0, 50796.0, 96579.0, 192563.0, 272566.0, 167986.0, 84544.0, 45271.0, 26035.0, 15476.0, 9356.0, 5628.0, 3498.0, 2095.0, 1304.0, 816.0, 466.0, 309.0, 202.0, 114.0, 88.0, 62.0, 47.0, 29.0, 13.0, 15.0, 6.0, 6.0, 6.0, 1.0, 3.0, 6.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.537109375, -0.5200042724609375, -0.502899169921875, -0.4857940673828125, -0.46868896484375, -0.4515838623046875, -0.434478759765625, -0.4173736572265625, -0.4002685546875, -0.3831634521484375, -0.366058349609375, -0.3489532470703125, -0.33184814453125, -0.3147430419921875, -0.297637939453125, -0.2805328369140625, -0.263427734375, -0.2463226318359375, -0.229217529296875, -0.2121124267578125, -0.19500732421875, -0.1779022216796875, -0.160797119140625, -0.1436920166015625, -0.1265869140625, -0.1094818115234375, -0.092376708984375, -0.0752716064453125, -0.05816650390625, -0.0410614013671875, -0.023956298828125, -0.0068511962890625, 0.01025390625, 0.0273590087890625, 0.044464111328125, 0.0615692138671875, 0.07867431640625, 0.0957794189453125, 0.112884521484375, 0.1299896240234375, 0.1470947265625, 0.1641998291015625, 0.181304931640625, 0.1984100341796875, 0.21551513671875, 0.2326202392578125, 0.249725341796875, 0.2668304443359375, 0.283935546875, 0.3010406494140625, 0.318145751953125, 0.3352508544921875, 0.35235595703125, 0.3694610595703125, 0.386566162109375, 0.4036712646484375, 0.4207763671875, 0.4378814697265625, 0.454986572265625, 0.4720916748046875, 0.48919677734375, 0.5063018798828125, 0.523406982421875, 0.5405120849609375, 0.5576171875]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 7.0, 4.0, 4.0, 7.0, 9.0, 6.0, 14.0, 20.0, 18.0, 23.0, 21.0, 27.0, 28.0, 31.0, 42.0, 33.0, 40.0, 47.0, 38.0, 58.0, 1075.0, 50.0, 51.0, 39.0, 45.0, 40.0, 34.0, 32.0, 34.0, 24.0, 29.0, 21.0, 15.0, 17.0, 22.0, 10.0, 5.0, 7.0, 5.0, 2.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-4.12890625, -4.01544189453125, -3.9019775390625, -3.78851318359375, -3.675048828125, -3.56158447265625, -3.4481201171875, -3.33465576171875, -3.22119140625, -3.10772705078125, -2.9942626953125, -2.88079833984375, -2.767333984375, -2.65386962890625, -2.5404052734375, -2.42694091796875, -2.3134765625, -2.20001220703125, -2.0865478515625, -1.97308349609375, -1.859619140625, -1.74615478515625, -1.6326904296875, -1.51922607421875, -1.40576171875, -1.29229736328125, -1.1788330078125, -1.06536865234375, -0.951904296875, -0.83843994140625, -0.7249755859375, -0.61151123046875, -0.498046875, -0.38458251953125, -0.2711181640625, -0.15765380859375, -0.044189453125, 0.06927490234375, 0.1827392578125, 0.29620361328125, 0.40966796875, 0.52313232421875, 0.6365966796875, 0.75006103515625, 0.863525390625, 0.97698974609375, 1.0904541015625, 1.20391845703125, 1.3173828125, 1.43084716796875, 1.5443115234375, 1.65777587890625, 1.771240234375, 1.88470458984375, 1.9981689453125, 2.11163330078125, 2.22509765625, 2.33856201171875, 2.4520263671875, 2.56549072265625, 2.678955078125, 2.79241943359375, 2.9058837890625, 3.01934814453125, 3.1328125]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 5.0, 4.0, 3.0, 2.0, 3.0, 1.0, 9.0, 10.0, 22.0, 21.0, 32.0, 46.0, 57.0, 91.0, 138.0, 215.0, 324.0, 510.0, 860.0, 1306.0, 2297.0, 3941.0, 6942.0, 12409.0, 22473.0, 41637.0, 76670.0, 139345.0, 709682.0, 768124.0, 138883.0, 77608.0, 41630.0, 22430.0, 12406.0, 6953.0, 4015.0, 2363.0, 1357.0, 852.0, 534.0, 325.0, 207.0, 116.0, 83.0, 67.0, 49.0, 30.0, 15.0, 11.0, 7.0, 4.0, 4.0, 4.0, 5.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.28955078125, -0.27989959716796875, -0.2702484130859375, -0.26059722900390625, -0.250946044921875, -0.24129486083984375, -0.2316436767578125, -0.22199249267578125, -0.21234130859375, -0.20269012451171875, -0.1930389404296875, -0.18338775634765625, -0.173736572265625, -0.16408538818359375, -0.1544342041015625, -0.14478302001953125, -0.1351318359375, -0.12548065185546875, -0.1158294677734375, -0.10617828369140625, -0.096527099609375, -0.08687591552734375, -0.0772247314453125, -0.06757354736328125, -0.05792236328125, -0.04827117919921875, -0.0386199951171875, -0.02896881103515625, -0.019317626953125, -0.00966644287109375, -1.52587890625e-05, 0.00963592529296875, 0.019287109375, 0.02893829345703125, 0.0385894775390625, 0.04824066162109375, 0.057891845703125, 0.06754302978515625, 0.0771942138671875, 0.08684539794921875, 0.09649658203125, 0.10614776611328125, 0.1157989501953125, 0.12545013427734375, 0.135101318359375, 0.14475250244140625, 0.1544036865234375, 0.16405487060546875, 0.1737060546875, 0.18335723876953125, 0.1930084228515625, 0.20265960693359375, 0.212310791015625, 0.22196197509765625, 0.2316131591796875, 0.24126434326171875, 0.25091552734375, 0.26056671142578125, 0.2702178955078125, 0.27986907958984375, 0.289520263671875, 0.29917144775390625, 0.3088226318359375, 0.31847381591796875, 0.328125]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 4.0, 0.0, 2.0, 1.0, 3.0, 4.0, 3.0, 2.0, 9.0, 9.0, 10.0, 21.0, 17.0, 24.0, 43.0, 89.0, 184.0, 212.0, 150.0, 79.0, 43.0, 28.0, 14.0, 16.0, 13.0, 7.0, 4.0, 5.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.00998687744140625, -0.00967860221862793, -0.00937032699584961, -0.009062051773071289, -0.008753776550292969, -0.008445501327514648, -0.008137226104736328, -0.007828950881958008, -0.0075206756591796875, -0.007212400436401367, -0.006904125213623047, -0.0065958499908447266, -0.006287574768066406, -0.005979299545288086, -0.005671024322509766, -0.005362749099731445, -0.005054473876953125, -0.004746198654174805, -0.004437923431396484, -0.004129648208618164, -0.0038213729858398438, -0.0035130977630615234, -0.003204822540283203, -0.002896547317504883, -0.0025882720947265625, -0.002279996871948242, -0.001971721649169922, -0.0016634464263916016, -0.0013551712036132812, -0.001046895980834961, -0.0007386207580566406, -0.0004303455352783203, -0.0001220703125, 0.0001862049102783203, 0.0004944801330566406, 0.0008027553558349609, 0.0011110305786132812, 0.0014193058013916016, 0.0017275810241699219, 0.002035856246948242, 0.0023441314697265625, 0.002652406692504883, 0.002960681915283203, 0.0032689571380615234, 0.0035772323608398438, 0.003885507583618164, 0.004193782806396484, 0.004502058029174805, 0.004810333251953125, 0.005118608474731445, 0.005426883697509766, 0.005735158920288086, 0.006043434143066406, 0.0063517093658447266, 0.006659984588623047, 0.006968259811401367, 0.0072765350341796875, 0.007584810256958008, 0.007893085479736328, 0.008201360702514648, 0.008509635925292969, 0.008817911148071289, 0.00912618637084961, 0.00943446159362793, 0.00974273681640625]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 1.0, 3.0, 3.0, 2.0, 7.0, 22.0, 24.0, 30.0, 53.0, 111.0, 280.0, 4736.0, 1027337.0, 15160.0, 477.0, 112.0, 55.0, 43.0, 29.0, 21.0, 13.0, 7.0, 3.0, 6.0, 2.0, 3.0, 2.0, 2.0, 0.0, 4.0, 0.0, 2.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2080078125, -0.2014293670654297, -0.19485092163085938, -0.18827247619628906, -0.18169403076171875, -0.17511558532714844, -0.16853713989257812, -0.1619586944580078, -0.1553802490234375, -0.1488018035888672, -0.14222335815429688, -0.13564491271972656, -0.12906646728515625, -0.12248802185058594, -0.11590957641601562, -0.10933113098144531, -0.102752685546875, -0.09617424011230469, -0.08959579467773438, -0.08301734924316406, -0.07643890380859375, -0.06986045837402344, -0.06328201293945312, -0.05670356750488281, -0.0501251220703125, -0.04354667663574219, -0.036968231201171875, -0.030389785766601562, -0.02381134033203125, -0.017232894897460938, -0.010654449462890625, -0.0040760040283203125, 0.00250244140625, 0.009080886840820312, 0.015659332275390625, 0.022237777709960938, 0.02881622314453125, 0.03539466857910156, 0.041973114013671875, 0.04855155944824219, 0.0551300048828125, 0.06170845031738281, 0.06828689575195312, 0.07486534118652344, 0.08144378662109375, 0.08802223205566406, 0.09460067749023438, 0.10117912292480469, 0.107757568359375, 0.11433601379394531, 0.12091445922851562, 0.12749290466308594, 0.13407135009765625, 0.14064979553222656, 0.14722824096679688, 0.1538066864013672, 0.1603851318359375, 0.1669635772705078, 0.17354202270507812, 0.18012046813964844, 0.18669891357421875, 0.19327735900878906, 0.19985580444335938, 0.2064342498779297, 0.2130126953125]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 9.0, 101.0, 779.0, 106.0, 21.0, 3.0], "bins": [-0.16950929164886475, -0.16670632362365723, -0.1639033555984497, -0.1611003875732422, -0.15829743444919586, -0.15549446642398834, -0.15269149839878082, -0.1498885303735733, -0.14708556234836578, -0.14428259432315826, -0.14147962629795074, -0.13867667317390442, -0.1358737051486969, -0.13307073712348938, -0.13026776909828186, -0.12746480107307434, -0.12466184794902802, -0.1218588799238205, -0.11905591934919357, -0.11625295132398605, -0.11344998329877853, -0.11064702272415161, -0.10784405469894409, -0.10504108667373657, -0.10223811864852905, -0.09943515062332153, -0.09663219004869461, -0.09382922202348709, -0.09102625399827957, -0.08822329342365265, -0.08542032539844513, -0.08261735737323761, -0.07981439679861069, -0.07701142877340317, -0.07420846819877625, -0.07140550017356873, -0.0686025321483612, -0.06579957157373428, -0.06299660354852676, -0.06019363924860954, -0.05739067494869232, -0.0545877106487751, -0.05178474262356758, -0.04898177832365036, -0.04617881402373314, -0.04337584972381592, -0.0405728816986084, -0.03776991739869118, -0.03496694937348366, -0.03216398507356644, -0.029361018911004066, -0.026558052748441696, -0.023755088448524475, -0.020952122285962105, -0.018149156123399734, -0.015346191823482513, -0.012543226592242718, -0.009740261361002922, -0.006937295664101839, -0.004134329967200756, -0.0013313647359609604, 0.0014716004952788353, 0.004274566657841206, 0.007077530957758427, 0.009880497120320797]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 7.0, 7.0, 4.0, 16.0, 12.0, 22.0, 18.0, 31.0, 24.0, 27.0, 28.0, 32.0, 36.0, 44.0, 39.0, 51.0, 40.0, 38.0, 49.0, 44.0, 66.0, 37.0, 44.0, 35.0, 40.0, 27.0, 37.0, 31.0, 22.0, 19.0, 19.0, 13.0, 19.0, 6.0, 8.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004465281963348389, -0.0042829085141420364, -0.004100535064935684, -0.003918161615729332, -0.0037357881665229797, -0.0035534147173166275, -0.0033710412681102753, -0.003188667818903923, -0.003006294369697571, -0.0028239209204912186, -0.0026415474712848663, -0.002459174022078514, -0.002276800572872162, -0.0020944271236658096, -0.0019120536744594574, -0.0017296802252531052, -0.001547306776046753, -0.0013649333268404007, -0.0011825598776340485, -0.0010001864284276962, -0.000817812979221344, -0.0006354395300149918, -0.0004530660808086395, -0.0002706926316022873, -8.831918239593506e-05, 9.405426681041718e-05, 0.0002764277160167694, 0.00045880116522312164, 0.0006411746144294739, 0.0008235480636358261, 0.0010059215128421783, 0.0011882949620485306, 0.0013706684112548828, 0.001553041860461235, 0.0017354153096675873, 0.0019177887588739395, 0.0021001622080802917, 0.002282535657286644, 0.002464909106492996, 0.0026472825556993484, 0.0028296560049057007, 0.003012029454112053, 0.003194402903318405, 0.0033767763525247574, 0.0035591498017311096, 0.003741523250937462, 0.003923896700143814, 0.004106270149350166, 0.0042886435985565186, 0.004471017047762871, 0.004653390496969223, 0.004835763946175575, 0.0050181373953819275, 0.00520051084458828, 0.005382884293794632, 0.005565257743000984, 0.005747631192207336, 0.005930004641413689, 0.006112378090620041, 0.006294751539826393, 0.006477124989032745, 0.006659498438239098, 0.00684187188744545, 0.007024245336651802, 0.007206618785858154]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 2.0, 1.0, 9.0, 5.0, 8.0, 6.0, 8.0, 15.0, 10.0, 12.0, 16.0, 18.0, 23.0, 24.0, 27.0, 42.0, 36.0, 47.0, 33.0, 37.0, 38.0, 43.0, 44.0, 47.0, 46.0, 53.0, 35.0, 31.0, 23.0, 36.0, 32.0, 34.0, 22.0, 21.0, 20.0, 21.0, 7.0, 12.0, 10.0, 6.0, 8.0, 3.0, 7.0, 7.0, 9.0, 7.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-4.69921875, -4.5478515625, -4.396484375, -4.2451171875, -4.09375, -3.9423828125, -3.791015625, -3.6396484375, -3.48828125, -3.3369140625, -3.185546875, -3.0341796875, -2.8828125, -2.7314453125, -2.580078125, -2.4287109375, -2.27734375, -2.1259765625, -1.974609375, -1.8232421875, -1.671875, -1.5205078125, -1.369140625, -1.2177734375, -1.06640625, -0.9150390625, -0.763671875, -0.6123046875, -0.4609375, -0.3095703125, -0.158203125, -0.0068359375, 0.14453125, 0.2958984375, 0.447265625, 0.5986328125, 0.75, 0.9013671875, 1.052734375, 1.2041015625, 1.35546875, 1.5068359375, 1.658203125, 1.8095703125, 1.9609375, 2.1123046875, 2.263671875, 2.4150390625, 2.56640625, 2.7177734375, 2.869140625, 3.0205078125, 3.171875, 3.3232421875, 3.474609375, 3.6259765625, 3.77734375, 3.9287109375, 4.080078125, 4.2314453125, 4.3828125, 4.5341796875, 4.685546875, 4.8369140625, 4.98828125]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 5.0, 5.0, 9.0, 8.0, 25.0, 41.0, 40.0, 73.0, 104.0, 142.0, 252.0, 390.0, 627.0, 1129.0, 1779.0, 2976.0, 5261.0, 9023.0, 15970.0, 28465.0, 54731.0, 121842.0, 328029.0, 269576.0, 101425.0, 47256.0, 25292.0, 14274.0, 8182.0, 4770.0, 2701.0, 1660.0, 927.0, 555.0, 334.0, 248.0, 126.0, 81.0, 79.0, 44.0, 20.0, 23.0, 20.0, 15.0, 6.0, 3.0, 4.0, 6.0, 2.0, 0.0, 2.0, 2.0, 1.0], "bins": [-3.6953125, -3.5863037109375, -3.477294921875, -3.3682861328125, -3.25927734375, -3.1502685546875, -3.041259765625, -2.9322509765625, -2.8232421875, -2.7142333984375, -2.605224609375, -2.4962158203125, -2.38720703125, -2.2781982421875, -2.169189453125, -2.0601806640625, -1.951171875, -1.8421630859375, -1.733154296875, -1.6241455078125, -1.51513671875, -1.4061279296875, -1.297119140625, -1.1881103515625, -1.0791015625, -0.9700927734375, -0.861083984375, -0.7520751953125, -0.64306640625, -0.5340576171875, -0.425048828125, -0.3160400390625, -0.20703125, -0.0980224609375, 0.010986328125, 0.1199951171875, 0.22900390625, 0.3380126953125, 0.447021484375, 0.5560302734375, 0.6650390625, 0.7740478515625, 0.883056640625, 0.9920654296875, 1.10107421875, 1.2100830078125, 1.319091796875, 1.4281005859375, 1.537109375, 1.6461181640625, 1.755126953125, 1.8641357421875, 1.97314453125, 2.0821533203125, 2.191162109375, 2.3001708984375, 2.4091796875, 2.5181884765625, 2.627197265625, 2.7362060546875, 2.84521484375, 2.9542236328125, 3.063232421875, 3.1722412109375, 3.28125]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 4.0, 1.0, 4.0, 7.0, 5.0, 9.0, 16.0, 7.0, 14.0, 12.0, 17.0, 25.0, 33.0, 23.0, 28.0, 30.0, 30.0, 41.0, 57.0, 60.0, 77.0, 313.0, 1623.0, 128.0, 66.0, 40.0, 54.0, 45.0, 42.0, 26.0, 23.0, 26.0, 31.0, 25.0, 23.0, 16.0, 9.0, 12.0, 10.0, 5.0, 7.0, 8.0, 4.0, 6.0, 1.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-17.21875, -16.68408203125, -16.1494140625, -15.61474609375, -15.080078125, -14.54541015625, -14.0107421875, -13.47607421875, -12.94140625, -12.40673828125, -11.8720703125, -11.33740234375, -10.802734375, -10.26806640625, -9.7333984375, -9.19873046875, -8.6640625, -8.12939453125, -7.5947265625, -7.06005859375, -6.525390625, -5.99072265625, -5.4560546875, -4.92138671875, -4.38671875, -3.85205078125, -3.3173828125, -2.78271484375, -2.248046875, -1.71337890625, -1.1787109375, -0.64404296875, -0.109375, 0.42529296875, 0.9599609375, 1.49462890625, 2.029296875, 2.56396484375, 3.0986328125, 3.63330078125, 4.16796875, 4.70263671875, 5.2373046875, 5.77197265625, 6.306640625, 6.84130859375, 7.3759765625, 7.91064453125, 8.4453125, 8.97998046875, 9.5146484375, 10.04931640625, 10.583984375, 11.11865234375, 11.6533203125, 12.18798828125, 12.72265625, 13.25732421875, 13.7919921875, 14.32666015625, 14.861328125, 15.39599609375, 15.9306640625, 16.46533203125, 17.0]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 3.0, 8.0, 8.0, 10.0, 16.0, 19.0, 35.0, 46.0, 64.0, 70.0, 99.0, 148.0, 244.0, 343.0, 767.0, 5424.0, 3064149.0, 71526.0, 1477.0, 399.0, 240.0, 157.0, 117.0, 93.0, 75.0, 38.0, 34.0, 23.0, 16.0, 19.0, 13.0, 8.0, 2.0, 5.0, 6.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0], "bins": [-63.875, -62.22607421875, -60.5771484375, -58.92822265625, -57.279296875, -55.63037109375, -53.9814453125, -52.33251953125, -50.68359375, -49.03466796875, -47.3857421875, -45.73681640625, -44.087890625, -42.43896484375, -40.7900390625, -39.14111328125, -37.4921875, -35.84326171875, -34.1943359375, -32.54541015625, -30.896484375, -29.24755859375, -27.5986328125, -25.94970703125, -24.30078125, -22.65185546875, -21.0029296875, -19.35400390625, -17.705078125, -16.05615234375, -14.4072265625, -12.75830078125, -11.109375, -9.46044921875, -7.8115234375, -6.16259765625, -4.513671875, -2.86474609375, -1.2158203125, 0.43310546875, 2.08203125, 3.73095703125, 5.3798828125, 7.02880859375, 8.677734375, 10.32666015625, 11.9755859375, 13.62451171875, 15.2734375, 16.92236328125, 18.5712890625, 20.22021484375, 21.869140625, 23.51806640625, 25.1669921875, 26.81591796875, 28.46484375, 30.11376953125, 31.7626953125, 33.41162109375, 35.060546875, 36.70947265625, 38.3583984375, 40.00732421875, 41.65625]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 92.0, 923.0, 5.0], "bins": [-575.4552612304688, -566.2109375, -556.9666748046875, -547.722412109375, -538.4780883789062, -529.2337646484375, -519.989501953125, -510.7452087402344, -501.50091552734375, -492.2566223144531, -483.0123291015625, -473.7680358886719, -464.52374267578125, -455.2794494628906, -446.03515625, -436.7908630371094, -427.54656982421875, -418.3022766113281, -409.0579833984375, -399.8136901855469, -390.56939697265625, -381.3251037597656, -372.080810546875, -362.8365173339844, -353.59222412109375, -344.3479309082031, -335.1036376953125, -325.8593444824219, -316.61505126953125, -307.3707580566406, -298.12646484375, -288.8821716308594, -279.6379089355469, -270.39361572265625, -261.1493225097656, -251.905029296875, -242.66073608398438, -233.41644287109375, -224.17214965820312, -214.9278564453125, -205.68356323242188, -196.43927001953125, -187.19497680664062, -177.95068359375, -168.70639038085938, -159.46209716796875, -150.21780395507812, -140.9735107421875, -131.72921752929688, -122.48492431640625, -113.24063110351562, -103.996337890625, -94.75204467773438, -85.50775146484375, -76.26345825195312, -67.0191650390625, -57.774871826171875, -48.53057861328125, -39.286285400390625, -30.0419921875, -20.797698974609375, -11.55340576171875, -2.309112548828125, 6.9351806640625, 16.179473876953125]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 4.0, 3.0, 5.0, 5.0, 11.0, 11.0, 10.0, 7.0, 13.0, 18.0, 15.0, 16.0, 22.0, 14.0, 34.0, 28.0, 38.0, 31.0, 37.0, 35.0, 38.0, 38.0, 51.0, 36.0, 46.0, 44.0, 39.0, 25.0, 27.0, 35.0, 39.0, 38.0, 27.0, 14.0, 21.0, 17.0, 15.0, 11.0, 17.0, 13.0, 14.0, 12.0, 9.0, 7.0, 11.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.7457275390625, -37.449668884277344, -36.15361022949219, -34.85755157470703, -33.561492919921875, -32.26543045043945, -30.969371795654297, -29.67331314086914, -28.377254486083984, -27.081195831298828, -25.785137176513672, -24.489076614379883, -23.193017959594727, -21.89695930480957, -20.60089874267578, -19.304840087890625, -18.00878143310547, -16.712722778320312, -15.41666316986084, -14.120603561401367, -12.824544906616211, -11.528486251831055, -10.232426643371582, -8.93636703491211, -7.640308380126953, -6.344249248504639, -5.048190116882324, -3.7521309852600098, -2.4560718536376953, -1.1600127220153809, 0.1360464096069336, 1.4321060180664062, 2.728160858154297, 4.024219989776611, 5.320279121398926, 6.61633825302124, 7.912397384643555, 9.208456039428711, 10.504515647888184, 11.800575256347656, 13.096633911132812, 14.392692565917969, 15.688752174377441, 16.984811782836914, 18.28087043762207, 19.576929092407227, 20.872989654541016, 22.169048309326172, 23.465106964111328, 24.761165618896484, 26.05722427368164, 27.35328483581543, 28.649343490600586, 29.945402145385742, 31.24146270751953, 32.53752136230469, 33.833580017089844, 35.129638671875, 36.425697326660156, 37.72175598144531, 39.01781463623047, 40.31387710571289, 41.60993576049805, 42.9059944152832, 44.20205307006836]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 4.0, 6.0, 4.0, 7.0, 9.0, 8.0, 11.0, 14.0, 15.0, 18.0, 15.0, 23.0, 28.0, 35.0, 26.0, 39.0, 40.0, 36.0, 43.0, 35.0, 46.0, 46.0, 48.0, 39.0, 38.0, 47.0, 31.0, 31.0, 45.0, 34.0, 17.0, 26.0, 21.0, 18.0, 19.0, 14.0, 10.0, 9.0, 7.0, 5.0, 7.0, 9.0, 8.0, 4.0, 3.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.94140625, -4.78265380859375, -4.6239013671875, -4.46514892578125, -4.306396484375, -4.14764404296875, -3.9888916015625, -3.83013916015625, -3.67138671875, -3.51263427734375, -3.3538818359375, -3.19512939453125, -3.036376953125, -2.87762451171875, -2.7188720703125, -2.56011962890625, -2.4013671875, -2.24261474609375, -2.0838623046875, -1.92510986328125, -1.766357421875, -1.60760498046875, -1.4488525390625, -1.29010009765625, -1.13134765625, -0.97259521484375, -0.8138427734375, -0.65509033203125, -0.496337890625, -0.33758544921875, -0.1788330078125, -0.02008056640625, 0.138671875, 0.29742431640625, 0.4561767578125, 0.61492919921875, 0.773681640625, 0.93243408203125, 1.0911865234375, 1.24993896484375, 1.40869140625, 1.56744384765625, 1.7261962890625, 1.88494873046875, 2.043701171875, 2.20245361328125, 2.3612060546875, 2.51995849609375, 2.6787109375, 2.83746337890625, 2.9962158203125, 3.15496826171875, 3.313720703125, 3.47247314453125, 3.6312255859375, 3.78997802734375, 3.94873046875, 4.10748291015625, 4.2662353515625, 4.42498779296875, 4.583740234375, 4.74249267578125, 4.9012451171875, 5.05999755859375, 5.21875]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 8.0, 1.0, 11.0, 7.0, 7.0, 9.0, 22.0, 19.0, 24.0, 23.0, 47.0, 51.0, 64.0, 101.0, 187.0, 416.0, 960.0, 2905.0, 11036.0, 54520.0, 439509.0, 2696317.0, 872345.0, 92705.0, 16592.0, 4039.0, 1228.0, 487.0, 229.0, 95.0, 73.0, 44.0, 38.0, 39.0, 27.0, 18.0, 17.0, 12.0, 12.0, 7.0, 5.0, 5.0, 4.0, 8.0, 3.0, 1.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-12.7890625, -12.3848876953125, -11.980712890625, -11.5765380859375, -11.17236328125, -10.7681884765625, -10.364013671875, -9.9598388671875, -9.5556640625, -9.1514892578125, -8.747314453125, -8.3431396484375, -7.93896484375, -7.5347900390625, -7.130615234375, -6.7264404296875, -6.322265625, -5.9180908203125, -5.513916015625, -5.1097412109375, -4.70556640625, -4.3013916015625, -3.897216796875, -3.4930419921875, -3.0888671875, -2.6846923828125, -2.280517578125, -1.8763427734375, -1.47216796875, -1.0679931640625, -0.663818359375, -0.2596435546875, 0.14453125, 0.5487060546875, 0.952880859375, 1.3570556640625, 1.76123046875, 2.1654052734375, 2.569580078125, 2.9737548828125, 3.3779296875, 3.7821044921875, 4.186279296875, 4.5904541015625, 4.99462890625, 5.3988037109375, 5.802978515625, 6.2071533203125, 6.611328125, 7.0155029296875, 7.419677734375, 7.8238525390625, 8.22802734375, 8.6322021484375, 9.036376953125, 9.4405517578125, 9.8447265625, 10.2489013671875, 10.653076171875, 11.0572509765625, 11.46142578125, 11.8656005859375, 12.269775390625, 12.6739501953125, 13.078125]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 3.0, 2.0, 5.0, 2.0, 6.0, 9.0, 16.0, 13.0, 15.0, 28.0, 27.0, 40.0, 57.0, 76.0, 109.0, 129.0, 185.0, 247.0, 329.0, 419.0, 513.0, 444.0, 379.0, 261.0, 214.0, 148.0, 109.0, 64.0, 60.0, 37.0, 39.0, 21.0, 21.0, 13.0, 10.0, 10.0, 7.0, 3.0, 4.0, 3.0, 3.0, 1.0, 0.0, 3.0, 1.0], "bins": [-12.0859375, -11.7808837890625, -11.475830078125, -11.1707763671875, -10.86572265625, -10.5606689453125, -10.255615234375, -9.9505615234375, -9.6455078125, -9.3404541015625, -9.035400390625, -8.7303466796875, -8.42529296875, -8.1202392578125, -7.815185546875, -7.5101318359375, -7.205078125, -6.9000244140625, -6.594970703125, -6.2899169921875, -5.98486328125, -5.6798095703125, -5.374755859375, -5.0697021484375, -4.7646484375, -4.4595947265625, -4.154541015625, -3.8494873046875, -3.54443359375, -3.2393798828125, -2.934326171875, -2.6292724609375, -2.32421875, -2.0191650390625, -1.714111328125, -1.4090576171875, -1.10400390625, -0.7989501953125, -0.493896484375, -0.1888427734375, 0.1162109375, 0.4212646484375, 0.726318359375, 1.0313720703125, 1.33642578125, 1.6414794921875, 1.946533203125, 2.2515869140625, 2.556640625, 2.8616943359375, 3.166748046875, 3.4718017578125, 3.77685546875, 4.0819091796875, 4.386962890625, 4.6920166015625, 4.9970703125, 5.3021240234375, 5.607177734375, 5.9122314453125, 6.21728515625, 6.5223388671875, 6.827392578125, 7.1324462890625, 7.4375]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 0.0, 3.0, 6.0, 3.0, 7.0, 8.0, 9.0, 18.0, 16.0, 26.0, 41.0, 45.0, 57.0, 80.0, 126.0, 159.0, 223.0, 401.0, 824.0, 5301.0, 218500.0, 3841619.0, 121172.0, 3740.0, 738.0, 341.0, 232.0, 161.0, 110.0, 88.0, 66.0, 32.0, 36.0, 22.0, 17.0, 14.0, 15.0, 8.0, 4.0, 3.0, 7.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-30.53125, -29.28173828125, -28.0322265625, -26.78271484375, -25.533203125, -24.28369140625, -23.0341796875, -21.78466796875, -20.53515625, -19.28564453125, -18.0361328125, -16.78662109375, -15.537109375, -14.28759765625, -13.0380859375, -11.78857421875, -10.5390625, -9.28955078125, -8.0400390625, -6.79052734375, -5.541015625, -4.29150390625, -3.0419921875, -1.79248046875, -0.54296875, 0.70654296875, 1.9560546875, 3.20556640625, 4.455078125, 5.70458984375, 6.9541015625, 8.20361328125, 9.453125, 10.70263671875, 11.9521484375, 13.20166015625, 14.451171875, 15.70068359375, 16.9501953125, 18.19970703125, 19.44921875, 20.69873046875, 21.9482421875, 23.19775390625, 24.447265625, 25.69677734375, 26.9462890625, 28.19580078125, 29.4453125, 30.69482421875, 31.9443359375, 33.19384765625, 34.443359375, 35.69287109375, 36.9423828125, 38.19189453125, 39.44140625, 40.69091796875, 41.9404296875, 43.18994140625, 44.439453125, 45.68896484375, 46.9384765625, 48.18798828125, 49.4375]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 13.0, 64.0, 200.0, 339.0, 263.0, 104.0, 25.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-200.46043395996094, -195.76461791992188, -191.06878662109375, -186.3729705810547, -181.67713928222656, -176.9813232421875, -172.28549194335938, -167.5896759033203, -162.89385986328125, -158.1980438232422, -153.50221252441406, -148.806396484375, -144.11056518554688, -139.4147491455078, -134.7189178466797, -130.02310180664062, -125.3272705078125, -120.6314468383789, -115.93562316894531, -111.23979949951172, -106.54397583007812, -101.84815979003906, -97.15233612060547, -92.45651245117188, -87.76068878173828, -83.06486511230469, -78.3690414428711, -73.6732177734375, -68.97740173339844, -64.28157043457031, -59.58575439453125, -54.889930725097656, -50.194091796875, -45.498268127441406, -40.80244445800781, -36.106624603271484, -31.41080093383789, -26.714977264404297, -22.019155502319336, -17.323333740234375, -12.627510070800781, -7.931687355041504, -3.2358646392822266, 1.4599580764770508, 6.155780792236328, 10.851604461669922, 15.547426223754883, 20.243247985839844, 24.939071655273438, 29.63489532470703, 34.330718994140625, 39.02653884887695, 43.72236251831055, 48.41818618774414, 53.11400604248047, 57.80982971191406, 62.505653381347656, 67.20147705078125, 71.89730072021484, 76.59312438964844, 81.2889404296875, 85.98477172851562, 90.68058776855469, 95.37641143798828, 100.07223510742188]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 6.0, 4.0, 6.0, 7.0, 15.0, 17.0, 15.0, 18.0, 21.0, 20.0, 18.0, 19.0, 18.0, 27.0, 38.0, 40.0, 27.0, 34.0, 51.0, 39.0, 49.0, 40.0, 49.0, 44.0, 44.0, 40.0, 31.0, 32.0, 26.0, 29.0, 20.0, 29.0, 21.0, 21.0, 13.0, 14.0, 8.0, 13.0, 10.0, 9.0, 7.0, 6.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-31.38421630859375, -30.37917709350586, -29.374135971069336, -28.369096755981445, -27.364055633544922, -26.35901641845703, -25.35397720336914, -24.34893798828125, -23.343896865844727, -22.338857650756836, -21.333816528320312, -20.328777313232422, -19.32373809814453, -18.318696975708008, -17.313657760620117, -16.308616638183594, -15.303577423095703, -14.298537254333496, -13.293497085571289, -12.288457870483398, -11.283417701721191, -10.278377532958984, -9.273338317871094, -8.268298149108887, -7.26325798034668, -6.258217811584473, -5.253178119659424, -4.248138427734375, -3.243098258972168, -2.238058090209961, -1.233018398284912, -0.22797870635986328, 0.7770614624023438, 1.7821013927459717, 2.7871413230895996, 3.7921812534332275, 4.7972211837768555, 5.8022613525390625, 6.807301044464111, 7.81234073638916, 8.817380905151367, 9.822421073913574, 10.827461242675781, 11.832500457763672, 12.837540626525879, 13.842580795288086, 14.847620010375977, 15.852660179138184, 16.85770034790039, 17.86273956298828, 18.867780685424805, 19.872819900512695, 20.87786102294922, 21.88290023803711, 22.887939453125, 23.89297866821289, 24.898019790649414, 25.903059005737305, 26.908100128173828, 27.91313934326172, 28.91817855834961, 29.923219680786133, 30.928258895874023, 31.933300018310547, 32.93833923339844]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 5.0, 9.0, 9.0, 15.0, 9.0, 19.0, 7.0, 18.0, 29.0, 21.0, 36.0, 37.0, 34.0, 37.0, 42.0, 44.0, 41.0, 40.0, 58.0, 55.0, 41.0, 50.0, 34.0, 41.0, 46.0, 38.0, 28.0, 36.0, 18.0, 17.0, 13.0, 13.0, 9.0, 10.0, 9.0, 5.0, 9.0, 7.0, 2.0, 2.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-5.375, -5.2054443359375, -5.035888671875, -4.8663330078125, -4.69677734375, -4.5272216796875, -4.357666015625, -4.1881103515625, -4.0185546875, -3.8489990234375, -3.679443359375, -3.5098876953125, -3.34033203125, -3.1707763671875, -3.001220703125, -2.8316650390625, -2.662109375, -2.4925537109375, -2.322998046875, -2.1534423828125, -1.98388671875, -1.8143310546875, -1.644775390625, -1.4752197265625, -1.3056640625, -1.1361083984375, -0.966552734375, -0.7969970703125, -0.62744140625, -0.4578857421875, -0.288330078125, -0.1187744140625, 0.05078125, 0.2203369140625, 0.389892578125, 0.5594482421875, 0.72900390625, 0.8985595703125, 1.068115234375, 1.2376708984375, 1.4072265625, 1.5767822265625, 1.746337890625, 1.9158935546875, 2.08544921875, 2.2550048828125, 2.424560546875, 2.5941162109375, 2.763671875, 2.9332275390625, 3.102783203125, 3.2723388671875, 3.44189453125, 3.6114501953125, 3.781005859375, 3.9505615234375, 4.1201171875, 4.2896728515625, 4.459228515625, 4.6287841796875, 4.79833984375, 4.9678955078125, 5.137451171875, 5.3070068359375, 5.4765625]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 2.0, 7.0, 5.0, 13.0, 14.0, 20.0, 36.0, 39.0, 61.0, 99.0, 159.0, 254.0, 356.0, 592.0, 900.0, 1444.0, 2215.0, 3485.0, 5510.0, 8812.0, 14498.0, 24520.0, 44036.0, 83287.0, 163719.0, 261177.0, 200903.0, 103475.0, 53865.0, 29750.0, 17320.0, 10429.0, 6371.0, 4018.0, 2522.0, 1686.0, 1026.0, 686.0, 421.0, 300.0, 170.0, 124.0, 79.0, 39.0, 33.0, 24.0, 17.0, 18.0, 10.0, 2.0, 7.0, 3.0, 0.0, 2.0, 3.0, 1.0, 2.0], "bins": [-0.5283203125, -0.51214599609375, -0.4959716796875, -0.47979736328125, -0.463623046875, -0.44744873046875, -0.4312744140625, -0.41510009765625, -0.39892578125, -0.38275146484375, -0.3665771484375, -0.35040283203125, -0.334228515625, -0.31805419921875, -0.3018798828125, -0.28570556640625, -0.26953125, -0.25335693359375, -0.2371826171875, -0.22100830078125, -0.204833984375, -0.18865966796875, -0.1724853515625, -0.15631103515625, -0.14013671875, -0.12396240234375, -0.1077880859375, -0.09161376953125, -0.075439453125, -0.05926513671875, -0.0430908203125, -0.02691650390625, -0.0107421875, 0.00543212890625, 0.0216064453125, 0.03778076171875, 0.053955078125, 0.07012939453125, 0.0863037109375, 0.10247802734375, 0.11865234375, 0.13482666015625, 0.1510009765625, 0.16717529296875, 0.183349609375, 0.19952392578125, 0.2156982421875, 0.23187255859375, 0.248046875, 0.26422119140625, 0.2803955078125, 0.29656982421875, 0.312744140625, 0.32891845703125, 0.3450927734375, 0.36126708984375, 0.37744140625, 0.39361572265625, 0.4097900390625, 0.42596435546875, 0.442138671875, 0.45831298828125, 0.4744873046875, 0.49066162109375, 0.5068359375]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 0.0, 0.0, 3.0, 3.0, 8.0, 11.0, 6.0, 10.0, 8.0, 15.0, 19.0, 26.0, 26.0, 37.0, 27.0, 34.0, 29.0, 31.0, 55.0, 45.0, 49.0, 1071.0, 52.0, 39.0, 61.0, 38.0, 45.0, 40.0, 30.0, 25.0, 37.0, 30.0, 20.0, 25.0, 21.0, 7.0, 11.0, 10.0, 10.0, 2.0, 8.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.2890625, -3.17413330078125, -3.0592041015625, -2.94427490234375, -2.829345703125, -2.71441650390625, -2.5994873046875, -2.48455810546875, -2.36962890625, -2.25469970703125, -2.1397705078125, -2.02484130859375, -1.909912109375, -1.79498291015625, -1.6800537109375, -1.56512451171875, -1.4501953125, -1.33526611328125, -1.2203369140625, -1.10540771484375, -0.990478515625, -0.87554931640625, -0.7606201171875, -0.64569091796875, -0.53076171875, -0.41583251953125, -0.3009033203125, -0.18597412109375, -0.071044921875, 0.04388427734375, 0.1588134765625, 0.27374267578125, 0.388671875, 0.50360107421875, 0.6185302734375, 0.73345947265625, 0.848388671875, 0.96331787109375, 1.0782470703125, 1.19317626953125, 1.30810546875, 1.42303466796875, 1.5379638671875, 1.65289306640625, 1.767822265625, 1.88275146484375, 1.9976806640625, 2.11260986328125, 2.2275390625, 2.34246826171875, 2.4573974609375, 2.57232666015625, 2.687255859375, 2.80218505859375, 2.9171142578125, 3.03204345703125, 3.14697265625, 3.26190185546875, 3.3768310546875, 3.49176025390625, 3.606689453125, 3.72161865234375, 3.8365478515625, 3.95147705078125, 4.06640625]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 2.0, 3.0, 5.0, 8.0, 13.0, 22.0, 26.0, 47.0, 68.0, 90.0, 119.0, 214.0, 339.0, 650.0, 1154.0, 1976.0, 3612.0, 6563.0, 12837.0, 25110.0, 51654.0, 106813.0, 205713.0, 1316263.0, 181923.0, 91783.0, 44213.0, 21691.0, 10880.0, 5882.0, 3190.0, 1745.0, 1048.0, 542.0, 339.0, 212.0, 112.0, 94.0, 69.0, 40.0, 28.0, 12.0, 10.0, 5.0, 5.0, 5.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.359375, -0.3479270935058594, -0.33647918701171875, -0.3250312805175781, -0.3135833740234375, -0.3021354675292969, -0.29068756103515625, -0.2792396545410156, -0.267791748046875, -0.2563438415527344, -0.24489593505859375, -0.23344802856445312, -0.2220001220703125, -0.21055221557617188, -0.19910430908203125, -0.18765640258789062, -0.17620849609375, -0.16476058959960938, -0.15331268310546875, -0.14186477661132812, -0.1304168701171875, -0.11896896362304688, -0.10752105712890625, -0.09607315063476562, -0.084625244140625, -0.07317733764648438, -0.06172943115234375, -0.050281524658203125, -0.0388336181640625, -0.027385711669921875, -0.01593780517578125, -0.004489898681640625, 0.0069580078125, 0.018405914306640625, 0.02985382080078125, 0.041301727294921875, 0.0527496337890625, 0.06419754028320312, 0.07564544677734375, 0.08709335327148438, 0.098541259765625, 0.10998916625976562, 0.12143707275390625, 0.13288497924804688, 0.1443328857421875, 0.15578079223632812, 0.16722869873046875, 0.17867660522460938, 0.19012451171875, 0.20157241821289062, 0.21302032470703125, 0.22446823120117188, 0.2359161376953125, 0.24736404418945312, 0.25881195068359375, 0.2702598571777344, 0.281707763671875, 0.2931556701660156, 0.30460357666015625, 0.3160514831542969, 0.3274993896484375, 0.3389472961425781, 0.35039520263671875, 0.3618431091308594, 0.373291015625]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 2.0, 4.0, 1.0, 1.0, 4.0, 2.0, 8.0, 4.0, 5.0, 4.0, 5.0, 8.0, 11.0, 9.0, 11.0, 9.0, 20.0, 28.0, 45.0, 33.0, 41.0, 60.0, 77.0, 96.0, 109.0, 78.0, 58.0, 54.0, 46.0, 31.0, 26.0, 26.0, 18.0, 10.0, 16.0, 5.0, 11.0, 10.0, 7.0, 2.0, 2.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.004756927490234375, -0.004620730876922607, -0.00448453426361084, -0.004348337650299072, -0.004212141036987305, -0.004075944423675537, -0.0039397478103637695, -0.003803551197052002, -0.0036673545837402344, -0.003531157970428467, -0.0033949613571166992, -0.0032587647438049316, -0.003122568130493164, -0.0029863715171813965, -0.002850174903869629, -0.0027139782905578613, -0.0025777816772460938, -0.002441585063934326, -0.0023053884506225586, -0.002169191837310791, -0.0020329952239990234, -0.0018967986106872559, -0.0017606019973754883, -0.0016244053840637207, -0.0014882087707519531, -0.0013520121574401855, -0.001215815544128418, -0.0010796189308166504, -0.0009434223175048828, -0.0008072257041931152, -0.0006710290908813477, -0.0005348324775695801, -0.0003986358642578125, -0.0002624392509460449, -0.00012624263763427734, 9.953975677490234e-06, 0.0001461505889892578, 0.0002823472023010254, 0.00041854381561279297, 0.0005547404289245605, 0.0006909370422363281, 0.0008271336555480957, 0.0009633302688598633, 0.0010995268821716309, 0.0012357234954833984, 0.001371920108795166, 0.0015081167221069336, 0.0016443133354187012, 0.0017805099487304688, 0.0019167065620422363, 0.002052903175354004, 0.0021890997886657715, 0.002325296401977539, 0.0024614930152893066, 0.0025976896286010742, 0.002733886241912842, 0.0028700828552246094, 0.003006279468536377, 0.0031424760818481445, 0.003278672695159912, 0.0034148693084716797, 0.0035510659217834473, 0.003687262535095215, 0.0038234591484069824, 0.00395965576171875]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 0.0, 0.0, 1.0, 3.0, 7.0, 7.0, 7.0, 14.0, 20.0, 21.0, 28.0, 48.0, 62.0, 98.0, 190.0, 533.0, 9258.0, 953581.0, 82684.0, 1337.0, 260.0, 127.0, 71.0, 49.0, 27.0, 29.0, 16.0, 11.0, 10.0, 11.0, 8.0, 5.0, 4.0, 5.0, 1.0, 5.0, 6.0, 3.0, 0.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.09539794921875, -0.09207725524902344, -0.08875656127929688, -0.08543586730957031, -0.08211517333984375, -0.07879447937011719, -0.07547378540039062, -0.07215309143066406, -0.0688323974609375, -0.06551170349121094, -0.062191009521484375, -0.05887031555175781, -0.05554962158203125, -0.05222892761230469, -0.048908233642578125, -0.04558753967285156, -0.042266845703125, -0.03894615173339844, -0.035625457763671875, -0.03230476379394531, -0.02898406982421875, -0.025663375854492188, -0.022342681884765625, -0.019021987915039062, -0.0157012939453125, -0.012380599975585938, -0.009059906005859375, -0.0057392120361328125, -0.00241851806640625, 0.0009021759033203125, 0.004222869873046875, 0.0075435638427734375, 0.0108642578125, 0.014184951782226562, 0.017505645751953125, 0.020826339721679688, 0.02414703369140625, 0.027467727661132812, 0.030788421630859375, 0.03410911560058594, 0.0374298095703125, 0.04075050354003906, 0.044071197509765625, 0.04739189147949219, 0.05071258544921875, 0.05403327941894531, 0.057353973388671875, 0.06067466735839844, 0.063995361328125, 0.06731605529785156, 0.07063674926757812, 0.07395744323730469, 0.07727813720703125, 0.08059883117675781, 0.08391952514648438, 0.08724021911621094, 0.0905609130859375, 0.09388160705566406, 0.09720230102539062, 0.10052299499511719, 0.10384368896484375, 0.10716438293457031, 0.11048507690429688, 0.11380577087402344, 0.11712646484375]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 10.0, 51.0, 606.0, 301.0, 38.0, 7.0, 1.0], "bins": [-0.10702475160360336, -0.10523727536201477, -0.10344980657100677, -0.10166233032941818, -0.09987485408782959, -0.098087377846241, -0.0962999016046524, -0.09451243281364441, -0.09272495657205582, -0.09093748033046722, -0.08915001153945923, -0.08736253529787064, -0.08557505905628204, -0.08378758281469345, -0.08200010657310486, -0.08021263778209686, -0.07842516154050827, -0.07663768529891968, -0.07485021650791168, -0.07306274026632309, -0.0712752640247345, -0.0694877877831459, -0.06770031154155731, -0.06591284275054932, -0.06412536650896072, -0.06233789026737213, -0.06055041775107384, -0.05876294523477554, -0.05697546899318695, -0.05518799275159836, -0.053400520235300064, -0.05161304771900177, -0.04982557147741318, -0.048038095235824585, -0.04625062271952629, -0.044463150203228, -0.042675673961639404, -0.04088819772005081, -0.03910072520375252, -0.037313252687454224, -0.03552577644586563, -0.03373830020427704, -0.031950827687978745, -0.0301633533090353, -0.028375878930091858, -0.026588404551148415, -0.02480093017220497, -0.023013455793261528, -0.021225979551672935, -0.019438505172729492, -0.01765103079378605, -0.015863556414842606, -0.014076082035899162, -0.012288607656955719, -0.010501133278012276, -0.008713658899068832, -0.006926184520125389, -0.005138710141181946, -0.0033512357622385025, -0.0015637613832950592, 0.0002237129956483841, 0.0020111873745918274, 0.0037986617535352707, 0.005586136132478714, 0.007373610511422157]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 6.0, 5.0, 4.0, 7.0, 13.0, 12.0, 19.0, 14.0, 15.0, 27.0, 27.0, 30.0, 32.0, 39.0, 66.0, 49.0, 41.0, 41.0, 46.0, 51.0, 57.0, 52.0, 53.0, 39.0, 31.0, 52.0, 33.0, 27.0, 27.0, 17.0, 12.0, 14.0, 16.0, 11.0, 7.0, 3.0, 7.0, 3.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0027153491973876953, -0.0026110466569662094, -0.0025067441165447235, -0.0024024415761232376, -0.0022981390357017517, -0.002193836495280266, -0.00208953395485878, -0.001985231414437294, -0.001880928874015808, -0.0017766263335943222, -0.0016723237931728363, -0.0015680212527513504, -0.0014637187123298645, -0.0013594161719083786, -0.0012551136314868927, -0.0011508110910654068, -0.001046508550643921, -0.000942206010222435, -0.0008379034698009491, -0.0007336009293794632, -0.0006292983889579773, -0.0005249958485364914, -0.0004206933081150055, -0.0003163907676935196, -0.0002120882272720337, -0.00010778568685054779, -3.4831464290618896e-06, 0.00010081939399242401, 0.0002051219344139099, 0.0003094244748353958, 0.0004137270152568817, 0.0005180295556783676, 0.0006223320960998535, 0.0007266346365213394, 0.0008309371769428253, 0.0009352397173643112, 0.0010395422577857971, 0.001143844798207283, 0.001248147338628769, 0.0013524498790502548, 0.0014567524194717407, 0.0015610549598932266, 0.0016653575003147125, 0.0017696600407361984, 0.0018739625811576843, 0.0019782651215791702, 0.002082567662000656, 0.002186870202422142, 0.002291172742843628, 0.002395475283265114, 0.0024997778236865997, 0.0026040803641080856, 0.0027083829045295715, 0.0028126854449510574, 0.0029169879853725433, 0.0030212905257940292, 0.003125593066215515, 0.003229895606637001, 0.003334198147058487, 0.003438500687479973, 0.0035428032279014587, 0.0036471057683229446, 0.0037514083087444305, 0.0038557108491659164, 0.003960013389587402]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 5.0, 9.0, 9.0, 15.0, 9.0, 19.0, 7.0, 18.0, 30.0, 20.0, 36.0, 37.0, 34.0, 37.0, 42.0, 44.0, 41.0, 40.0, 58.0, 55.0, 40.0, 51.0, 34.0, 41.0, 46.0, 38.0, 28.0, 36.0, 18.0, 17.0, 13.0, 13.0, 9.0, 10.0, 9.0, 5.0, 9.0, 7.0, 2.0, 2.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-5.375, -5.2054443359375, -5.035888671875, -4.8663330078125, -4.69677734375, -4.5272216796875, -4.357666015625, -4.1881103515625, -4.0185546875, -3.8489990234375, -3.679443359375, -3.5098876953125, -3.34033203125, -3.1707763671875, -3.001220703125, -2.8316650390625, -2.662109375, -2.4925537109375, -2.322998046875, -2.1534423828125, -1.98388671875, -1.8143310546875, -1.644775390625, -1.4752197265625, -1.3056640625, -1.1361083984375, -0.966552734375, -0.7969970703125, -0.62744140625, -0.4578857421875, -0.288330078125, -0.1187744140625, 0.05078125, 0.2203369140625, 0.389892578125, 0.5594482421875, 0.72900390625, 0.8985595703125, 1.068115234375, 1.2376708984375, 1.4072265625, 1.5767822265625, 1.746337890625, 1.9158935546875, 2.08544921875, 2.2550048828125, 2.424560546875, 2.5941162109375, 2.763671875, 2.9332275390625, 3.102783203125, 3.2723388671875, 3.44189453125, 3.6114501953125, 3.781005859375, 3.9505615234375, 4.1201171875, 4.2896728515625, 4.459228515625, 4.6287841796875, 4.79833984375, 4.9678955078125, 5.137451171875, 5.3070068359375, 5.4765625]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 5.0, 11.0, 12.0, 19.0, 22.0, 33.0, 43.0, 68.0, 84.0, 145.0, 244.0, 446.0, 955.0, 1896.0, 4077.0, 9289.0, 22771.0, 57886.0, 167988.0, 476877.0, 195915.0, 65352.0, 25329.0, 10170.0, 4584.0, 2103.0, 961.0, 518.0, 262.0, 142.0, 96.0, 63.0, 49.0, 38.0, 22.0, 20.0, 12.0, 14.0, 7.0, 7.0, 6.0, 5.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-6.3828125, -6.192626953125, -6.00244140625, -5.812255859375, -5.6220703125, -5.431884765625, -5.24169921875, -5.051513671875, -4.861328125, -4.671142578125, -4.48095703125, -4.290771484375, -4.1005859375, -3.910400390625, -3.72021484375, -3.530029296875, -3.33984375, -3.149658203125, -2.95947265625, -2.769287109375, -2.5791015625, -2.388916015625, -2.19873046875, -2.008544921875, -1.818359375, -1.628173828125, -1.43798828125, -1.247802734375, -1.0576171875, -0.867431640625, -0.67724609375, -0.487060546875, -0.296875, -0.106689453125, 0.08349609375, 0.273681640625, 0.4638671875, 0.654052734375, 0.84423828125, 1.034423828125, 1.224609375, 1.414794921875, 1.60498046875, 1.795166015625, 1.9853515625, 2.175537109375, 2.36572265625, 2.555908203125, 2.74609375, 2.936279296875, 3.12646484375, 3.316650390625, 3.5068359375, 3.697021484375, 3.88720703125, 4.077392578125, 4.267578125, 4.457763671875, 4.64794921875, 4.838134765625, 5.0283203125, 5.218505859375, 5.40869140625, 5.598876953125, 5.7890625]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 4.0, 4.0, 2.0, 7.0, 11.0, 3.0, 7.0, 9.0, 19.0, 14.0, 16.0, 15.0, 23.0, 25.0, 35.0, 27.0, 44.0, 53.0, 42.0, 66.0, 102.0, 272.0, 1581.0, 177.0, 70.0, 60.0, 46.0, 40.0, 38.0, 32.0, 36.0, 31.0, 17.0, 20.0, 18.0, 17.0, 20.0, 9.0, 11.0, 6.0, 8.0, 5.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-16.328125, -15.8388671875, -15.349609375, -14.8603515625, -14.37109375, -13.8818359375, -13.392578125, -12.9033203125, -12.4140625, -11.9248046875, -11.435546875, -10.9462890625, -10.45703125, -9.9677734375, -9.478515625, -8.9892578125, -8.5, -8.0107421875, -7.521484375, -7.0322265625, -6.54296875, -6.0537109375, -5.564453125, -5.0751953125, -4.5859375, -4.0966796875, -3.607421875, -3.1181640625, -2.62890625, -2.1396484375, -1.650390625, -1.1611328125, -0.671875, -0.1826171875, 0.306640625, 0.7958984375, 1.28515625, 1.7744140625, 2.263671875, 2.7529296875, 3.2421875, 3.7314453125, 4.220703125, 4.7099609375, 5.19921875, 5.6884765625, 6.177734375, 6.6669921875, 7.15625, 7.6455078125, 8.134765625, 8.6240234375, 9.11328125, 9.6025390625, 10.091796875, 10.5810546875, 11.0703125, 11.5595703125, 12.048828125, 12.5380859375, 13.02734375, 13.5166015625, 14.005859375, 14.4951171875, 14.984375]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 2.0, 1.0, 2.0, 6.0, 4.0, 9.0, 16.0, 15.0, 16.0, 10.0, 26.0, 32.0, 53.0, 47.0, 58.0, 79.0, 117.0, 132.0, 192.0, 288.0, 543.0, 1276.0, 7506.0, 434961.0, 2679070.0, 17439.0, 1967.0, 670.0, 318.0, 233.0, 142.0, 101.0, 84.0, 66.0, 40.0, 38.0, 21.0, 19.0, 24.0, 14.0, 14.0, 8.0, 13.0, 9.0, 6.0, 5.0, 5.0, 5.0, 1.0, 1.0, 4.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-29.640625, -28.657470703125, -27.67431640625, -26.691162109375, -25.7080078125, -24.724853515625, -23.74169921875, -22.758544921875, -21.775390625, -20.792236328125, -19.80908203125, -18.825927734375, -17.8427734375, -16.859619140625, -15.87646484375, -14.893310546875, -13.91015625, -12.927001953125, -11.94384765625, -10.960693359375, -9.9775390625, -8.994384765625, -8.01123046875, -7.028076171875, -6.044921875, -5.061767578125, -4.07861328125, -3.095458984375, -2.1123046875, -1.129150390625, -0.14599609375, 0.837158203125, 1.8203125, 2.803466796875, 3.78662109375, 4.769775390625, 5.7529296875, 6.736083984375, 7.71923828125, 8.702392578125, 9.685546875, 10.668701171875, 11.65185546875, 12.635009765625, 13.6181640625, 14.601318359375, 15.58447265625, 16.567626953125, 17.55078125, 18.533935546875, 19.51708984375, 20.500244140625, 21.4833984375, 22.466552734375, 23.44970703125, 24.432861328125, 25.416015625, 26.399169921875, 27.38232421875, 28.365478515625, 29.3486328125, 30.331787109375, 31.31494140625, 32.298095703125, 33.28125]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 20.0, 245.0, 525.0, 204.0, 22.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-150.7985382080078, -147.7479705810547, -144.69740295410156, -141.64683532714844, -138.5962677001953, -135.5457000732422, -132.49513244628906, -129.44456481933594, -126.39399719238281, -123.34342956542969, -120.29286193847656, -117.24229431152344, -114.19172668457031, -111.14115905761719, -108.09059143066406, -105.04002380371094, -101.98945617675781, -98.93888854980469, -95.88832092285156, -92.83775329589844, -89.78718566894531, -86.73661804199219, -83.68605041503906, -80.63548278808594, -77.58490753173828, -74.53433990478516, -71.48377227783203, -68.4332046508789, -65.38263702392578, -62.332069396972656, -59.28150177001953, -56.230934143066406, -53.18036651611328, -50.129798889160156, -47.07923126220703, -44.028663635253906, -40.97809600830078, -37.927528381347656, -34.87696075439453, -31.826391220092773, -28.77582359313965, -25.725255966186523, -22.6746883392334, -19.62411880493164, -16.573551177978516, -13.522984504699707, -10.472415924072266, -7.421848297119141, -4.371280670166016, -1.3207128047943115, 1.7298550605773926, 4.780423164367676, 7.830990791320801, 10.881558418273926, 13.932126998901367, 16.982694625854492, 20.033262252807617, 23.083829879760742, 26.134397506713867, 29.184967041015625, 32.23553466796875, 35.286102294921875, 38.336669921875, 41.387237548828125, 44.43780517578125]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 7.0, 3.0, 1.0, 3.0, 6.0, 6.0, 13.0, 11.0, 16.0, 18.0, 16.0, 23.0, 20.0, 20.0, 44.0, 31.0, 31.0, 26.0, 46.0, 45.0, 40.0, 39.0, 37.0, 49.0, 44.0, 38.0, 39.0, 29.0, 30.0, 34.0, 21.0, 32.0, 32.0, 26.0, 25.0, 17.0, 13.0, 9.0, 6.0, 10.0, 11.0, 10.0, 9.0, 4.0, 6.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-44.636993408203125, -43.29643630981445, -41.95587921142578, -40.61532211303711, -39.27476501464844, -37.934207916259766, -36.593650817871094, -35.25309753417969, -33.91253662109375, -32.57197952270508, -31.231422424316406, -29.890865325927734, -28.550308227539062, -27.20975112915039, -25.86919593811035, -24.52863883972168, -23.18808364868164, -21.84752655029297, -20.506969451904297, -19.166412353515625, -17.825855255126953, -16.48529815673828, -15.144742965698242, -13.80418586730957, -12.463628768920898, -11.123071670532227, -9.782514572143555, -8.4419584274292, -7.101401329040527, -5.7608442306518555, -4.4202880859375, -3.079730987548828, -1.7391700744628906, -0.39861321449279785, 0.9419436454772949, 2.2825002670288086, 3.6230573654174805, 4.963614463806152, 6.304170608520508, 7.64472770690918, 8.985284805297852, 10.325841903686523, 11.666399002075195, 13.00695514678955, 14.347512245178223, 15.688069343566895, 17.02862548828125, 18.369182586669922, 19.709739685058594, 21.050296783447266, 22.390853881835938, 23.73141098022461, 25.07196807861328, 26.412525177001953, 27.753080368041992, 29.093637466430664, 30.434194564819336, 31.774751663208008, 33.11530685424805, 34.45586395263672, 35.79642105102539, 37.13697814941406, 38.477535247802734, 39.818092346191406, 41.15864944458008]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 4.0, 4.0, 2.0, 7.0, 13.0, 7.0, 11.0, 18.0, 11.0, 15.0, 30.0, 23.0, 29.0, 43.0, 40.0, 33.0, 38.0, 47.0, 36.0, 47.0, 57.0, 49.0, 50.0, 47.0, 38.0, 35.0, 43.0, 35.0, 30.0, 29.0, 28.0, 23.0, 10.0, 11.0, 13.0, 8.0, 8.0, 13.0, 5.0, 4.0, 1.0, 5.0, 1.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-5.70703125, -5.52752685546875, -5.3480224609375, -5.16851806640625, -4.989013671875, -4.80950927734375, -4.6300048828125, -4.45050048828125, -4.27099609375, -4.09149169921875, -3.9119873046875, -3.73248291015625, -3.552978515625, -3.37347412109375, -3.1939697265625, -3.01446533203125, -2.8349609375, -2.65545654296875, -2.4759521484375, -2.29644775390625, -2.116943359375, -1.93743896484375, -1.7579345703125, -1.57843017578125, -1.39892578125, -1.21942138671875, -1.0399169921875, -0.86041259765625, -0.680908203125, -0.50140380859375, -0.3218994140625, -0.14239501953125, 0.037109375, 0.21661376953125, 0.3961181640625, 0.57562255859375, 0.755126953125, 0.93463134765625, 1.1141357421875, 1.29364013671875, 1.47314453125, 1.65264892578125, 1.8321533203125, 2.01165771484375, 2.191162109375, 2.37066650390625, 2.5501708984375, 2.72967529296875, 2.9091796875, 3.08868408203125, 3.2681884765625, 3.44769287109375, 3.627197265625, 3.80670166015625, 3.9862060546875, 4.16571044921875, 4.34521484375, 4.52471923828125, 4.7042236328125, 4.88372802734375, 5.063232421875, 5.24273681640625, 5.4222412109375, 5.60174560546875, 5.78125]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 10.0, 7.0, 9.0, 18.0, 13.0, 31.0, 28.0, 30.0, 47.0, 81.0, 135.0, 238.0, 473.0, 1334.0, 4329.0, 19018.0, 122191.0, 1459939.0, 2340854.0, 208424.0, 28307.0, 5827.0, 1608.0, 612.0, 258.0, 153.0, 58.0, 55.0, 49.0, 24.0, 27.0, 19.0, 18.0, 8.0, 9.0, 11.0, 5.0, 4.0, 0.0, 1.0, 3.0, 4.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-15.4921875, -15.0244140625, -14.556640625, -14.0888671875, -13.62109375, -13.1533203125, -12.685546875, -12.2177734375, -11.75, -11.2822265625, -10.814453125, -10.3466796875, -9.87890625, -9.4111328125, -8.943359375, -8.4755859375, -8.0078125, -7.5400390625, -7.072265625, -6.6044921875, -6.13671875, -5.6689453125, -5.201171875, -4.7333984375, -4.265625, -3.7978515625, -3.330078125, -2.8623046875, -2.39453125, -1.9267578125, -1.458984375, -0.9912109375, -0.5234375, -0.0556640625, 0.412109375, 0.8798828125, 1.34765625, 1.8154296875, 2.283203125, 2.7509765625, 3.21875, 3.6865234375, 4.154296875, 4.6220703125, 5.08984375, 5.5576171875, 6.025390625, 6.4931640625, 6.9609375, 7.4287109375, 7.896484375, 8.3642578125, 8.83203125, 9.2998046875, 9.767578125, 10.2353515625, 10.703125, 11.1708984375, 11.638671875, 12.1064453125, 12.57421875, 13.0419921875, 13.509765625, 13.9775390625, 14.4453125]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 7.0, 8.0, 12.0, 10.0, 19.0, 33.0, 40.0, 47.0, 73.0, 108.0, 156.0, 225.0, 341.0, 434.0, 578.0, 580.0, 400.0, 296.0, 229.0, 138.0, 117.0, 61.0, 41.0, 44.0, 25.0, 15.0, 15.0, 8.0, 5.0, 1.0, 3.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.1484375, -10.7882080078125, -10.427978515625, -10.0677490234375, -9.70751953125, -9.3472900390625, -8.987060546875, -8.6268310546875, -8.2666015625, -7.9063720703125, -7.546142578125, -7.1859130859375, -6.82568359375, -6.4654541015625, -6.105224609375, -5.7449951171875, -5.384765625, -5.0245361328125, -4.664306640625, -4.3040771484375, -3.94384765625, -3.5836181640625, -3.223388671875, -2.8631591796875, -2.5029296875, -2.1427001953125, -1.782470703125, -1.4222412109375, -1.06201171875, -0.7017822265625, -0.341552734375, 0.0186767578125, 0.37890625, 0.7391357421875, 1.099365234375, 1.4595947265625, 1.81982421875, 2.1800537109375, 2.540283203125, 2.9005126953125, 3.2607421875, 3.6209716796875, 3.981201171875, 4.3414306640625, 4.70166015625, 5.0618896484375, 5.422119140625, 5.7823486328125, 6.142578125, 6.5028076171875, 6.863037109375, 7.2232666015625, 7.58349609375, 7.9437255859375, 8.303955078125, 8.6641845703125, 9.0244140625, 9.3846435546875, 9.744873046875, 10.1051025390625, 10.46533203125, 10.8255615234375, 11.185791015625, 11.5460205078125, 11.90625]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 3.0, 1.0, 2.0, 5.0, 3.0, 6.0, 17.0, 15.0, 30.0, 31.0, 66.0, 86.0, 135.0, 239.0, 348.0, 831.0, 11861.0, 3295204.0, 878813.0, 5010.0, 653.0, 338.0, 193.0, 129.0, 81.0, 52.0, 47.0, 32.0, 17.0, 13.0, 5.0, 12.0, 2.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.6875, -58.84228515625, -56.9970703125, -55.15185546875, -53.306640625, -51.46142578125, -49.6162109375, -47.77099609375, -45.92578125, -44.08056640625, -42.2353515625, -40.39013671875, -38.544921875, -36.69970703125, -34.8544921875, -33.00927734375, -31.1640625, -29.31884765625, -27.4736328125, -25.62841796875, -23.783203125, -21.93798828125, -20.0927734375, -18.24755859375, -16.40234375, -14.55712890625, -12.7119140625, -10.86669921875, -9.021484375, -7.17626953125, -5.3310546875, -3.48583984375, -1.640625, 0.20458984375, 2.0498046875, 3.89501953125, 5.740234375, 7.58544921875, 9.4306640625, 11.27587890625, 13.12109375, 14.96630859375, 16.8115234375, 18.65673828125, 20.501953125, 22.34716796875, 24.1923828125, 26.03759765625, 27.8828125, 29.72802734375, 31.5732421875, 33.41845703125, 35.263671875, 37.10888671875, 38.9541015625, 40.79931640625, 42.64453125, 44.48974609375, 46.3349609375, 48.18017578125, 50.025390625, 51.87060546875, 53.7158203125, 55.56103515625, 57.40625]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 23.0, 39.0, 60.0, 121.0, 188.0, 191.0, 170.0, 118.0, 59.0, 22.0, 14.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-123.63871002197266, -120.97744750976562, -118.31619262695312, -115.6549301147461, -112.9936752319336, -110.33241271972656, -107.67115783691406, -105.00989532470703, -102.3486328125, -99.68737030029297, -97.02611541748047, -94.36485290527344, -91.70359802246094, -89.0423355102539, -86.38107299804688, -83.71981811523438, -81.05856323242188, -78.39730072021484, -75.73604583740234, -73.07478332519531, -70.41352844238281, -67.75226593017578, -65.09100341796875, -62.42974853515625, -59.76848602294922, -57.10722732543945, -54.44596862792969, -51.784706115722656, -49.12344741821289, -46.462188720703125, -43.80093002319336, -41.139671325683594, -38.47840881347656, -35.8171501159668, -33.15589141845703, -30.494630813598633, -27.833370208740234, -25.17211151123047, -22.510852813720703, -19.849592208862305, -17.18833351135254, -14.527073860168457, -11.865814208984375, -9.20455551147461, -6.543295860290527, -3.8820362091064453, -1.2207775115966797, 1.4404830932617188, 4.101741790771484, 6.763001441955566, 9.424261093139648, 12.085519790649414, 14.746779441833496, 17.408039093017578, 20.069297790527344, 22.730558395385742, 25.391817092895508, 28.053075790405273, 30.714336395263672, 33.37559509277344, 36.0368537902832, 38.69811248779297, 41.359375, 44.020633697509766, 46.68189239501953]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 6.0, 1.0, 3.0, 7.0, 7.0, 6.0, 8.0, 13.0, 16.0, 21.0, 27.0, 21.0, 32.0, 39.0, 38.0, 33.0, 42.0, 38.0, 45.0, 34.0, 46.0, 50.0, 46.0, 52.0, 49.0, 45.0, 44.0, 32.0, 30.0, 38.0, 26.0, 12.0, 23.0, 14.0, 10.0, 15.0, 14.0, 8.0, 7.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.18115234375, -30.10691261291504, -29.032670974731445, -27.958431243896484, -26.88418960571289, -25.80994987487793, -24.73571014404297, -23.661468505859375, -22.587228775024414, -21.512989044189453, -20.43874740600586, -19.3645076751709, -18.290267944335938, -17.216026306152344, -16.141786575317383, -15.067545890808105, -13.993305206298828, -12.91906452178955, -11.844823837280273, -10.770584106445312, -9.696343421936035, -8.622102737426758, -7.547862529754639, -6.4736223220825195, -5.399381637573242, -4.325140953063965, -3.2509007453918457, -2.1766602993011475, -1.1024198532104492, -0.028179168701171875, 1.0460610389709473, 2.1203012466430664, 3.1945419311523438, 4.268782615661621, 5.34302282333374, 6.417263031005859, 7.491503715515137, 8.565744400024414, 9.639984130859375, 10.714224815368652, 11.78846549987793, 12.862706184387207, 13.936946868896484, 15.011186599731445, 16.085426330566406, 17.15966796875, 18.23390769958496, 19.308147430419922, 20.382389068603516, 21.456628799438477, 22.53087043762207, 23.60511016845703, 24.679351806640625, 25.753591537475586, 26.827831268310547, 27.90207290649414, 28.9763126373291, 30.050552368164062, 31.124794006347656, 32.19903564453125, 33.27327346801758, 34.34751510620117, 35.421756744384766, 36.495994567871094, 37.57023620605469]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 2.0, 5.0, 10.0, 10.0, 5.0, 15.0, 14.0, 18.0, 21.0, 24.0, 32.0, 20.0, 38.0, 33.0, 35.0, 41.0, 47.0, 50.0, 56.0, 48.0, 52.0, 44.0, 40.0, 40.0, 31.0, 43.0, 29.0, 33.0, 24.0, 23.0, 22.0, 19.0, 16.0, 12.0, 14.0, 6.0, 3.0, 8.0, 7.0, 9.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.6171875, -5.4349365234375, -5.252685546875, -5.0704345703125, -4.88818359375, -4.7059326171875, -4.523681640625, -4.3414306640625, -4.1591796875, -3.9769287109375, -3.794677734375, -3.6124267578125, -3.43017578125, -3.2479248046875, -3.065673828125, -2.8834228515625, -2.701171875, -2.5189208984375, -2.336669921875, -2.1544189453125, -1.97216796875, -1.7899169921875, -1.607666015625, -1.4254150390625, -1.2431640625, -1.0609130859375, -0.878662109375, -0.6964111328125, -0.51416015625, -0.3319091796875, -0.149658203125, 0.0325927734375, 0.21484375, 0.3970947265625, 0.579345703125, 0.7615966796875, 0.94384765625, 1.1260986328125, 1.308349609375, 1.4906005859375, 1.6728515625, 1.8551025390625, 2.037353515625, 2.2196044921875, 2.40185546875, 2.5841064453125, 2.766357421875, 2.9486083984375, 3.130859375, 3.3131103515625, 3.495361328125, 3.6776123046875, 3.85986328125, 4.0421142578125, 4.224365234375, 4.4066162109375, 4.5888671875, 4.7711181640625, 4.953369140625, 5.1356201171875, 5.31787109375, 5.5001220703125, 5.682373046875, 5.8646240234375, 6.046875]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 8.0, 12.0, 10.0, 12.0, 22.0, 40.0, 49.0, 78.0, 104.0, 181.0, 261.0, 347.0, 535.0, 820.0, 1171.0, 1796.0, 2699.0, 3904.0, 5908.0, 8984.0, 13538.0, 20739.0, 32709.0, 52860.0, 90127.0, 157020.0, 221748.0, 172254.0, 100024.0, 58294.0, 35771.0, 23070.0, 14519.0, 9485.0, 6444.0, 4199.0, 2912.0, 1911.0, 1354.0, 869.0, 590.0, 372.0, 255.0, 193.0, 117.0, 84.0, 53.0, 41.0, 24.0, 17.0, 13.0, 8.0, 8.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.495361328125, -0.48016357421875, -0.4649658203125, -0.44976806640625, -0.4345703125, -0.41937255859375, -0.4041748046875, -0.38897705078125, -0.373779296875, -0.35858154296875, -0.3433837890625, -0.32818603515625, -0.31298828125, -0.29779052734375, -0.2825927734375, -0.26739501953125, -0.252197265625, -0.23699951171875, -0.2218017578125, -0.20660400390625, -0.19140625, -0.17620849609375, -0.1610107421875, -0.14581298828125, -0.130615234375, -0.11541748046875, -0.1002197265625, -0.08502197265625, -0.06982421875, -0.05462646484375, -0.0394287109375, -0.02423095703125, -0.009033203125, 0.00616455078125, 0.0213623046875, 0.03656005859375, 0.0517578125, 0.06695556640625, 0.0821533203125, 0.09735107421875, 0.112548828125, 0.12774658203125, 0.1429443359375, 0.15814208984375, 0.17333984375, 0.18853759765625, 0.2037353515625, 0.21893310546875, 0.234130859375, 0.24932861328125, 0.2645263671875, 0.27972412109375, 0.294921875, 0.31011962890625, 0.3253173828125, 0.34051513671875, 0.355712890625, 0.37091064453125, 0.3861083984375, 0.40130615234375, 0.41650390625, 0.43170166015625, 0.4468994140625, 0.46209716796875, 0.477294921875]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 2.0, 8.0, 7.0, 7.0, 17.0, 18.0, 19.0, 12.0, 24.0, 25.0, 26.0, 31.0, 29.0, 33.0, 33.0, 40.0, 43.0, 46.0, 54.0, 1066.0, 55.0, 41.0, 39.0, 42.0, 40.0, 34.0, 37.0, 32.0, 25.0, 23.0, 22.0, 19.0, 19.0, 13.0, 15.0, 11.0, 3.0, 5.0, 4.0, 6.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.841796875, -3.723876953125, -3.60595703125, -3.488037109375, -3.3701171875, -3.252197265625, -3.13427734375, -3.016357421875, -2.8984375, -2.780517578125, -2.66259765625, -2.544677734375, -2.4267578125, -2.308837890625, -2.19091796875, -2.072998046875, -1.955078125, -1.837158203125, -1.71923828125, -1.601318359375, -1.4833984375, -1.365478515625, -1.24755859375, -1.129638671875, -1.01171875, -0.893798828125, -0.77587890625, -0.657958984375, -0.5400390625, -0.422119140625, -0.30419921875, -0.186279296875, -0.068359375, 0.049560546875, 0.16748046875, 0.285400390625, 0.4033203125, 0.521240234375, 0.63916015625, 0.757080078125, 0.875, 0.992919921875, 1.11083984375, 1.228759765625, 1.3466796875, 1.464599609375, 1.58251953125, 1.700439453125, 1.818359375, 1.936279296875, 2.05419921875, 2.172119140625, 2.2900390625, 2.407958984375, 2.52587890625, 2.643798828125, 2.76171875, 2.879638671875, 2.99755859375, 3.115478515625, 3.2333984375, 3.351318359375, 3.46923828125, 3.587158203125, 3.705078125]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 4.0, 10.0, 18.0, 16.0, 38.0, 44.0, 70.0, 83.0, 130.0, 193.0, 418.0, 630.0, 1093.0, 2260.0, 4481.0, 8613.0, 17498.0, 36975.0, 79593.0, 167928.0, 1325382.0, 230314.0, 116724.0, 54028.0, 25464.0, 12259.0, 6042.0, 3108.0, 1552.0, 875.0, 490.0, 298.0, 178.0, 117.0, 75.0, 43.0, 35.0, 24.0, 12.0, 4.0, 4.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.408935546875, -0.39563751220703125, -0.3823394775390625, -0.36904144287109375, -0.355743408203125, -0.34244537353515625, -0.3291473388671875, -0.31584930419921875, -0.30255126953125, -0.28925323486328125, -0.2759552001953125, -0.26265716552734375, -0.249359130859375, -0.23606109619140625, -0.2227630615234375, -0.20946502685546875, -0.1961669921875, -0.18286895751953125, -0.1695709228515625, -0.15627288818359375, -0.142974853515625, -0.12967681884765625, -0.1163787841796875, -0.10308074951171875, -0.08978271484375, -0.07648468017578125, -0.0631866455078125, -0.04988861083984375, -0.036590576171875, -0.02329254150390625, -0.0099945068359375, 0.00330352783203125, 0.0166015625, 0.02989959716796875, 0.0431976318359375, 0.05649566650390625, 0.069793701171875, 0.08309173583984375, 0.0963897705078125, 0.10968780517578125, 0.12298583984375, 0.13628387451171875, 0.1495819091796875, 0.16287994384765625, 0.176177978515625, 0.18947601318359375, 0.2027740478515625, 0.21607208251953125, 0.2293701171875, 0.24266815185546875, 0.2559661865234375, 0.26926422119140625, 0.282562255859375, 0.29586029052734375, 0.3091583251953125, 0.32245635986328125, 0.33575439453125, 0.34905242919921875, 0.3623504638671875, 0.37564849853515625, 0.388946533203125, 0.40224456787109375, 0.4155426025390625, 0.42884063720703125, 0.442138671875]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 7.0, 3.0, 6.0, 10.0, 10.0, 18.0, 16.0, 15.0, 18.0, 24.0, 31.0, 25.0, 25.0, 50.0, 63.0, 87.0, 93.0, 105.0, 76.0, 63.0, 41.0, 34.0, 22.0, 21.0, 22.0, 22.0, 16.0, 21.0, 10.0, 8.0, 9.0, 3.0, 6.0, 4.0, 4.0, 1.0, 0.0, 4.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.005695343017578125, -0.005505561828613281, -0.0053157806396484375, -0.005125999450683594, -0.00493621826171875, -0.004746437072753906, -0.0045566558837890625, -0.004366874694824219, -0.004177093505859375, -0.003987312316894531, -0.0037975311279296875, -0.0036077499389648438, -0.00341796875, -0.0032281875610351562, -0.0030384063720703125, -0.0028486251831054688, -0.002658843994140625, -0.0024690628051757812, -0.0022792816162109375, -0.0020895004272460938, -0.00189971923828125, -0.0017099380493164062, -0.0015201568603515625, -0.0013303756713867188, -0.001140594482421875, -0.0009508132934570312, -0.0007610321044921875, -0.0005712509155273438, -0.0003814697265625, -0.00019168853759765625, -1.9073486328125e-06, 0.00018787384033203125, 0.000377655029296875, 0.0005674362182617188, 0.0007572174072265625, 0.0009469985961914062, 0.00113677978515625, 0.0013265609741210938, 0.0015163421630859375, 0.0017061233520507812, 0.001895904541015625, 0.0020856857299804688, 0.0022754669189453125, 0.0024652481079101562, 0.002655029296875, 0.0028448104858398438, 0.0030345916748046875, 0.0032243728637695312, 0.003414154052734375, 0.0036039352416992188, 0.0037937164306640625, 0.003983497619628906, 0.00417327880859375, 0.004363059997558594, 0.0045528411865234375, 0.004742622375488281, 0.004932403564453125, 0.005122184753417969, 0.0053119659423828125, 0.005501747131347656, 0.0056915283203125, 0.005881309509277344, 0.0060710906982421875, 0.006260871887207031, 0.006450653076171875]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 4.0, 0.0, 2.0, 4.0, 4.0, 4.0, 12.0, 10.0, 8.0, 15.0, 26.0, 24.0, 27.0, 59.0, 57.0, 93.0, 130.0, 282.0, 1174.0, 33595.0, 979550.0, 31452.0, 1214.0, 291.0, 144.0, 82.0, 69.0, 61.0, 39.0, 26.0, 27.0, 21.0, 10.0, 12.0, 7.0, 6.0, 5.0, 6.0, 3.0, 3.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.140625, -0.13654804229736328, -0.13247108459472656, -0.12839412689208984, -0.12431716918945312, -0.1202402114868164, -0.11616325378417969, -0.11208629608154297, -0.10800933837890625, -0.10393238067626953, -0.09985542297363281, -0.0957784652709961, -0.09170150756835938, -0.08762454986572266, -0.08354759216308594, -0.07947063446044922, -0.0753936767578125, -0.07131671905517578, -0.06723976135253906, -0.06316280364990234, -0.059085845947265625, -0.055008888244628906, -0.05093193054199219, -0.04685497283935547, -0.04277801513671875, -0.03870105743408203, -0.03462409973144531, -0.030547142028808594, -0.026470184326171875, -0.022393226623535156, -0.018316268920898438, -0.014239311218261719, -0.010162353515625, -0.006085395812988281, -0.0020084381103515625, 0.0020685195922851562, 0.006145477294921875, 0.010222434997558594, 0.014299392700195312, 0.01837635040283203, 0.02245330810546875, 0.02653026580810547, 0.030607223510742188, 0.034684181213378906, 0.038761138916015625, 0.042838096618652344, 0.04691505432128906, 0.05099201202392578, 0.0550689697265625, 0.05914592742919922, 0.06322288513183594, 0.06729984283447266, 0.07137680053710938, 0.0754537582397461, 0.07953071594238281, 0.08360767364501953, 0.08768463134765625, 0.09176158905029297, 0.09583854675292969, 0.0999155044555664, 0.10399246215820312, 0.10806941986083984, 0.11214637756347656, 0.11622333526611328, 0.12030029296875]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 11.0, 70.0, 673.0, 220.0, 25.0, 11.0, 5.0, 1.0], "bins": [-0.15723174810409546, -0.15455174446105957, -0.15187174081802368, -0.1491917371749878, -0.1465117335319519, -0.14383172988891602, -0.14115172624588013, -0.13847172260284424, -0.13579171895980835, -0.13311171531677246, -0.13043171167373657, -0.12775170803070068, -0.1250717043876648, -0.1223917007446289, -0.11971169710159302, -0.11703169345855713, -0.11435168236494064, -0.11167167872190475, -0.10899167507886887, -0.10631167143583298, -0.10363166779279709, -0.1009516641497612, -0.09827165305614471, -0.09559164941310883, -0.09291164577007294, -0.09023164212703705, -0.08755163848400116, -0.08487163484096527, -0.08219163119792938, -0.0795116275548935, -0.0768316239118576, -0.07415162026882172, -0.07147161662578583, -0.06879161298274994, -0.06611160933971405, -0.06343160569667816, -0.06075160205364227, -0.058071598410606384, -0.0553915910422802, -0.05271158739924431, -0.05003158003091812, -0.04735157638788223, -0.044671572744846344, -0.041991569101810455, -0.03931156545877457, -0.03663156181573868, -0.03395155444741249, -0.0312715508043766, -0.028591549023985863, -0.025911545380949974, -0.023231539875268936, -0.020551536232233047, -0.01787153258919716, -0.01519152894616127, -0.012511523440480232, -0.009831519797444344, -0.007151516154408455, -0.004471512045711279, -0.001791507937014103, 0.0008884966373443604, 0.003568500280380249, 0.006248503923416138, 0.008928509429097176, 0.011608513072133064, 0.014288516715168953]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 5.0, 2.0, 4.0, 8.0, 7.0, 15.0, 16.0, 20.0, 26.0, 25.0, 42.0, 23.0, 41.0, 52.0, 39.0, 53.0, 56.0, 53.0, 40.0, 51.0, 41.0, 59.0, 43.0, 46.0, 32.0, 39.0, 27.0, 28.0, 21.0, 18.0, 18.0, 15.0, 13.0, 6.0, 3.0, 7.0, 5.0, 4.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005460023880004883, -0.005240678787231445, -0.005021333694458008, -0.00480198860168457, -0.004582643508911133, -0.004363298416137695, -0.004143953323364258, -0.00392460823059082, -0.003705263137817383, -0.0034859180450439453, -0.003266572952270508, -0.0030472278594970703, -0.002827882766723633, -0.0026085376739501953, -0.002389192581176758, -0.0021698474884033203, -0.0019505023956298828, -0.0017311573028564453, -0.0015118122100830078, -0.0012924671173095703, -0.0010731220245361328, -0.0008537769317626953, -0.0006344318389892578, -0.0004150867462158203, -0.0001957416534423828, 2.3603439331054688e-05, 0.0002429485321044922, 0.0004622936248779297, 0.0006816387176513672, 0.0009009838104248047, 0.0011203289031982422, 0.0013396739959716797, 0.0015590190887451172, 0.0017783641815185547, 0.001997709274291992, 0.0022170543670654297, 0.002436399459838867, 0.0026557445526123047, 0.002875089645385742, 0.0030944347381591797, 0.003313779830932617, 0.0035331249237060547, 0.003752470016479492, 0.00397181510925293, 0.004191160202026367, 0.004410505294799805, 0.004629850387573242, 0.00484919548034668, 0.005068540573120117, 0.005287885665893555, 0.005507230758666992, 0.00572657585144043, 0.005945920944213867, 0.006165266036987305, 0.006384611129760742, 0.00660395622253418, 0.006823301315307617, 0.007042646408081055, 0.007261991500854492, 0.00748133659362793, 0.007700681686401367, 0.007920026779174805, 0.008139371871948242, 0.00835871696472168, 0.008578062057495117]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 2.0, 5.0, 10.0, 10.0, 5.0, 15.0, 14.0, 19.0, 20.0, 24.0, 32.0, 20.0, 38.0, 33.0, 35.0, 41.0, 47.0, 50.0, 56.0, 48.0, 52.0, 44.0, 40.0, 40.0, 31.0, 43.0, 29.0, 33.0, 24.0, 23.0, 22.0, 19.0, 16.0, 12.0, 14.0, 6.0, 3.0, 8.0, 7.0, 9.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.6171875, -5.4349365234375, -5.252685546875, -5.0704345703125, -4.88818359375, -4.7059326171875, -4.523681640625, -4.3414306640625, -4.1591796875, -3.9769287109375, -3.794677734375, -3.6124267578125, -3.43017578125, -3.2479248046875, -3.065673828125, -2.8834228515625, -2.701171875, -2.5189208984375, -2.336669921875, -2.1544189453125, -1.97216796875, -1.7899169921875, -1.607666015625, -1.4254150390625, -1.2431640625, -1.0609130859375, -0.878662109375, -0.6964111328125, -0.51416015625, -0.3319091796875, -0.149658203125, 0.0325927734375, 0.21484375, 0.3970947265625, 0.579345703125, 0.7615966796875, 0.94384765625, 1.1260986328125, 1.308349609375, 1.4906005859375, 1.6728515625, 1.8551025390625, 2.037353515625, 2.2196044921875, 2.40185546875, 2.5841064453125, 2.766357421875, 2.9486083984375, 3.130859375, 3.3131103515625, 3.495361328125, 3.6776123046875, 3.85986328125, 4.0421142578125, 4.224365234375, 4.4066162109375, 4.5888671875, 4.7711181640625, 4.953369140625, 5.1356201171875, 5.31787109375, 5.5001220703125, 5.682373046875, 5.8646240234375, 6.046875]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 4.0, 1.0, 3.0, 8.0, 12.0, 12.0, 14.0, 18.0, 27.0, 50.0, 50.0, 72.0, 85.0, 146.0, 277.0, 478.0, 1110.0, 2906.0, 8051.0, 26944.0, 126476.0, 684413.0, 152259.0, 30378.0, 9119.0, 3106.0, 1215.0, 550.0, 272.0, 144.0, 96.0, 67.0, 53.0, 32.0, 22.0, 24.0, 17.0, 8.0, 6.0, 11.0, 11.0, 6.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.6875, -9.370361328125, -9.05322265625, -8.736083984375, -8.4189453125, -8.101806640625, -7.78466796875, -7.467529296875, -7.150390625, -6.833251953125, -6.51611328125, -6.198974609375, -5.8818359375, -5.564697265625, -5.24755859375, -4.930419921875, -4.61328125, -4.296142578125, -3.97900390625, -3.661865234375, -3.3447265625, -3.027587890625, -2.71044921875, -2.393310546875, -2.076171875, -1.759033203125, -1.44189453125, -1.124755859375, -0.8076171875, -0.490478515625, -0.17333984375, 0.143798828125, 0.4609375, 0.778076171875, 1.09521484375, 1.412353515625, 1.7294921875, 2.046630859375, 2.36376953125, 2.680908203125, 2.998046875, 3.315185546875, 3.63232421875, 3.949462890625, 4.2666015625, 4.583740234375, 4.90087890625, 5.218017578125, 5.53515625, 5.852294921875, 6.16943359375, 6.486572265625, 6.8037109375, 7.120849609375, 7.43798828125, 7.755126953125, 8.072265625, 8.389404296875, 8.70654296875, 9.023681640625, 9.3408203125, 9.657958984375, 9.97509765625, 10.292236328125, 10.609375]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 4.0, 6.0, 6.0, 11.0, 7.0, 4.0, 11.0, 9.0, 16.0, 26.0, 18.0, 24.0, 30.0, 29.0, 45.0, 38.0, 48.0, 65.0, 96.0, 188.0, 1651.0, 189.0, 88.0, 67.0, 52.0, 42.0, 37.0, 36.0, 33.0, 35.0, 23.0, 26.0, 13.0, 21.0, 7.0, 8.0, 12.0, 6.0, 4.0, 4.0, 3.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-18.75, -18.190185546875, -17.63037109375, -17.070556640625, -16.5107421875, -15.950927734375, -15.39111328125, -14.831298828125, -14.271484375, -13.711669921875, -13.15185546875, -12.592041015625, -12.0322265625, -11.472412109375, -10.91259765625, -10.352783203125, -9.79296875, -9.233154296875, -8.67333984375, -8.113525390625, -7.5537109375, -6.993896484375, -6.43408203125, -5.874267578125, -5.314453125, -4.754638671875, -4.19482421875, -3.635009765625, -3.0751953125, -2.515380859375, -1.95556640625, -1.395751953125, -0.8359375, -0.276123046875, 0.28369140625, 0.843505859375, 1.4033203125, 1.963134765625, 2.52294921875, 3.082763671875, 3.642578125, 4.202392578125, 4.76220703125, 5.322021484375, 5.8818359375, 6.441650390625, 7.00146484375, 7.561279296875, 8.12109375, 8.680908203125, 9.24072265625, 9.800537109375, 10.3603515625, 10.920166015625, 11.47998046875, 12.039794921875, 12.599609375, 13.159423828125, 13.71923828125, 14.279052734375, 14.8388671875, 15.398681640625, 15.95849609375, 16.518310546875, 17.078125]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 5.0, 1.0, 7.0, 7.0, 15.0, 8.0, 22.0, 10.0, 24.0, 40.0, 39.0, 54.0, 64.0, 79.0, 138.0, 211.0, 468.0, 1387.0, 22735.0, 3059357.0, 57808.0, 1949.0, 520.0, 213.0, 136.0, 101.0, 70.0, 44.0, 36.0, 27.0, 31.0, 18.0, 11.0, 12.0, 10.0, 3.0, 10.0, 6.0, 7.0, 5.0, 6.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-48.03125, -46.46142578125, -44.8916015625, -43.32177734375, -41.751953125, -40.18212890625, -38.6123046875, -37.04248046875, -35.47265625, -33.90283203125, -32.3330078125, -30.76318359375, -29.193359375, -27.62353515625, -26.0537109375, -24.48388671875, -22.9140625, -21.34423828125, -19.7744140625, -18.20458984375, -16.634765625, -15.06494140625, -13.4951171875, -11.92529296875, -10.35546875, -8.78564453125, -7.2158203125, -5.64599609375, -4.076171875, -2.50634765625, -0.9365234375, 0.63330078125, 2.203125, 3.77294921875, 5.3427734375, 6.91259765625, 8.482421875, 10.05224609375, 11.6220703125, 13.19189453125, 14.76171875, 16.33154296875, 17.9013671875, 19.47119140625, 21.041015625, 22.61083984375, 24.1806640625, 25.75048828125, 27.3203125, 28.89013671875, 30.4599609375, 32.02978515625, 33.599609375, 35.16943359375, 36.7392578125, 38.30908203125, 39.87890625, 41.44873046875, 43.0185546875, 44.58837890625, 46.158203125, 47.72802734375, 49.2978515625, 50.86767578125, 52.4375]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 7.0, 6.0, 17.0, 17.0, 25.0, 39.0, 44.0, 79.0, 79.0, 111.0, 116.0, 104.0, 105.0, 80.0, 69.0, 45.0, 20.0, 18.0, 9.0, 13.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-31.195711135864258, -30.52763557434082, -29.859561920166016, -29.191486358642578, -28.523412704467773, -27.855337142944336, -27.18726348876953, -26.519187927246094, -25.851112365722656, -25.18303680419922, -24.514963150024414, -23.846887588500977, -23.178813934326172, -22.510738372802734, -21.842662811279297, -21.174589157104492, -20.506515502929688, -19.83843994140625, -19.170366287231445, -18.502290725708008, -17.834217071533203, -17.166141510009766, -16.498065948486328, -15.829992294311523, -15.161917686462402, -14.493843078613281, -13.82576847076416, -13.157693862915039, -12.489618301391602, -11.821544647216797, -11.15346908569336, -10.485394477844238, -9.817320823669434, -9.149246215820312, -8.481171607971191, -7.813096523284912, -7.145021915435791, -6.47694730758667, -5.808872222900391, -5.1407976150512695, -4.472723007202148, -3.8046483993530273, -3.136573553085327, -2.468498706817627, -1.8004240989685059, -1.1323494911193848, -0.46427440643310547, 0.20380020141601562, 0.8718748092651367, 1.5399495363235474, 2.208024263381958, 2.876099109649658, 3.5441737174987793, 4.2122483253479, 4.88032341003418, 5.548398017883301, 6.216472625732422, 6.884547233581543, 7.552621841430664, 8.220697402954102, 8.888771057128906, 9.556846618652344, 10.224921226501465, 10.892995834350586, 11.561070442199707]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 6.0, 3.0, 6.0, 3.0, 5.0, 11.0, 6.0, 15.0, 19.0, 24.0, 14.0, 24.0, 14.0, 24.0, 25.0, 32.0, 31.0, 52.0, 30.0, 36.0, 37.0, 37.0, 42.0, 43.0, 29.0, 28.0, 34.0, 38.0, 36.0, 39.0, 25.0, 32.0, 28.0, 19.0, 25.0, 17.0, 26.0, 14.0, 12.0, 11.0, 11.0, 8.0, 6.0, 5.0, 9.0, 1.0, 5.0, 5.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0], "bins": [-47.36326599121094, -45.93043899536133, -44.49761199951172, -43.06478500366211, -41.6319580078125, -40.199127197265625, -38.76630401611328, -37.333473205566406, -35.9006462097168, -34.46781921386719, -33.03499221801758, -31.60216522216797, -30.169336318969727, -28.736509323120117, -27.303682327270508, -25.870853424072266, -24.43802833557129, -23.00520133972168, -21.57237434387207, -20.139545440673828, -18.70671844482422, -17.27389144897461, -15.841064453125, -14.408236503601074, -12.975409507751465, -11.542582511901855, -10.10975456237793, -8.67692756652832, -7.244100093841553, -5.811272621154785, -4.378445625305176, -2.94561767578125, -1.5127906799316406, -0.0799633264541626, 1.3528640270233154, 2.785691261291504, 4.2185187339782715, 5.651346206665039, 7.084173202514648, 8.517001152038574, 9.949828147888184, 11.382655143737793, 12.815483093261719, 14.248310089111328, 15.681137084960938, 17.113964080810547, 18.546791076660156, 19.9796199798584, 21.412446975708008, 22.845273971557617, 24.278100967407227, 25.71092987060547, 27.143756866455078, 28.576583862304688, 30.009410858154297, 31.442237854003906, 32.875064849853516, 34.307891845703125, 35.740718841552734, 37.173545837402344, 38.60637283325195, 40.03919982910156, 41.47203063964844, 42.90485763549805, 44.337684631347656]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 1.0, 2.0, 3.0, 8.0, 4.0, 9.0, 8.0, 23.0, 16.0, 13.0, 29.0, 24.0, 29.0, 23.0, 30.0, 33.0, 47.0, 48.0, 47.0, 56.0, 37.0, 44.0, 70.0, 33.0, 41.0, 32.0, 43.0, 30.0, 38.0, 26.0, 22.0, 15.0, 21.0, 20.0, 16.0, 11.0, 7.0, 14.0, 6.0, 7.0, 7.0, 5.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.00390625, -5.8128662109375, -5.621826171875, -5.4307861328125, -5.23974609375, -5.0487060546875, -4.857666015625, -4.6666259765625, -4.4755859375, -4.2845458984375, -4.093505859375, -3.9024658203125, -3.71142578125, -3.5203857421875, -3.329345703125, -3.1383056640625, -2.947265625, -2.7562255859375, -2.565185546875, -2.3741455078125, -2.18310546875, -1.9920654296875, -1.801025390625, -1.6099853515625, -1.4189453125, -1.2279052734375, -1.036865234375, -0.8458251953125, -0.65478515625, -0.4637451171875, -0.272705078125, -0.0816650390625, 0.109375, 0.3004150390625, 0.491455078125, 0.6824951171875, 0.87353515625, 1.0645751953125, 1.255615234375, 1.4466552734375, 1.6376953125, 1.8287353515625, 2.019775390625, 2.2108154296875, 2.40185546875, 2.5928955078125, 2.783935546875, 2.9749755859375, 3.166015625, 3.3570556640625, 3.548095703125, 3.7391357421875, 3.93017578125, 4.1212158203125, 4.312255859375, 4.5032958984375, 4.6943359375, 4.8853759765625, 5.076416015625, 5.2674560546875, 5.45849609375, 5.6495361328125, 5.840576171875, 6.0316162109375, 6.22265625]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 7.0, 9.0, 19.0, 21.0, 30.0, 37.0, 41.0, 75.0, 111.0, 161.0, 213.0, 327.0, 541.0, 910.0, 1547.0, 2906.0, 5378.0, 11112.0, 24246.0, 56672.0, 151914.0, 448534.0, 1159241.0, 1389108.0, 605563.0, 202481.0, 74455.0, 30417.0, 13763.0, 6519.0, 3419.0, 1767.0, 1024.0, 571.0, 372.0, 260.0, 160.0, 107.0, 78.0, 55.0, 42.0, 27.0, 23.0, 13.0, 5.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.08984375, -6.87591552734375, -6.6619873046875, -6.44805908203125, -6.234130859375, -6.02020263671875, -5.8062744140625, -5.59234619140625, -5.37841796875, -5.16448974609375, -4.9505615234375, -4.73663330078125, -4.522705078125, -4.30877685546875, -4.0948486328125, -3.88092041015625, -3.6669921875, -3.45306396484375, -3.2391357421875, -3.02520751953125, -2.811279296875, -2.59735107421875, -2.3834228515625, -2.16949462890625, -1.95556640625, -1.74163818359375, -1.5277099609375, -1.31378173828125, -1.099853515625, -0.88592529296875, -0.6719970703125, -0.45806884765625, -0.244140625, -0.03021240234375, 0.1837158203125, 0.39764404296875, 0.611572265625, 0.82550048828125, 1.0394287109375, 1.25335693359375, 1.46728515625, 1.68121337890625, 1.8951416015625, 2.10906982421875, 2.322998046875, 2.53692626953125, 2.7508544921875, 2.96478271484375, 3.1787109375, 3.39263916015625, 3.6065673828125, 3.82049560546875, 4.034423828125, 4.24835205078125, 4.4622802734375, 4.67620849609375, 4.89013671875, 5.10406494140625, 5.3179931640625, 5.53192138671875, 5.745849609375, 5.95977783203125, 6.1737060546875, 6.38763427734375, 6.6015625]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 4.0, 3.0, 11.0, 9.0, 16.0, 18.0, 22.0, 14.0, 28.0, 43.0, 47.0, 53.0, 72.0, 85.0, 125.0, 127.0, 171.0, 176.0, 271.0, 327.0, 347.0, 360.0, 347.0, 264.0, 232.0, 197.0, 138.0, 126.0, 93.0, 76.0, 76.0, 27.0, 42.0, 25.0, 27.0, 17.0, 16.0, 9.0, 8.0, 9.0, 5.0, 7.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0], "bins": [-8.7265625, -8.46435546875, -8.2021484375, -7.93994140625, -7.677734375, -7.41552734375, -7.1533203125, -6.89111328125, -6.62890625, -6.36669921875, -6.1044921875, -5.84228515625, -5.580078125, -5.31787109375, -5.0556640625, -4.79345703125, -4.53125, -4.26904296875, -4.0068359375, -3.74462890625, -3.482421875, -3.22021484375, -2.9580078125, -2.69580078125, -2.43359375, -2.17138671875, -1.9091796875, -1.64697265625, -1.384765625, -1.12255859375, -0.8603515625, -0.59814453125, -0.3359375, -0.07373046875, 0.1884765625, 0.45068359375, 0.712890625, 0.97509765625, 1.2373046875, 1.49951171875, 1.76171875, 2.02392578125, 2.2861328125, 2.54833984375, 2.810546875, 3.07275390625, 3.3349609375, 3.59716796875, 3.859375, 4.12158203125, 4.3837890625, 4.64599609375, 4.908203125, 5.17041015625, 5.4326171875, 5.69482421875, 5.95703125, 6.21923828125, 6.4814453125, 6.74365234375, 7.005859375, 7.26806640625, 7.5302734375, 7.79248046875, 8.0546875]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 3.0, 4.0, 4.0, 2.0, 9.0, 11.0, 11.0, 16.0, 22.0, 36.0, 61.0, 70.0, 102.0, 141.0, 175.0, 270.0, 392.0, 776.0, 2340.0, 19647.0, 496443.0, 3490405.0, 170377.0, 9516.0, 1546.0, 599.0, 402.0, 248.0, 171.0, 147.0, 80.0, 69.0, 58.0, 35.0, 25.0, 23.0, 15.0, 13.0, 9.0, 7.0, 2.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-33.0625, -32.04052734375, -31.0185546875, -29.99658203125, -28.974609375, -27.95263671875, -26.9306640625, -25.90869140625, -24.88671875, -23.86474609375, -22.8427734375, -21.82080078125, -20.798828125, -19.77685546875, -18.7548828125, -17.73291015625, -16.7109375, -15.68896484375, -14.6669921875, -13.64501953125, -12.623046875, -11.60107421875, -10.5791015625, -9.55712890625, -8.53515625, -7.51318359375, -6.4912109375, -5.46923828125, -4.447265625, -3.42529296875, -2.4033203125, -1.38134765625, -0.359375, 0.66259765625, 1.6845703125, 2.70654296875, 3.728515625, 4.75048828125, 5.7724609375, 6.79443359375, 7.81640625, 8.83837890625, 9.8603515625, 10.88232421875, 11.904296875, 12.92626953125, 13.9482421875, 14.97021484375, 15.9921875, 17.01416015625, 18.0361328125, 19.05810546875, 20.080078125, 21.10205078125, 22.1240234375, 23.14599609375, 24.16796875, 25.18994140625, 26.2119140625, 27.23388671875, 28.255859375, 29.27783203125, 30.2998046875, 31.32177734375, 32.34375]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 56.0, 399.0, 449.0, 99.0, 11.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-192.3268280029297, -184.35580444335938, -176.38479614257812, -168.4137725830078, -160.4427490234375, -152.47174072265625, -144.50071716308594, -136.52969360351562, -128.55868530273438, -120.5876693725586, -112.61665344238281, -104.6456298828125, -96.67461395263672, -88.70359802246094, -80.73257446289062, -72.76155853271484, -64.79054260253906, -56.81952667236328, -48.848506927490234, -40.87748718261719, -32.906471252441406, -24.935455322265625, -16.964435577392578, -8.993415832519531, -1.02239990234375, 6.948617935180664, 14.919635772705078, 22.890653610229492, 30.861671447753906, 38.83268737792969, 46.803707122802734, 54.77472686767578, 62.745758056640625, 70.7167739868164, 78.68778991699219, 86.6588134765625, 94.62982940673828, 102.60084533691406, 110.57186889648438, 118.54288482666016, 126.51390075683594, 134.48492431640625, 142.4559326171875, 150.4269561767578, 158.39797973632812, 166.36898803710938, 174.3400115966797, 182.31103515625, 190.28204345703125, 198.25306701660156, 206.2240753173828, 214.19509887695312, 222.16610717773438, 230.1371307373047, 238.108154296875, 246.07916259765625, 254.05018615722656, 262.0212097167969, 269.9922180175781, 277.9632263183594, 285.93426513671875, 293.9052734375, 301.87628173828125, 309.8473205566406, 317.8183288574219]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 0.0, 1.0, 2.0, 4.0, 3.0, 6.0, 7.0, 6.0, 9.0, 12.0, 12.0, 11.0, 18.0, 18.0, 20.0, 34.0, 25.0, 24.0, 32.0, 28.0, 41.0, 32.0, 42.0, 34.0, 43.0, 39.0, 36.0, 39.0, 41.0, 36.0, 28.0, 43.0, 26.0, 23.0, 26.0, 19.0, 26.0, 19.0, 25.0, 24.0, 11.0, 7.0, 12.0, 12.0, 12.0, 11.0, 10.0, 3.0, 3.0, 3.0, 1.0, 5.0, 5.0, 1.0, 1.0, 0.0, 2.0], "bins": [-34.395179748535156, -33.359039306640625, -32.32290267944336, -31.286762237548828, -30.25062370300293, -29.21448516845703, -28.1783447265625, -27.1422061920166, -26.106067657470703, -25.069929122924805, -24.033790588378906, -22.997650146484375, -21.961511611938477, -20.925373077392578, -19.889232635498047, -18.85309410095215, -17.81695556640625, -16.78081703186035, -15.744677543640137, -14.708538055419922, -13.672399520874023, -12.636260986328125, -11.60012149810791, -10.563982009887695, -9.527843475341797, -8.491704940795898, -7.455565452575684, -6.419426441192627, -5.38328742980957, -4.347148418426514, -3.311009407043457, -2.2748703956604004, -1.2387313842773438, -0.2025923728942871, 0.8335466384887695, 1.8696856498718262, 2.905824661254883, 3.9419636726379395, 4.978102684020996, 6.014241695404053, 7.050380706787109, 8.086519241333008, 9.122658729553223, 10.158798217773438, 11.194936752319336, 12.231075286865234, 13.26721477508545, 14.303354263305664, 15.339492797851562, 16.37563133239746, 17.41176986694336, 18.44791030883789, 19.48404884338379, 20.520187377929688, 21.55632781982422, 22.592466354370117, 23.628604888916016, 24.664743423461914, 25.700881958007812, 26.737022399902344, 27.773160934448242, 28.80929946899414, 29.845439910888672, 30.88157844543457, 31.91771697998047]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 3.0, 4.0, 5.0, 11.0, 8.0, 11.0, 15.0, 14.0, 14.0, 17.0, 20.0, 23.0, 29.0, 24.0, 30.0, 38.0, 40.0, 45.0, 44.0, 42.0, 44.0, 53.0, 41.0, 44.0, 44.0, 34.0, 39.0, 39.0, 28.0, 27.0, 25.0, 21.0, 21.0, 15.0, 20.0, 14.0, 9.0, 5.0, 10.0, 5.0, 14.0, 5.0, 5.0, 3.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.4453125, -5.266845703125, -5.08837890625, -4.909912109375, -4.7314453125, -4.552978515625, -4.37451171875, -4.196044921875, -4.017578125, -3.839111328125, -3.66064453125, -3.482177734375, -3.3037109375, -3.125244140625, -2.94677734375, -2.768310546875, -2.58984375, -2.411376953125, -2.23291015625, -2.054443359375, -1.8759765625, -1.697509765625, -1.51904296875, -1.340576171875, -1.162109375, -0.983642578125, -0.80517578125, -0.626708984375, -0.4482421875, -0.269775390625, -0.09130859375, 0.087158203125, 0.265625, 0.444091796875, 0.62255859375, 0.801025390625, 0.9794921875, 1.157958984375, 1.33642578125, 1.514892578125, 1.693359375, 1.871826171875, 2.05029296875, 2.228759765625, 2.4072265625, 2.585693359375, 2.76416015625, 2.942626953125, 3.12109375, 3.299560546875, 3.47802734375, 3.656494140625, 3.8349609375, 4.013427734375, 4.19189453125, 4.370361328125, 4.548828125, 4.727294921875, 4.90576171875, 5.084228515625, 5.2626953125, 5.441162109375, 5.61962890625, 5.798095703125, 5.9765625]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 4.0, 9.0, 14.0, 14.0, 26.0, 30.0, 42.0, 75.0, 110.0, 181.0, 229.0, 329.0, 484.0, 735.0, 1036.0, 1508.0, 2149.0, 2986.0, 4349.0, 6396.0, 9645.0, 14179.0, 21789.0, 33871.0, 54819.0, 90386.0, 154794.0, 215472.0, 167359.0, 99133.0, 59049.0, 36700.0, 23209.0, 15344.0, 10172.0, 6833.0, 4470.0, 3218.0, 2273.0, 1576.0, 1159.0, 762.0, 493.0, 366.0, 254.0, 180.0, 122.0, 90.0, 36.0, 38.0, 24.0, 14.0, 16.0, 4.0, 4.0, 7.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.468994140625, -0.4541435241699219, -0.43929290771484375, -0.4244422912597656, -0.4095916748046875, -0.3947410583496094, -0.37989044189453125, -0.3650398254394531, -0.350189208984375, -0.3353385925292969, -0.32048797607421875, -0.3056373596191406, -0.2907867431640625, -0.2759361267089844, -0.26108551025390625, -0.24623489379882812, -0.23138427734375, -0.21653366088867188, -0.20168304443359375, -0.18683242797851562, -0.1719818115234375, -0.15713119506835938, -0.14228057861328125, -0.12742996215820312, -0.112579345703125, -0.09772872924804688, -0.08287811279296875, -0.06802749633789062, -0.0531768798828125, -0.038326263427734375, -0.02347564697265625, -0.008625030517578125, 0.0062255859375, 0.021076202392578125, 0.03592681884765625, 0.050777435302734375, 0.0656280517578125, 0.08047866821289062, 0.09532928466796875, 0.11017990112304688, 0.125030517578125, 0.13988113403320312, 0.15473175048828125, 0.16958236694335938, 0.1844329833984375, 0.19928359985351562, 0.21413421630859375, 0.22898483276367188, 0.24383544921875, 0.2586860656738281, 0.27353668212890625, 0.2883872985839844, 0.3032379150390625, 0.3180885314941406, 0.33293914794921875, 0.3477897644042969, 0.362640380859375, 0.3774909973144531, 0.39234161376953125, 0.4071922302246094, 0.4220428466796875, 0.4368934631347656, 0.45174407958984375, 0.4665946960449219, 0.4814453125]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 6.0, 2.0, 4.0, 10.0, 8.0, 8.0, 11.0, 16.0, 16.0, 19.0, 19.0, 15.0, 22.0, 30.0, 19.0, 38.0, 31.0, 38.0, 41.0, 41.0, 42.0, 45.0, 1065.0, 49.0, 43.0, 51.0, 40.0, 36.0, 36.0, 37.0, 31.0, 29.0, 16.0, 14.0, 13.0, 14.0, 18.0, 7.0, 7.0, 15.0, 7.0, 4.0, 6.0, 4.0, 1.0, 5.0, 1.0, 6.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.359375, -3.24566650390625, -3.1319580078125, -3.01824951171875, -2.904541015625, -2.79083251953125, -2.6771240234375, -2.56341552734375, -2.44970703125, -2.33599853515625, -2.2222900390625, -2.10858154296875, -1.994873046875, -1.88116455078125, -1.7674560546875, -1.65374755859375, -1.5400390625, -1.42633056640625, -1.3126220703125, -1.19891357421875, -1.085205078125, -0.97149658203125, -0.8577880859375, -0.74407958984375, -0.63037109375, -0.51666259765625, -0.4029541015625, -0.28924560546875, -0.175537109375, -0.06182861328125, 0.0518798828125, 0.16558837890625, 0.279296875, 0.39300537109375, 0.5067138671875, 0.62042236328125, 0.734130859375, 0.84783935546875, 0.9615478515625, 1.07525634765625, 1.18896484375, 1.30267333984375, 1.4163818359375, 1.53009033203125, 1.643798828125, 1.75750732421875, 1.8712158203125, 1.98492431640625, 2.0986328125, 2.21234130859375, 2.3260498046875, 2.43975830078125, 2.553466796875, 2.66717529296875, 2.7808837890625, 2.89459228515625, 3.00830078125, 3.12200927734375, 3.2357177734375, 3.34942626953125, 3.463134765625, 3.57684326171875, 3.6905517578125, 3.80426025390625, 3.91796875]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 3.0, 10.0, 14.0, 11.0, 37.0, 35.0, 54.0, 70.0, 122.0, 210.0, 310.0, 433.0, 745.0, 1235.0, 2200.0, 3757.0, 6756.0, 11640.0, 20353.0, 36418.0, 65354.0, 116384.0, 188471.0, 1268017.0, 160945.0, 93838.0, 52113.0, 28771.0, 16385.0, 9337.0, 5361.0, 3106.0, 1884.0, 1065.0, 623.0, 382.0, 237.0, 139.0, 92.0, 66.0, 47.0, 33.0, 16.0, 15.0, 18.0, 6.0, 5.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.32470703125, -0.3143348693847656, -0.30396270751953125, -0.2935905456542969, -0.2832183837890625, -0.2728462219238281, -0.26247406005859375, -0.2521018981933594, -0.241729736328125, -0.23135757446289062, -0.22098541259765625, -0.21061325073242188, -0.2002410888671875, -0.18986892700195312, -0.17949676513671875, -0.16912460327148438, -0.15875244140625, -0.14838027954101562, -0.13800811767578125, -0.12763595581054688, -0.1172637939453125, -0.10689163208007812, -0.09651947021484375, -0.08614730834960938, -0.075775146484375, -0.06540298461914062, -0.05503082275390625, -0.044658660888671875, -0.0342864990234375, -0.023914337158203125, -0.01354217529296875, -0.003170013427734375, 0.0072021484375, 0.017574310302734375, 0.02794647216796875, 0.038318634033203125, 0.0486907958984375, 0.059062957763671875, 0.06943511962890625, 0.07980728149414062, 0.090179443359375, 0.10055160522460938, 0.11092376708984375, 0.12129592895507812, 0.1316680908203125, 0.14204025268554688, 0.15241241455078125, 0.16278457641601562, 0.17315673828125, 0.18352890014648438, 0.19390106201171875, 0.20427322387695312, 0.2146453857421875, 0.22501754760742188, 0.23538970947265625, 0.24576187133789062, 0.256134033203125, 0.2665061950683594, 0.27687835693359375, 0.2872505187988281, 0.2976226806640625, 0.3079948425292969, 0.31836700439453125, 0.3287391662597656, 0.339111328125]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 3.0, 6.0, 3.0, 7.0, 2.0, 2.0, 4.0, 12.0, 10.0, 13.0, 14.0, 15.0, 21.0, 29.0, 34.0, 42.0, 40.0, 53.0, 78.0, 66.0, 53.0, 54.0, 71.0, 67.0, 60.0, 40.0, 37.0, 33.0, 23.0, 20.0, 18.0, 16.0, 10.0, 9.0, 5.0, 6.0, 9.0, 3.0, 3.0, 3.0, 6.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.002994537353515625, -0.002900153398513794, -0.002805769443511963, -0.002711385488510132, -0.0026170015335083008, -0.0025226175785064697, -0.0024282336235046387, -0.0023338496685028076, -0.0022394657135009766, -0.0021450817584991455, -0.0020506978034973145, -0.0019563138484954834, -0.0018619298934936523, -0.0017675459384918213, -0.0016731619834899902, -0.0015787780284881592, -0.0014843940734863281, -0.001390010118484497, -0.001295626163482666, -0.001201242208480835, -0.001106858253479004, -0.0010124742984771729, -0.0009180903434753418, -0.0008237063884735107, -0.0007293224334716797, -0.0006349384784698486, -0.0005405545234680176, -0.0004461705684661865, -0.00035178661346435547, -0.0002574026584625244, -0.00016301870346069336, -6.86347484588623e-05, 2.574920654296875e-05, 0.0001201331615447998, 0.00021451711654663086, 0.0003089010715484619, 0.00040328502655029297, 0.000497668981552124, 0.0005920529365539551, 0.0006864368915557861, 0.0007808208465576172, 0.0008752048015594482, 0.0009695887565612793, 0.0010639727115631104, 0.0011583566665649414, 0.0012527406215667725, 0.0013471245765686035, 0.0014415085315704346, 0.0015358924865722656, 0.0016302764415740967, 0.0017246603965759277, 0.0018190443515777588, 0.0019134283065795898, 0.002007812261581421, 0.002102196216583252, 0.002196580171585083, 0.002290964126586914, 0.002385348081588745, 0.002479732036590576, 0.0025741159915924072, 0.0026684999465942383, 0.0027628839015960693, 0.0028572678565979004, 0.0029516518115997314, 0.0030460357666015625]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 3.0, 2.0, 4.0, 1.0, 1.0, 5.0, 7.0, 9.0, 13.0, 9.0, 17.0, 27.0, 27.0, 48.0, 39.0, 61.0, 90.0, 137.0, 378.0, 1507.0, 8731.0, 78756.0, 836480.0, 108573.0, 10879.0, 1786.0, 450.0, 163.0, 94.0, 57.0, 40.0, 33.0, 25.0, 21.0, 11.0, 14.0, 13.0, 8.0, 5.0, 12.0, 5.0, 1.0, 4.0, 5.0, 6.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.05902099609375, -0.057150840759277344, -0.05528068542480469, -0.05341053009033203, -0.051540374755859375, -0.04967021942138672, -0.04780006408691406, -0.045929908752441406, -0.04405975341796875, -0.042189598083496094, -0.04031944274902344, -0.03844928741455078, -0.036579132080078125, -0.03470897674560547, -0.03283882141113281, -0.030968666076660156, -0.0290985107421875, -0.027228355407714844, -0.025358200073242188, -0.02348804473876953, -0.021617889404296875, -0.01974773406982422, -0.017877578735351562, -0.016007423400878906, -0.01413726806640625, -0.012267112731933594, -0.010396957397460938, -0.008526802062988281, -0.006656646728515625, -0.004786491394042969, -0.0029163360595703125, -0.0010461807250976562, 0.000823974609375, 0.0026941299438476562, 0.0045642852783203125, 0.006434440612792969, 0.008304595947265625, 0.010174751281738281, 0.012044906616210938, 0.013915061950683594, 0.01578521728515625, 0.017655372619628906, 0.019525527954101562, 0.02139568328857422, 0.023265838623046875, 0.02513599395751953, 0.027006149291992188, 0.028876304626464844, 0.0307464599609375, 0.032616615295410156, 0.03448677062988281, 0.03635692596435547, 0.038227081298828125, 0.04009723663330078, 0.04196739196777344, 0.043837547302246094, 0.04570770263671875, 0.047577857971191406, 0.04944801330566406, 0.05131816864013672, 0.053188323974609375, 0.05505847930908203, 0.05692863464355469, 0.058798789978027344, 0.0606689453125]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 2.0, 6.0, 8.0, 6.0, 11.0, 16.0, 20.0, 46.0, 55.0, 88.0, 133.0, 185.0, 160.0, 79.0, 53.0, 47.0, 24.0, 17.0, 18.0, 11.0, 7.0, 4.0, 7.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0161150936037302, -0.015685705468058586, -0.015256316401064396, -0.01482692826539278, -0.01439753919839859, -0.013968151062726974, -0.013538762927055359, -0.013109373860061169, -0.012679984793066978, -0.012250596657395363, -0.011821207590401173, -0.011391819454729557, -0.010962430387735367, -0.010533042252063751, -0.010103654116392136, -0.009674265049397945, -0.00924487691372633, -0.008815488778054714, -0.008386099711060524, -0.007956711575388908, -0.007527322508394718, -0.007097934372723103, -0.0066685457713902, -0.006239157170057297, -0.005809768568724394, -0.005380379967391491, -0.004950991366058588, -0.004521602764725685, -0.0040922146290540695, -0.003662825794890523, -0.0032334374263882637, -0.002804048825055361, -0.0023746592923998833, -0.0019452706910669804, -0.0015158822061493993, -0.0010864937212318182, -0.0006571051198989153, -0.00022771651856601238, 0.00020167184993624687, 0.0006310604512691498, 0.0010604490526020527, 0.0014898376539349556, 0.0019192261388525367, 0.0023486146237701178, 0.0027780032251030207, 0.0032073918264359236, 0.003636780194938183, 0.004066168796271086, 0.004495557397603989, 0.0049249459989368916, 0.0053543346002697945, 0.00578372273594141, 0.0062131118029356, 0.006642499938607216, 0.007071888539940119, 0.007501277141273022, 0.007930666208267212, 0.008360054343938828, 0.008789443410933018, 0.009218831546604633, 0.009648220613598824, 0.01007760874927044, 0.010506996884942055, 0.010936385951936245, 0.01136577408760786]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 5.0, 1.0, 5.0, 6.0, 6.0, 6.0, 7.0, 13.0, 18.0, 14.0, 13.0, 23.0, 23.0, 18.0, 27.0, 20.0, 24.0, 45.0, 38.0, 36.0, 36.0, 41.0, 43.0, 45.0, 42.0, 37.0, 49.0, 23.0, 29.0, 43.0, 35.0, 33.0, 23.0, 31.0, 27.0, 21.0, 21.0, 11.0, 10.0, 8.0, 11.0, 10.0, 8.0, 6.0, 4.0, 4.0, 3.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 3.0], "bins": [-0.0017390847206115723, -0.001688213087618351, -0.0016373414546251297, -0.0015864698216319084, -0.0015355981886386871, -0.0014847265556454659, -0.0014338549226522446, -0.0013829832896590233, -0.001332111656665802, -0.0012812400236725807, -0.0012303683906793594, -0.0011794967576861382, -0.0011286251246929169, -0.0010777534916996956, -0.0010268818587064743, -0.000976010225713253, -0.0009251385927200317, -0.0008742669597268105, -0.0008233953267335892, -0.0007725236937403679, -0.0007216520607471466, -0.0006707804277539253, -0.000619908794760704, -0.0005690371617674828, -0.0005181655287742615, -0.0004672938957810402, -0.0004164222627878189, -0.0003655506297945976, -0.00031467899680137634, -0.00026380736380815506, -0.00021293573081493378, -0.0001620640978217125, -0.00011119246482849121, -6.032083183526993e-05, -9.449198842048645e-06, 4.142243415117264e-05, 9.229406714439392e-05, 0.0001431657001376152, 0.0001940373331308365, 0.00024490896612405777, 0.00029578059911727905, 0.00034665223211050034, 0.0003975238651037216, 0.0004483954980969429, 0.0004992671310901642, 0.0005501387640833855, 0.0006010103970766068, 0.000651882030069828, 0.0007027536630630493, 0.0007536252960562706, 0.0008044969290494919, 0.0008553685620427132, 0.0009062401950359344, 0.0009571118280291557, 0.001007983461022377, 0.0010588550940155983, 0.0011097267270088196, 0.0011605983600020409, 0.0012114699929952621, 0.0012623416259884834, 0.0013132132589817047, 0.001364084891974926, 0.0014149565249681473, 0.0014658281579613686, 0.0015166997909545898]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 3.0, 4.0, 5.0, 11.0, 8.0, 11.0, 15.0, 14.0, 14.0, 17.0, 20.0, 23.0, 29.0, 24.0, 30.0, 38.0, 40.0, 45.0, 44.0, 42.0, 44.0, 53.0, 41.0, 44.0, 44.0, 34.0, 39.0, 39.0, 28.0, 27.0, 25.0, 21.0, 21.0, 15.0, 20.0, 14.0, 9.0, 5.0, 10.0, 5.0, 14.0, 5.0, 5.0, 3.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.4453125, -5.266845703125, -5.08837890625, -4.909912109375, -4.7314453125, -4.552978515625, -4.37451171875, -4.196044921875, -4.017578125, -3.839111328125, -3.66064453125, -3.482177734375, -3.3037109375, -3.125244140625, -2.94677734375, -2.768310546875, -2.58984375, -2.411376953125, -2.23291015625, -2.054443359375, -1.8759765625, -1.697509765625, -1.51904296875, -1.340576171875, -1.162109375, -0.983642578125, -0.80517578125, -0.626708984375, -0.4482421875, -0.269775390625, -0.09130859375, 0.087158203125, 0.265625, 0.444091796875, 0.62255859375, 0.801025390625, 0.9794921875, 1.157958984375, 1.33642578125, 1.514892578125, 1.693359375, 1.871826171875, 2.05029296875, 2.228759765625, 2.4072265625, 2.585693359375, 2.76416015625, 2.942626953125, 3.12109375, 3.299560546875, 3.47802734375, 3.656494140625, 3.8349609375, 4.013427734375, 4.19189453125, 4.370361328125, 4.548828125, 4.727294921875, 4.90576171875, 5.084228515625, 5.2626953125, 5.441162109375, 5.61962890625, 5.798095703125, 5.9765625]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 5.0, 5.0, 9.0, 16.0, 29.0, 41.0, 54.0, 93.0, 111.0, 222.0, 386.0, 651.0, 1140.0, 2035.0, 3667.0, 6769.0, 12357.0, 23396.0, 45216.0, 99328.0, 265118.0, 337564.0, 132291.0, 56663.0, 28257.0, 14899.0, 8019.0, 4473.0, 2507.0, 1331.0, 787.0, 442.0, 247.0, 146.0, 95.0, 61.0, 38.0, 32.0, 21.0, 10.0, 10.0, 4.0, 8.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.4140625, -6.22625732421875, -6.0384521484375, -5.85064697265625, -5.662841796875, -5.47503662109375, -5.2872314453125, -5.09942626953125, -4.91162109375, -4.72381591796875, -4.5360107421875, -4.34820556640625, -4.160400390625, -3.97259521484375, -3.7847900390625, -3.59698486328125, -3.4091796875, -3.22137451171875, -3.0335693359375, -2.84576416015625, -2.657958984375, -2.47015380859375, -2.2823486328125, -2.09454345703125, -1.90673828125, -1.71893310546875, -1.5311279296875, -1.34332275390625, -1.155517578125, -0.96771240234375, -0.7799072265625, -0.59210205078125, -0.404296875, -0.21649169921875, -0.0286865234375, 0.15911865234375, 0.346923828125, 0.53472900390625, 0.7225341796875, 0.91033935546875, 1.09814453125, 1.28594970703125, 1.4737548828125, 1.66156005859375, 1.849365234375, 2.03717041015625, 2.2249755859375, 2.41278076171875, 2.6005859375, 2.78839111328125, 2.9761962890625, 3.16400146484375, 3.351806640625, 3.53961181640625, 3.7274169921875, 3.91522216796875, 4.10302734375, 4.29083251953125, 4.4786376953125, 4.66644287109375, 4.854248046875, 5.04205322265625, 5.2298583984375, 5.41766357421875, 5.60546875]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 8.0, 6.0, 5.0, 6.0, 6.0, 14.0, 12.0, 10.0, 22.0, 23.0, 23.0, 23.0, 25.0, 29.0, 24.0, 39.0, 44.0, 46.0, 66.0, 81.0, 160.0, 290.0, 1359.0, 194.0, 87.0, 62.0, 56.0, 41.0, 33.0, 39.0, 33.0, 18.0, 16.0, 21.0, 25.0, 26.0, 21.0, 12.0, 8.0, 9.0, 5.0, 5.0, 3.0, 5.0, 3.0, 1.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0], "bins": [-16.859375, -16.351318359375, -15.84326171875, -15.335205078125, -14.8271484375, -14.319091796875, -13.81103515625, -13.302978515625, -12.794921875, -12.286865234375, -11.77880859375, -11.270751953125, -10.7626953125, -10.254638671875, -9.74658203125, -9.238525390625, -8.73046875, -8.222412109375, -7.71435546875, -7.206298828125, -6.6982421875, -6.190185546875, -5.68212890625, -5.174072265625, -4.666015625, -4.157958984375, -3.64990234375, -3.141845703125, -2.6337890625, -2.125732421875, -1.61767578125, -1.109619140625, -0.6015625, -0.093505859375, 0.41455078125, 0.922607421875, 1.4306640625, 1.938720703125, 2.44677734375, 2.954833984375, 3.462890625, 3.970947265625, 4.47900390625, 4.987060546875, 5.4951171875, 6.003173828125, 6.51123046875, 7.019287109375, 7.52734375, 8.035400390625, 8.54345703125, 9.051513671875, 9.5595703125, 10.067626953125, 10.57568359375, 11.083740234375, 11.591796875, 12.099853515625, 12.60791015625, 13.115966796875, 13.6240234375, 14.132080078125, 14.64013671875, 15.148193359375, 15.65625]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 5.0, 2.0, 3.0, 9.0, 6.0, 9.0, 12.0, 14.0, 14.0, 31.0, 47.0, 40.0, 65.0, 66.0, 82.0, 147.0, 159.0, 250.0, 500.0, 1540.0, 11243.0, 229240.0, 2812931.0, 81185.0, 5785.0, 1035.0, 383.0, 218.0, 133.0, 126.0, 95.0, 75.0, 58.0, 43.0, 34.0, 28.0, 19.0, 13.0, 20.0, 8.0, 7.0, 7.0, 6.0, 4.0, 4.0, 3.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-29.9375, -29.01220703125, -28.0869140625, -27.16162109375, -26.236328125, -25.31103515625, -24.3857421875, -23.46044921875, -22.53515625, -21.60986328125, -20.6845703125, -19.75927734375, -18.833984375, -17.90869140625, -16.9833984375, -16.05810546875, -15.1328125, -14.20751953125, -13.2822265625, -12.35693359375, -11.431640625, -10.50634765625, -9.5810546875, -8.65576171875, -7.73046875, -6.80517578125, -5.8798828125, -4.95458984375, -4.029296875, -3.10400390625, -2.1787109375, -1.25341796875, -0.328125, 0.59716796875, 1.5224609375, 2.44775390625, 3.373046875, 4.29833984375, 5.2236328125, 6.14892578125, 7.07421875, 7.99951171875, 8.9248046875, 9.85009765625, 10.775390625, 11.70068359375, 12.6259765625, 13.55126953125, 14.4765625, 15.40185546875, 16.3271484375, 17.25244140625, 18.177734375, 19.10302734375, 20.0283203125, 20.95361328125, 21.87890625, 22.80419921875, 23.7294921875, 24.65478515625, 25.580078125, 26.50537109375, 27.4306640625, 28.35595703125, 29.28125]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 56.0, 197.0, 361.0, 272.0, 106.0, 12.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.19447898864746, -24.408601760864258, -21.622724533081055, -18.83684730529785, -16.05097007751465, -13.265092849731445, -10.479215621948242, -7.693338394165039, -4.907461166381836, -2.121583938598633, 0.6642932891845703, 3.4501705169677734, 6.236047744750977, 9.02192497253418, 11.807802200317383, 14.593679428100586, 17.37955665588379, 20.165433883666992, 22.951311111450195, 25.7371883392334, 28.5230655670166, 31.308942794799805, 34.094818115234375, 36.880699157714844, 39.66657257080078, 42.452449798583984, 45.23832702636719, 48.02420425415039, 50.810081481933594, 53.5959587097168, 56.3818359375, 59.1677131652832, 61.95359802246094, 64.73947143554688, 67.52535247802734, 70.31123352050781, 73.09710693359375, 75.88298034667969, 78.66886138916016, 81.45474243164062, 84.24061584472656, 87.0264892578125, 89.81237030029297, 92.59825134277344, 95.38412475585938, 98.16999816894531, 100.95587921142578, 103.74176025390625, 106.52763366699219, 109.31350708007812, 112.0993881225586, 114.88526916503906, 117.671142578125, 120.45701599121094, 123.2428970336914, 126.02877807617188, 128.8146514892578, 131.60052490234375, 134.38641357421875, 137.1722869873047, 139.95816040039062, 142.74403381347656, 145.5299072265625, 148.3157958984375, 151.10166931152344]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 1.0, 7.0, 8.0, 6.0, 15.0, 20.0, 20.0, 14.0, 16.0, 21.0, 16.0, 20.0, 27.0, 29.0, 39.0, 34.0, 37.0, 30.0, 37.0, 44.0, 53.0, 39.0, 33.0, 52.0, 36.0, 39.0, 37.0, 37.0, 26.0, 19.0, 25.0, 23.0, 22.0, 23.0, 30.0, 10.0, 9.0, 8.0, 7.0, 10.0, 7.0, 5.0, 3.0, 4.0, 4.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.20503234863281, -41.78216552734375, -40.35929489135742, -38.93642807006836, -37.5135612487793, -36.09069061279297, -34.667823791503906, -33.244956970214844, -31.82208824157715, -30.399219512939453, -28.97635269165039, -27.553483963012695, -26.130615234375, -24.707748413085938, -23.284879684448242, -21.862010955810547, -20.439144134521484, -19.01627540588379, -17.593408584594727, -16.17053985595703, -14.747672080993652, -13.324804306030273, -11.901935577392578, -10.4790678024292, -9.05620002746582, -7.633332252502441, -6.210464000701904, -4.787595748901367, -3.3647279739379883, -1.9418601989746094, -0.5189914703369141, 0.9038763046264648, 2.3267440795898438, 3.7496120929718018, 5.17248010635376, 6.595348358154297, 8.018216133117676, 9.441083908081055, 10.86395263671875, 12.286820411682129, 13.709688186645508, 15.132555961608887, 16.555423736572266, 17.97829246520996, 19.401161193847656, 20.82402801513672, 22.246896743774414, 23.66976547241211, 25.092632293701172, 26.515501022338867, 27.93836784362793, 29.361236572265625, 30.784103393554688, 32.20697021484375, 33.62984085083008, 35.05270767211914, 36.47557830810547, 37.89844512939453, 39.32131576538086, 40.74418258666992, 42.167049407958984, 43.58992004394531, 45.012786865234375, 46.43565368652344, 47.8585205078125]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 9.0, 7.0, 5.0, 13.0, 14.0, 12.0, 12.0, 10.0, 19.0, 30.0, 23.0, 26.0, 23.0, 27.0, 28.0, 38.0, 33.0, 44.0, 47.0, 39.0, 36.0, 45.0, 41.0, 47.0, 39.0, 28.0, 29.0, 32.0, 29.0, 32.0, 30.0, 20.0, 17.0, 14.0, 18.0, 11.0, 10.0, 14.0, 14.0, 9.0, 4.0, 5.0, 5.0, 4.0, 7.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0], "bins": [-5.3046875, -5.135009765625, -4.96533203125, -4.795654296875, -4.6259765625, -4.456298828125, -4.28662109375, -4.116943359375, -3.947265625, -3.777587890625, -3.60791015625, -3.438232421875, -3.2685546875, -3.098876953125, -2.92919921875, -2.759521484375, -2.58984375, -2.420166015625, -2.25048828125, -2.080810546875, -1.9111328125, -1.741455078125, -1.57177734375, -1.402099609375, -1.232421875, -1.062744140625, -0.89306640625, -0.723388671875, -0.5537109375, -0.384033203125, -0.21435546875, -0.044677734375, 0.125, 0.294677734375, 0.46435546875, 0.634033203125, 0.8037109375, 0.973388671875, 1.14306640625, 1.312744140625, 1.482421875, 1.652099609375, 1.82177734375, 1.991455078125, 2.1611328125, 2.330810546875, 2.50048828125, 2.670166015625, 2.83984375, 3.009521484375, 3.17919921875, 3.348876953125, 3.5185546875, 3.688232421875, 3.85791015625, 4.027587890625, 4.197265625, 4.366943359375, 4.53662109375, 4.706298828125, 4.8759765625, 5.045654296875, 5.21533203125, 5.385009765625, 5.5546875]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 1.0, 5.0, 5.0, 4.0, 3.0, 6.0, 11.0, 17.0, 18.0, 21.0, 22.0, 29.0, 35.0, 70.0, 133.0, 237.0, 501.0, 1486.0, 4381.0, 15848.0, 65850.0, 402493.0, 2469447.0, 1054254.0, 138195.0, 29221.0, 7964.0, 2405.0, 768.0, 360.0, 165.0, 86.0, 67.0, 40.0, 26.0, 19.0, 22.0, 7.0, 15.0, 10.0, 11.0, 7.0, 4.0, 6.0, 0.0, 5.0, 5.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-14.1953125, -13.7864990234375, -13.377685546875, -12.9688720703125, -12.56005859375, -12.1512451171875, -11.742431640625, -11.3336181640625, -10.9248046875, -10.5159912109375, -10.107177734375, -9.6983642578125, -9.28955078125, -8.8807373046875, -8.471923828125, -8.0631103515625, -7.654296875, -7.2454833984375, -6.836669921875, -6.4278564453125, -6.01904296875, -5.6102294921875, -5.201416015625, -4.7926025390625, -4.3837890625, -3.9749755859375, -3.566162109375, -3.1573486328125, -2.74853515625, -2.3397216796875, -1.930908203125, -1.5220947265625, -1.11328125, -0.7044677734375, -0.295654296875, 0.1131591796875, 0.52197265625, 0.9307861328125, 1.339599609375, 1.7484130859375, 2.1572265625, 2.5660400390625, 2.974853515625, 3.3836669921875, 3.79248046875, 4.2012939453125, 4.610107421875, 5.0189208984375, 5.427734375, 5.8365478515625, 6.245361328125, 6.6541748046875, 7.06298828125, 7.4718017578125, 7.880615234375, 8.2894287109375, 8.6982421875, 9.1070556640625, 9.515869140625, 9.9246826171875, 10.33349609375, 10.7423095703125, 11.151123046875, 11.5599365234375, 11.96875]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 0.0, 5.0, 4.0, 5.0, 5.0, 12.0, 11.0, 17.0, 28.0, 31.0, 32.0, 47.0, 88.0, 94.0, 132.0, 180.0, 267.0, 319.0, 433.0, 449.0, 475.0, 381.0, 239.0, 209.0, 140.0, 109.0, 93.0, 52.0, 59.0, 40.0, 35.0, 26.0, 13.0, 14.0, 10.0, 7.0, 5.0, 7.0, 2.0, 3.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.6015625, -7.2818603515625, -6.962158203125, -6.6424560546875, -6.32275390625, -6.0030517578125, -5.683349609375, -5.3636474609375, -5.0439453125, -4.7242431640625, -4.404541015625, -4.0848388671875, -3.76513671875, -3.4454345703125, -3.125732421875, -2.8060302734375, -2.486328125, -2.1666259765625, -1.846923828125, -1.5272216796875, -1.20751953125, -0.8878173828125, -0.568115234375, -0.2484130859375, 0.0712890625, 0.3909912109375, 0.710693359375, 1.0303955078125, 1.35009765625, 1.6697998046875, 1.989501953125, 2.3092041015625, 2.62890625, 2.9486083984375, 3.268310546875, 3.5880126953125, 3.90771484375, 4.2274169921875, 4.547119140625, 4.8668212890625, 5.1865234375, 5.5062255859375, 5.825927734375, 6.1456298828125, 6.46533203125, 6.7850341796875, 7.104736328125, 7.4244384765625, 7.744140625, 8.0638427734375, 8.383544921875, 8.7032470703125, 9.02294921875, 9.3426513671875, 9.662353515625, 9.9820556640625, 10.3017578125, 10.6214599609375, 10.941162109375, 11.2608642578125, 11.58056640625, 11.9002685546875, 12.219970703125, 12.5396728515625, 12.859375]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 3.0, 7.0, 6.0, 8.0, 21.0, 36.0, 27.0, 30.0, 48.0, 61.0, 98.0, 108.0, 177.0, 200.0, 319.0, 727.0, 3727.0, 37358.0, 938763.0, 3099937.0, 101979.0, 7994.0, 1294.0, 449.0, 261.0, 164.0, 119.0, 100.0, 69.0, 50.0, 38.0, 31.0, 29.0, 15.0, 10.0, 6.0, 4.0, 3.0, 5.0, 5.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-41.09375, -40.017333984375, -38.94091796875, -37.864501953125, -36.7880859375, -35.711669921875, -34.63525390625, -33.558837890625, -32.482421875, -31.406005859375, -30.32958984375, -29.253173828125, -28.1767578125, -27.100341796875, -26.02392578125, -24.947509765625, -23.87109375, -22.794677734375, -21.71826171875, -20.641845703125, -19.5654296875, -18.489013671875, -17.41259765625, -16.336181640625, -15.259765625, -14.183349609375, -13.10693359375, -12.030517578125, -10.9541015625, -9.877685546875, -8.80126953125, -7.724853515625, -6.6484375, -5.572021484375, -4.49560546875, -3.419189453125, -2.3427734375, -1.266357421875, -0.18994140625, 0.886474609375, 1.962890625, 3.039306640625, 4.11572265625, 5.192138671875, 6.2685546875, 7.344970703125, 8.42138671875, 9.497802734375, 10.57421875, 11.650634765625, 12.72705078125, 13.803466796875, 14.8798828125, 15.956298828125, 17.03271484375, 18.109130859375, 19.185546875, 20.261962890625, 21.33837890625, 22.414794921875, 23.4912109375, 24.567626953125, 25.64404296875, 26.720458984375, 27.796875]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 6.0, 45.0, 221.0, 412.0, 260.0, 68.0, 7.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-124.3444595336914, -118.566650390625, -112.7888412475586, -107.01103210449219, -101.23323059082031, -95.4554214477539, -89.6776123046875, -83.89981079101562, -78.12199401855469, -72.34418487548828, -66.56637573242188, -60.788570404052734, -55.010765075683594, -49.23295593261719, -43.45514678955078, -37.67734146118164, -31.8995361328125, -26.121728897094727, -20.343921661376953, -14.566112518310547, -8.788305282592773, -3.010498046875, 2.7673110961914062, 8.545116424560547, 14.322925567626953, 20.100732803344727, 25.8785400390625, 31.656349182128906, 37.43415832519531, 43.21196365356445, 48.98977279663086, 54.767578125, 60.545379638671875, 66.32318878173828, 72.10099792480469, 77.87879943847656, 83.65660858154297, 89.43441772460938, 95.21222686767578, 100.99003601074219, 106.76783752441406, 112.54564666748047, 118.32345581054688, 124.10125732421875, 129.8790740966797, 135.65687561035156, 141.4346923828125, 147.21249389648438, 152.99029541015625, 158.76809692382812, 164.54591369628906, 170.32371520996094, 176.10153198242188, 181.87933349609375, 187.65713500976562, 193.43495178222656, 199.2127685546875, 204.99057006835938, 210.7683868408203, 216.5461883544922, 222.32400512695312, 228.101806640625, 233.87960815429688, 239.6574249267578, 245.4352264404297]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 4.0, 7.0, 3.0, 9.0, 7.0, 11.0, 11.0, 13.0, 11.0, 14.0, 16.0, 27.0, 19.0, 37.0, 32.0, 38.0, 36.0, 36.0, 38.0, 48.0, 40.0, 43.0, 34.0, 38.0, 35.0, 45.0, 50.0, 26.0, 34.0, 39.0, 29.0, 29.0, 24.0, 20.0, 18.0, 15.0, 23.0, 8.0, 8.0, 6.0, 9.0, 4.0, 4.0, 4.0, 0.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-32.95263671875, -31.8546142578125, -30.756591796875, -29.6585693359375, -28.560546875, -27.4625244140625, -26.364503860473633, -25.266481399536133, -24.168458938598633, -23.070436477661133, -21.972414016723633, -20.874391555786133, -19.776371002197266, -18.678348541259766, -17.580326080322266, -16.482303619384766, -15.384281158447266, -14.286258697509766, -13.188236236572266, -12.090214729309082, -10.992192268371582, -9.894169807434082, -8.796148300170898, -7.698125839233398, -6.600103378295898, -5.502080917358398, -4.404058933258057, -3.3060367107391357, -2.208014488220215, -1.1099920272827148, -0.011970043182373047, 1.0860519409179688, 2.1840744018554688, 3.2820966243743896, 4.3801188468933105, 5.478140830993652, 6.576163291931152, 7.674185752868652, 8.772207260131836, 9.870229721069336, 10.968252182006836, 12.066274642944336, 13.164297103881836, 14.26231861114502, 15.36034107208252, 16.458362579345703, 17.556385040283203, 18.654407501220703, 19.752429962158203, 20.850452423095703, 21.948474884033203, 23.046497344970703, 24.144519805908203, 25.242542266845703, 26.34056282043457, 27.43858528137207, 28.53660774230957, 29.63463020324707, 30.73265266418457, 31.83067512512207, 32.92869567871094, 34.02671813964844, 35.12474060058594, 36.22276306152344, 37.32078552246094]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 0.0, 3.0, 8.0, 5.0, 9.0, 13.0, 14.0, 14.0, 12.0, 20.0, 16.0, 24.0, 27.0, 34.0, 38.0, 36.0, 42.0, 41.0, 26.0, 39.0, 43.0, 48.0, 45.0, 38.0, 27.0, 40.0, 34.0, 32.0, 38.0, 32.0, 27.0, 25.0, 29.0, 15.0, 18.0, 12.0, 10.0, 10.0, 11.0, 7.0, 10.0, 6.0, 4.0, 6.0, 7.0, 1.0, 2.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.29296875, -5.1168212890625, -4.940673828125, -4.7645263671875, -4.58837890625, -4.4122314453125, -4.236083984375, -4.0599365234375, -3.8837890625, -3.7076416015625, -3.531494140625, -3.3553466796875, -3.17919921875, -3.0030517578125, -2.826904296875, -2.6507568359375, -2.474609375, -2.2984619140625, -2.122314453125, -1.9461669921875, -1.77001953125, -1.5938720703125, -1.417724609375, -1.2415771484375, -1.0654296875, -0.8892822265625, -0.713134765625, -0.5369873046875, -0.36083984375, -0.1846923828125, -0.008544921875, 0.1676025390625, 0.34375, 0.5198974609375, 0.696044921875, 0.8721923828125, 1.04833984375, 1.2244873046875, 1.400634765625, 1.5767822265625, 1.7529296875, 1.9290771484375, 2.105224609375, 2.2813720703125, 2.45751953125, 2.6336669921875, 2.809814453125, 2.9859619140625, 3.162109375, 3.3382568359375, 3.514404296875, 3.6905517578125, 3.86669921875, 4.0428466796875, 4.218994140625, 4.3951416015625, 4.5712890625, 4.7474365234375, 4.923583984375, 5.0997314453125, 5.27587890625, 5.4520263671875, 5.628173828125, 5.8043212890625, 5.98046875]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 6.0, 7.0, 9.0, 7.0, 14.0, 27.0, 28.0, 45.0, 81.0, 122.0, 173.0, 239.0, 448.0, 644.0, 1090.0, 1750.0, 2917.0, 4902.0, 8327.0, 13831.0, 23790.0, 42932.0, 79968.0, 158585.0, 262641.0, 208138.0, 107752.0, 55784.0, 30747.0, 17696.0, 10200.0, 6110.0, 3735.0, 2187.0, 1342.0, 839.0, 496.0, 355.0, 202.0, 130.0, 92.0, 59.0, 35.0, 28.0, 18.0, 14.0, 1.0, 11.0, 4.0, 4.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.62255859375, -0.6035308837890625, -0.584503173828125, -0.5654754638671875, -0.54644775390625, -0.5274200439453125, -0.508392333984375, -0.4893646240234375, -0.4703369140625, -0.4513092041015625, -0.432281494140625, -0.4132537841796875, -0.39422607421875, -0.3751983642578125, -0.356170654296875, -0.3371429443359375, -0.318115234375, -0.2990875244140625, -0.280059814453125, -0.2610321044921875, -0.24200439453125, -0.2229766845703125, -0.203948974609375, -0.1849212646484375, -0.1658935546875, -0.1468658447265625, -0.127838134765625, -0.1088104248046875, -0.08978271484375, -0.0707550048828125, -0.051727294921875, -0.0326995849609375, -0.013671875, 0.0053558349609375, 0.024383544921875, 0.0434112548828125, 0.06243896484375, 0.0814666748046875, 0.100494384765625, 0.1195220947265625, 0.1385498046875, 0.1575775146484375, 0.176605224609375, 0.1956329345703125, 0.21466064453125, 0.2336883544921875, 0.252716064453125, 0.2717437744140625, 0.290771484375, 0.3097991943359375, 0.328826904296875, 0.3478546142578125, 0.36688232421875, 0.3859100341796875, 0.404937744140625, 0.4239654541015625, 0.4429931640625, 0.4620208740234375, 0.481048583984375, 0.5000762939453125, 0.51910400390625, 0.5381317138671875, 0.557159423828125, 0.5761871337890625, 0.59521484375]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 5.0, 8.0, 8.0, 18.0, 6.0, 20.0, 15.0, 16.0, 26.0, 28.0, 20.0, 26.0, 26.0, 32.0, 31.0, 36.0, 28.0, 32.0, 41.0, 37.0, 54.0, 1054.0, 36.0, 39.0, 35.0, 39.0, 31.0, 36.0, 29.0, 38.0, 23.0, 19.0, 20.0, 19.0, 14.0, 20.0, 8.0, 15.0, 11.0, 8.0, 3.0, 7.0, 3.0, 4.0, 2.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0], "bins": [-4.0234375, -3.907012939453125, -3.79058837890625, -3.674163818359375, -3.5577392578125, -3.441314697265625, -3.32489013671875, -3.208465576171875, -3.092041015625, -2.975616455078125, -2.85919189453125, -2.742767333984375, -2.6263427734375, -2.509918212890625, -2.39349365234375, -2.277069091796875, -2.16064453125, -2.044219970703125, -1.92779541015625, -1.811370849609375, -1.6949462890625, -1.578521728515625, -1.46209716796875, -1.345672607421875, -1.229248046875, -1.112823486328125, -0.99639892578125, -0.879974365234375, -0.7635498046875, -0.647125244140625, -0.53070068359375, -0.414276123046875, -0.2978515625, -0.181427001953125, -0.06500244140625, 0.051422119140625, 0.1678466796875, 0.284271240234375, 0.40069580078125, 0.517120361328125, 0.633544921875, 0.749969482421875, 0.86639404296875, 0.982818603515625, 1.0992431640625, 1.215667724609375, 1.33209228515625, 1.448516845703125, 1.56494140625, 1.681365966796875, 1.79779052734375, 1.914215087890625, 2.0306396484375, 2.147064208984375, 2.26348876953125, 2.379913330078125, 2.496337890625, 2.612762451171875, 2.72918701171875, 2.845611572265625, 2.9620361328125, 3.078460693359375, 3.19488525390625, 3.311309814453125, 3.427734375]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 1.0, 6.0, 2.0, 9.0, 12.0, 21.0, 21.0, 37.0, 38.0, 63.0, 77.0, 129.0, 215.0, 327.0, 522.0, 794.0, 1375.0, 2253.0, 3784.0, 6184.0, 10562.0, 17663.0, 30737.0, 53792.0, 92458.0, 149900.0, 1247823.0, 183972.0, 121693.0, 72048.0, 41722.0, 24020.0, 14028.0, 8221.0, 4842.0, 3005.0, 1775.0, 1085.0, 670.0, 436.0, 272.0, 155.0, 124.0, 77.0, 54.0, 35.0, 33.0, 23.0, 13.0, 9.0, 12.0, 5.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0], "bins": [-0.31396484375, -0.3037605285644531, -0.29355621337890625, -0.2833518981933594, -0.2731475830078125, -0.2629432678222656, -0.25273895263671875, -0.24253463745117188, -0.232330322265625, -0.22212600708007812, -0.21192169189453125, -0.20171737670898438, -0.1915130615234375, -0.18130874633789062, -0.17110443115234375, -0.16090011596679688, -0.15069580078125, -0.14049148559570312, -0.13028717041015625, -0.12008285522460938, -0.1098785400390625, -0.09967422485351562, -0.08946990966796875, -0.07926559448242188, -0.069061279296875, -0.058856964111328125, -0.04865264892578125, -0.038448333740234375, -0.0282440185546875, -0.018039703369140625, -0.00783538818359375, 0.002368927001953125, 0.0125732421875, 0.022777557373046875, 0.03298187255859375, 0.043186187744140625, 0.0533905029296875, 0.06359481811523438, 0.07379913330078125, 0.08400344848632812, 0.094207763671875, 0.10441207885742188, 0.11461639404296875, 0.12482070922851562, 0.1350250244140625, 0.14522933959960938, 0.15543365478515625, 0.16563796997070312, 0.17584228515625, 0.18604660034179688, 0.19625091552734375, 0.20645523071289062, 0.2166595458984375, 0.22686386108398438, 0.23706817626953125, 0.24727249145507812, 0.257476806640625, 0.2676811218261719, 0.27788543701171875, 0.2880897521972656, 0.2982940673828125, 0.3084983825683594, 0.31870269775390625, 0.3289070129394531, 0.339111328125]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 4.0, 2.0, 2.0, 3.0, 5.0, 7.0, 5.0, 14.0, 12.0, 21.0, 28.0, 34.0, 64.0, 100.0, 153.0, 154.0, 112.0, 80.0, 53.0, 34.0, 28.0, 15.0, 17.0, 10.0, 9.0, 3.0, 5.0, 4.0, 3.0, 8.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00548553466796875, -0.005334198474884033, -0.005182862281799316, -0.0050315260887146, -0.004880189895629883, -0.004728853702545166, -0.004577517509460449, -0.004426181316375732, -0.004274845123291016, -0.004123508930206299, -0.003972172737121582, -0.0038208365440368652, -0.0036695003509521484, -0.0035181641578674316, -0.003366827964782715, -0.003215491771697998, -0.0030641555786132812, -0.0029128193855285645, -0.0027614831924438477, -0.002610146999359131, -0.002458810806274414, -0.0023074746131896973, -0.0021561384201049805, -0.0020048022270202637, -0.0018534660339355469, -0.00170212984085083, -0.0015507936477661133, -0.0013994574546813965, -0.0012481212615966797, -0.0010967850685119629, -0.0009454488754272461, -0.0007941126823425293, -0.0006427764892578125, -0.0004914402961730957, -0.0003401041030883789, -0.0001887679100036621, -3.743171691894531e-05, 0.00011390447616577148, 0.0002652406692504883, 0.0004165768623352051, 0.0005679130554199219, 0.0007192492485046387, 0.0008705854415893555, 0.0010219216346740723, 0.001173257827758789, 0.0013245940208435059, 0.0014759302139282227, 0.0016272664070129395, 0.0017786026000976562, 0.001929938793182373, 0.00208127498626709, 0.0022326111793518066, 0.0023839473724365234, 0.0025352835655212402, 0.002686619758605957, 0.002837955951690674, 0.0029892921447753906, 0.0031406283378601074, 0.0032919645309448242, 0.003443300724029541, 0.003594636917114258, 0.0037459731101989746, 0.0038973093032836914, 0.004048645496368408, 0.004199981689453125]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 2.0, 4.0, 8.0, 4.0, 9.0, 10.0, 7.0, 8.0, 13.0, 14.0, 26.0, 30.0, 50.0, 81.0, 115.0, 263.0, 1179.0, 36338.0, 992698.0, 16432.0, 733.0, 177.0, 104.0, 67.0, 50.0, 25.0, 24.0, 14.0, 16.0, 7.0, 8.0, 3.0, 5.0, 5.0, 3.0, 5.0, 2.0, 4.0, 4.0, 0.0, 2.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08282470703125, -0.08000850677490234, -0.07719230651855469, -0.07437610626220703, -0.07155990600585938, -0.06874370574951172, -0.06592750549316406, -0.0631113052368164, -0.06029510498046875, -0.057478904724121094, -0.05466270446777344, -0.05184650421142578, -0.049030303955078125, -0.04621410369873047, -0.04339790344238281, -0.040581703186035156, -0.0377655029296875, -0.034949302673339844, -0.03213310241699219, -0.02931690216064453, -0.026500701904296875, -0.02368450164794922, -0.020868301391601562, -0.018052101135253906, -0.01523590087890625, -0.012419700622558594, -0.009603500366210938, -0.006787300109863281, -0.003971099853515625, -0.0011548995971679688, 0.0016613006591796875, 0.004477500915527344, 0.007293701171875, 0.010109901428222656, 0.012926101684570312, 0.01574230194091797, 0.018558502197265625, 0.02137470245361328, 0.024190902709960938, 0.027007102966308594, 0.02982330322265625, 0.032639503479003906, 0.03545570373535156, 0.03827190399169922, 0.041088104248046875, 0.04390430450439453, 0.04672050476074219, 0.049536705017089844, 0.0523529052734375, 0.055169105529785156, 0.05798530578613281, 0.06080150604248047, 0.06361770629882812, 0.06643390655517578, 0.06925010681152344, 0.0720663070678711, 0.07488250732421875, 0.0776987075805664, 0.08051490783691406, 0.08333110809326172, 0.08614730834960938, 0.08896350860595703, 0.09177970886230469, 0.09459590911865234, 0.097412109375]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 16.0, 85.0, 662.0, 217.0, 33.0, 2.0], "bins": [-0.08191760629415512, -0.08056759834289551, -0.0792175903916359, -0.07786757498979568, -0.07651756703853607, -0.07516755908727646, -0.07381755113601685, -0.07246753573417664, -0.07111752778291702, -0.06976751983165741, -0.0684175118803978, -0.06706749647855759, -0.06571748852729797, -0.06436748057603836, -0.06301747262477875, -0.061667460948228836, -0.060317449271678925, -0.05896744132041931, -0.0576174296438694, -0.05626742169260979, -0.054917410016059875, -0.05356740206480026, -0.05221739038825035, -0.05086738243699074, -0.049517374485731125, -0.04816736653447151, -0.0468173548579216, -0.04546734690666199, -0.044117335230112076, -0.04276732727885246, -0.04141731560230255, -0.04006730765104294, -0.038717299699783325, -0.03736729174852371, -0.0360172800719738, -0.03466727212071419, -0.033317260444164276, -0.03196725249290466, -0.03061724081635475, -0.02926723286509514, -0.027917221188545227, -0.026567211374640465, -0.025217201560735703, -0.02386719174683094, -0.022517181932926178, -0.021167172119021416, -0.019817162305116653, -0.01846715435385704, -0.017117144539952278, -0.015767134726047516, -0.014417124912142754, -0.013067115098237991, -0.011717105284333229, -0.010367095470428467, -0.00901708658784628, -0.007667076773941517, -0.006317066494375467, -0.004967056680470705, -0.0036170470993965864, -0.002267037518322468, -0.0009170277044177055, 0.00043298210948705673, 0.0017829914577305317, 0.003133001271635294, 0.004483011085540056]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 3.0, 4.0, 8.0, 5.0, 8.0, 9.0, 14.0, 15.0, 20.0, 26.0, 24.0, 31.0, 31.0, 36.0, 35.0, 51.0, 52.0, 40.0, 55.0, 57.0, 49.0, 60.0, 35.0, 55.0, 40.0, 32.0, 37.0, 33.0, 30.0, 27.0, 20.0, 12.0, 16.0, 13.0, 6.0, 12.0, 1.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002838134765625, -0.0027212779968976974, -0.002604421228170395, -0.0024875644594430923, -0.00237070769071579, -0.0022538509219884872, -0.0021369941532611847, -0.002020137384533882, -0.0019032806158065796, -0.001786423847079277, -0.0016695670783519745, -0.001552710309624672, -0.0014358535408973694, -0.0013189967721700668, -0.0012021400034427643, -0.0010852832347154617, -0.0009684264659881592, -0.0008515696972608566, -0.0007347129285335541, -0.0006178561598062515, -0.000500999391078949, -0.0003841426223516464, -0.00026728585362434387, -0.00015042908489704132, -3.357231616973877e-05, 8.328445255756378e-05, 0.00020014122128486633, 0.0003169979900121689, 0.00043385475873947144, 0.000550711527466774, 0.0006675682961940765, 0.0007844250649213791, 0.0009012818336486816, 0.0010181386023759842, 0.0011349953711032867, 0.0012518521398305893, 0.0013687089085578918, 0.0014855656772851944, 0.001602422446012497, 0.0017192792147397995, 0.001836135983467102, 0.0019529927521944046, 0.002069849520921707, 0.0021867062896490097, 0.0023035630583763123, 0.002420419827103615, 0.0025372765958309174, 0.00265413336455822, 0.0027709901332855225, 0.002887846902012825, 0.0030047036707401276, 0.00312156043946743, 0.0032384172081947327, 0.0033552739769220352, 0.0034721307456493378, 0.0035889875143766403, 0.003705844283103943, 0.0038227010518312454, 0.003939557820558548, 0.0040564145892858505, 0.004173271358013153, 0.004290128126740456, 0.004406984895467758, 0.004523841664195061, 0.004640698432922363]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 0.0, 3.0, 8.0, 5.0, 9.0, 13.0, 14.0, 14.0, 12.0, 20.0, 16.0, 24.0, 27.0, 34.0, 38.0, 36.0, 42.0, 41.0, 26.0, 39.0, 43.0, 49.0, 44.0, 38.0, 27.0, 40.0, 34.0, 32.0, 38.0, 32.0, 27.0, 24.0, 30.0, 15.0, 18.0, 12.0, 10.0, 10.0, 11.0, 7.0, 10.0, 6.0, 4.0, 6.0, 7.0, 1.0, 2.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.29296875, -5.1168212890625, -4.940673828125, -4.7645263671875, -4.58837890625, -4.4122314453125, -4.236083984375, -4.0599365234375, -3.8837890625, -3.7076416015625, -3.531494140625, -3.3553466796875, -3.17919921875, -3.0030517578125, -2.826904296875, -2.6507568359375, -2.474609375, -2.2984619140625, -2.122314453125, -1.9461669921875, -1.77001953125, -1.5938720703125, -1.417724609375, -1.2415771484375, -1.0654296875, -0.8892822265625, -0.713134765625, -0.5369873046875, -0.36083984375, -0.1846923828125, -0.008544921875, 0.1676025390625, 0.34375, 0.5198974609375, 0.696044921875, 0.8721923828125, 1.04833984375, 1.2244873046875, 1.400634765625, 1.5767822265625, 1.7529296875, 1.9290771484375, 2.105224609375, 2.2813720703125, 2.45751953125, 2.6336669921875, 2.809814453125, 2.9859619140625, 3.162109375, 3.3382568359375, 3.514404296875, 3.6905517578125, 3.86669921875, 4.0428466796875, 4.218994140625, 4.3951416015625, 4.5712890625, 4.7474365234375, 4.923583984375, 5.0997314453125, 5.27587890625, 5.4520263671875, 5.628173828125, 5.8043212890625, 5.98046875]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 3.0, 1.0, 3.0, 11.0, 10.0, 17.0, 20.0, 25.0, 25.0, 28.0, 50.0, 58.0, 101.0, 102.0, 211.0, 355.0, 601.0, 1226.0, 2682.0, 6222.0, 16718.0, 61682.0, 477197.0, 400720.0, 54140.0, 15272.0, 5799.0, 2547.0, 1160.0, 575.0, 334.0, 173.0, 124.0, 96.0, 58.0, 46.0, 40.0, 23.0, 22.0, 19.0, 12.0, 12.0, 7.0, 8.0, 6.0, 6.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.3203125, -9.975830078125, -9.63134765625, -9.286865234375, -8.9423828125, -8.597900390625, -8.25341796875, -7.908935546875, -7.564453125, -7.219970703125, -6.87548828125, -6.531005859375, -6.1865234375, -5.842041015625, -5.49755859375, -5.153076171875, -4.80859375, -4.464111328125, -4.11962890625, -3.775146484375, -3.4306640625, -3.086181640625, -2.74169921875, -2.397216796875, -2.052734375, -1.708251953125, -1.36376953125, -1.019287109375, -0.6748046875, -0.330322265625, 0.01416015625, 0.358642578125, 0.703125, 1.047607421875, 1.39208984375, 1.736572265625, 2.0810546875, 2.425537109375, 2.77001953125, 3.114501953125, 3.458984375, 3.803466796875, 4.14794921875, 4.492431640625, 4.8369140625, 5.181396484375, 5.52587890625, 5.870361328125, 6.21484375, 6.559326171875, 6.90380859375, 7.248291015625, 7.5927734375, 7.937255859375, 8.28173828125, 8.626220703125, 8.970703125, 9.315185546875, 9.65966796875, 10.004150390625, 10.3486328125, 10.693115234375, 11.03759765625, 11.382080078125, 11.7265625]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 7.0, 5.0, 4.0, 14.0, 9.0, 9.0, 18.0, 17.0, 19.0, 22.0, 37.0, 26.0, 37.0, 36.0, 41.0, 42.0, 55.0, 57.0, 87.0, 188.0, 1533.0, 258.0, 122.0, 72.0, 51.0, 34.0, 48.0, 36.0, 19.0, 38.0, 16.0, 15.0, 11.0, 15.0, 18.0, 12.0, 10.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-19.59375, -19.029052734375, -18.46435546875, -17.899658203125, -17.3349609375, -16.770263671875, -16.20556640625, -15.640869140625, -15.076171875, -14.511474609375, -13.94677734375, -13.382080078125, -12.8173828125, -12.252685546875, -11.68798828125, -11.123291015625, -10.55859375, -9.993896484375, -9.42919921875, -8.864501953125, -8.2998046875, -7.735107421875, -7.17041015625, -6.605712890625, -6.041015625, -5.476318359375, -4.91162109375, -4.346923828125, -3.7822265625, -3.217529296875, -2.65283203125, -2.088134765625, -1.5234375, -0.958740234375, -0.39404296875, 0.170654296875, 0.7353515625, 1.300048828125, 1.86474609375, 2.429443359375, 2.994140625, 3.558837890625, 4.12353515625, 4.688232421875, 5.2529296875, 5.817626953125, 6.38232421875, 6.947021484375, 7.51171875, 8.076416015625, 8.64111328125, 9.205810546875, 9.7705078125, 10.335205078125, 10.89990234375, 11.464599609375, 12.029296875, 12.593994140625, 13.15869140625, 13.723388671875, 14.2880859375, 14.852783203125, 15.41748046875, 15.982177734375, 16.546875]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 7.0, 3.0, 6.0, 15.0, 11.0, 20.0, 13.0, 20.0, 31.0, 43.0, 35.0, 53.0, 94.0, 119.0, 227.0, 471.0, 1758.0, 17757.0, 2818940.0, 297316.0, 6709.0, 982.0, 351.0, 182.0, 112.0, 96.0, 69.0, 61.0, 38.0, 29.0, 31.0, 23.0, 16.0, 14.0, 13.0, 9.0, 12.0, 6.0, 7.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.40625, -35.14306640625, -33.8798828125, -32.61669921875, -31.353515625, -30.09033203125, -28.8271484375, -27.56396484375, -26.30078125, -25.03759765625, -23.7744140625, -22.51123046875, -21.248046875, -19.98486328125, -18.7216796875, -17.45849609375, -16.1953125, -14.93212890625, -13.6689453125, -12.40576171875, -11.142578125, -9.87939453125, -8.6162109375, -7.35302734375, -6.08984375, -4.82666015625, -3.5634765625, -2.30029296875, -1.037109375, 0.22607421875, 1.4892578125, 2.75244140625, 4.015625, 5.27880859375, 6.5419921875, 7.80517578125, 9.068359375, 10.33154296875, 11.5947265625, 12.85791015625, 14.12109375, 15.38427734375, 16.6474609375, 17.91064453125, 19.173828125, 20.43701171875, 21.7001953125, 22.96337890625, 24.2265625, 25.48974609375, 26.7529296875, 28.01611328125, 29.279296875, 30.54248046875, 31.8056640625, 33.06884765625, 34.33203125, 35.59521484375, 36.8583984375, 38.12158203125, 39.384765625, 40.64794921875, 41.9111328125, 43.17431640625, 44.4375]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 12.0, 173.0, 484.0, 303.0, 45.0], "bins": [-208.68045043945312, -205.2956085205078, -201.9107666015625, -198.52593994140625, -195.14109802246094, -191.75625610351562, -188.37142944335938, -184.98658752441406, -181.60174560546875, -178.21690368652344, -174.83206176757812, -171.44723510742188, -168.06239318847656, -164.67755126953125, -161.292724609375, -157.9078826904297, -154.52304077148438, -151.13819885253906, -147.75335693359375, -144.3685302734375, -140.9836883544922, -137.59884643554688, -134.21401977539062, -130.8291778564453, -127.4443359375, -124.05949401855469, -120.6746597290039, -117.28982543945312, -113.90498352050781, -110.5201416015625, -107.13530731201172, -103.75047302246094, -100.36563873291016, -96.98080444335938, -93.59596252441406, -90.21112060546875, -86.82628631591797, -83.44145202636719, -80.05661010742188, -76.67176818847656, -73.28693389892578, -69.902099609375, -66.51725769042969, -63.13241958618164, -59.747581481933594, -56.36274337768555, -52.9779052734375, -49.59306716918945, -46.20822525024414, -42.823387145996094, -39.43854904174805, -36.0537109375, -32.66887283325195, -29.284034729003906, -25.89919662475586, -22.514358520507812, -19.129520416259766, -15.744682312011719, -12.359844207763672, -8.975006103515625, -5.590167999267578, -2.2053298950195312, 1.1795082092285156, 4.5643463134765625, 7.949183464050293]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 5.0, 2.0, 2.0, 4.0, 4.0, 5.0, 10.0, 8.0, 12.0, 14.0, 20.0, 22.0, 13.0, 23.0, 19.0, 37.0, 30.0, 31.0, 28.0, 35.0, 34.0, 45.0, 44.0, 38.0, 29.0, 49.0, 30.0, 38.0, 33.0, 39.0, 49.0, 30.0, 35.0, 26.0, 27.0, 25.0, 12.0, 29.0, 15.0, 11.0, 7.0, 9.0, 7.0, 8.0, 5.0, 3.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-44.03089141845703, -42.72881317138672, -41.42673873901367, -40.124664306640625, -38.82258605957031, -37.5205078125, -36.21843338012695, -34.916358947753906, -33.614280700683594, -32.31220245361328, -31.010128021240234, -29.708051681518555, -28.405975341796875, -27.103899002075195, -25.801822662353516, -24.499746322631836, -23.197669982910156, -21.895593643188477, -20.593517303466797, -19.291440963745117, -17.989364624023438, -16.687288284301758, -15.385211944580078, -14.083135604858398, -12.781059265136719, -11.478982925415039, -10.17690658569336, -8.87483024597168, -7.57275390625, -6.27067756652832, -4.968601226806641, -3.666524887084961, -2.3644485473632812, -1.0623722076416016, 0.23970413208007812, 1.5417804718017578, 2.8438568115234375, 4.145933151245117, 5.448009490966797, 6.750085830688477, 8.052162170410156, 9.354238510131836, 10.656314849853516, 11.958391189575195, 13.260467529296875, 14.562543869018555, 15.864620208740234, 17.166696548461914, 18.468772888183594, 19.770849227905273, 21.072925567626953, 22.375001907348633, 23.677078247070312, 24.979154586791992, 26.281230926513672, 27.58330726623535, 28.88538360595703, 30.18745994567871, 31.48953628540039, 32.79161071777344, 34.09368896484375, 35.39576721191406, 36.69784164428711, 37.999916076660156, 39.30199432373047]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 2.0, 3.0, 6.0, 5.0, 6.0, 9.0, 6.0, 14.0, 13.0, 24.0, 16.0, 18.0, 21.0, 27.0, 37.0, 26.0, 40.0, 41.0, 38.0, 33.0, 37.0, 46.0, 35.0, 47.0, 40.0, 32.0, 32.0, 38.0, 35.0, 33.0, 29.0, 32.0, 21.0, 31.0, 16.0, 15.0, 20.0, 19.0, 10.0, 15.0, 6.0, 4.0, 5.0, 5.0, 3.0, 3.0, 3.0, 5.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-5.43359375, -5.25335693359375, -5.0731201171875, -4.89288330078125, -4.712646484375, -4.53240966796875, -4.3521728515625, -4.17193603515625, -3.99169921875, -3.81146240234375, -3.6312255859375, -3.45098876953125, -3.270751953125, -3.09051513671875, -2.9102783203125, -2.73004150390625, -2.5498046875, -2.36956787109375, -2.1893310546875, -2.00909423828125, -1.828857421875, -1.64862060546875, -1.4683837890625, -1.28814697265625, -1.10791015625, -0.92767333984375, -0.7474365234375, -0.56719970703125, -0.386962890625, -0.20672607421875, -0.0264892578125, 0.15374755859375, 0.333984375, 0.51422119140625, 0.6944580078125, 0.87469482421875, 1.054931640625, 1.23516845703125, 1.4154052734375, 1.59564208984375, 1.77587890625, 1.95611572265625, 2.1363525390625, 2.31658935546875, 2.496826171875, 2.67706298828125, 2.8572998046875, 3.03753662109375, 3.2177734375, 3.39801025390625, 3.5782470703125, 3.75848388671875, 3.938720703125, 4.11895751953125, 4.2991943359375, 4.47943115234375, 4.65966796875, 4.83990478515625, 5.0201416015625, 5.20037841796875, 5.380615234375, 5.56085205078125, 5.7410888671875, 5.92132568359375, 6.1015625]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 3.0, 8.0, 7.0, 11.0, 15.0, 16.0, 26.0, 44.0, 63.0, 74.0, 138.0, 250.0, 407.0, 719.0, 1430.0, 2832.0, 6433.0, 15504.0, 42223.0, 142416.0, 646029.0, 2124106.0, 930745.0, 191097.0, 54841.0, 19373.0, 7920.0, 3475.0, 1803.0, 967.0, 498.0, 305.0, 160.0, 115.0, 67.0, 41.0, 36.0, 17.0, 12.0, 13.0, 13.0, 8.0, 6.0, 2.0, 8.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-10.4921875, -10.1602783203125, -9.828369140625, -9.4964599609375, -9.16455078125, -8.8326416015625, -8.500732421875, -8.1688232421875, -7.8369140625, -7.5050048828125, -7.173095703125, -6.8411865234375, -6.50927734375, -6.1773681640625, -5.845458984375, -5.5135498046875, -5.181640625, -4.8497314453125, -4.517822265625, -4.1859130859375, -3.85400390625, -3.5220947265625, -3.190185546875, -2.8582763671875, -2.5263671875, -2.1944580078125, -1.862548828125, -1.5306396484375, -1.19873046875, -0.8668212890625, -0.534912109375, -0.2030029296875, 0.12890625, 0.4608154296875, 0.792724609375, 1.1246337890625, 1.45654296875, 1.7884521484375, 2.120361328125, 2.4522705078125, 2.7841796875, 3.1160888671875, 3.447998046875, 3.7799072265625, 4.11181640625, 4.4437255859375, 4.775634765625, 5.1075439453125, 5.439453125, 5.7713623046875, 6.103271484375, 6.4351806640625, 6.76708984375, 7.0989990234375, 7.430908203125, 7.7628173828125, 8.0947265625, 8.4266357421875, 8.758544921875, 9.0904541015625, 9.42236328125, 9.7542724609375, 10.086181640625, 10.4180908203125, 10.75]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 9.0, 8.0, 14.0, 15.0, 16.0, 15.0, 25.0, 41.0, 46.0, 55.0, 91.0, 131.0, 123.0, 195.0, 241.0, 276.0, 379.0, 438.0, 448.0, 337.0, 292.0, 189.0, 169.0, 116.0, 87.0, 66.0, 60.0, 60.0, 28.0, 22.0, 27.0, 7.0, 13.0, 3.0, 7.0, 9.0, 4.0, 5.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.984375, -9.6795654296875, -9.374755859375, -9.0699462890625, -8.76513671875, -8.4603271484375, -8.155517578125, -7.8507080078125, -7.5458984375, -7.2410888671875, -6.936279296875, -6.6314697265625, -6.32666015625, -6.0218505859375, -5.717041015625, -5.4122314453125, -5.107421875, -4.8026123046875, -4.497802734375, -4.1929931640625, -3.88818359375, -3.5833740234375, -3.278564453125, -2.9737548828125, -2.6689453125, -2.3641357421875, -2.059326171875, -1.7545166015625, -1.44970703125, -1.1448974609375, -0.840087890625, -0.5352783203125, -0.23046875, 0.0743408203125, 0.379150390625, 0.6839599609375, 0.98876953125, 1.2935791015625, 1.598388671875, 1.9031982421875, 2.2080078125, 2.5128173828125, 2.817626953125, 3.1224365234375, 3.42724609375, 3.7320556640625, 4.036865234375, 4.3416748046875, 4.646484375, 4.9512939453125, 5.256103515625, 5.5609130859375, 5.86572265625, 6.1705322265625, 6.475341796875, 6.7801513671875, 7.0849609375, 7.3897705078125, 7.694580078125, 7.9993896484375, 8.30419921875, 8.6090087890625, 8.913818359375, 9.2186279296875, 9.5234375]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 3.0, 2.0, 5.0, 6.0, 6.0, 9.0, 14.0, 18.0, 19.0, 27.0, 30.0, 43.0, 74.0, 64.0, 110.0, 165.0, 230.0, 385.0, 776.0, 2105.0, 7221.0, 35322.0, 278807.0, 2964943.0, 807468.0, 77412.0, 13038.0, 3300.0, 1180.0, 525.0, 285.0, 152.0, 130.0, 98.0, 81.0, 57.0, 52.0, 33.0, 20.0, 17.0, 15.0, 11.0, 6.0, 9.0, 4.0, 2.0, 3.0, 1.0, 3.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0], "bins": [-23.546875, -22.80419921875, -22.0615234375, -21.31884765625, -20.576171875, -19.83349609375, -19.0908203125, -18.34814453125, -17.60546875, -16.86279296875, -16.1201171875, -15.37744140625, -14.634765625, -13.89208984375, -13.1494140625, -12.40673828125, -11.6640625, -10.92138671875, -10.1787109375, -9.43603515625, -8.693359375, -7.95068359375, -7.2080078125, -6.46533203125, -5.72265625, -4.97998046875, -4.2373046875, -3.49462890625, -2.751953125, -2.00927734375, -1.2666015625, -0.52392578125, 0.21875, 0.96142578125, 1.7041015625, 2.44677734375, 3.189453125, 3.93212890625, 4.6748046875, 5.41748046875, 6.16015625, 6.90283203125, 7.6455078125, 8.38818359375, 9.130859375, 9.87353515625, 10.6162109375, 11.35888671875, 12.1015625, 12.84423828125, 13.5869140625, 14.32958984375, 15.072265625, 15.81494140625, 16.5576171875, 17.30029296875, 18.04296875, 18.78564453125, 19.5283203125, 20.27099609375, 21.013671875, 21.75634765625, 22.4990234375, 23.24169921875, 23.984375]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 5.0, 4.0, 8.0, 24.0, 44.0, 62.0, 112.0, 143.0, 155.0, 131.0, 122.0, 90.0, 60.0, 30.0, 10.0, 4.0, 10.0], "bins": [-120.45821380615234, -118.29277038574219, -116.12733459472656, -113.9618911743164, -111.79645538330078, -109.63101196289062, -107.465576171875, -105.30013275146484, -103.13468933105469, -100.96924591064453, -98.8038101196289, -96.63836669921875, -94.47293090820312, -92.30748748779297, -90.14204406738281, -87.97660827636719, -85.81117248535156, -83.6457290649414, -81.48029327392578, -79.31484985351562, -77.1494140625, -74.98397064208984, -72.81852722167969, -70.65309143066406, -68.4876480102539, -66.32220458984375, -64.15676879882812, -61.99132537841797, -59.82588577270508, -57.66044616699219, -55.4950065612793, -53.329566955566406, -51.164127349853516, -48.998687744140625, -46.833248138427734, -44.667808532714844, -42.50236511230469, -40.3369255065918, -38.171485900878906, -36.006046295166016, -33.840606689453125, -31.675167083740234, -29.50972557067871, -27.34428596496582, -25.178844451904297, -23.013404846191406, -20.847965240478516, -18.682525634765625, -16.51708221435547, -14.351641654968262, -12.186201095581055, -10.020761489868164, -7.855320930480957, -5.68988037109375, -3.5244407653808594, -1.3590002059936523, 0.8064403533935547, 2.9718806743621826, 5.1373209953308105, 7.302761077880859, 9.468201637268066, 11.633642196655273, 13.799081802368164, 15.964522361755371, 18.129962921142578]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 0.0, 3.0, 1.0, 4.0, 6.0, 8.0, 13.0, 10.0, 12.0, 18.0, 21.0, 14.0, 23.0, 28.0, 29.0, 28.0, 26.0, 38.0, 52.0, 37.0, 46.0, 41.0, 39.0, 39.0, 36.0, 35.0, 29.0, 42.0, 35.0, 30.0, 26.0, 35.0, 24.0, 29.0, 26.0, 23.0, 25.0, 11.0, 16.0, 7.0, 9.0, 8.0, 13.0, 5.0, 3.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-35.973297119140625, -34.8250846862793, -33.67687225341797, -32.52865982055664, -31.380447387695312, -30.232234954833984, -29.084020614624023, -27.935808181762695, -26.787595748901367, -25.63938331604004, -24.49117088317871, -23.342958450317383, -22.194744110107422, -21.046531677246094, -19.898319244384766, -18.750106811523438, -17.60189437866211, -16.45368194580078, -15.305469512939453, -14.157256126403809, -13.00904369354248, -11.860831260681152, -10.712617874145508, -9.56440544128418, -8.416193008422852, -7.267980575561523, -6.119767665863037, -4.971554756164551, -3.8233423233032227, -2.6751298904418945, -1.5269169807434082, -0.3787040710449219, 0.7695083618164062, 1.9177210330963135, 3.0659337043762207, 4.214146614074707, 5.362359046936035, 6.510571479797363, 7.65878438949585, 8.806997299194336, 9.955209732055664, 11.103422164916992, 12.25163459777832, 13.399847984313965, 14.548060417175293, 15.696272850036621, 16.844486236572266, 17.992698669433594, 19.140911102294922, 20.28912353515625, 21.437335968017578, 22.585548400878906, 23.733760833740234, 24.881973266601562, 26.030187606811523, 27.17840003967285, 28.32661247253418, 29.474824905395508, 30.623037338256836, 31.771249771118164, 32.919464111328125, 34.06767654418945, 35.21588897705078, 36.36410140991211, 37.51231384277344]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 4.0, 5.0, 3.0, 7.0, 19.0, 7.0, 9.0, 20.0, 13.0, 26.0, 29.0, 35.0, 38.0, 20.0, 18.0, 37.0, 42.0, 37.0, 36.0, 41.0, 48.0, 41.0, 47.0, 32.0, 36.0, 39.0, 25.0, 35.0, 21.0, 36.0, 32.0, 23.0, 25.0, 18.0, 16.0, 8.0, 10.0, 12.0, 9.0, 5.0, 5.0, 9.0, 8.0, 6.0, 3.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.91796875, -5.722900390625, -5.52783203125, -5.332763671875, -5.1376953125, -4.942626953125, -4.74755859375, -4.552490234375, -4.357421875, -4.162353515625, -3.96728515625, -3.772216796875, -3.5771484375, -3.382080078125, -3.18701171875, -2.991943359375, -2.796875, -2.601806640625, -2.40673828125, -2.211669921875, -2.0166015625, -1.821533203125, -1.62646484375, -1.431396484375, -1.236328125, -1.041259765625, -0.84619140625, -0.651123046875, -0.4560546875, -0.260986328125, -0.06591796875, 0.129150390625, 0.32421875, 0.519287109375, 0.71435546875, 0.909423828125, 1.1044921875, 1.299560546875, 1.49462890625, 1.689697265625, 1.884765625, 2.079833984375, 2.27490234375, 2.469970703125, 2.6650390625, 2.860107421875, 3.05517578125, 3.250244140625, 3.4453125, 3.640380859375, 3.83544921875, 4.030517578125, 4.2255859375, 4.420654296875, 4.61572265625, 4.810791015625, 5.005859375, 5.200927734375, 5.39599609375, 5.591064453125, 5.7861328125, 5.981201171875, 6.17626953125, 6.371337890625, 6.56640625]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 9.0, 8.0, 13.0, 14.0, 37.0, 40.0, 57.0, 109.0, 128.0, 182.0, 279.0, 381.0, 578.0, 847.0, 1338.0, 1896.0, 2869.0, 4280.0, 6435.0, 10201.0, 15981.0, 24661.0, 39513.0, 64938.0, 108434.0, 172546.0, 204069.0, 148777.0, 90386.0, 54850.0, 33927.0, 21226.0, 13529.0, 8784.0, 5720.0, 3854.0, 2503.0, 1656.0, 1098.0, 745.0, 531.0, 371.0, 232.0, 167.0, 112.0, 82.0, 59.0, 37.0, 26.0, 17.0, 11.0, 9.0, 6.0, 4.0, 1.0, 3.0, 0.0, 2.0], "bins": [-0.5009765625, -0.48548126220703125, -0.4699859619140625, -0.45449066162109375, -0.438995361328125, -0.42350006103515625, -0.4080047607421875, -0.39250946044921875, -0.37701416015625, -0.36151885986328125, -0.3460235595703125, -0.33052825927734375, -0.315032958984375, -0.29953765869140625, -0.2840423583984375, -0.26854705810546875, -0.2530517578125, -0.23755645751953125, -0.2220611572265625, -0.20656585693359375, -0.191070556640625, -0.17557525634765625, -0.1600799560546875, -0.14458465576171875, -0.12908935546875, -0.11359405517578125, -0.0980987548828125, -0.08260345458984375, -0.067108154296875, -0.05161285400390625, -0.0361175537109375, -0.02062225341796875, -0.005126953125, 0.01036834716796875, 0.0258636474609375, 0.04135894775390625, 0.056854248046875, 0.07234954833984375, 0.0878448486328125, 0.10334014892578125, 0.11883544921875, 0.13433074951171875, 0.1498260498046875, 0.16532135009765625, 0.180816650390625, 0.19631195068359375, 0.2118072509765625, 0.22730255126953125, 0.2427978515625, 0.25829315185546875, 0.2737884521484375, 0.28928375244140625, 0.304779052734375, 0.32027435302734375, 0.3357696533203125, 0.35126495361328125, 0.36676025390625, 0.38225555419921875, 0.3977508544921875, 0.41324615478515625, 0.428741455078125, 0.44423675537109375, 0.4597320556640625, 0.47522735595703125, 0.49072265625]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 1.0, 3.0, 3.0, 9.0, 6.0, 7.0, 7.0, 13.0, 13.0, 15.0, 14.0, 22.0, 18.0, 16.0, 24.0, 36.0, 33.0, 24.0, 24.0, 42.0, 41.0, 33.0, 38.0, 35.0, 1064.0, 44.0, 49.0, 29.0, 38.0, 40.0, 30.0, 32.0, 37.0, 24.0, 28.0, 21.0, 16.0, 12.0, 14.0, 9.0, 12.0, 12.0, 13.0, 12.0, 5.0, 7.0, 5.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0], "bins": [-4.12109375, -4.000091552734375, -3.87908935546875, -3.758087158203125, -3.6370849609375, -3.516082763671875, -3.39508056640625, -3.274078369140625, -3.153076171875, -3.032073974609375, -2.91107177734375, -2.790069580078125, -2.6690673828125, -2.548065185546875, -2.42706298828125, -2.306060791015625, -2.18505859375, -2.064056396484375, -1.94305419921875, -1.822052001953125, -1.7010498046875, -1.580047607421875, -1.45904541015625, -1.338043212890625, -1.217041015625, -1.096038818359375, -0.97503662109375, -0.854034423828125, -0.7330322265625, -0.612030029296875, -0.49102783203125, -0.370025634765625, -0.2490234375, -0.128021240234375, -0.00701904296875, 0.113983154296875, 0.2349853515625, 0.355987548828125, 0.47698974609375, 0.597991943359375, 0.718994140625, 0.839996337890625, 0.96099853515625, 1.082000732421875, 1.2030029296875, 1.324005126953125, 1.44500732421875, 1.566009521484375, 1.68701171875, 1.808013916015625, 1.92901611328125, 2.050018310546875, 2.1710205078125, 2.292022705078125, 2.41302490234375, 2.534027099609375, 2.655029296875, 2.776031494140625, 2.89703369140625, 3.018035888671875, 3.1390380859375, 3.260040283203125, 3.38104248046875, 3.502044677734375, 3.623046875]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 5.0, 0.0, 1.0, 1.0, 2.0, 4.0, 9.0, 12.0, 15.0, 20.0, 31.0, 43.0, 56.0, 96.0, 128.0, 201.0, 323.0, 505.0, 829.0, 1286.0, 2144.0, 3560.0, 6076.0, 10316.0, 18484.0, 32449.0, 57893.0, 100368.0, 163881.0, 1257243.0, 177571.0, 112274.0, 64952.0, 36650.0, 20933.0, 11628.0, 6978.0, 3883.0, 2361.0, 1478.0, 884.0, 531.0, 341.0, 237.0, 134.0, 100.0, 74.0, 53.0, 25.0, 24.0, 10.0, 11.0, 9.0, 8.0, 4.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.3505859375, -0.3394927978515625, -0.328399658203125, -0.3173065185546875, -0.30621337890625, -0.2951202392578125, -0.284027099609375, -0.2729339599609375, -0.2618408203125, -0.2507476806640625, -0.239654541015625, -0.2285614013671875, -0.21746826171875, -0.2063751220703125, -0.195281982421875, -0.1841888427734375, -0.173095703125, -0.1620025634765625, -0.150909423828125, -0.1398162841796875, -0.12872314453125, -0.1176300048828125, -0.106536865234375, -0.0954437255859375, -0.0843505859375, -0.0732574462890625, -0.062164306640625, -0.0510711669921875, -0.03997802734375, -0.0288848876953125, -0.017791748046875, -0.0066986083984375, 0.00439453125, 0.0154876708984375, 0.026580810546875, 0.0376739501953125, 0.04876708984375, 0.0598602294921875, 0.070953369140625, 0.0820465087890625, 0.0931396484375, 0.1042327880859375, 0.115325927734375, 0.1264190673828125, 0.13751220703125, 0.1486053466796875, 0.159698486328125, 0.1707916259765625, 0.181884765625, 0.1929779052734375, 0.204071044921875, 0.2151641845703125, 0.22625732421875, 0.2373504638671875, 0.248443603515625, 0.2595367431640625, 0.2706298828125, 0.2817230224609375, 0.292816162109375, 0.3039093017578125, 0.31500244140625, 0.3260955810546875, 0.337188720703125, 0.3482818603515625, 0.359375]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 4.0, 4.0, 4.0, 3.0, 4.0, 2.0, 8.0, 3.0, 10.0, 11.0, 13.0, 15.0, 13.0, 12.0, 18.0, 28.0, 23.0, 35.0, 64.0, 70.0, 125.0, 124.0, 89.0, 56.0, 51.0, 46.0, 26.0, 22.0, 27.0, 16.0, 12.0, 14.0, 6.0, 5.0, 5.0, 5.0, 7.0, 6.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00536346435546875, -0.005196571350097656, -0.0050296783447265625, -0.004862785339355469, -0.004695892333984375, -0.004528999328613281, -0.0043621063232421875, -0.004195213317871094, -0.0040283203125, -0.0038614273071289062, -0.0036945343017578125, -0.0035276412963867188, -0.003360748291015625, -0.0031938552856445312, -0.0030269622802734375, -0.0028600692749023438, -0.00269317626953125, -0.0025262832641601562, -0.0023593902587890625, -0.0021924972534179688, -0.002025604248046875, -0.0018587112426757812, -0.0016918182373046875, -0.0015249252319335938, -0.0013580322265625, -0.0011911392211914062, -0.0010242462158203125, -0.0008573532104492188, -0.000690460205078125, -0.0005235671997070312, -0.0003566741943359375, -0.00018978118896484375, -2.288818359375e-05, 0.00014400482177734375, 0.0003108978271484375, 0.00047779083251953125, 0.000644683837890625, 0.0008115768432617188, 0.0009784698486328125, 0.0011453628540039062, 0.001312255859375, 0.0014791488647460938, 0.0016460418701171875, 0.0018129348754882812, 0.001979827880859375, 0.0021467208862304688, 0.0023136138916015625, 0.0024805068969726562, 0.00264739990234375, 0.0028142929077148438, 0.0029811859130859375, 0.0031480789184570312, 0.003314971923828125, 0.0034818649291992188, 0.0036487579345703125, 0.0038156509399414062, 0.0039825439453125, 0.004149436950683594, 0.0043163299560546875, 0.004483222961425781, 0.004650115966796875, 0.004817008972167969, 0.0049839019775390625, 0.005150794982910156, 0.00531768798828125]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 7.0, 11.0, 9.0, 6.0, 6.0, 14.0, 21.0, 24.0, 24.0, 40.0, 65.0, 111.0, 151.0, 271.0, 893.0, 116627.0, 927815.0, 1577.0, 341.0, 165.0, 93.0, 64.0, 46.0, 32.0, 19.0, 27.0, 17.0, 11.0, 11.0, 11.0, 5.0, 4.0, 5.0, 2.0, 4.0, 3.0, 3.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12164306640625, -0.11785697937011719, -0.11407089233398438, -0.11028480529785156, -0.10649871826171875, -0.10271263122558594, -0.09892654418945312, -0.09514045715332031, -0.0913543701171875, -0.08756828308105469, -0.08378219604492188, -0.07999610900878906, -0.07621002197265625, -0.07242393493652344, -0.06863784790039062, -0.06485176086425781, -0.061065673828125, -0.05727958679199219, -0.053493499755859375, -0.04970741271972656, -0.04592132568359375, -0.04213523864746094, -0.038349151611328125, -0.03456306457519531, -0.0307769775390625, -0.026990890502929688, -0.023204803466796875, -0.019418716430664062, -0.01563262939453125, -0.011846542358398438, -0.008060455322265625, -0.0042743682861328125, -0.00048828125, 0.0032978057861328125, 0.007083892822265625, 0.010869979858398438, 0.01465606689453125, 0.018442153930664062, 0.022228240966796875, 0.026014328002929688, 0.0298004150390625, 0.03358650207519531, 0.037372589111328125, 0.04115867614746094, 0.04494476318359375, 0.04873085021972656, 0.052516937255859375, 0.05630302429199219, 0.060089111328125, 0.06387519836425781, 0.06766128540039062, 0.07144737243652344, 0.07523345947265625, 0.07901954650878906, 0.08280563354492188, 0.08659172058105469, 0.0903778076171875, 0.09416389465332031, 0.09794998168945312, 0.10173606872558594, 0.10552215576171875, 0.10930824279785156, 0.11309432983398438, 0.11688041687011719, 0.12066650390625]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 70.0, 949.0], "bins": [-0.19887615740299225, -0.19573211669921875, -0.19258809089660645, -0.18944405019283295, -0.18630002439022064, -0.18315598368644714, -0.18001195788383484, -0.17686791718006134, -0.17372387647628784, -0.17057983577251434, -0.16743580996990204, -0.16429176926612854, -0.16114774346351624, -0.15800370275974274, -0.15485966205596924, -0.15171563625335693, -0.14857161045074463, -0.14542756974697113, -0.14228354394435883, -0.13913950324058533, -0.13599547743797302, -0.13285143673419952, -0.12970739603042603, -0.12656337022781372, -0.12341932952404022, -0.12027529627084732, -0.11713126301765442, -0.11398722231388092, -0.11084318906068802, -0.10769915580749512, -0.10455512255430222, -0.10141108930110931, -0.09826704859733582, -0.09512301534414291, -0.09197898209095001, -0.08883494138717651, -0.08569090813398361, -0.08254687488079071, -0.07940284162759781, -0.07625880837440491, -0.073114775121212, -0.0699707418680191, -0.0668267086148262, -0.0636826753616333, -0.0605386346578598, -0.0573946014046669, -0.054250568151474, -0.0511065348982811, -0.0479624979197979, -0.044818464666604996, -0.041674427688121796, -0.038530394434928894, -0.03538636118173599, -0.03224232420325279, -0.02909829095005989, -0.02595425583422184, -0.02281021885573864, -0.01966618373990059, -0.016522150486707687, -0.013378115370869637, -0.010234080255031586, -0.007090045139193535, -0.003946011886000633, -0.0008019767701625824, 0.0023420576471835375]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 4.0, 10.0, 10.0, 10.0, 17.0, 13.0, 23.0, 40.0, 35.0, 44.0, 46.0, 37.0, 59.0, 72.0, 73.0, 62.0, 77.0, 70.0, 47.0, 51.0, 47.0, 30.0, 36.0, 24.0, 21.0, 15.0, 9.0, 9.0, 3.0, 4.0, 0.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004844188690185547, -0.004624322988092899, -0.004404457286000252, -0.004184591583907604, -0.003964725881814957, -0.003744860179722309, -0.0035249944776296616, -0.003305128775537014, -0.0030852630734443665, -0.002865397371351719, -0.0026455316692590714, -0.002425665967166424, -0.0022058002650737762, -0.0019859345629811287, -0.0017660688608884811, -0.0015462031587958336, -0.001326337456703186, -0.0011064717546105385, -0.0008866060525178909, -0.0006667403504252434, -0.0004468746483325958, -0.00022700894623994827, -7.14324414730072e-06, 0.00021272245794534683, 0.0004325881600379944, 0.0006524538621306419, 0.0008723195642232895, 0.001092185266315937, 0.0013120509684085846, 0.0015319166705012321, 0.0017517823725938797, 0.0019716480746865273, 0.002191513776779175, 0.0024113794788718224, 0.00263124518096447, 0.0028511108830571175, 0.003070976585149765, 0.0032908422872424126, 0.00351070798933506, 0.0037305736914277077, 0.003950439393520355, 0.004170305095613003, 0.00439017079770565, 0.004610036499798298, 0.0048299022018909454, 0.005049767903983593, 0.0052696336060762405, 0.005489499308168888, 0.005709365010261536, 0.005929230712354183, 0.006149096414446831, 0.006368962116539478, 0.006588827818632126, 0.006808693520724773, 0.007028559222817421, 0.0072484249249100685, 0.007468290627002716, 0.007688156329095364, 0.007908022031188011, 0.008127887733280659, 0.008347753435373306, 0.008567619137465954, 0.008787484839558601, 0.009007350541651249, 0.009227216243743896]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 4.0, 5.0, 3.0, 7.0, 19.0, 7.0, 9.0, 20.0, 13.0, 26.0, 29.0, 35.0, 38.0, 20.0, 18.0, 37.0, 42.0, 37.0, 36.0, 41.0, 48.0, 41.0, 46.0, 33.0, 36.0, 38.0, 26.0, 35.0, 21.0, 36.0, 32.0, 23.0, 25.0, 18.0, 16.0, 8.0, 10.0, 12.0, 9.0, 5.0, 5.0, 9.0, 8.0, 6.0, 3.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.9140625, -5.7191162109375, -5.524169921875, -5.3292236328125, -5.13427734375, -4.9393310546875, -4.744384765625, -4.5494384765625, -4.3544921875, -4.1595458984375, -3.964599609375, -3.7696533203125, -3.57470703125, -3.3797607421875, -3.184814453125, -2.9898681640625, -2.794921875, -2.5999755859375, -2.405029296875, -2.2100830078125, -2.01513671875, -1.8201904296875, -1.625244140625, -1.4302978515625, -1.2353515625, -1.0404052734375, -0.845458984375, -0.6505126953125, -0.45556640625, -0.2606201171875, -0.065673828125, 0.1292724609375, 0.32421875, 0.5191650390625, 0.714111328125, 0.9090576171875, 1.10400390625, 1.2989501953125, 1.493896484375, 1.6888427734375, 1.8837890625, 2.0787353515625, 2.273681640625, 2.4686279296875, 2.66357421875, 2.8585205078125, 3.053466796875, 3.2484130859375, 3.443359375, 3.6383056640625, 3.833251953125, 4.0281982421875, 4.22314453125, 4.4180908203125, 4.613037109375, 4.8079833984375, 5.0029296875, 5.1978759765625, 5.392822265625, 5.5877685546875, 5.78271484375, 5.9776611328125, 6.172607421875, 6.3675537109375, 6.5625]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 0.0, 2.0, 2.0, 1.0, 6.0, 7.0, 8.0, 12.0, 13.0, 12.0, 33.0, 36.0, 41.0, 59.0, 59.0, 101.0, 112.0, 185.0, 219.0, 354.0, 533.0, 1066.0, 2213.0, 5238.0, 13308.0, 40178.0, 177117.0, 649792.0, 109848.0, 29465.0, 10194.0, 4075.0, 1792.0, 852.0, 514.0, 323.0, 196.0, 141.0, 114.0, 72.0, 59.0, 40.0, 42.0, 26.0, 26.0, 14.0, 14.0, 12.0, 13.0, 10.0, 4.0, 6.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.140625, -13.6749267578125, -13.209228515625, -12.7435302734375, -12.27783203125, -11.8121337890625, -11.346435546875, -10.8807373046875, -10.4150390625, -9.9493408203125, -9.483642578125, -9.0179443359375, -8.55224609375, -8.0865478515625, -7.620849609375, -7.1551513671875, -6.689453125, -6.2237548828125, -5.758056640625, -5.2923583984375, -4.82666015625, -4.3609619140625, -3.895263671875, -3.4295654296875, -2.9638671875, -2.4981689453125, -2.032470703125, -1.5667724609375, -1.10107421875, -0.6353759765625, -0.169677734375, 0.2960205078125, 0.76171875, 1.2274169921875, 1.693115234375, 2.1588134765625, 2.62451171875, 3.0902099609375, 3.555908203125, 4.0216064453125, 4.4873046875, 4.9530029296875, 5.418701171875, 5.8843994140625, 6.35009765625, 6.8157958984375, 7.281494140625, 7.7471923828125, 8.212890625, 8.6785888671875, 9.144287109375, 9.6099853515625, 10.07568359375, 10.5413818359375, 11.007080078125, 11.4727783203125, 11.9384765625, 12.4041748046875, 12.869873046875, 13.3355712890625, 13.80126953125, 14.2669677734375, 14.732666015625, 15.1983642578125, 15.6640625]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 8.0, 8.0, 1.0, 5.0, 9.0, 6.0, 8.0, 10.0, 15.0, 20.0, 9.0, 20.0, 21.0, 24.0, 24.0, 32.0, 33.0, 43.0, 38.0, 48.0, 67.0, 78.0, 145.0, 323.0, 1385.0, 158.0, 65.0, 62.0, 46.0, 43.0, 41.0, 47.0, 34.0, 25.0, 26.0, 22.0, 18.0, 10.0, 17.0, 15.0, 10.0, 9.0, 7.0, 8.0, 3.0, 3.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-18.375, -17.8359375, -17.296875, -16.7578125, -16.21875, -15.6796875, -15.140625, -14.6015625, -14.0625, -13.5234375, -12.984375, -12.4453125, -11.90625, -11.3671875, -10.828125, -10.2890625, -9.75, -9.2109375, -8.671875, -8.1328125, -7.59375, -7.0546875, -6.515625, -5.9765625, -5.4375, -4.8984375, -4.359375, -3.8203125, -3.28125, -2.7421875, -2.203125, -1.6640625, -1.125, -0.5859375, -0.046875, 0.4921875, 1.03125, 1.5703125, 2.109375, 2.6484375, 3.1875, 3.7265625, 4.265625, 4.8046875, 5.34375, 5.8828125, 6.421875, 6.9609375, 7.5, 8.0390625, 8.578125, 9.1171875, 9.65625, 10.1953125, 10.734375, 11.2734375, 11.8125, 12.3515625, 12.890625, 13.4296875, 13.96875, 14.5078125, 15.046875, 15.5859375, 16.125]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 2.0, 2.0, 6.0, 3.0, 8.0, 16.0, 18.0, 11.0, 25.0, 25.0, 36.0, 32.0, 45.0, 58.0, 123.0, 194.0, 305.0, 612.0, 2484.0, 27322.0, 2914072.0, 191090.0, 6885.0, 1150.0, 431.0, 258.0, 133.0, 84.0, 59.0, 40.0, 30.0, 29.0, 29.0, 24.0, 16.0, 14.0, 12.0, 3.0, 7.0, 11.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.125, -54.4111328125, -52.697265625, -50.9833984375, -49.26953125, -47.5556640625, -45.841796875, -44.1279296875, -42.4140625, -40.7001953125, -38.986328125, -37.2724609375, -35.55859375, -33.8447265625, -32.130859375, -30.4169921875, -28.703125, -26.9892578125, -25.275390625, -23.5615234375, -21.84765625, -20.1337890625, -18.419921875, -16.7060546875, -14.9921875, -13.2783203125, -11.564453125, -9.8505859375, -8.13671875, -6.4228515625, -4.708984375, -2.9951171875, -1.28125, 0.4326171875, 2.146484375, 3.8603515625, 5.57421875, 7.2880859375, 9.001953125, 10.7158203125, 12.4296875, 14.1435546875, 15.857421875, 17.5712890625, 19.28515625, 20.9990234375, 22.712890625, 24.4267578125, 26.140625, 27.8544921875, 29.568359375, 31.2822265625, 32.99609375, 34.7099609375, 36.423828125, 38.1376953125, 39.8515625, 41.5654296875, 43.279296875, 44.9931640625, 46.70703125, 48.4208984375, 50.134765625, 51.8486328125, 53.5625]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 41.0, 252.0, 494.0, 186.0, 37.0, 5.0, 0.0, 1.0], "bins": [-270.9718017578125, -266.3309631347656, -261.69012451171875, -257.0492858886719, -252.40843200683594, -247.76759338378906, -243.1267547607422, -238.4859161376953, -233.84507751464844, -229.20423889160156, -224.5634002685547, -219.92254638671875, -215.28170776367188, -210.640869140625, -206.00003051757812, -201.35919189453125, -196.71835327148438, -192.0775146484375, -187.43667602539062, -182.79583740234375, -178.1549835205078, -173.51414489746094, -168.87330627441406, -164.2324676513672, -159.59161376953125, -154.95077514648438, -150.3099365234375, -145.66909790039062, -141.0282440185547, -136.3874053955078, -131.74656677246094, -127.10572814941406, -122.46490478515625, -117.82406616210938, -113.18321990966797, -108.5423812866211, -103.90154266357422, -99.26069641113281, -94.61985778808594, -89.97901916503906, -85.33817291259766, -80.69733428955078, -76.05648803710938, -71.4156494140625, -66.77481079101562, -62.133968353271484, -57.493125915527344, -52.85228729248047, -48.21144485473633, -43.57060241699219, -38.92976379394531, -34.28892135620117, -29.648080825805664, -25.007240295410156, -20.366397857666016, -15.72555923461914, -11.084716796875, -6.443875789642334, -1.803034782409668, 2.8378067016601562, 7.478647232055664, 12.119487762451172, 16.760330200195312, 21.401168823242188, 26.042011260986328]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 6.0, 4.0, 3.0, 4.0, 9.0, 12.0, 8.0, 11.0, 12.0, 12.0, 16.0, 25.0, 15.0, 22.0, 27.0, 31.0, 13.0, 32.0, 27.0, 41.0, 41.0, 42.0, 37.0, 43.0, 42.0, 39.0, 44.0, 49.0, 33.0, 40.0, 39.0, 33.0, 29.0, 36.0, 17.0, 20.0, 18.0, 14.0, 15.0, 11.0, 4.0, 8.0, 3.0, 3.0, 5.0, 1.0, 1.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-44.105506896972656, -42.67094421386719, -41.23638153076172, -39.80181884765625, -38.36725997924805, -36.93269729614258, -35.49813461303711, -34.06357192993164, -32.62901306152344, -31.19445037841797, -29.759889602661133, -28.325326919555664, -26.890766143798828, -25.45620346069336, -24.02164077758789, -22.587078094482422, -21.152515411376953, -19.717952728271484, -18.28339195251465, -16.84882926940918, -15.414267539978027, -13.979705810546875, -12.545143127441406, -11.110581398010254, -9.676019668579102, -8.24145793914795, -6.806895732879639, -5.372333526611328, -3.937771797180176, -2.5032100677490234, -1.0686473846435547, 0.36591434478759766, 1.80047607421875, 3.2350380420684814, 4.669600009918213, 6.104162216186523, 7.538723945617676, 8.973285675048828, 10.407848358154297, 11.84241008758545, 13.276971817016602, 14.711533546447754, 16.146095275878906, 17.580657958984375, 19.015220642089844, 20.44978141784668, 21.88434410095215, 23.318904876708984, 24.753467559814453, 26.188030242919922, 27.622591018676758, 29.057153701782227, 30.491714477539062, 31.92627716064453, 33.36083984375, 34.79540252685547, 36.22996520996094, 37.664527893066406, 39.099090576171875, 40.533653259277344, 41.96821212768555, 43.402774810791016, 44.837337493896484, 46.27190017700195, 47.706459045410156]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 1.0, 5.0, 5.0, 7.0, 7.0, 10.0, 13.0, 8.0, 25.0, 26.0, 21.0, 32.0, 28.0, 33.0, 42.0, 36.0, 56.0, 45.0, 50.0, 41.0, 53.0, 48.0, 46.0, 39.0, 41.0, 49.0, 40.0, 24.0, 30.0, 21.0, 30.0, 11.0, 12.0, 12.0, 15.0, 11.0, 7.0, 8.0, 11.0, 6.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.3515625, -8.10076904296875, -7.8499755859375, -7.59918212890625, -7.348388671875, -7.09759521484375, -6.8468017578125, -6.59600830078125, -6.34521484375, -6.09442138671875, -5.8436279296875, -5.59283447265625, -5.342041015625, -5.09124755859375, -4.8404541015625, -4.58966064453125, -4.3388671875, -4.08807373046875, -3.8372802734375, -3.58648681640625, -3.335693359375, -3.08489990234375, -2.8341064453125, -2.58331298828125, -2.33251953125, -2.08172607421875, -1.8309326171875, -1.58013916015625, -1.329345703125, -1.07855224609375, -0.8277587890625, -0.57696533203125, -0.326171875, -0.07537841796875, 0.1754150390625, 0.42620849609375, 0.677001953125, 0.92779541015625, 1.1785888671875, 1.42938232421875, 1.68017578125, 1.93096923828125, 2.1817626953125, 2.43255615234375, 2.683349609375, 2.93414306640625, 3.1849365234375, 3.43572998046875, 3.6865234375, 3.93731689453125, 4.1881103515625, 4.43890380859375, 4.689697265625, 4.94049072265625, 5.1912841796875, 5.44207763671875, 5.69287109375, 5.94366455078125, 6.1944580078125, 6.44525146484375, 6.696044921875, 6.94683837890625, 7.1976318359375, 7.44842529296875, 7.69921875]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 6.0, 1.0, 4.0, 7.0, 13.0, 12.0, 24.0, 28.0, 34.0, 76.0, 79.0, 129.0, 198.0, 314.0, 561.0, 983.0, 1860.0, 3734.0, 8119.0, 19377.0, 54807.0, 200214.0, 1005478.0, 2099040.0, 603158.0, 129157.0, 39164.0, 14743.0, 6262.0, 2992.0, 1567.0, 844.0, 462.0, 287.0, 176.0, 123.0, 85.0, 63.0, 30.0, 22.0, 19.0, 14.0, 14.0, 4.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.171875, -10.8037109375, -10.435546875, -10.0673828125, -9.69921875, -9.3310546875, -8.962890625, -8.5947265625, -8.2265625, -7.8583984375, -7.490234375, -7.1220703125, -6.75390625, -6.3857421875, -6.017578125, -5.6494140625, -5.28125, -4.9130859375, -4.544921875, -4.1767578125, -3.80859375, -3.4404296875, -3.072265625, -2.7041015625, -2.3359375, -1.9677734375, -1.599609375, -1.2314453125, -0.86328125, -0.4951171875, -0.126953125, 0.2412109375, 0.609375, 0.9775390625, 1.345703125, 1.7138671875, 2.08203125, 2.4501953125, 2.818359375, 3.1865234375, 3.5546875, 3.9228515625, 4.291015625, 4.6591796875, 5.02734375, 5.3955078125, 5.763671875, 6.1318359375, 6.5, 6.8681640625, 7.236328125, 7.6044921875, 7.97265625, 8.3408203125, 8.708984375, 9.0771484375, 9.4453125, 9.8134765625, 10.181640625, 10.5498046875, 10.91796875, 11.2861328125, 11.654296875, 12.0224609375, 12.390625]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 5.0, 11.0, 9.0, 8.0, 20.0, 19.0, 26.0, 50.0, 81.0, 101.0, 137.0, 212.0, 390.0, 570.0, 707.0, 631.0, 389.0, 269.0, 142.0, 101.0, 63.0, 45.0, 27.0, 22.0, 14.0, 6.0, 9.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.671875, -15.142822265625, -14.61376953125, -14.084716796875, -13.5556640625, -13.026611328125, -12.49755859375, -11.968505859375, -11.439453125, -10.910400390625, -10.38134765625, -9.852294921875, -9.3232421875, -8.794189453125, -8.26513671875, -7.736083984375, -7.20703125, -6.677978515625, -6.14892578125, -5.619873046875, -5.0908203125, -4.561767578125, -4.03271484375, -3.503662109375, -2.974609375, -2.445556640625, -1.91650390625, -1.387451171875, -0.8583984375, -0.329345703125, 0.19970703125, 0.728759765625, 1.2578125, 1.786865234375, 2.31591796875, 2.844970703125, 3.3740234375, 3.903076171875, 4.43212890625, 4.961181640625, 5.490234375, 6.019287109375, 6.54833984375, 7.077392578125, 7.6064453125, 8.135498046875, 8.66455078125, 9.193603515625, 9.72265625, 10.251708984375, 10.78076171875, 11.309814453125, 11.8388671875, 12.367919921875, 12.89697265625, 13.426025390625, 13.955078125, 14.484130859375, 15.01318359375, 15.542236328125, 16.0712890625, 16.600341796875, 17.12939453125, 17.658447265625, 18.1875]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 2.0, 4.0, 7.0, 8.0, 18.0, 26.0, 35.0, 74.0, 107.0, 153.0, 282.0, 585.0, 1486.0, 5374.0, 35678.0, 698798.0, 3308864.0, 126092.0, 11983.0, 2599.0, 953.0, 462.0, 295.0, 141.0, 79.0, 52.0, 33.0, 29.0, 14.0, 20.0, 3.0, 12.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-41.75, -40.5654296875, -39.380859375, -38.1962890625, -37.01171875, -35.8271484375, -34.642578125, -33.4580078125, -32.2734375, -31.0888671875, -29.904296875, -28.7197265625, -27.53515625, -26.3505859375, -25.166015625, -23.9814453125, -22.796875, -21.6123046875, -20.427734375, -19.2431640625, -18.05859375, -16.8740234375, -15.689453125, -14.5048828125, -13.3203125, -12.1357421875, -10.951171875, -9.7666015625, -8.58203125, -7.3974609375, -6.212890625, -5.0283203125, -3.84375, -2.6591796875, -1.474609375, -0.2900390625, 0.89453125, 2.0791015625, 3.263671875, 4.4482421875, 5.6328125, 6.8173828125, 8.001953125, 9.1865234375, 10.37109375, 11.5556640625, 12.740234375, 13.9248046875, 15.109375, 16.2939453125, 17.478515625, 18.6630859375, 19.84765625, 21.0322265625, 22.216796875, 23.4013671875, 24.5859375, 25.7705078125, 26.955078125, 28.1396484375, 29.32421875, 30.5087890625, 31.693359375, 32.8779296875, 34.0625]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 7.0, 29.0, 154.0, 328.0, 342.0, 131.0, 17.0, 5.0, 1.0, 1.0], "bins": [-337.9951477050781, -332.1595458984375, -326.3239440917969, -320.4883117675781, -314.6527099609375, -308.8171081542969, -302.98150634765625, -297.1459045410156, -291.310302734375, -285.4747009277344, -279.63909912109375, -273.803466796875, -267.9678649902344, -262.13226318359375, -256.2966613769531, -250.4610595703125, -244.62542724609375, -238.78982543945312, -232.95420837402344, -227.1186065673828, -221.28298950195312, -215.4473876953125, -209.61178588867188, -203.77618408203125, -197.94056701660156, -192.10496520996094, -186.26934814453125, -180.43374633789062, -174.59814453125, -168.7625274658203, -162.9269256591797, -157.09130859375, -151.25570678710938, -145.42010498046875, -139.58448791503906, -133.74888610839844, -127.91327667236328, -122.07766723632812, -116.2420654296875, -110.40645599365234, -104.57083892822266, -98.7352294921875, -92.89962768554688, -87.06401824951172, -81.22840881347656, -75.3927993774414, -69.55718994140625, -63.721588134765625, -57.88597869873047, -52.05036926269531, -46.21476364135742, -40.37915802001953, -34.543548583984375, -28.70794105529785, -22.872333526611328, -17.036727905273438, -11.201118469238281, -5.365510940551758, 0.4700965881347656, 6.305704116821289, 12.141311645507812, 17.976919174194336, 23.81252670288086, 29.64813232421875, 35.483741760253906]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 8.0, 6.0, 8.0, 7.0, 11.0, 7.0, 11.0, 4.0, 22.0, 19.0, 19.0, 34.0, 22.0, 23.0, 28.0, 21.0, 32.0, 46.0, 25.0, 40.0, 37.0, 36.0, 38.0, 43.0, 45.0, 34.0, 42.0, 34.0, 22.0, 32.0, 29.0, 24.0, 29.0, 25.0, 16.0, 17.0, 24.0, 13.0, 20.0, 10.0, 10.0, 8.0, 10.0, 5.0, 0.0, 2.0, 2.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-38.4891357421875, -37.3023796081543, -36.115623474121094, -34.92886734008789, -33.74211120605469, -32.555355072021484, -31.36859893798828, -30.181842803955078, -28.995086669921875, -27.808330535888672, -26.62157440185547, -25.434818267822266, -24.248062133789062, -23.06130599975586, -21.874549865722656, -20.687793731689453, -19.50103759765625, -18.314281463623047, -17.127525329589844, -15.94076919555664, -14.754013061523438, -13.567256927490234, -12.380500793457031, -11.193744659423828, -10.006988525390625, -8.820232391357422, -7.633476257324219, -6.446720123291016, -5.2599639892578125, -4.073207855224609, -2.8864517211914062, -1.6996955871582031, -0.512939453125, 0.6738166809082031, 1.8605728149414062, 3.0473289489746094, 4.2340850830078125, 5.420841217041016, 6.607597351074219, 7.794353485107422, 8.981109619140625, 10.167865753173828, 11.354621887207031, 12.541378021240234, 13.728134155273438, 14.91489028930664, 16.101646423339844, 17.288402557373047, 18.47515869140625, 19.661914825439453, 20.848670959472656, 22.03542709350586, 23.222183227539062, 24.408939361572266, 25.59569549560547, 26.782451629638672, 27.969207763671875, 29.155963897705078, 30.34272003173828, 31.529476165771484, 32.71623229980469, 33.90298843383789, 35.089744567871094, 36.2765007019043, 37.4632568359375]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 2.0, 5.0, 7.0, 8.0, 6.0, 8.0, 9.0, 16.0, 21.0, 23.0, 24.0, 26.0, 33.0, 28.0, 41.0, 43.0, 36.0, 46.0, 46.0, 44.0, 49.0, 59.0, 43.0, 35.0, 27.0, 38.0, 34.0, 35.0, 42.0, 30.0, 24.0, 23.0, 17.0, 13.0, 9.0, 13.0, 11.0, 6.0, 9.0, 8.0, 6.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-9.328125, -9.0736083984375, -8.819091796875, -8.5645751953125, -8.31005859375, -8.0555419921875, -7.801025390625, -7.5465087890625, -7.2919921875, -7.0374755859375, -6.782958984375, -6.5284423828125, -6.27392578125, -6.0194091796875, -5.764892578125, -5.5103759765625, -5.255859375, -5.0013427734375, -4.746826171875, -4.4923095703125, -4.23779296875, -3.9832763671875, -3.728759765625, -3.4742431640625, -3.2197265625, -2.9652099609375, -2.710693359375, -2.4561767578125, -2.20166015625, -1.9471435546875, -1.692626953125, -1.4381103515625, -1.18359375, -0.9290771484375, -0.674560546875, -0.4200439453125, -0.16552734375, 0.0889892578125, 0.343505859375, 0.5980224609375, 0.8525390625, 1.1070556640625, 1.361572265625, 1.6160888671875, 1.87060546875, 2.1251220703125, 2.379638671875, 2.6341552734375, 2.888671875, 3.1431884765625, 3.397705078125, 3.6522216796875, 3.90673828125, 4.1612548828125, 4.415771484375, 4.6702880859375, 4.9248046875, 5.1793212890625, 5.433837890625, 5.6883544921875, 5.94287109375, 6.1973876953125, 6.451904296875, 6.7064208984375, 6.9609375]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 3.0, 3.0, 6.0, 12.0, 9.0, 16.0, 33.0, 42.0, 57.0, 91.0, 126.0, 196.0, 298.0, 425.0, 689.0, 954.0, 1507.0, 2325.0, 3472.0, 5712.0, 8868.0, 14208.0, 23205.0, 38196.0, 65254.0, 112732.0, 181887.0, 210937.0, 152721.0, 90363.0, 51922.0, 30846.0, 18862.0, 11727.0, 7375.0, 4628.0, 3051.0, 1999.0, 1253.0, 850.0, 571.0, 368.0, 221.0, 186.0, 120.0, 85.0, 41.0, 33.0, 24.0, 24.0, 6.0, 4.0, 10.0, 6.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.53369140625, -0.5160751342773438, -0.4984588623046875, -0.48084259033203125, -0.463226318359375, -0.44561004638671875, -0.4279937744140625, -0.41037750244140625, -0.39276123046875, -0.37514495849609375, -0.3575286865234375, -0.33991241455078125, -0.322296142578125, -0.30467987060546875, -0.2870635986328125, -0.26944732666015625, -0.2518310546875, -0.23421478271484375, -0.2165985107421875, -0.19898223876953125, -0.181365966796875, -0.16374969482421875, -0.1461334228515625, -0.12851715087890625, -0.11090087890625, -0.09328460693359375, -0.0756683349609375, -0.05805206298828125, -0.040435791015625, -0.02281951904296875, -0.0052032470703125, 0.01241302490234375, 0.030029296875, 0.04764556884765625, 0.0652618408203125, 0.08287811279296875, 0.100494384765625, 0.11811065673828125, 0.1357269287109375, 0.15334320068359375, 0.17095947265625, 0.18857574462890625, 0.2061920166015625, 0.22380828857421875, 0.241424560546875, 0.25904083251953125, 0.2766571044921875, 0.29427337646484375, 0.3118896484375, 0.32950592041015625, 0.3471221923828125, 0.36473846435546875, 0.382354736328125, 0.39997100830078125, 0.4175872802734375, 0.43520355224609375, 0.45281982421875, 0.47043609619140625, 0.4880523681640625, 0.5056686401367188, 0.523284912109375, 0.5409011840820312, 0.5585174560546875, 0.5761337280273438, 0.59375]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 3.0, 5.0, 6.0, 10.0, 8.0, 10.0, 8.0, 19.0, 23.0, 25.0, 27.0, 35.0, 39.0, 40.0, 32.0, 43.0, 54.0, 44.0, 48.0, 1074.0, 53.0, 54.0, 46.0, 35.0, 37.0, 32.0, 31.0, 35.0, 20.0, 25.0, 16.0, 17.0, 14.0, 14.0, 12.0, 15.0, 6.0, 4.0, 3.0, 6.0, 3.0, 0.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.59765625, -5.42230224609375, -5.2469482421875, -5.07159423828125, -4.896240234375, -4.72088623046875, -4.5455322265625, -4.37017822265625, -4.19482421875, -4.01947021484375, -3.8441162109375, -3.66876220703125, -3.493408203125, -3.31805419921875, -3.1427001953125, -2.96734619140625, -2.7919921875, -2.61663818359375, -2.4412841796875, -2.26593017578125, -2.090576171875, -1.91522216796875, -1.7398681640625, -1.56451416015625, -1.38916015625, -1.21380615234375, -1.0384521484375, -0.86309814453125, -0.687744140625, -0.51239013671875, -0.3370361328125, -0.16168212890625, 0.013671875, 0.18902587890625, 0.3643798828125, 0.53973388671875, 0.715087890625, 0.89044189453125, 1.0657958984375, 1.24114990234375, 1.41650390625, 1.59185791015625, 1.7672119140625, 1.94256591796875, 2.117919921875, 2.29327392578125, 2.4686279296875, 2.64398193359375, 2.8193359375, 2.99468994140625, 3.1700439453125, 3.34539794921875, 3.520751953125, 3.69610595703125, 3.8714599609375, 4.04681396484375, 4.22216796875, 4.39752197265625, 4.5728759765625, 4.74822998046875, 4.923583984375, 5.09893798828125, 5.2742919921875, 5.44964599609375, 5.625]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 5.0, 2.0, 15.0, 12.0, 23.0, 29.0, 36.0, 53.0, 104.0, 153.0, 227.0, 380.0, 566.0, 1043.0, 1715.0, 2833.0, 4989.0, 8383.0, 14497.0, 25480.0, 43886.0, 74517.0, 123115.0, 180808.0, 1243233.0, 147389.0, 92798.0, 54837.0, 31996.0, 18599.0, 10450.0, 6089.0, 3594.0, 2079.0, 1172.0, 798.0, 437.0, 283.0, 161.0, 122.0, 67.0, 48.0, 39.0, 25.0, 23.0, 12.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.3857421875, -0.3741264343261719, -0.36251068115234375, -0.3508949279785156, -0.3392791748046875, -0.3276634216308594, -0.31604766845703125, -0.3044319152832031, -0.292816162109375, -0.2812004089355469, -0.26958465576171875, -0.2579689025878906, -0.2463531494140625, -0.23473739624023438, -0.22312164306640625, -0.21150588989257812, -0.19989013671875, -0.18827438354492188, -0.17665863037109375, -0.16504287719726562, -0.1534271240234375, -0.14181137084960938, -0.13019561767578125, -0.11857986450195312, -0.106964111328125, -0.09534835815429688, -0.08373260498046875, -0.07211685180664062, -0.0605010986328125, -0.048885345458984375, -0.03726959228515625, -0.025653839111328125, -0.0140380859375, -0.002422332763671875, 0.00919342041015625, 0.020809173583984375, 0.0324249267578125, 0.044040679931640625, 0.05565643310546875, 0.06727218627929688, 0.078887939453125, 0.09050369262695312, 0.10211944580078125, 0.11373519897460938, 0.1253509521484375, 0.13696670532226562, 0.14858245849609375, 0.16019821166992188, 0.17181396484375, 0.18342971801757812, 0.19504547119140625, 0.20666122436523438, 0.2182769775390625, 0.22989273071289062, 0.24150848388671875, 0.2531242370605469, 0.264739990234375, 0.2763557434082031, 0.28797149658203125, 0.2995872497558594, 0.3112030029296875, 0.3228187561035156, 0.33443450927734375, 0.3460502624511719, 0.357666015625]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 1.0, 2.0, 3.0, 4.0, 2.0, 5.0, 6.0, 10.0, 18.0, 21.0, 35.0, 57.0, 85.0, 107.0, 127.0, 135.0, 129.0, 70.0, 53.0, 32.0, 29.0, 10.0, 15.0, 10.0, 6.0, 5.0, 2.0, 5.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0052032470703125, -0.005035340785980225, -0.004867434501647949, -0.004699528217315674, -0.0045316219329833984, -0.004363715648651123, -0.004195809364318848, -0.004027903079986572, -0.003859996795654297, -0.0036920905113220215, -0.003524184226989746, -0.0033562779426574707, -0.0031883716583251953, -0.00302046537399292, -0.0028525590896606445, -0.002684652805328369, -0.0025167465209960938, -0.0023488402366638184, -0.002180933952331543, -0.0020130276679992676, -0.0018451213836669922, -0.0016772150993347168, -0.0015093088150024414, -0.001341402530670166, -0.0011734962463378906, -0.0010055899620056152, -0.0008376836776733398, -0.0006697773933410645, -0.0005018711090087891, -0.00033396482467651367, -0.00016605854034423828, 1.8477439880371094e-06, 0.0001697540283203125, 0.0003376603126525879, 0.0005055665969848633, 0.0006734728813171387, 0.0008413791656494141, 0.0010092854499816895, 0.0011771917343139648, 0.0013450980186462402, 0.0015130043029785156, 0.001680910587310791, 0.0018488168716430664, 0.002016723155975342, 0.002184629440307617, 0.0023525357246398926, 0.002520442008972168, 0.0026883482933044434, 0.0028562545776367188, 0.003024160861968994, 0.0031920671463012695, 0.003359973430633545, 0.0035278797149658203, 0.0036957859992980957, 0.003863692283630371, 0.0040315985679626465, 0.004199504852294922, 0.004367411136627197, 0.004535317420959473, 0.004703223705291748, 0.0048711299896240234, 0.005039036273956299, 0.005206942558288574, 0.00537484884262085, 0.005542755126953125]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 4.0, 5.0, 7.0, 7.0, 10.0, 18.0, 23.0, 47.0, 51.0, 78.0, 146.0, 299.0, 1394.0, 257237.0, 786436.0, 1977.0, 354.0, 161.0, 83.0, 66.0, 42.0, 22.0, 16.0, 9.0, 6.0, 3.0, 7.0, 7.0, 1.0, 3.0, 8.0, 4.0, 1.0, 1.0, 2.0, 4.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.10693359375, -0.1036996841430664, -0.10046577453613281, -0.09723186492919922, -0.09399795532226562, -0.09076404571533203, -0.08753013610839844, -0.08429622650146484, -0.08106231689453125, -0.07782840728759766, -0.07459449768066406, -0.07136058807373047, -0.06812667846679688, -0.06489276885986328, -0.06165885925292969, -0.058424949645996094, -0.0551910400390625, -0.051957130432128906, -0.04872322082519531, -0.04548931121826172, -0.042255401611328125, -0.03902149200439453, -0.03578758239746094, -0.032553672790527344, -0.02931976318359375, -0.026085853576660156, -0.022851943969726562, -0.01961803436279297, -0.016384124755859375, -0.013150215148925781, -0.009916305541992188, -0.006682395935058594, -0.003448486328125, -0.00021457672119140625, 0.0030193328857421875, 0.006253242492675781, 0.009487152099609375, 0.012721061706542969, 0.015954971313476562, 0.019188880920410156, 0.02242279052734375, 0.025656700134277344, 0.028890609741210938, 0.03212451934814453, 0.035358428955078125, 0.03859233856201172, 0.04182624816894531, 0.045060157775878906, 0.0482940673828125, 0.051527976989746094, 0.05476188659667969, 0.05799579620361328, 0.061229705810546875, 0.06446361541748047, 0.06769752502441406, 0.07093143463134766, 0.07416534423828125, 0.07739925384521484, 0.08063316345214844, 0.08386707305908203, 0.08710098266601562, 0.09033489227294922, 0.09356880187988281, 0.0968027114868164, 0.10003662109375]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 8.0, 216.0, 765.0, 32.0], "bins": [-0.10660815984010696, -0.10489494353532791, -0.10318172723054886, -0.1014685109257698, -0.09975528717041016, -0.0980420708656311, -0.09632885456085205, -0.094615638256073, -0.09290242195129395, -0.09118920564651489, -0.08947598934173584, -0.08776277303695679, -0.08604955673217773, -0.08433633297681808, -0.08262311667203903, -0.08090990036725998, -0.07919668406248093, -0.07748346775770187, -0.07577025145292282, -0.07405703514814377, -0.07234381139278412, -0.07063059508800507, -0.06891737878322601, -0.06720416247844696, -0.06549094617366791, -0.06377772986888885, -0.0620645135641098, -0.06035129353404045, -0.0586380772292614, -0.056924860924482346, -0.055211640894412994, -0.05349842458963394, -0.05178520455956459, -0.05007198825478554, -0.048358768224716187, -0.046645551919937134, -0.04493233561515808, -0.04321911931037903, -0.041505903005599976, -0.039792682975530624, -0.03807946667075157, -0.03636625036597252, -0.03465303033590317, -0.032939814031124115, -0.031226597726345062, -0.02951338142156601, -0.027800163254141808, -0.026086945086717606, -0.024373730644583702, -0.0226605124771595, -0.020947296172380447, -0.019234079867601395, -0.017520861700177193, -0.01580764353275299, -0.014094427227973938, -0.01238120999187231, -0.010667992755770683, -0.008954775519669056, -0.007241558283567429, -0.005528341047465801, -0.003815123811364174, -0.0021019065752625465, -0.0003886893391609192, 0.0013245278969407082, 0.003037745365872979]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 2.0, 5.0, 16.0, 11.0, 20.0, 19.0, 24.0, 25.0, 33.0, 47.0, 37.0, 67.0, 59.0, 56.0, 75.0, 57.0, 82.0, 85.0, 47.0, 48.0, 46.0, 29.0, 39.0, 17.0, 26.0, 14.0, 8.0, 7.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0031363368034362793, -0.0030001457780599594, -0.0028639547526836395, -0.0027277637273073196, -0.0025915727019309998, -0.00245538167655468, -0.00231919065117836, -0.00218299962580204, -0.00204680860042572, -0.0019106175750494003, -0.0017744265496730804, -0.0016382355242967606, -0.0015020444989204407, -0.0013658534735441208, -0.001229662448167801, -0.001093471422791481, -0.0009572803974151611, -0.0008210893720388412, -0.0006848983466625214, -0.0005487073212862015, -0.0004125162959098816, -0.0002763252705335617, -0.00014013424515724182, -3.943219780921936e-06, 0.00013224780559539795, 0.00026843883097171783, 0.0004046298563480377, 0.0005408208817243576, 0.0006770119071006775, 0.0008132029324769974, 0.0009493939578533173, 0.0010855849832296371, 0.001221776008605957, 0.001357967033982277, 0.0014941580593585968, 0.0016303490847349167, 0.0017665401101112366, 0.0019027311354875565, 0.0020389221608638763, 0.0021751131862401962, 0.002311304211616516, 0.002447495236992836, 0.002583686262369156, 0.0027198772877454758, 0.0028560683131217957, 0.0029922593384981155, 0.0031284503638744354, 0.0032646413892507553, 0.003400832414627075, 0.003537023440003395, 0.003673214465379715, 0.003809405490756035, 0.003945596516132355, 0.004081787541508675, 0.0042179785668849945, 0.004354169592261314, 0.004490360617637634, 0.004626551643013954, 0.004762742668390274, 0.004898933693766594, 0.005035124719142914, 0.005171315744519234, 0.005307506769895554, 0.0054436977952718735, 0.005579888820648193]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 2.0, 5.0, 7.0, 8.0, 6.0, 8.0, 9.0, 16.0, 20.0, 24.0, 24.0, 26.0, 33.0, 28.0, 41.0, 43.0, 36.0, 46.0, 46.0, 44.0, 49.0, 59.0, 43.0, 35.0, 27.0, 38.0, 34.0, 35.0, 42.0, 30.0, 23.0, 24.0, 17.0, 13.0, 9.0, 13.0, 11.0, 6.0, 9.0, 8.0, 6.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-9.328125, -9.0736083984375, -8.819091796875, -8.5645751953125, -8.31005859375, -8.0555419921875, -7.801025390625, -7.5465087890625, -7.2919921875, -7.0374755859375, -6.782958984375, -6.5284423828125, -6.27392578125, -6.0194091796875, -5.764892578125, -5.5103759765625, -5.255859375, -5.0013427734375, -4.746826171875, -4.4923095703125, -4.23779296875, -3.9832763671875, -3.728759765625, -3.4742431640625, -3.2197265625, -2.9652099609375, -2.710693359375, -2.4561767578125, -2.20166015625, -1.9471435546875, -1.692626953125, -1.4381103515625, -1.18359375, -0.9290771484375, -0.674560546875, -0.4200439453125, -0.16552734375, 0.0889892578125, 0.343505859375, 0.5980224609375, 0.8525390625, 1.1070556640625, 1.361572265625, 1.6160888671875, 1.87060546875, 2.1251220703125, 2.379638671875, 2.6341552734375, 2.888671875, 3.1431884765625, 3.397705078125, 3.6522216796875, 3.90673828125, 4.1612548828125, 4.415771484375, 4.6702880859375, 4.9248046875, 5.1793212890625, 5.433837890625, 5.6883544921875, 5.94287109375, 6.1973876953125, 6.451904296875, 6.7064208984375, 6.9609375]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 5.0, 8.0, 11.0, 20.0, 27.0, 36.0, 51.0, 89.0, 126.0, 182.0, 275.0, 444.0, 651.0, 1147.0, 1825.0, 3154.0, 5639.0, 10365.0, 19842.0, 41007.0, 86675.0, 203501.0, 381177.0, 153874.0, 68922.0, 32845.0, 16351.0, 8600.0, 4729.0, 2702.0, 1562.0, 1025.0, 580.0, 371.0, 235.0, 166.0, 104.0, 81.0, 47.0, 26.0, 31.0, 16.0, 19.0, 3.0, 4.0, 6.0, 2.0, 2.0, 1.0], "bins": [-11.421875, -11.1160888671875, -10.810302734375, -10.5045166015625, -10.19873046875, -9.8929443359375, -9.587158203125, -9.2813720703125, -8.9755859375, -8.6697998046875, -8.364013671875, -8.0582275390625, -7.75244140625, -7.4466552734375, -7.140869140625, -6.8350830078125, -6.529296875, -6.2235107421875, -5.917724609375, -5.6119384765625, -5.30615234375, -5.0003662109375, -4.694580078125, -4.3887939453125, -4.0830078125, -3.7772216796875, -3.471435546875, -3.1656494140625, -2.85986328125, -2.5540771484375, -2.248291015625, -1.9425048828125, -1.63671875, -1.3309326171875, -1.025146484375, -0.7193603515625, -0.41357421875, -0.1077880859375, 0.197998046875, 0.5037841796875, 0.8095703125, 1.1153564453125, 1.421142578125, 1.7269287109375, 2.03271484375, 2.3385009765625, 2.644287109375, 2.9500732421875, 3.255859375, 3.5616455078125, 3.867431640625, 4.1732177734375, 4.47900390625, 4.7847900390625, 5.090576171875, 5.3963623046875, 5.7021484375, 6.0079345703125, 6.313720703125, 6.6195068359375, 6.92529296875, 7.2310791015625, 7.536865234375, 7.8426513671875, 8.1484375]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 4.0, 3.0, 7.0, 13.0, 19.0, 11.0, 19.0, 24.0, 25.0, 31.0, 25.0, 27.0, 36.0, 43.0, 44.0, 55.0, 56.0, 97.0, 163.0, 1460.0, 302.0, 109.0, 78.0, 64.0, 66.0, 29.0, 30.0, 31.0, 24.0, 24.0, 20.0, 16.0, 21.0, 13.0, 13.0, 13.0, 4.0, 6.0, 8.0, 7.0, 2.0, 2.0, 4.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.515625, -21.828857421875, -21.14208984375, -20.455322265625, -19.7685546875, -19.081787109375, -18.39501953125, -17.708251953125, -17.021484375, -16.334716796875, -15.64794921875, -14.961181640625, -14.2744140625, -13.587646484375, -12.90087890625, -12.214111328125, -11.52734375, -10.840576171875, -10.15380859375, -9.467041015625, -8.7802734375, -8.093505859375, -7.40673828125, -6.719970703125, -6.033203125, -5.346435546875, -4.65966796875, -3.972900390625, -3.2861328125, -2.599365234375, -1.91259765625, -1.225830078125, -0.5390625, 0.147705078125, 0.83447265625, 1.521240234375, 2.2080078125, 2.894775390625, 3.58154296875, 4.268310546875, 4.955078125, 5.641845703125, 6.32861328125, 7.015380859375, 7.7021484375, 8.388916015625, 9.07568359375, 9.762451171875, 10.44921875, 11.135986328125, 11.82275390625, 12.509521484375, 13.1962890625, 13.883056640625, 14.56982421875, 15.256591796875, 15.943359375, 16.630126953125, 17.31689453125, 18.003662109375, 18.6904296875, 19.377197265625, 20.06396484375, 20.750732421875, 21.4375]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 4.0, 6.0, 1.0, 2.0, 2.0, 6.0, 4.0, 3.0, 14.0, 12.0, 17.0, 21.0, 34.0, 41.0, 64.0, 88.0, 122.0, 237.0, 465.0, 1267.0, 4508.0, 32445.0, 977560.0, 2077706.0, 42794.0, 5577.0, 1366.0, 521.0, 299.0, 162.0, 123.0, 68.0, 42.0, 23.0, 15.0, 16.0, 19.0, 11.0, 8.0, 7.0, 6.0, 6.0, 7.0, 2.0, 5.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-32.0, -30.8173828125, -29.634765625, -28.4521484375, -27.26953125, -26.0869140625, -24.904296875, -23.7216796875, -22.5390625, -21.3564453125, -20.173828125, -18.9912109375, -17.80859375, -16.6259765625, -15.443359375, -14.2607421875, -13.078125, -11.8955078125, -10.712890625, -9.5302734375, -8.34765625, -7.1650390625, -5.982421875, -4.7998046875, -3.6171875, -2.4345703125, -1.251953125, -0.0693359375, 1.11328125, 2.2958984375, 3.478515625, 4.6611328125, 5.84375, 7.0263671875, 8.208984375, 9.3916015625, 10.57421875, 11.7568359375, 12.939453125, 14.1220703125, 15.3046875, 16.4873046875, 17.669921875, 18.8525390625, 20.03515625, 21.2177734375, 22.400390625, 23.5830078125, 24.765625, 25.9482421875, 27.130859375, 28.3134765625, 29.49609375, 30.6787109375, 31.861328125, 33.0439453125, 34.2265625, 35.4091796875, 36.591796875, 37.7744140625, 38.95703125, 40.1396484375, 41.322265625, 42.5048828125, 43.6875]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 24.0, 100.0, 272.0, 409.0, 174.0, 34.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.796022415161133, -15.955615043640137, -12.11520767211914, -8.274801254272461, -4.434393882751465, -0.5939865112304688, 3.246419906616211, 7.086828231811523, 10.927234649658203, 14.7676420211792, 18.608049392700195, 22.448455810546875, 26.288864135742188, 30.129270553588867, 33.96967697143555, 37.81008529663086, 41.650489807128906, 45.49089813232422, 49.331302642822266, 53.17171096801758, 57.01211929321289, 60.85252380371094, 64.69293212890625, 68.53334045410156, 72.37374877929688, 76.21415710449219, 80.0545654296875, 83.89497375488281, 87.7353744506836, 91.5757827758789, 95.41619110107422, 99.25659942626953, 103.09700775146484, 106.93741607666016, 110.77782440185547, 114.61822509765625, 118.45863342285156, 122.29904174804688, 126.13945007324219, 129.9798583984375, 133.8202667236328, 137.66067504882812, 141.50108337402344, 145.34149169921875, 149.18190002441406, 153.02230834960938, 156.86270141601562, 160.703125, 164.54351806640625, 168.38392639160156, 172.22433471679688, 176.0647430419922, 179.9051513671875, 183.7455596923828, 187.58596801757812, 191.42636108398438, 195.26678466796875, 199.10719299316406, 202.94760131835938, 206.7880096435547, 210.62841796875, 214.4688262939453, 218.30923461914062, 222.14962768554688, 225.9900360107422]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 6.0, 6.0, 6.0, 4.0, 4.0, 6.0, 7.0, 9.0, 12.0, 14.0, 8.0, 24.0, 23.0, 23.0, 23.0, 24.0, 27.0, 30.0, 32.0, 29.0, 37.0, 44.0, 43.0, 48.0, 45.0, 29.0, 40.0, 44.0, 37.0, 39.0, 32.0, 32.0, 28.0, 34.0, 26.0, 23.0, 20.0, 15.0, 14.0, 17.0, 13.0, 8.0, 7.0, 3.0, 4.0, 4.0, 6.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.651824951171875, -37.23672866821289, -35.82162857055664, -34.406532287597656, -32.991432189941406, -31.576335906982422, -30.161239624023438, -28.74614143371582, -27.331043243408203, -25.915945053100586, -24.50084686279297, -23.085750579833984, -21.670652389526367, -20.25555419921875, -18.840457916259766, -17.42535972595215, -16.01026153564453, -14.595163345336914, -13.180066108703613, -11.764968872070312, -10.349870681762695, -8.934772491455078, -7.519675254821777, -6.104578018188477, -4.689479827880859, -3.2743821144104004, -1.8592844009399414, -0.4441866874694824, 0.9709110260009766, 2.3860087394714355, 3.8011064529418945, 5.216203689575195, 6.6313018798828125, 8.04640007019043, 9.46149730682373, 10.876594543457031, 12.291692733764648, 13.706790924072266, 15.121888160705566, 16.536985397338867, 17.952083587646484, 19.3671817779541, 20.78227996826172, 22.197376251220703, 23.61247444152832, 25.027572631835938, 26.442668914794922, 27.85776710510254, 29.272865295410156, 30.687963485717773, 32.10306167602539, 33.518157958984375, 34.933258056640625, 36.34835433959961, 37.763450622558594, 39.178550720214844, 40.59364700317383, 42.00874328613281, 43.42384338378906, 44.83893966674805, 46.25403594970703, 47.66913604736328, 49.084232330322266, 50.49932861328125, 51.9144287109375]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 2.0, 2.0, 5.0, 8.0, 9.0, 12.0, 10.0, 9.0, 16.0, 21.0, 22.0, 20.0, 33.0, 31.0, 30.0, 33.0, 35.0, 28.0, 49.0, 46.0, 48.0, 36.0, 47.0, 35.0, 44.0, 41.0, 39.0, 37.0, 44.0, 18.0, 34.0, 26.0, 22.0, 23.0, 12.0, 15.0, 14.0, 6.0, 5.0, 12.0, 9.0, 8.0, 1.0, 3.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0], "bins": [-8.84375, -8.596923828125, -8.35009765625, -8.103271484375, -7.8564453125, -7.609619140625, -7.36279296875, -7.115966796875, -6.869140625, -6.622314453125, -6.37548828125, -6.128662109375, -5.8818359375, -5.635009765625, -5.38818359375, -5.141357421875, -4.89453125, -4.647705078125, -4.40087890625, -4.154052734375, -3.9072265625, -3.660400390625, -3.41357421875, -3.166748046875, -2.919921875, -2.673095703125, -2.42626953125, -2.179443359375, -1.9326171875, -1.685791015625, -1.43896484375, -1.192138671875, -0.9453125, -0.698486328125, -0.45166015625, -0.204833984375, 0.0419921875, 0.288818359375, 0.53564453125, 0.782470703125, 1.029296875, 1.276123046875, 1.52294921875, 1.769775390625, 2.0166015625, 2.263427734375, 2.51025390625, 2.757080078125, 3.00390625, 3.250732421875, 3.49755859375, 3.744384765625, 3.9912109375, 4.238037109375, 4.48486328125, 4.731689453125, 4.978515625, 5.225341796875, 5.47216796875, 5.718994140625, 5.9658203125, 6.212646484375, 6.45947265625, 6.706298828125, 6.953125]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 7.0, 4.0, 18.0, 33.0, 23.0, 40.0, 35.0, 75.0, 109.0, 177.0, 296.0, 535.0, 890.0, 1462.0, 2709.0, 5080.0, 10687.0, 25103.0, 71109.0, 264402.0, 1144898.0, 1882086.0, 574434.0, 135321.0, 42147.0, 16412.0, 7491.0, 3652.0, 2068.0, 1194.0, 684.0, 402.0, 270.0, 126.0, 101.0, 55.0, 39.0, 29.0, 23.0, 18.0, 11.0, 10.0, 9.0, 2.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-10.234375, -9.906982421875, -9.57958984375, -9.252197265625, -8.9248046875, -8.597412109375, -8.27001953125, -7.942626953125, -7.615234375, -7.287841796875, -6.96044921875, -6.633056640625, -6.3056640625, -5.978271484375, -5.65087890625, -5.323486328125, -4.99609375, -4.668701171875, -4.34130859375, -4.013916015625, -3.6865234375, -3.359130859375, -3.03173828125, -2.704345703125, -2.376953125, -2.049560546875, -1.72216796875, -1.394775390625, -1.0673828125, -0.739990234375, -0.41259765625, -0.085205078125, 0.2421875, 0.569580078125, 0.89697265625, 1.224365234375, 1.5517578125, 1.879150390625, 2.20654296875, 2.533935546875, 2.861328125, 3.188720703125, 3.51611328125, 3.843505859375, 4.1708984375, 4.498291015625, 4.82568359375, 5.153076171875, 5.48046875, 5.807861328125, 6.13525390625, 6.462646484375, 6.7900390625, 7.117431640625, 7.44482421875, 7.772216796875, 8.099609375, 8.427001953125, 8.75439453125, 9.081787109375, 9.4091796875, 9.736572265625, 10.06396484375, 10.391357421875, 10.71875]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 4.0, 6.0, 7.0, 13.0, 28.0, 23.0, 15.0, 29.0, 25.0, 56.0, 62.0, 75.0, 97.0, 173.0, 202.0, 300.0, 411.0, 526.0, 488.0, 413.0, 287.0, 228.0, 151.0, 112.0, 84.0, 56.0, 52.0, 30.0, 25.0, 21.0, 12.0, 14.0, 6.0, 3.0, 7.0, 5.0, 5.0, 1.0, 4.0, 4.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.203125, -9.863037109375, -9.52294921875, -9.182861328125, -8.8427734375, -8.502685546875, -8.16259765625, -7.822509765625, -7.482421875, -7.142333984375, -6.80224609375, -6.462158203125, -6.1220703125, -5.781982421875, -5.44189453125, -5.101806640625, -4.76171875, -4.421630859375, -4.08154296875, -3.741455078125, -3.4013671875, -3.061279296875, -2.72119140625, -2.381103515625, -2.041015625, -1.700927734375, -1.36083984375, -1.020751953125, -0.6806640625, -0.340576171875, -0.00048828125, 0.339599609375, 0.6796875, 1.019775390625, 1.35986328125, 1.699951171875, 2.0400390625, 2.380126953125, 2.72021484375, 3.060302734375, 3.400390625, 3.740478515625, 4.08056640625, 4.420654296875, 4.7607421875, 5.100830078125, 5.44091796875, 5.781005859375, 6.12109375, 6.461181640625, 6.80126953125, 7.141357421875, 7.4814453125, 7.821533203125, 8.16162109375, 8.501708984375, 8.841796875, 9.181884765625, 9.52197265625, 9.862060546875, 10.2021484375, 10.542236328125, 10.88232421875, 11.222412109375, 11.5625]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 5.0, 5.0, 6.0, 5.0, 15.0, 16.0, 16.0, 24.0, 28.0, 33.0, 67.0, 102.0, 181.0, 311.0, 556.0, 1080.0, 2065.0, 4531.0, 11439.0, 31915.0, 109290.0, 529277.0, 2592085.0, 714935.0, 135723.0, 37888.0, 12811.0, 4991.0, 2242.0, 1114.0, 598.0, 334.0, 193.0, 120.0, 88.0, 49.0, 39.0, 27.0, 18.0, 17.0, 11.0, 8.0, 8.0, 4.0, 10.0, 2.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-15.6484375, -15.1680908203125, -14.687744140625, -14.2073974609375, -13.72705078125, -13.2467041015625, -12.766357421875, -12.2860107421875, -11.8056640625, -11.3253173828125, -10.844970703125, -10.3646240234375, -9.88427734375, -9.4039306640625, -8.923583984375, -8.4432373046875, -7.962890625, -7.4825439453125, -7.002197265625, -6.5218505859375, -6.04150390625, -5.5611572265625, -5.080810546875, -4.6004638671875, -4.1201171875, -3.6397705078125, -3.159423828125, -2.6790771484375, -2.19873046875, -1.7183837890625, -1.238037109375, -0.7576904296875, -0.27734375, 0.2030029296875, 0.683349609375, 1.1636962890625, 1.64404296875, 2.1243896484375, 2.604736328125, 3.0850830078125, 3.5654296875, 4.0457763671875, 4.526123046875, 5.0064697265625, 5.48681640625, 5.9671630859375, 6.447509765625, 6.9278564453125, 7.408203125, 7.8885498046875, 8.368896484375, 8.8492431640625, 9.32958984375, 9.8099365234375, 10.290283203125, 10.7706298828125, 11.2509765625, 11.7313232421875, 12.211669921875, 12.6920166015625, 13.17236328125, 13.6527099609375, 14.133056640625, 14.6134033203125, 15.09375]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 13.0, 16.0, 20.0, 43.0, 80.0, 86.0, 119.0, 137.0, 138.0, 104.0, 91.0, 54.0, 38.0, 25.0, 22.0, 10.0, 2.0, 3.0, 2.0, 5.0], "bins": [-91.17721557617188, -89.42210388183594, -87.66699981689453, -85.9118881225586, -84.15677642822266, -82.40167236328125, -80.64656066894531, -78.89144897460938, -77.13634490966797, -75.38123321533203, -73.62612915039062, -71.87101745605469, -70.11590576171875, -68.36080169677734, -66.6056900024414, -64.85057830810547, -63.0954704284668, -61.340362548828125, -59.58525085449219, -57.830142974853516, -56.075035095214844, -54.319923400878906, -52.564815521240234, -50.80970764160156, -49.054595947265625, -47.29948806762695, -45.544376373291016, -43.789268493652344, -42.03416061401367, -40.279052734375, -38.52394104003906, -36.76883316040039, -35.013729095458984, -33.25862121582031, -31.503511428833008, -29.748401641845703, -27.99329376220703, -26.238183975219727, -24.483074188232422, -22.72796630859375, -20.972856521606445, -19.21774673461914, -17.46263885498047, -15.707529067993164, -13.952420234680176, -12.197311401367188, -10.442201614379883, -8.687092781066895, -6.931983947753906, -5.176875114440918, -3.4217658042907715, -1.666656494140625, 0.08845233917236328, 1.8435611724853516, 3.5986709594726562, 5.3537797927856445, 7.108888626098633, 8.863997459411621, 10.61910629272461, 12.374216079711914, 14.129324913024902, 15.88443374633789, 17.639543533325195, 19.3946533203125, 21.149761199951172]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 7.0, 9.0, 9.0, 16.0, 14.0, 19.0, 19.0, 23.0, 34.0, 23.0, 27.0, 32.0, 31.0, 45.0, 42.0, 35.0, 38.0, 34.0, 55.0, 50.0, 41.0, 40.0, 38.0, 30.0, 41.0, 36.0, 26.0, 26.0, 26.0, 16.0, 16.0, 20.0, 15.0, 15.0, 11.0, 11.0, 13.0, 7.0, 4.0, 8.0, 6.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-40.18719482421875, -38.95146179199219, -37.71573257446289, -36.47999954223633, -35.24427032470703, -34.00853729248047, -32.772804260253906, -31.53707504272461, -30.301342010498047, -29.065610885620117, -27.829879760742188, -26.594146728515625, -25.358415603637695, -24.122684478759766, -22.886953353881836, -21.651222229003906, -20.415491104125977, -19.179759979248047, -17.944028854370117, -16.708297729492188, -15.472564697265625, -14.236833572387695, -13.001102447509766, -11.76537036895752, -10.52963924407959, -9.29390811920166, -8.058176040649414, -6.822444915771484, -5.5867133140563965, -4.350981712341309, -3.115250587463379, -1.8795185089111328, -0.6437873840332031, 0.5919440984725952, 1.8276755809783936, 3.0634069442749023, 4.29913854598999, 5.534870147705078, 6.770601272583008, 8.006333351135254, 9.242064476013184, 10.477795600891113, 11.71352767944336, 12.949258804321289, 14.184989929199219, 15.420722007751465, 16.656452178955078, 17.89218521118164, 19.12791633605957, 20.3636474609375, 21.59937858581543, 22.83510971069336, 24.070842742919922, 25.30657386779785, 26.54230499267578, 27.778038024902344, 29.01376724243164, 30.24949836730957, 31.4852294921875, 32.72096252441406, 33.95669174194336, 35.19242477416992, 36.42815399169922, 37.66388702392578, 38.899620056152344]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 6.0, 4.0, 3.0, 5.0, 11.0, 11.0, 4.0, 8.0, 11.0, 14.0, 19.0, 18.0, 13.0, 18.0, 27.0, 28.0, 30.0, 27.0, 28.0, 34.0, 39.0, 46.0, 26.0, 38.0, 33.0, 33.0, 31.0, 41.0, 39.0, 35.0, 33.0, 30.0, 29.0, 24.0, 31.0, 20.0, 24.0, 20.0, 16.0, 21.0, 18.0, 11.0, 8.0, 5.0, 10.0, 8.0, 9.0, 6.0, 6.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.421875, -6.20123291015625, -5.9805908203125, -5.75994873046875, -5.539306640625, -5.31866455078125, -5.0980224609375, -4.87738037109375, -4.65673828125, -4.43609619140625, -4.2154541015625, -3.99481201171875, -3.774169921875, -3.55352783203125, -3.3328857421875, -3.11224365234375, -2.8916015625, -2.67095947265625, -2.4503173828125, -2.22967529296875, -2.009033203125, -1.78839111328125, -1.5677490234375, -1.34710693359375, -1.12646484375, -0.90582275390625, -0.6851806640625, -0.46453857421875, -0.243896484375, -0.02325439453125, 0.1973876953125, 0.41802978515625, 0.638671875, 0.85931396484375, 1.0799560546875, 1.30059814453125, 1.521240234375, 1.74188232421875, 1.9625244140625, 2.18316650390625, 2.40380859375, 2.62445068359375, 2.8450927734375, 3.06573486328125, 3.286376953125, 3.50701904296875, 3.7276611328125, 3.94830322265625, 4.1689453125, 4.38958740234375, 4.6102294921875, 4.83087158203125, 5.051513671875, 5.27215576171875, 5.4927978515625, 5.71343994140625, 5.93408203125, 6.15472412109375, 6.3753662109375, 6.59600830078125, 6.816650390625, 7.03729248046875, 7.2579345703125, 7.47857666015625, 7.69921875]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 6.0, 7.0, 8.0, 20.0, 26.0, 22.0, 52.0, 72.0, 84.0, 150.0, 208.0, 249.0, 385.0, 594.0, 727.0, 1040.0, 1547.0, 2192.0, 3111.0, 4537.0, 6515.0, 9474.0, 13584.0, 20269.0, 30198.0, 46128.0, 70518.0, 108064.0, 155601.0, 173240.0, 134581.0, 89418.0, 58259.0, 37828.0, 25039.0, 16907.0, 11738.0, 7876.0, 5376.0, 3915.0, 2598.0, 1879.0, 1301.0, 976.0, 672.0, 517.0, 324.0, 208.0, 160.0, 132.0, 80.0, 54.0, 31.0, 27.0, 13.0, 14.0, 8.0, 4.0, 2.0, 6.0], "bins": [-0.51318359375, -0.4977607727050781, -0.48233795166015625, -0.4669151306152344, -0.4514923095703125, -0.4360694885253906, -0.42064666748046875, -0.4052238464355469, -0.389801025390625, -0.3743782043457031, -0.35895538330078125, -0.3435325622558594, -0.3281097412109375, -0.3126869201660156, -0.29726409912109375, -0.2818412780761719, -0.26641845703125, -0.2509956359863281, -0.23557281494140625, -0.22014999389648438, -0.2047271728515625, -0.18930435180664062, -0.17388153076171875, -0.15845870971679688, -0.143035888671875, -0.12761306762695312, -0.11219024658203125, -0.09676742553710938, -0.0813446044921875, -0.06592178344726562, -0.05049896240234375, -0.035076141357421875, -0.0196533203125, -0.004230499267578125, 0.01119232177734375, 0.026615142822265625, 0.0420379638671875, 0.057460784912109375, 0.07288360595703125, 0.08830642700195312, 0.103729248046875, 0.11915206909179688, 0.13457489013671875, 0.14999771118164062, 0.1654205322265625, 0.18084335327148438, 0.19626617431640625, 0.21168899536132812, 0.22711181640625, 0.24253463745117188, 0.25795745849609375, 0.2733802795410156, 0.2888031005859375, 0.3042259216308594, 0.31964874267578125, 0.3350715637207031, 0.350494384765625, 0.3659172058105469, 0.38134002685546875, 0.3967628479003906, 0.4121856689453125, 0.4276084899902344, 0.44303131103515625, 0.4584541320800781, 0.473876953125]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 2.0, 5.0, 1.0, 7.0, 9.0, 9.0, 12.0, 15.0, 18.0, 15.0, 17.0, 27.0, 29.0, 30.0, 28.0, 39.0, 39.0, 31.0, 32.0, 46.0, 35.0, 36.0, 1065.0, 35.0, 41.0, 41.0, 39.0, 45.0, 33.0, 28.0, 38.0, 23.0, 14.0, 19.0, 22.0, 27.0, 15.0, 10.0, 8.0, 7.0, 9.0, 6.0, 3.0, 3.0, 7.0, 3.0, 1.0, 3.0, 2.0, 3.0], "bins": [-5.6875, -5.531005859375, -5.37451171875, -5.218017578125, -5.0615234375, -4.905029296875, -4.74853515625, -4.592041015625, -4.435546875, -4.279052734375, -4.12255859375, -3.966064453125, -3.8095703125, -3.653076171875, -3.49658203125, -3.340087890625, -3.18359375, -3.027099609375, -2.87060546875, -2.714111328125, -2.5576171875, -2.401123046875, -2.24462890625, -2.088134765625, -1.931640625, -1.775146484375, -1.61865234375, -1.462158203125, -1.3056640625, -1.149169921875, -0.99267578125, -0.836181640625, -0.6796875, -0.523193359375, -0.36669921875, -0.210205078125, -0.0537109375, 0.102783203125, 0.25927734375, 0.415771484375, 0.572265625, 0.728759765625, 0.88525390625, 1.041748046875, 1.1982421875, 1.354736328125, 1.51123046875, 1.667724609375, 1.82421875, 1.980712890625, 2.13720703125, 2.293701171875, 2.4501953125, 2.606689453125, 2.76318359375, 2.919677734375, 3.076171875, 3.232666015625, 3.38916015625, 3.545654296875, 3.7021484375, 3.858642578125, 4.01513671875, 4.171630859375, 4.328125]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 6.0, 12.0, 11.0, 12.0, 14.0, 23.0, 25.0, 37.0, 47.0, 78.0, 141.0, 193.0, 311.0, 480.0, 779.0, 1245.0, 2071.0, 3387.0, 5333.0, 9013.0, 14653.0, 24180.0, 40468.0, 67264.0, 109804.0, 162716.0, 1237683.0, 155926.0, 102669.0, 62772.0, 37595.0, 23060.0, 13469.0, 8444.0, 4993.0, 3101.0, 1894.0, 1184.0, 711.0, 465.0, 307.0, 185.0, 119.0, 83.0, 49.0, 36.0, 26.0, 23.0, 9.0, 7.0, 4.0, 6.0, 5.0, 4.0, 2.0, 3.0, 0.0, 1.0], "bins": [-0.37353515625, -0.3620185852050781, -0.35050201416015625, -0.3389854431152344, -0.3274688720703125, -0.3159523010253906, -0.30443572998046875, -0.2929191589355469, -0.281402587890625, -0.2698860168457031, -0.25836944580078125, -0.24685287475585938, -0.2353363037109375, -0.22381973266601562, -0.21230316162109375, -0.20078659057617188, -0.18927001953125, -0.17775344848632812, -0.16623687744140625, -0.15472030639648438, -0.1432037353515625, -0.13168716430664062, -0.12017059326171875, -0.10865402221679688, -0.097137451171875, -0.08562088012695312, -0.07410430908203125, -0.06258773803710938, -0.0510711669921875, -0.039554595947265625, -0.02803802490234375, -0.016521453857421875, -0.0050048828125, 0.006511688232421875, 0.01802825927734375, 0.029544830322265625, 0.0410614013671875, 0.052577972412109375, 0.06409454345703125, 0.07561111450195312, 0.087127685546875, 0.09864425659179688, 0.11016082763671875, 0.12167739868164062, 0.1331939697265625, 0.14471054077148438, 0.15622711181640625, 0.16774368286132812, 0.17926025390625, 0.19077682495117188, 0.20229339599609375, 0.21380996704101562, 0.2253265380859375, 0.23684310913085938, 0.24835968017578125, 0.2598762512207031, 0.271392822265625, 0.2829093933105469, 0.29442596435546875, 0.3059425354003906, 0.3174591064453125, 0.3289756774902344, 0.34049224853515625, 0.3520088195800781, 0.363525390625]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 3.0, 4.0, 4.0, 4.0, 2.0, 1.0, 11.0, 7.0, 6.0, 18.0, 5.0, 19.0, 15.0, 28.0, 26.0, 51.0, 52.0, 60.0, 88.0, 108.0, 115.0, 72.0, 60.0, 62.0, 36.0, 31.0, 23.0, 13.0, 14.0, 12.0, 13.0, 6.0, 6.0, 4.0, 6.0, 6.0, 5.0, 3.0, 5.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005847930908203125, -0.005629479885101318, -0.005411028861999512, -0.005192577838897705, -0.0049741268157958984, -0.004755675792694092, -0.004537224769592285, -0.0043187737464904785, -0.004100322723388672, -0.0038818717002868652, -0.0036634206771850586, -0.003444969654083252, -0.0032265186309814453, -0.0030080676078796387, -0.002789616584777832, -0.0025711655616760254, -0.0023527145385742188, -0.002134263515472412, -0.0019158124923706055, -0.0016973614692687988, -0.0014789104461669922, -0.0012604594230651855, -0.001042008399963379, -0.0008235573768615723, -0.0006051063537597656, -0.000386655330657959, -0.00016820430755615234, 5.02467155456543e-05, 0.00026869773864746094, 0.0004871487617492676, 0.0007055997848510742, 0.0009240508079528809, 0.0011425018310546875, 0.0013609528541564941, 0.0015794038772583008, 0.0017978549003601074, 0.002016305923461914, 0.0022347569465637207, 0.0024532079696655273, 0.002671658992767334, 0.0028901100158691406, 0.0031085610389709473, 0.003327012062072754, 0.0035454630851745605, 0.003763914108276367, 0.003982365131378174, 0.0042008161544799805, 0.004419267177581787, 0.004637718200683594, 0.0048561692237854, 0.005074620246887207, 0.005293071269989014, 0.00551152229309082, 0.005729973316192627, 0.005948424339294434, 0.00616687536239624, 0.006385326385498047, 0.0066037774085998535, 0.00682222843170166, 0.007040679454803467, 0.0072591304779052734, 0.00747758150100708, 0.007696032524108887, 0.007914483547210693, 0.0081329345703125]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 6.0, 2.0, 7.0, 7.0, 7.0, 8.0, 6.0, 8.0, 11.0, 22.0, 24.0, 21.0, 26.0, 50.0, 56.0, 104.0, 163.0, 290.0, 662.0, 17858.0, 1025351.0, 2771.0, 440.0, 228.0, 131.0, 78.0, 51.0, 44.0, 27.0, 21.0, 14.0, 13.0, 16.0, 10.0, 6.0, 3.0, 3.0, 5.0, 5.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1771240234375, -0.1723785400390625, -0.167633056640625, -0.1628875732421875, -0.15814208984375, -0.1533966064453125, -0.148651123046875, -0.1439056396484375, -0.13916015625, -0.1344146728515625, -0.129669189453125, -0.1249237060546875, -0.12017822265625, -0.1154327392578125, -0.110687255859375, -0.1059417724609375, -0.1011962890625, -0.0964508056640625, -0.091705322265625, -0.0869598388671875, -0.08221435546875, -0.0774688720703125, -0.072723388671875, -0.0679779052734375, -0.063232421875, -0.0584869384765625, -0.053741455078125, -0.0489959716796875, -0.04425048828125, -0.0395050048828125, -0.034759521484375, -0.0300140380859375, -0.0252685546875, -0.0205230712890625, -0.015777587890625, -0.0110321044921875, -0.00628662109375, -0.0015411376953125, 0.003204345703125, 0.0079498291015625, 0.0126953125, 0.0174407958984375, 0.022186279296875, 0.0269317626953125, 0.03167724609375, 0.0364227294921875, 0.041168212890625, 0.0459136962890625, 0.0506591796875, 0.0554046630859375, 0.060150146484375, 0.0648956298828125, 0.06964111328125, 0.0743865966796875, 0.079132080078125, 0.0838775634765625, 0.088623046875, 0.0933685302734375, 0.098114013671875, 0.1028594970703125, 0.10760498046875, 0.1123504638671875, 0.117095947265625, 0.1218414306640625, 0.1265869140625]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 10.0, 827.0, 174.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.014397669583559036, -0.011411639861762524, -0.008425610139966011, -0.0054395804181694984, -0.002453550696372986, 0.0005324790254235268, 0.0035185087472200394, 0.006504539400339127, 0.009490568190813065, 0.012476597912609577, 0.01546262763440609, 0.018448658287525177, 0.021434687077999115, 0.024420715868473053, 0.02740674652159214, 0.030392777174711227, 0.033378805965185165, 0.0363648347556591, 0.03935086727142334, 0.04233689606189728, 0.045322924852371216, 0.048308953642845154, 0.05129498243331909, 0.05428101494908333, 0.057267043739557266, 0.060253072530031204, 0.06323910504579544, 0.06622513383626938, 0.06921116262674332, 0.07219719141721725, 0.07518322020769119, 0.07816925644874573, 0.08115528523921967, 0.0841413140296936, 0.08712734282016754, 0.09011337161064148, 0.09309940040111542, 0.09608543664216995, 0.09907146543264389, 0.10205749422311783, 0.10504352301359177, 0.1080295518040657, 0.11101558059453964, 0.11400160938501358, 0.11698764562606812, 0.11997367441654205, 0.12295970320701599, 0.12594573199748993, 0.12893176078796387, 0.1319177895784378, 0.13490381836891174, 0.13788984715938568, 0.14087587594985962, 0.14386190474033356, 0.1468479335308075, 0.14983397722244263, 0.15281999111175537, 0.1558060199022293, 0.15879204869270325, 0.16177807748317719, 0.16476410627365112, 0.16775013506412506, 0.170736163854599, 0.17372220754623413, 0.17670823633670807]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 5.0, 5.0, 4.0, 7.0, 10.0, 9.0, 14.0, 17.0, 21.0, 15.0, 18.0, 29.0, 34.0, 31.0, 40.0, 40.0, 32.0, 42.0, 55.0, 46.0, 65.0, 47.0, 42.0, 41.0, 43.0, 35.0, 27.0, 45.0, 24.0, 38.0, 20.0, 24.0, 17.0, 17.0, 13.0, 5.0, 9.0, 7.0, 2.0, 6.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.008141040802001953, -0.00790256354957819, -0.007664086297154427, -0.007425609044730663, -0.0071871317923069, -0.006948654539883137, -0.0067101772874593735, -0.00647170003503561, -0.006233222782611847, -0.005994745530188084, -0.00575626827776432, -0.005517791025340557, -0.005279313772916794, -0.0050408365204930305, -0.004802359268069267, -0.004563882015645504, -0.004325404763221741, -0.0040869275107979774, -0.003848450258374214, -0.003609973005950451, -0.0033714957535266876, -0.0031330185011029243, -0.002894541248679161, -0.002656063996255398, -0.0024175867438316345, -0.0021791094914078712, -0.001940632238984108, -0.0017021549865603447, -0.0014636777341365814, -0.0012252004817128181, -0.0009867232292890549, -0.0007482459768652916, -0.0005097687244415283, -0.00027129147201776505, -3.281421959400177e-05, 0.0002056630328297615, 0.0004441402852535248, 0.0006826175376772881, 0.0009210947901010513, 0.0011595720425248146, 0.0013980492949485779, 0.0016365265473723412, 0.0018750037997961044, 0.0021134810522198677, 0.002351958304643631, 0.0025904355570673943, 0.0028289128094911575, 0.003067390061914921, 0.003305867314338684, 0.0035443445667624474, 0.0037828218191862106, 0.004021299071609974, 0.004259776324033737, 0.0044982535764575005, 0.004736730828881264, 0.004975208081305027, 0.00521368533372879, 0.0054521625861525536, 0.005690639838576317, 0.00592911709100008, 0.006167594343423843, 0.006406071595847607, 0.00664454884827137, 0.006883026100695133, 0.0071215033531188965]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 6.0, 4.0, 3.0, 5.0, 11.0, 11.0, 4.0, 8.0, 11.0, 14.0, 19.0, 18.0, 13.0, 18.0, 27.0, 28.0, 30.0, 27.0, 28.0, 34.0, 39.0, 46.0, 26.0, 38.0, 33.0, 33.0, 31.0, 41.0, 39.0, 35.0, 33.0, 30.0, 29.0, 24.0, 31.0, 20.0, 24.0, 20.0, 16.0, 21.0, 18.0, 11.0, 8.0, 5.0, 10.0, 8.0, 9.0, 6.0, 6.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.421875, -6.20123291015625, -5.9805908203125, -5.75994873046875, -5.539306640625, -5.31866455078125, -5.0980224609375, -4.87738037109375, -4.65673828125, -4.43609619140625, -4.2154541015625, -3.99481201171875, -3.774169921875, -3.55352783203125, -3.3328857421875, -3.11224365234375, -2.8916015625, -2.67095947265625, -2.4503173828125, -2.22967529296875, -2.009033203125, -1.78839111328125, -1.5677490234375, -1.34710693359375, -1.12646484375, -0.90582275390625, -0.6851806640625, -0.46453857421875, -0.243896484375, -0.02325439453125, 0.1973876953125, 0.41802978515625, 0.638671875, 0.85931396484375, 1.0799560546875, 1.30059814453125, 1.521240234375, 1.74188232421875, 1.9625244140625, 2.18316650390625, 2.40380859375, 2.62445068359375, 2.8450927734375, 3.06573486328125, 3.286376953125, 3.50701904296875, 3.7276611328125, 3.94830322265625, 4.1689453125, 4.38958740234375, 4.6102294921875, 4.83087158203125, 5.051513671875, 5.27215576171875, 5.4927978515625, 5.71343994140625, 5.93408203125, 6.15472412109375, 6.3753662109375, 6.59600830078125, 6.816650390625, 7.03729248046875, 7.2579345703125, 7.47857666015625, 7.69921875]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 3.0, 3.0, 8.0, 10.0, 11.0, 24.0, 26.0, 23.0, 39.0, 58.0, 106.0, 136.0, 215.0, 321.0, 520.0, 832.0, 1446.0, 2472.0, 4493.0, 7876.0, 14020.0, 25295.0, 47566.0, 97934.0, 269070.0, 334527.0, 119451.0, 55660.0, 29183.0, 16188.0, 8993.0, 4998.0, 2879.0, 1558.0, 999.0, 590.0, 322.0, 214.0, 142.0, 106.0, 74.0, 44.0, 27.0, 24.0, 19.0, 15.0, 16.0, 8.0, 6.0, 7.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-9.765625, -9.4615478515625, -9.157470703125, -8.8533935546875, -8.54931640625, -8.2452392578125, -7.941162109375, -7.6370849609375, -7.3330078125, -7.0289306640625, -6.724853515625, -6.4207763671875, -6.11669921875, -5.8126220703125, -5.508544921875, -5.2044677734375, -4.900390625, -4.5963134765625, -4.292236328125, -3.9881591796875, -3.68408203125, -3.3800048828125, -3.075927734375, -2.7718505859375, -2.4677734375, -2.1636962890625, -1.859619140625, -1.5555419921875, -1.25146484375, -0.9473876953125, -0.643310546875, -0.3392333984375, -0.03515625, 0.2689208984375, 0.572998046875, 0.8770751953125, 1.18115234375, 1.4852294921875, 1.789306640625, 2.0933837890625, 2.3974609375, 2.7015380859375, 3.005615234375, 3.3096923828125, 3.61376953125, 3.9178466796875, 4.221923828125, 4.5260009765625, 4.830078125, 5.1341552734375, 5.438232421875, 5.7423095703125, 6.04638671875, 6.3504638671875, 6.654541015625, 6.9586181640625, 7.2626953125, 7.5667724609375, 7.870849609375, 8.1749267578125, 8.47900390625, 8.7830810546875, 9.087158203125, 9.3912353515625, 9.6953125]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 7.0, 4.0, 4.0, 9.0, 13.0, 15.0, 10.0, 10.0, 20.0, 35.0, 26.0, 29.0, 45.0, 45.0, 79.0, 73.0, 118.0, 229.0, 1427.0, 285.0, 133.0, 95.0, 58.0, 49.0, 44.0, 45.0, 30.0, 20.0, 29.0, 17.0, 16.0, 12.0, 4.0, 7.0, 5.0, 8.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.875, -28.08740234375, -27.2998046875, -26.51220703125, -25.724609375, -24.93701171875, -24.1494140625, -23.36181640625, -22.57421875, -21.78662109375, -20.9990234375, -20.21142578125, -19.423828125, -18.63623046875, -17.8486328125, -17.06103515625, -16.2734375, -15.48583984375, -14.6982421875, -13.91064453125, -13.123046875, -12.33544921875, -11.5478515625, -10.76025390625, -9.97265625, -9.18505859375, -8.3974609375, -7.60986328125, -6.822265625, -6.03466796875, -5.2470703125, -4.45947265625, -3.671875, -2.88427734375, -2.0966796875, -1.30908203125, -0.521484375, 0.26611328125, 1.0537109375, 1.84130859375, 2.62890625, 3.41650390625, 4.2041015625, 4.99169921875, 5.779296875, 6.56689453125, 7.3544921875, 8.14208984375, 8.9296875, 9.71728515625, 10.5048828125, 11.29248046875, 12.080078125, 12.86767578125, 13.6552734375, 14.44287109375, 15.23046875, 16.01806640625, 16.8056640625, 17.59326171875, 18.380859375, 19.16845703125, 19.9560546875, 20.74365234375, 21.53125]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 3.0, 4.0, 5.0, 10.0, 16.0, 13.0, 19.0, 38.0, 54.0, 81.0, 126.0, 264.0, 530.0, 2392.0, 45421.0, 2986647.0, 104784.0, 3847.0, 692.0, 282.0, 171.0, 91.0, 71.0, 38.0, 33.0, 15.0, 18.0, 9.0, 9.0, 6.0, 3.0, 4.0, 6.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.84375, -45.01416015625, -43.1845703125, -41.35498046875, -39.525390625, -37.69580078125, -35.8662109375, -34.03662109375, -32.20703125, -30.37744140625, -28.5478515625, -26.71826171875, -24.888671875, -23.05908203125, -21.2294921875, -19.39990234375, -17.5703125, -15.74072265625, -13.9111328125, -12.08154296875, -10.251953125, -8.42236328125, -6.5927734375, -4.76318359375, -2.93359375, -1.10400390625, 0.7255859375, 2.55517578125, 4.384765625, 6.21435546875, 8.0439453125, 9.87353515625, 11.703125, 13.53271484375, 15.3623046875, 17.19189453125, 19.021484375, 20.85107421875, 22.6806640625, 24.51025390625, 26.33984375, 28.16943359375, 29.9990234375, 31.82861328125, 33.658203125, 35.48779296875, 37.3173828125, 39.14697265625, 40.9765625, 42.80615234375, 44.6357421875, 46.46533203125, 48.294921875, 50.12451171875, 51.9541015625, 53.78369140625, 55.61328125, 57.44287109375, 59.2724609375, 61.10205078125, 62.931640625, 64.76123046875, 66.5908203125, 68.42041015625, 70.25]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [2.0, 14.0, 128.0, 511.0, 313.0, 45.0, 6.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.04140853881836, -16.901386260986328, -10.761363983154297, -4.621341705322266, 1.5186805725097656, 7.658702850341797, 13.798725128173828, 19.93874740600586, 26.07876968383789, 32.21879196166992, 38.35881423950195, 44.498836517333984, 50.638858795166016, 56.77888107299805, 62.91890335083008, 69.05892944335938, 75.19894409179688, 81.3389663696289, 87.47898864746094, 93.61901092529297, 99.759033203125, 105.89905548095703, 112.03907775878906, 118.1791000366211, 124.31912231445312, 130.45913696289062, 136.5991668701172, 142.73919677734375, 148.87921142578125, 155.01922607421875, 161.1592559814453, 167.29928588867188, 173.43930053710938, 179.57931518554688, 185.71934509277344, 191.859375, 197.9993896484375, 204.139404296875, 210.27943420410156, 216.41946411132812, 222.55947875976562, 228.69949340820312, 234.8395233154297, 240.97955322265625, 247.11956787109375, 253.25958251953125, 259.39959716796875, 265.5396423339844, 271.6796569824219, 277.8196716308594, 283.959716796875, 290.0997314453125, 296.23974609375, 302.3797607421875, 308.519775390625, 314.6598205566406, 320.7998352050781, 326.9398498535156, 333.07989501953125, 339.21990966796875, 345.35992431640625, 351.49993896484375, 357.63995361328125, 363.7799987792969, 369.9200134277344]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 5.0, 8.0, 10.0, 8.0, 3.0, 12.0, 13.0, 9.0, 19.0, 19.0, 25.0, 24.0, 27.0, 32.0, 31.0, 29.0, 31.0, 45.0, 42.0, 41.0, 47.0, 39.0, 46.0, 48.0, 41.0, 35.0, 40.0, 40.0, 28.0, 30.0, 15.0, 28.0, 20.0, 16.0, 18.0, 13.0, 14.0, 8.0, 10.0, 9.0, 4.0, 5.0, 5.0, 3.0, 4.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.911376953125, -43.43986129760742, -41.96834182739258, -40.496826171875, -39.02531051635742, -37.553794860839844, -36.082275390625, -34.61075973510742, -33.139244079589844, -31.667726516723633, -30.196210861206055, -28.724693298339844, -27.253177642822266, -25.781660079956055, -24.310142517089844, -22.838626861572266, -21.367107391357422, -19.89558982849121, -18.424074172973633, -16.952556610107422, -15.481040000915527, -14.009523391723633, -12.538005828857422, -11.066489219665527, -9.594972610473633, -8.123456001281738, -6.6519389152526855, -5.180421829223633, -3.7089052200317383, -2.2373886108398438, -0.7658710479736328, 0.7056455612182617, 2.1771621704101562, 3.64867901802063, 5.1201958656311035, 6.591712951660156, 8.06322956085205, 9.534746170043945, 11.006263732910156, 12.47778034210205, 13.949296951293945, 15.42081356048584, 16.892330169677734, 18.363847732543945, 19.835365295410156, 21.306880950927734, 22.778398513793945, 24.249916076660156, 25.721431732177734, 27.192949295043945, 28.664464950561523, 30.135982513427734, 31.607498168945312, 33.079017639160156, 34.550533294677734, 36.02204895019531, 37.493568420410156, 38.965084075927734, 40.43660354614258, 41.908119201660156, 43.379634857177734, 44.85115051269531, 46.322669982910156, 47.794185638427734, 49.26570129394531]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 5.0, 6.0, 6.0, 7.0, 4.0, 9.0, 12.0, 9.0, 15.0, 13.0, 13.0, 12.0, 25.0, 23.0, 22.0, 18.0, 31.0, 30.0, 27.0, 35.0, 33.0, 40.0, 31.0, 35.0, 25.0, 36.0, 36.0, 38.0, 31.0, 41.0, 27.0, 42.0, 27.0, 26.0, 31.0, 24.0, 17.0, 27.0, 9.0, 19.0, 17.0, 12.0, 14.0, 16.0, 8.0, 6.0, 5.0, 4.0, 7.0, 2.0, 4.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.765625, -5.5479736328125, -5.330322265625, -5.1126708984375, -4.89501953125, -4.6773681640625, -4.459716796875, -4.2420654296875, -4.0244140625, -3.8067626953125, -3.589111328125, -3.3714599609375, -3.15380859375, -2.9361572265625, -2.718505859375, -2.5008544921875, -2.283203125, -2.0655517578125, -1.847900390625, -1.6302490234375, -1.41259765625, -1.1949462890625, -0.977294921875, -0.7596435546875, -0.5419921875, -0.3243408203125, -0.106689453125, 0.1109619140625, 0.32861328125, 0.5462646484375, 0.763916015625, 0.9815673828125, 1.19921875, 1.4168701171875, 1.634521484375, 1.8521728515625, 2.06982421875, 2.2874755859375, 2.505126953125, 2.7227783203125, 2.9404296875, 3.1580810546875, 3.375732421875, 3.5933837890625, 3.81103515625, 4.0286865234375, 4.246337890625, 4.4639892578125, 4.681640625, 4.8992919921875, 5.116943359375, 5.3345947265625, 5.55224609375, 5.7698974609375, 5.987548828125, 6.2052001953125, 6.4228515625, 6.6405029296875, 6.858154296875, 7.0758056640625, 7.29345703125, 7.5111083984375, 7.728759765625, 7.9464111328125, 8.1640625]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 5.0, 9.0, 5.0, 10.0, 14.0, 13.0, 13.0, 20.0, 28.0, 33.0, 47.0, 45.0, 65.0, 102.0, 145.0, 186.0, 250.0, 333.0, 566.0, 8345.0, 4132298.0, 49405.0, 894.0, 405.0, 275.0, 175.0, 152.0, 107.0, 75.0, 48.0, 59.0, 34.0, 17.0, 25.0, 11.0, 7.0, 14.0, 14.0, 9.0, 5.0, 4.0, 7.0, 1.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-88.5625, -85.763671875, -82.96484375, -80.166015625, -77.3671875, -74.568359375, -71.76953125, -68.970703125, -66.171875, -63.373046875, -60.57421875, -57.775390625, -54.9765625, -52.177734375, -49.37890625, -46.580078125, -43.78125, -40.982421875, -38.18359375, -35.384765625, -32.5859375, -29.787109375, -26.98828125, -24.189453125, -21.390625, -18.591796875, -15.79296875, -12.994140625, -10.1953125, -7.396484375, -4.59765625, -1.798828125, 1.0, 3.798828125, 6.59765625, 9.396484375, 12.1953125, 14.994140625, 17.79296875, 20.591796875, 23.390625, 26.189453125, 28.98828125, 31.787109375, 34.5859375, 37.384765625, 40.18359375, 42.982421875, 45.78125, 48.580078125, 51.37890625, 54.177734375, 56.9765625, 59.775390625, 62.57421875, 65.373046875, 68.171875, 70.970703125, 73.76953125, 76.568359375, 79.3671875, 82.166015625, 84.96484375, 87.763671875, 90.5625]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 6.0, 9.0, 6.0, 7.0, 22.0, 26.0, 25.0, 35.0, 52.0, 65.0, 89.0, 121.0, 156.0, 272.0, 429.0, 689.0, 703.0, 492.0, 303.0, 194.0, 113.0, 65.0, 57.0, 29.0, 44.0, 19.0, 14.0, 13.0, 9.0, 4.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.5703125, -15.126708984375, -14.68310546875, -14.239501953125, -13.7958984375, -13.352294921875, -12.90869140625, -12.465087890625, -12.021484375, -11.577880859375, -11.13427734375, -10.690673828125, -10.2470703125, -9.803466796875, -9.35986328125, -8.916259765625, -8.47265625, -8.029052734375, -7.58544921875, -7.141845703125, -6.6982421875, -6.254638671875, -5.81103515625, -5.367431640625, -4.923828125, -4.480224609375, -4.03662109375, -3.593017578125, -3.1494140625, -2.705810546875, -2.26220703125, -1.818603515625, -1.375, -0.931396484375, -0.48779296875, -0.044189453125, 0.3994140625, 0.843017578125, 1.28662109375, 1.730224609375, 2.173828125, 2.617431640625, 3.06103515625, 3.504638671875, 3.9482421875, 4.391845703125, 4.83544921875, 5.279052734375, 5.72265625, 6.166259765625, 6.60986328125, 7.053466796875, 7.4970703125, 7.940673828125, 8.38427734375, 8.827880859375, 9.271484375, 9.715087890625, 10.15869140625, 10.602294921875, 11.0458984375, 11.489501953125, 11.93310546875, 12.376708984375, 12.8203125]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 5.0, 1.0, 5.0, 7.0, 19.0, 16.0, 19.0, 18.0, 31.0, 42.0, 49.0, 92.0, 190.0, 665.0, 7058.0, 498898.0, 3657580.0, 27584.0, 1331.0, 303.0, 110.0, 63.0, 41.0, 36.0, 29.0, 23.0, 20.0, 11.0, 13.0, 7.0, 10.0, 3.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-56.96875, -55.25244140625, -53.5361328125, -51.81982421875, -50.103515625, -48.38720703125, -46.6708984375, -44.95458984375, -43.23828125, -41.52197265625, -39.8056640625, -38.08935546875, -36.373046875, -34.65673828125, -32.9404296875, -31.22412109375, -29.5078125, -27.79150390625, -26.0751953125, -24.35888671875, -22.642578125, -20.92626953125, -19.2099609375, -17.49365234375, -15.77734375, -14.06103515625, -12.3447265625, -10.62841796875, -8.912109375, -7.19580078125, -5.4794921875, -3.76318359375, -2.046875, -0.33056640625, 1.3857421875, 3.10205078125, 4.818359375, 6.53466796875, 8.2509765625, 9.96728515625, 11.68359375, 13.39990234375, 15.1162109375, 16.83251953125, 18.548828125, 20.26513671875, 21.9814453125, 23.69775390625, 25.4140625, 27.13037109375, 28.8466796875, 30.56298828125, 32.279296875, 33.99560546875, 35.7119140625, 37.42822265625, 39.14453125, 40.86083984375, 42.5771484375, 44.29345703125, 46.009765625, 47.72607421875, 49.4423828125, 51.15869140625, 52.875]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 9.0, 14.0, 43.0, 83.0, 168.0, 211.0, 220.0, 128.0, 90.0, 29.0, 13.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.32117462158203, -70.61112976074219, -67.90109252929688, -65.19104766845703, -62.48100280761719, -59.77096176147461, -57.06092071533203, -54.35087585449219, -51.640830993652344, -48.930789947509766, -46.22074508666992, -43.510704040527344, -40.8006591796875, -38.09061813354492, -35.380577087402344, -32.6705322265625, -29.960491180419922, -27.25044822692871, -24.5404052734375, -21.830364227294922, -19.120319366455078, -16.4102783203125, -13.700235366821289, -10.990192413330078, -8.280149459838867, -5.570106506347656, -2.8600640296936035, -0.15002155303955078, 2.56002140045166, 5.270064353942871, 7.980106353759766, 10.690149307250977, 13.400192260742188, 16.1102352142334, 18.82027816772461, 21.530319213867188, 24.24036407470703, 26.95040512084961, 29.66044807434082, 32.37049102783203, 35.080535888671875, 37.79057693481445, 40.5006217956543, 43.210662841796875, 45.92070770263672, 48.6307487487793, 51.340789794921875, 54.05083465576172, 56.7608757019043, 59.470916748046875, 62.18096160888672, 64.89100646972656, 67.60104370117188, 70.31108856201172, 73.02113342285156, 75.73117065429688, 78.44121551513672, 81.15126037597656, 83.86129760742188, 86.57134246826172, 89.28138732910156, 91.9914321899414, 94.70146942138672, 97.41151428222656, 100.1215591430664]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 3.0, 3.0, 3.0, 2.0, 5.0, 4.0, 3.0, 5.0, 6.0, 10.0, 5.0, 4.0, 9.0, 11.0, 24.0, 13.0, 27.0, 22.0, 20.0, 33.0, 25.0, 29.0, 36.0, 34.0, 29.0, 28.0, 33.0, 41.0, 25.0, 45.0, 39.0, 39.0, 36.0, 30.0, 27.0, 35.0, 25.0, 28.0, 12.0, 24.0, 32.0, 22.0, 23.0, 16.0, 14.0, 16.0, 9.0, 9.0, 11.0, 6.0, 5.0, 4.0, 4.0, 5.0, 5.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0], "bins": [-35.45603942871094, -34.349205017089844, -33.24237060546875, -32.135536193847656, -31.028701782226562, -29.92186737060547, -28.815034866333008, -27.708200454711914, -26.60136604309082, -25.494531631469727, -24.387697219848633, -23.28086280822754, -22.174030303955078, -21.067195892333984, -19.96036148071289, -18.853527069091797, -17.746692657470703, -16.63985824584961, -15.533023834228516, -14.426190376281738, -13.319355964660645, -12.21252155303955, -11.105688095092773, -9.99885368347168, -8.892019271850586, -7.785184860229492, -6.678350925445557, -5.571516990661621, -4.464682579040527, -3.3578481674194336, -2.251014232635498, -1.1441802978515625, -0.03734588623046875, 1.069488286972046, 2.1763224601745605, 3.283156633377075, 4.38999080657959, 5.496825218200684, 6.603659152984619, 7.710493087768555, 8.817327499389648, 9.924161911010742, 11.030996322631836, 12.137829780578613, 13.244664192199707, 14.3514986038208, 15.458332061767578, 16.565166473388672, 17.672000885009766, 18.77883529663086, 19.885669708251953, 20.992504119873047, 22.09933853149414, 23.206172943115234, 24.313005447387695, 25.41983985900879, 26.526674270629883, 27.633508682250977, 28.74034309387207, 29.847177505493164, 30.954010009765625, 32.06084442138672, 33.16767883300781, 34.274513244628906, 35.38134765625]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 5.0, 5.0, 2.0, 6.0, 4.0, 6.0, 7.0, 10.0, 10.0, 16.0, 16.0, 13.0, 17.0, 21.0, 28.0, 20.0, 32.0, 37.0, 29.0, 42.0, 31.0, 44.0, 31.0, 35.0, 41.0, 22.0, 43.0, 32.0, 31.0, 40.0, 27.0, 31.0, 35.0, 22.0, 28.0, 30.0, 38.0, 16.0, 19.0, 10.0, 17.0, 17.0, 9.0, 10.0, 4.0, 5.0, 5.0, 1.0, 3.0, 3.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-6.16796875, -5.95819091796875, -5.7484130859375, -5.53863525390625, -5.328857421875, -5.11907958984375, -4.9093017578125, -4.69952392578125, -4.48974609375, -4.27996826171875, -4.0701904296875, -3.86041259765625, -3.650634765625, -3.44085693359375, -3.2310791015625, -3.02130126953125, -2.8115234375, -2.60174560546875, -2.3919677734375, -2.18218994140625, -1.972412109375, -1.76263427734375, -1.5528564453125, -1.34307861328125, -1.13330078125, -0.92352294921875, -0.7137451171875, -0.50396728515625, -0.294189453125, -0.08441162109375, 0.1253662109375, 0.33514404296875, 0.544921875, 0.75469970703125, 0.9644775390625, 1.17425537109375, 1.384033203125, 1.59381103515625, 1.8035888671875, 2.01336669921875, 2.22314453125, 2.43292236328125, 2.6427001953125, 2.85247802734375, 3.062255859375, 3.27203369140625, 3.4818115234375, 3.69158935546875, 3.9013671875, 4.11114501953125, 4.3209228515625, 4.53070068359375, 4.740478515625, 4.95025634765625, 5.1600341796875, 5.36981201171875, 5.57958984375, 5.78936767578125, 5.9991455078125, 6.20892333984375, 6.418701171875, 6.62847900390625, 6.8382568359375, 7.04803466796875, 7.2578125]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 3.0, 9.0, 6.0, 14.0, 17.0, 42.0, 51.0, 83.0, 109.0, 154.0, 216.0, 391.0, 557.0, 790.0, 1233.0, 1808.0, 2983.0, 4404.0, 6767.0, 10570.0, 17559.0, 28930.0, 50399.0, 88706.0, 156963.0, 227295.0, 186459.0, 109231.0, 61144.0, 35151.0, 20964.0, 12869.0, 7899.0, 5078.0, 3358.0, 2142.0, 1406.0, 960.0, 602.0, 389.0, 260.0, 176.0, 140.0, 101.0, 61.0, 39.0, 24.0, 16.0, 18.0, 7.0, 4.0, 9.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.6142578125, -0.5935592651367188, -0.5728607177734375, -0.5521621704101562, -0.531463623046875, -0.5107650756835938, -0.4900665283203125, -0.46936798095703125, -0.44866943359375, -0.42797088623046875, -0.4072723388671875, -0.38657379150390625, -0.365875244140625, -0.34517669677734375, -0.3244781494140625, -0.30377960205078125, -0.2830810546875, -0.26238250732421875, -0.2416839599609375, -0.22098541259765625, -0.200286865234375, -0.17958831787109375, -0.1588897705078125, -0.13819122314453125, -0.11749267578125, -0.09679412841796875, -0.0760955810546875, -0.05539703369140625, -0.034698486328125, -0.01399993896484375, 0.0066986083984375, 0.02739715576171875, 0.048095703125, 0.06879425048828125, 0.0894927978515625, 0.11019134521484375, 0.130889892578125, 0.15158843994140625, 0.1722869873046875, 0.19298553466796875, 0.21368408203125, 0.23438262939453125, 0.2550811767578125, 0.27577972412109375, 0.296478271484375, 0.31717681884765625, 0.3378753662109375, 0.35857391357421875, 0.3792724609375, 0.39997100830078125, 0.4206695556640625, 0.44136810302734375, 0.462066650390625, 0.48276519775390625, 0.5034637451171875, 0.5241622924804688, 0.54486083984375, 0.5655593872070312, 0.5862579345703125, 0.6069564819335938, 0.627655029296875, 0.6483535766601562, 0.6690521240234375, 0.6897506713867188, 0.71044921875]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 6.0, 4.0, 7.0, 8.0, 3.0, 18.0, 16.0, 17.0, 29.0, 23.0, 25.0, 23.0, 26.0, 37.0, 43.0, 29.0, 28.0, 42.0, 40.0, 42.0, 29.0, 1053.0, 41.0, 33.0, 36.0, 37.0, 35.0, 31.0, 40.0, 25.0, 27.0, 31.0, 23.0, 24.0, 16.0, 12.0, 13.0, 13.0, 10.0, 7.0, 8.0, 3.0, 3.0, 6.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.3984375, -4.2576904296875, -4.116943359375, -3.9761962890625, -3.83544921875, -3.6947021484375, -3.553955078125, -3.4132080078125, -3.2724609375, -3.1317138671875, -2.990966796875, -2.8502197265625, -2.70947265625, -2.5687255859375, -2.427978515625, -2.2872314453125, -2.146484375, -2.0057373046875, -1.864990234375, -1.7242431640625, -1.58349609375, -1.4427490234375, -1.302001953125, -1.1612548828125, -1.0205078125, -0.8797607421875, -0.739013671875, -0.5982666015625, -0.45751953125, -0.3167724609375, -0.176025390625, -0.0352783203125, 0.10546875, 0.2462158203125, 0.386962890625, 0.5277099609375, 0.66845703125, 0.8092041015625, 0.949951171875, 1.0906982421875, 1.2314453125, 1.3721923828125, 1.512939453125, 1.6536865234375, 1.79443359375, 1.9351806640625, 2.075927734375, 2.2166748046875, 2.357421875, 2.4981689453125, 2.638916015625, 2.7796630859375, 2.92041015625, 3.0611572265625, 3.201904296875, 3.3426513671875, 3.4833984375, 3.6241455078125, 3.764892578125, 3.9056396484375, 4.04638671875, 4.1871337890625, 4.327880859375, 4.4686279296875, 4.609375]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 6.0, 5.0, 7.0, 7.0, 9.0, 14.0, 20.0, 29.0, 63.0, 62.0, 85.0, 139.0, 215.0, 360.0, 553.0, 836.0, 1428.0, 2558.0, 4196.0, 7021.0, 12440.0, 21670.0, 38746.0, 68984.0, 121362.0, 192787.0, 1260254.0, 154331.0, 91158.0, 50529.0, 28817.0, 15936.0, 9134.0, 5357.0, 3104.0, 1869.0, 1085.0, 713.0, 426.0, 270.0, 167.0, 141.0, 87.0, 49.0, 31.0, 23.0, 25.0, 14.0, 6.0, 6.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.4033203125, -0.3899803161621094, -0.37664031982421875, -0.3633003234863281, -0.3499603271484375, -0.3366203308105469, -0.32328033447265625, -0.3099403381347656, -0.296600341796875, -0.2832603454589844, -0.26992034912109375, -0.2565803527832031, -0.2432403564453125, -0.22990036010742188, -0.21656036376953125, -0.20322036743164062, -0.18988037109375, -0.17654037475585938, -0.16320037841796875, -0.14986038208007812, -0.1365203857421875, -0.12318038940429688, -0.10984039306640625, -0.09650039672851562, -0.083160400390625, -0.06982040405273438, -0.05648040771484375, -0.043140411376953125, -0.0298004150390625, -0.016460418701171875, -0.00312042236328125, 0.010219573974609375, 0.0235595703125, 0.036899566650390625, 0.05023956298828125, 0.06357955932617188, 0.0769195556640625, 0.09025955200195312, 0.10359954833984375, 0.11693954467773438, 0.130279541015625, 0.14361953735351562, 0.15695953369140625, 0.17029953002929688, 0.1836395263671875, 0.19697952270507812, 0.21031951904296875, 0.22365951538085938, 0.23699951171875, 0.2503395080566406, 0.26367950439453125, 0.2770195007324219, 0.2903594970703125, 0.3036994934082031, 0.31703948974609375, 0.3303794860839844, 0.343719482421875, 0.3570594787597656, 0.37039947509765625, 0.3837394714355469, 0.3970794677734375, 0.4104194641113281, 0.42375946044921875, 0.4370994567871094, 0.450439453125]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 4.0, 7.0, 8.0, 5.0, 4.0, 4.0, 6.0, 9.0, 15.0, 27.0, 28.0, 40.0, 59.0, 98.0, 129.0, 136.0, 117.0, 81.0, 49.0, 39.0, 33.0, 14.0, 17.0, 8.0, 10.0, 9.0, 5.0, 12.0, 2.0, 3.0, 2.0, 4.0, 1.0, 2.0, 5.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00666046142578125, -0.006439864635467529, -0.006219267845153809, -0.005998671054840088, -0.005778074264526367, -0.0055574774742126465, -0.005336880683898926, -0.005116283893585205, -0.004895687103271484, -0.004675090312957764, -0.004454493522644043, -0.004233896732330322, -0.0040132999420166016, -0.003792703151702881, -0.00357210636138916, -0.0033515095710754395, -0.0031309127807617188, -0.002910315990447998, -0.0026897192001342773, -0.0024691224098205566, -0.002248525619506836, -0.0020279288291931152, -0.0018073320388793945, -0.0015867352485656738, -0.0013661384582519531, -0.0011455416679382324, -0.0009249448776245117, -0.000704348087310791, -0.0004837512969970703, -0.0002631545066833496, -4.2557716369628906e-05, 0.0001780390739440918, 0.0003986358642578125, 0.0006192326545715332, 0.0008398294448852539, 0.0010604262351989746, 0.0012810230255126953, 0.001501619815826416, 0.0017222166061401367, 0.0019428133964538574, 0.002163410186767578, 0.002384006977081299, 0.0026046037673950195, 0.0028252005577087402, 0.003045797348022461, 0.0032663941383361816, 0.0034869909286499023, 0.003707587718963623, 0.003928184509277344, 0.0041487812995910645, 0.004369378089904785, 0.004589974880218506, 0.0048105716705322266, 0.005031168460845947, 0.005251765251159668, 0.005472362041473389, 0.005692958831787109, 0.00591355562210083, 0.006134152412414551, 0.0063547492027282715, 0.006575345993041992, 0.006795942783355713, 0.007016539573669434, 0.007237136363983154, 0.007457733154296875]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 4.0, 9.0, 2.0, 5.0, 3.0, 10.0, 4.0, 9.0, 20.0, 16.0, 24.0, 29.0, 27.0, 42.0, 92.0, 119.0, 219.0, 420.0, 2119.0, 967344.0, 76282.0, 949.0, 256.0, 173.0, 122.0, 64.0, 37.0, 29.0, 23.0, 11.0, 13.0, 8.0, 18.0, 14.0, 2.0, 13.0, 5.0, 3.0, 5.0, 2.0, 5.0, 3.0, 1.0, 0.0, 1.0, 5.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.1387939453125, -0.13469219207763672, -0.13059043884277344, -0.12648868560791016, -0.12238693237304688, -0.1182851791381836, -0.11418342590332031, -0.11008167266845703, -0.10597991943359375, -0.10187816619873047, -0.09777641296386719, -0.0936746597290039, -0.08957290649414062, -0.08547115325927734, -0.08136940002441406, -0.07726764678955078, -0.0731658935546875, -0.06906414031982422, -0.06496238708496094, -0.060860633850097656, -0.056758880615234375, -0.052657127380371094, -0.04855537414550781, -0.04445362091064453, -0.04035186767578125, -0.03625011444091797, -0.03214836120605469, -0.028046607971191406, -0.023944854736328125, -0.019843101501464844, -0.015741348266601562, -0.011639595031738281, -0.007537841796875, -0.0034360885620117188, 0.0006656646728515625, 0.004767417907714844, 0.008869171142578125, 0.012970924377441406, 0.017072677612304688, 0.02117443084716797, 0.02527618408203125, 0.02937793731689453, 0.03347969055175781, 0.037581443786621094, 0.041683197021484375, 0.045784950256347656, 0.04988670349121094, 0.05398845672607422, 0.0580902099609375, 0.06219196319580078, 0.06629371643066406, 0.07039546966552734, 0.07449722290039062, 0.0785989761352539, 0.08270072937011719, 0.08680248260498047, 0.09090423583984375, 0.09500598907470703, 0.09910774230957031, 0.1032094955444336, 0.10731124877929688, 0.11141300201416016, 0.11551475524902344, 0.11961650848388672, 0.12371826171875]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 9.0, 639.0, 369.0], "bins": [-0.16133931279182434, -0.15877553820610046, -0.15621177852153778, -0.1536480039358139, -0.15108422935009003, -0.14852046966552734, -0.14595669507980347, -0.1433929204940796, -0.1408291459083557, -0.13826537132263184, -0.13570161163806915, -0.13313783705234528, -0.1305740624666214, -0.12801030278205872, -0.12544652819633484, -0.12288275361061096, -0.12031899392604828, -0.117755226790905, -0.11519145220518112, -0.11262768507003784, -0.11006391048431396, -0.10750014334917068, -0.1049363762140274, -0.10237260162830353, -0.09980882704257965, -0.09724505990743637, -0.0946812853217125, -0.09211751818656921, -0.08955374360084534, -0.08698997646570206, -0.08442620933055878, -0.0818624347448349, -0.07929866015911102, -0.07673489302396774, -0.07417111843824387, -0.07160735130310059, -0.06904357671737671, -0.06647980958223343, -0.06391604244709015, -0.06135226786136627, -0.05878850072622299, -0.05622472986578941, -0.053660959005355835, -0.051097191870212555, -0.048533421009778976, -0.0459696501493454, -0.04340587928891182, -0.04084210842847824, -0.03827834129333496, -0.03571457043290138, -0.033150799572467804, -0.030587030574679375, -0.028023261576890945, -0.025459490716457367, -0.02289571985602379, -0.02033195085823536, -0.01776817999780178, -0.015204410068690777, -0.012640640139579773, -0.010076869279146194, -0.007513099350035191, -0.004949329420924187, -0.002385558560490608, 0.00017821043729782104, 0.002741981763392687]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 7.0, 5.0, 4.0, 7.0, 5.0, 12.0, 14.0, 18.0, 27.0, 28.0, 23.0, 35.0, 43.0, 36.0, 51.0, 41.0, 48.0, 44.0, 63.0, 49.0, 56.0, 54.0, 48.0, 45.0, 35.0, 48.0, 30.0, 29.0, 19.0, 25.0, 19.0, 11.0, 10.0, 5.0, 7.0, 4.0, 2.0, 2.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0043534040451049805, -0.004136873409152031, -0.003920342773199081, -0.003703812137246132, -0.0034872815012931824, -0.003270750865340233, -0.0030542202293872833, -0.002837689593434334, -0.0026211589574813843, -0.0024046283215284348, -0.0021880976855754852, -0.0019715670496225357, -0.0017550364136695862, -0.0015385057777166367, -0.0013219751417636871, -0.0011054445058107376, -0.0008889138698577881, -0.0006723832339048386, -0.00045585259795188904, -0.00023932196199893951, -2.279132604598999e-05, 0.00019373930990695953, 0.00041026994585990906, 0.0006268005818128586, 0.0008433312177658081, 0.0010598618537187576, 0.0012763924896717072, 0.0014929231256246567, 0.0017094537615776062, 0.0019259843975305557, 0.0021425150334835052, 0.0023590456694364548, 0.0025755763053894043, 0.002792106941342354, 0.0030086375772953033, 0.003225168213248253, 0.0034416988492012024, 0.003658229485154152, 0.0038747601211071014, 0.004091290757060051, 0.0043078213930130005, 0.00452435202896595, 0.0047408826649188995, 0.004957413300871849, 0.005173943936824799, 0.005390474572777748, 0.005607005208730698, 0.005823535844683647, 0.006040066480636597, 0.006256597116589546, 0.006473127752542496, 0.006689658388495445, 0.006906189024448395, 0.007122719660401344, 0.007339250296354294, 0.007555780932307243, 0.007772311568260193, 0.007988842204213142, 0.008205372840166092, 0.008421903476119041, 0.008638434112071991, 0.00885496474802494, 0.00907149538397789, 0.00928802601993084, 0.009504556655883789]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 5.0, 5.0, 2.0, 6.0, 4.0, 6.0, 7.0, 10.0, 10.0, 16.0, 16.0, 13.0, 17.0, 21.0, 28.0, 20.0, 32.0, 37.0, 29.0, 42.0, 31.0, 44.0, 31.0, 35.0, 41.0, 22.0, 43.0, 32.0, 31.0, 40.0, 27.0, 31.0, 35.0, 22.0, 28.0, 30.0, 38.0, 16.0, 19.0, 10.0, 17.0, 17.0, 9.0, 10.0, 4.0, 5.0, 5.0, 1.0, 3.0, 3.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-6.16796875, -5.95819091796875, -5.7484130859375, -5.53863525390625, -5.328857421875, -5.11907958984375, -4.9093017578125, -4.69952392578125, -4.48974609375, -4.27996826171875, -4.0701904296875, -3.86041259765625, -3.650634765625, -3.44085693359375, -3.2310791015625, -3.02130126953125, -2.8115234375, -2.60174560546875, -2.3919677734375, -2.18218994140625, -1.972412109375, -1.76263427734375, -1.5528564453125, -1.34307861328125, -1.13330078125, -0.92352294921875, -0.7137451171875, -0.50396728515625, -0.294189453125, -0.08441162109375, 0.1253662109375, 0.33514404296875, 0.544921875, 0.75469970703125, 0.9644775390625, 1.17425537109375, 1.384033203125, 1.59381103515625, 1.8035888671875, 2.01336669921875, 2.22314453125, 2.43292236328125, 2.6427001953125, 2.85247802734375, 3.062255859375, 3.27203369140625, 3.4818115234375, 3.69158935546875, 3.9013671875, 4.11114501953125, 4.3209228515625, 4.53070068359375, 4.740478515625, 4.95025634765625, 5.1600341796875, 5.36981201171875, 5.57958984375, 5.78936767578125, 5.9991455078125, 6.20892333984375, 6.418701171875, 6.62847900390625, 6.8382568359375, 7.04803466796875, 7.2578125]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 2.0, 3.0, 8.0, 9.0, 15.0, 14.0, 19.0, 22.0, 35.0, 38.0, 66.0, 67.0, 101.0, 132.0, 165.0, 224.0, 276.0, 378.0, 549.0, 718.0, 1145.0, 1855.0, 3342.0, 7058.0, 16014.0, 39882.0, 106195.0, 277568.0, 347094.0, 148032.0, 55233.0, 21858.0, 9311.0, 4417.0, 2229.0, 1315.0, 854.0, 581.0, 443.0, 315.0, 230.0, 180.0, 140.0, 109.0, 69.0, 67.0, 54.0, 34.0, 26.0, 19.0, 11.0, 11.0, 7.0, 7.0, 6.0, 6.0, 3.0, 1.0, 2.0, 1.0, 4.0], "bins": [-10.2578125, -9.9287109375, -9.599609375, -9.2705078125, -8.94140625, -8.6123046875, -8.283203125, -7.9541015625, -7.625, -7.2958984375, -6.966796875, -6.6376953125, -6.30859375, -5.9794921875, -5.650390625, -5.3212890625, -4.9921875, -4.6630859375, -4.333984375, -4.0048828125, -3.67578125, -3.3466796875, -3.017578125, -2.6884765625, -2.359375, -2.0302734375, -1.701171875, -1.3720703125, -1.04296875, -0.7138671875, -0.384765625, -0.0556640625, 0.2734375, 0.6025390625, 0.931640625, 1.2607421875, 1.58984375, 1.9189453125, 2.248046875, 2.5771484375, 2.90625, 3.2353515625, 3.564453125, 3.8935546875, 4.22265625, 4.5517578125, 4.880859375, 5.2099609375, 5.5390625, 5.8681640625, 6.197265625, 6.5263671875, 6.85546875, 7.1845703125, 7.513671875, 7.8427734375, 8.171875, 8.5009765625, 8.830078125, 9.1591796875, 9.48828125, 9.8173828125, 10.146484375, 10.4755859375, 10.8046875]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 4.0, 1.0, 2.0, 1.0, 10.0, 4.0, 3.0, 6.0, 10.0, 8.0, 6.0, 16.0, 12.0, 16.0, 22.0, 21.0, 28.0, 37.0, 25.0, 49.0, 63.0, 65.0, 93.0, 198.0, 1378.0, 297.0, 152.0, 115.0, 70.0, 55.0, 49.0, 36.0, 33.0, 29.0, 18.0, 13.0, 25.0, 16.0, 10.0, 16.0, 9.0, 6.0, 10.0, 4.0, 6.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-16.640625, -16.064453125, -15.48828125, -14.912109375, -14.3359375, -13.759765625, -13.18359375, -12.607421875, -12.03125, -11.455078125, -10.87890625, -10.302734375, -9.7265625, -9.150390625, -8.57421875, -7.998046875, -7.421875, -6.845703125, -6.26953125, -5.693359375, -5.1171875, -4.541015625, -3.96484375, -3.388671875, -2.8125, -2.236328125, -1.66015625, -1.083984375, -0.5078125, 0.068359375, 0.64453125, 1.220703125, 1.796875, 2.373046875, 2.94921875, 3.525390625, 4.1015625, 4.677734375, 5.25390625, 5.830078125, 6.40625, 6.982421875, 7.55859375, 8.134765625, 8.7109375, 9.287109375, 9.86328125, 10.439453125, 11.015625, 11.591796875, 12.16796875, 12.744140625, 13.3203125, 13.896484375, 14.47265625, 15.048828125, 15.625, 16.201171875, 16.77734375, 17.353515625, 17.9296875, 18.505859375, 19.08203125, 19.658203125, 20.234375]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 4.0, 4.0, 6.0, 4.0, 3.0, 9.0, 14.0, 12.0, 30.0, 27.0, 41.0, 51.0, 72.0, 140.0, 241.0, 550.0, 1411.0, 63136.0, 3074326.0, 3984.0, 799.0, 332.0, 172.0, 104.0, 61.0, 36.0, 27.0, 19.0, 18.0, 12.0, 12.0, 9.0, 8.0, 7.0, 10.0, 5.0, 3.0, 6.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-91.0, -88.263671875, -85.52734375, -82.791015625, -80.0546875, -77.318359375, -74.58203125, -71.845703125, -69.109375, -66.373046875, -63.63671875, -60.900390625, -58.1640625, -55.427734375, -52.69140625, -49.955078125, -47.21875, -44.482421875, -41.74609375, -39.009765625, -36.2734375, -33.537109375, -30.80078125, -28.064453125, -25.328125, -22.591796875, -19.85546875, -17.119140625, -14.3828125, -11.646484375, -8.91015625, -6.173828125, -3.4375, -0.701171875, 2.03515625, 4.771484375, 7.5078125, 10.244140625, 12.98046875, 15.716796875, 18.453125, 21.189453125, 23.92578125, 26.662109375, 29.3984375, 32.134765625, 34.87109375, 37.607421875, 40.34375, 43.080078125, 45.81640625, 48.552734375, 51.2890625, 54.025390625, 56.76171875, 59.498046875, 62.234375, 64.970703125, 67.70703125, 70.443359375, 73.1796875, 75.916015625, 78.65234375, 81.388671875, 84.125]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 13.0, 73.0, 286.0, 397.0, 203.0, 38.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-200.26974487304688, -195.0447998046875, -189.81983947753906, -184.59487915039062, -179.36993408203125, -174.14498901367188, -168.92002868652344, -163.695068359375, -158.47012329101562, -153.24517822265625, -148.0202178955078, -142.79525756835938, -137.5703125, -132.34536743164062, -127.12040710449219, -121.89545440673828, -116.67050170898438, -111.44554901123047, -106.22059631347656, -100.99564361572266, -95.77069091796875, -90.54573822021484, -85.32078552246094, -80.09583282470703, -74.87088012695312, -69.64592742919922, -64.42097473144531, -59.196022033691406, -53.9710693359375, -48.746116638183594, -43.52116394042969, -38.29621124267578, -33.07124328613281, -27.846290588378906, -22.621337890625, -17.396385192871094, -12.171432495117188, -6.946479797363281, -1.721527099609375, 3.5034255981445312, 8.728378295898438, 13.953330993652344, 19.17828369140625, 24.403236389160156, 29.628189086914062, 34.85314178466797, 40.078094482421875, 45.30304718017578, 50.52799987792969, 55.752952575683594, 60.9779052734375, 66.2028579711914, 71.42781066894531, 76.65276336669922, 81.87771606445312, 87.10266876220703, 92.32762145996094, 97.55257415771484, 102.77752685546875, 108.00247955322266, 113.22743225097656, 118.45238494873047, 123.67733764648438, 128.90228271484375, 134.1272430419922]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 3.0, 9.0, 4.0, 5.0, 3.0, 13.0, 9.0, 13.0, 18.0, 13.0, 15.0, 17.0, 29.0, 24.0, 31.0, 41.0, 32.0, 32.0, 36.0, 40.0, 39.0, 38.0, 45.0, 44.0, 40.0, 35.0, 47.0, 35.0, 30.0, 33.0, 44.0, 35.0, 21.0, 25.0, 19.0, 11.0, 18.0, 11.0, 8.0, 8.0, 5.0, 8.0, 3.0, 6.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-53.414398193359375, -51.74942398071289, -50.08444595336914, -48.419471740722656, -46.754493713378906, -45.08951950073242, -43.42454528808594, -41.75956726074219, -40.09458923339844, -38.42961502075195, -36.7646369934082, -35.09966278076172, -33.43468475341797, -31.769710540771484, -30.104734420776367, -28.43975830078125, -26.774784088134766, -25.10980796813965, -23.44483184814453, -21.779857635498047, -20.114879608154297, -18.449905395507812, -16.784929275512695, -15.119953155517578, -13.454977035522461, -11.790000915527344, -10.125024795532227, -8.460049629211426, -6.795073509216309, -5.130097389221191, -3.4651222229003906, -1.8001461029052734, -0.13516998291015625, 1.5298058986663818, 3.19478178024292, 4.859757423400879, 6.524733543395996, 8.189709663391113, 9.854684829711914, 11.519660949707031, 13.184637069702148, 14.849613189697266, 16.514589309692383, 18.1795654296875, 19.844539642333984, 21.509517669677734, 23.17449188232422, 24.839468002319336, 26.504444122314453, 28.16942024230957, 29.834396362304688, 31.499370574951172, 33.16434860229492, 34.829322814941406, 36.494300842285156, 38.15927505493164, 39.824249267578125, 41.48922348022461, 43.15420150756836, 44.819175720214844, 46.484153747558594, 48.14912796020508, 49.81410217285156, 51.47908020019531, 53.14405822753906]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 6.0, 3.0, 2.0, 4.0, 5.0, 2.0, 7.0, 3.0, 5.0, 11.0, 17.0, 13.0, 11.0, 22.0, 20.0, 21.0, 23.0, 34.0, 32.0, 29.0, 42.0, 47.0, 27.0, 42.0, 37.0, 36.0, 32.0, 41.0, 36.0, 41.0, 28.0, 39.0, 30.0, 28.0, 24.0, 28.0, 27.0, 25.0, 21.0, 20.0, 11.0, 21.0, 8.0, 6.0, 6.0, 10.0, 7.0, 7.0, 1.0, 2.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-6.70703125, -6.498779296875, -6.29052734375, -6.082275390625, -5.8740234375, -5.665771484375, -5.45751953125, -5.249267578125, -5.041015625, -4.832763671875, -4.62451171875, -4.416259765625, -4.2080078125, -3.999755859375, -3.79150390625, -3.583251953125, -3.375, -3.166748046875, -2.95849609375, -2.750244140625, -2.5419921875, -2.333740234375, -2.12548828125, -1.917236328125, -1.708984375, -1.500732421875, -1.29248046875, -1.084228515625, -0.8759765625, -0.667724609375, -0.45947265625, -0.251220703125, -0.04296875, 0.165283203125, 0.37353515625, 0.581787109375, 0.7900390625, 0.998291015625, 1.20654296875, 1.414794921875, 1.623046875, 1.831298828125, 2.03955078125, 2.247802734375, 2.4560546875, 2.664306640625, 2.87255859375, 3.080810546875, 3.2890625, 3.497314453125, 3.70556640625, 3.913818359375, 4.1220703125, 4.330322265625, 4.53857421875, 4.746826171875, 4.955078125, 5.163330078125, 5.37158203125, 5.579833984375, 5.7880859375, 5.996337890625, 6.20458984375, 6.412841796875, 6.62109375]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 0.0, 3.0, 4.0, 5.0, 11.0, 14.0, 24.0, 22.0, 39.0, 60.0, 63.0, 118.0, 176.0, 259.0, 388.0, 584.0, 968.0, 1738.0, 3385.0, 8040.0, 23586.0, 105711.0, 654654.0, 2260834.0, 932213.0, 151539.0, 30861.0, 9758.0, 4184.0, 1950.0, 1089.0, 689.0, 428.0, 291.0, 175.0, 108.0, 105.0, 58.0, 41.0, 33.0, 25.0, 24.0, 11.0, 5.0, 4.0, 5.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-14.171875, -13.7501220703125, -13.328369140625, -12.9066162109375, -12.48486328125, -12.0631103515625, -11.641357421875, -11.2196044921875, -10.7978515625, -10.3760986328125, -9.954345703125, -9.5325927734375, -9.11083984375, -8.6890869140625, -8.267333984375, -7.8455810546875, -7.423828125, -7.0020751953125, -6.580322265625, -6.1585693359375, -5.73681640625, -5.3150634765625, -4.893310546875, -4.4715576171875, -4.0498046875, -3.6280517578125, -3.206298828125, -2.7845458984375, -2.36279296875, -1.9410400390625, -1.519287109375, -1.0975341796875, -0.67578125, -0.2540283203125, 0.167724609375, 0.5894775390625, 1.01123046875, 1.4329833984375, 1.854736328125, 2.2764892578125, 2.6982421875, 3.1199951171875, 3.541748046875, 3.9635009765625, 4.38525390625, 4.8070068359375, 5.228759765625, 5.6505126953125, 6.072265625, 6.4940185546875, 6.915771484375, 7.3375244140625, 7.75927734375, 8.1810302734375, 8.602783203125, 9.0245361328125, 9.4462890625, 9.8680419921875, 10.289794921875, 10.7115478515625, 11.13330078125, 11.5550537109375, 11.976806640625, 12.3985595703125, 12.8203125]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 3.0, 5.0, 4.0, 6.0, 5.0, 7.0, 14.0, 12.0, 15.0, 18.0, 17.0, 37.0, 47.0, 49.0, 80.0, 98.0, 115.0, 130.0, 132.0, 200.0, 295.0, 390.0, 486.0, 405.0, 342.0, 239.0, 185.0, 140.0, 115.0, 96.0, 79.0, 58.0, 50.0, 33.0, 35.0, 33.0, 18.0, 18.0, 14.0, 9.0, 13.0, 10.0, 8.0, 6.0, 1.0, 4.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-10.875, -10.54345703125, -10.2119140625, -9.88037109375, -9.548828125, -9.21728515625, -8.8857421875, -8.55419921875, -8.22265625, -7.89111328125, -7.5595703125, -7.22802734375, -6.896484375, -6.56494140625, -6.2333984375, -5.90185546875, -5.5703125, -5.23876953125, -4.9072265625, -4.57568359375, -4.244140625, -3.91259765625, -3.5810546875, -3.24951171875, -2.91796875, -2.58642578125, -2.2548828125, -1.92333984375, -1.591796875, -1.26025390625, -0.9287109375, -0.59716796875, -0.265625, 0.06591796875, 0.3974609375, 0.72900390625, 1.060546875, 1.39208984375, 1.7236328125, 2.05517578125, 2.38671875, 2.71826171875, 3.0498046875, 3.38134765625, 3.712890625, 4.04443359375, 4.3759765625, 4.70751953125, 5.0390625, 5.37060546875, 5.7021484375, 6.03369140625, 6.365234375, 6.69677734375, 7.0283203125, 7.35986328125, 7.69140625, 8.02294921875, 8.3544921875, 8.68603515625, 9.017578125, 9.34912109375, 9.6806640625, 10.01220703125, 10.34375]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 4.0, 3.0, 7.0, 13.0, 17.0, 29.0, 32.0, 49.0, 80.0, 162.0, 202.0, 321.0, 605.0, 1006.0, 2054.0, 5953.0, 28126.0, 235036.0, 2785551.0, 1019674.0, 94348.0, 13965.0, 3672.0, 1503.0, 756.0, 452.0, 233.0, 171.0, 101.0, 56.0, 39.0, 20.0, 15.0, 12.0, 8.0, 6.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.609375, -23.921875, -23.234375, -22.546875, -21.859375, -21.171875, -20.484375, -19.796875, -19.109375, -18.421875, -17.734375, -17.046875, -16.359375, -15.671875, -14.984375, -14.296875, -13.609375, -12.921875, -12.234375, -11.546875, -10.859375, -10.171875, -9.484375, -8.796875, -8.109375, -7.421875, -6.734375, -6.046875, -5.359375, -4.671875, -3.984375, -3.296875, -2.609375, -1.921875, -1.234375, -0.546875, 0.140625, 0.828125, 1.515625, 2.203125, 2.890625, 3.578125, 4.265625, 4.953125, 5.640625, 6.328125, 7.015625, 7.703125, 8.390625, 9.078125, 9.765625, 10.453125, 11.140625, 11.828125, 12.515625, 13.203125, 13.890625, 14.578125, 15.265625, 15.953125, 16.640625, 17.328125, 18.015625, 18.703125, 19.390625]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 41.0, 349.0, 502.0, 112.0, 8.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-443.3281555175781, -434.8367004394531, -426.3452453613281, -417.8537902832031, -409.3623352050781, -400.870849609375, -392.37939453125, -383.887939453125, -375.396484375, -366.905029296875, -358.41357421875, -349.922119140625, -341.4306640625, -332.939208984375, -324.44775390625, -315.9562683105469, -307.46484375, -298.973388671875, -290.48193359375, -281.990478515625, -273.4990234375, -265.007568359375, -256.51611328125, -248.02464294433594, -239.53317260742188, -231.04171752929688, -222.55026245117188, -214.05880737304688, -205.5673370361328, -197.0758819580078, -188.5844268798828, -180.0929718017578, -171.6014862060547, -163.1100311279297, -154.6185760498047, -146.12710571289062, -137.63565063476562, -129.14419555664062, -120.65274047851562, -112.16128540039062, -103.6698226928711, -95.1783676147461, -86.68690490722656, -78.19544982910156, -69.70399475097656, -61.21253204345703, -52.72107696533203, -44.229618072509766, -35.7381591796875, -27.246700286865234, -18.7552433013916, -10.263786315917969, -1.7723274230957031, 6.7191314697265625, 15.210586547851562, 23.702045440673828, 32.193504333496094, 40.68496322631836, 49.176422119140625, 57.667877197265625, 66.15933227539062, 74.65079498291016, 83.14225006103516, 91.63371276855469, 100.12516784667969]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 2.0, 4.0, 3.0, 7.0, 4.0, 10.0, 11.0, 11.0, 10.0, 17.0, 24.0, 20.0, 31.0, 23.0, 38.0, 32.0, 34.0, 47.0, 42.0, 42.0, 43.0, 45.0, 41.0, 41.0, 34.0, 41.0, 38.0, 36.0, 27.0, 41.0, 29.0, 29.0, 25.0, 14.0, 19.0, 23.0, 7.0, 9.0, 7.0, 12.0, 10.0, 4.0, 2.0, 3.0, 4.0, 0.0, 5.0, 1.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-41.64564514160156, -40.18769073486328, -38.729732513427734, -37.27177810668945, -35.813819885253906, -34.355865478515625, -32.897911071777344, -31.439952850341797, -29.981996536254883, -28.52404022216797, -27.066083908081055, -25.60812759399414, -24.15017318725586, -22.692214965820312, -21.23426055908203, -19.776304244995117, -18.318347930908203, -16.86039161682129, -15.402435302734375, -13.944479942321777, -12.486523628234863, -11.02856731414795, -9.570611953735352, -8.112655639648438, -6.654699325561523, -5.196743011474609, -3.7387871742248535, -2.2808313369750977, -0.8228750228881836, 0.6350812911987305, 2.093036651611328, 3.550992965698242, 5.008949279785156, 6.46690559387207, 7.924861431121826, 9.382817268371582, 10.840773582458496, 12.29872989654541, 13.756685256958008, 15.214641571044922, 16.672597885131836, 18.13055419921875, 19.588510513305664, 21.046466827392578, 22.50442123413086, 23.962379455566406, 25.420333862304688, 26.8782901763916, 28.336246490478516, 29.79420280456543, 31.252159118652344, 32.710113525390625, 34.16807174682617, 35.62602615356445, 37.083984375, 38.54193878173828, 39.99989318847656, 41.457847595214844, 42.91580581665039, 44.37376022338867, 45.83171844482422, 47.2896728515625, 48.74762725830078, 50.20558547973633, 51.663543701171875]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 8.0, 6.0, 13.0, 7.0, 13.0, 13.0, 22.0, 19.0, 18.0, 19.0, 21.0, 35.0, 34.0, 29.0, 42.0, 34.0, 39.0, 49.0, 54.0, 53.0, 32.0, 50.0, 37.0, 45.0, 29.0, 34.0, 32.0, 36.0, 30.0, 27.0, 24.0, 14.0, 19.0, 8.0, 13.0, 13.0, 9.0, 5.0, 4.0, 5.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.63671875, -5.4522705078125, -5.267822265625, -5.0833740234375, -4.89892578125, -4.7144775390625, -4.530029296875, -4.3455810546875, -4.1611328125, -3.9766845703125, -3.792236328125, -3.6077880859375, -3.42333984375, -3.2388916015625, -3.054443359375, -2.8699951171875, -2.685546875, -2.5010986328125, -2.316650390625, -2.1322021484375, -1.94775390625, -1.7633056640625, -1.578857421875, -1.3944091796875, -1.2099609375, -1.0255126953125, -0.841064453125, -0.6566162109375, -0.47216796875, -0.2877197265625, -0.103271484375, 0.0811767578125, 0.265625, 0.4500732421875, 0.634521484375, 0.8189697265625, 1.00341796875, 1.1878662109375, 1.372314453125, 1.5567626953125, 1.7412109375, 1.9256591796875, 2.110107421875, 2.2945556640625, 2.47900390625, 2.6634521484375, 2.847900390625, 3.0323486328125, 3.216796875, 3.4012451171875, 3.585693359375, 3.7701416015625, 3.95458984375, 4.1390380859375, 4.323486328125, 4.5079345703125, 4.6923828125, 4.8768310546875, 5.061279296875, 5.2457275390625, 5.43017578125, 5.6146240234375, 5.799072265625, 5.9835205078125, 6.16796875]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [5.0, 1.0, 2.0, 5.0, 6.0, 9.0, 16.0, 18.0, 29.0, 24.0, 35.0, 48.0, 76.0, 98.0, 131.0, 190.0, 264.0, 376.0, 589.0, 822.0, 1234.0, 1711.0, 2715.0, 3820.0, 5561.0, 8683.0, 13720.0, 21000.0, 33340.0, 53966.0, 90612.0, 153597.0, 216819.0, 171596.0, 102103.0, 60817.0, 37320.0, 23240.0, 14799.0, 9532.0, 6319.0, 4241.0, 2880.0, 1925.0, 1283.0, 861.0, 662.0, 444.0, 276.0, 208.0, 164.0, 100.0, 74.0, 53.0, 37.0, 33.0, 28.0, 11.0, 17.0, 16.0, 6.0, 4.0, 3.0, 2.0], "bins": [-0.492919921875, -0.47780609130859375, -0.4626922607421875, -0.44757843017578125, -0.432464599609375, -0.41735076904296875, -0.4022369384765625, -0.38712310791015625, -0.37200927734375, -0.35689544677734375, -0.3417816162109375, -0.32666778564453125, -0.311553955078125, -0.29644012451171875, -0.2813262939453125, -0.26621246337890625, -0.2510986328125, -0.23598480224609375, -0.2208709716796875, -0.20575714111328125, -0.190643310546875, -0.17552947998046875, -0.1604156494140625, -0.14530181884765625, -0.13018798828125, -0.11507415771484375, -0.0999603271484375, -0.08484649658203125, -0.069732666015625, -0.05461883544921875, -0.0395050048828125, -0.02439117431640625, -0.00927734375, 0.00583648681640625, 0.0209503173828125, 0.03606414794921875, 0.051177978515625, 0.06629180908203125, 0.0814056396484375, 0.09651947021484375, 0.11163330078125, 0.12674713134765625, 0.1418609619140625, 0.15697479248046875, 0.172088623046875, 0.18720245361328125, 0.2023162841796875, 0.21743011474609375, 0.2325439453125, 0.24765777587890625, 0.2627716064453125, 0.27788543701171875, 0.292999267578125, 0.30811309814453125, 0.3232269287109375, 0.33834075927734375, 0.35345458984375, 0.36856842041015625, 0.3836822509765625, 0.39879608154296875, 0.413909912109375, 0.42902374267578125, 0.4441375732421875, 0.45925140380859375, 0.474365234375]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 2.0, 4.0, 5.0, 6.0, 3.0, 9.0, 9.0, 13.0, 10.0, 18.0, 20.0, 16.0, 26.0, 28.0, 28.0, 25.0, 37.0, 30.0, 35.0, 42.0, 35.0, 46.0, 26.0, 1064.0, 48.0, 43.0, 24.0, 45.0, 44.0, 28.0, 36.0, 26.0, 28.0, 23.0, 23.0, 23.0, 22.0, 20.0, 7.0, 16.0, 8.0, 8.0, 5.0, 2.0, 5.0, 4.0, 5.0, 3.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.65625, -3.5447998046875, -3.433349609375, -3.3218994140625, -3.21044921875, -3.0989990234375, -2.987548828125, -2.8760986328125, -2.7646484375, -2.6531982421875, -2.541748046875, -2.4302978515625, -2.31884765625, -2.2073974609375, -2.095947265625, -1.9844970703125, -1.873046875, -1.7615966796875, -1.650146484375, -1.5386962890625, -1.42724609375, -1.3157958984375, -1.204345703125, -1.0928955078125, -0.9814453125, -0.8699951171875, -0.758544921875, -0.6470947265625, -0.53564453125, -0.4241943359375, -0.312744140625, -0.2012939453125, -0.08984375, 0.0216064453125, 0.133056640625, 0.2445068359375, 0.35595703125, 0.4674072265625, 0.578857421875, 0.6903076171875, 0.8017578125, 0.9132080078125, 1.024658203125, 1.1361083984375, 1.24755859375, 1.3590087890625, 1.470458984375, 1.5819091796875, 1.693359375, 1.8048095703125, 1.916259765625, 2.0277099609375, 2.13916015625, 2.2506103515625, 2.362060546875, 2.4735107421875, 2.5849609375, 2.6964111328125, 2.807861328125, 2.9193115234375, 3.03076171875, 3.1422119140625, 3.253662109375, 3.3651123046875, 3.4765625]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 5.0, 7.0, 11.0, 10.0, 33.0, 28.0, 57.0, 94.0, 127.0, 223.0, 362.0, 703.0, 1350.0, 2565.0, 5608.0, 12182.0, 27628.0, 62727.0, 143149.0, 1307199.0, 294830.0, 133319.0, 58217.0, 25019.0, 11262.0, 5144.0, 2479.0, 1218.0, 658.0, 382.0, 203.0, 134.0, 69.0, 52.0, 36.0, 12.0, 12.0, 7.0, 2.0, 1.0, 6.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.552734375, -0.5373611450195312, -0.5219879150390625, -0.5066146850585938, -0.491241455078125, -0.47586822509765625, -0.4604949951171875, -0.44512176513671875, -0.42974853515625, -0.41437530517578125, -0.3990020751953125, -0.38362884521484375, -0.368255615234375, -0.35288238525390625, -0.3375091552734375, -0.32213592529296875, -0.3067626953125, -0.29138946533203125, -0.2760162353515625, -0.26064300537109375, -0.245269775390625, -0.22989654541015625, -0.2145233154296875, -0.19915008544921875, -0.18377685546875, -0.16840362548828125, -0.1530303955078125, -0.13765716552734375, -0.122283935546875, -0.10691070556640625, -0.0915374755859375, -0.07616424560546875, -0.060791015625, -0.04541778564453125, -0.0300445556640625, -0.01467132568359375, 0.000701904296875, 0.01607513427734375, 0.0314483642578125, 0.04682159423828125, 0.06219482421875, 0.07756805419921875, 0.0929412841796875, 0.10831451416015625, 0.123687744140625, 0.13906097412109375, 0.1544342041015625, 0.16980743408203125, 0.1851806640625, 0.20055389404296875, 0.2159271240234375, 0.23130035400390625, 0.246673583984375, 0.26204681396484375, 0.2774200439453125, 0.29279327392578125, 0.30816650390625, 0.32353973388671875, 0.3389129638671875, 0.35428619384765625, 0.369659423828125, 0.38503265380859375, 0.4004058837890625, 0.41577911376953125, 0.43115234375]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 5.0, 4.0, 9.0, 14.0, 8.0, 15.0, 12.0, 23.0, 24.0, 38.0, 40.0, 47.0, 58.0, 71.0, 74.0, 82.0, 80.0, 85.0, 61.0, 39.0, 39.0, 38.0, 31.0, 31.0, 12.0, 14.0, 16.0, 8.0, 6.0, 3.0, 7.0, 4.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.002758026123046875, -0.0026808083057403564, -0.002603590488433838, -0.0025263726711273193, -0.0024491548538208008, -0.0023719370365142822, -0.0022947192192077637, -0.002217501401901245, -0.0021402835845947266, -0.002063065767288208, -0.0019858479499816895, -0.001908630132675171, -0.0018314123153686523, -0.0017541944980621338, -0.0016769766807556152, -0.0015997588634490967, -0.0015225410461425781, -0.0014453232288360596, -0.001368105411529541, -0.0012908875942230225, -0.001213669776916504, -0.0011364519596099854, -0.0010592341423034668, -0.0009820163249969482, -0.0009047985076904297, -0.0008275806903839111, -0.0007503628730773926, -0.000673145055770874, -0.0005959272384643555, -0.0005187094211578369, -0.00044149160385131836, -0.0003642737865447998, -0.00028705596923828125, -0.0002098381519317627, -0.00013262033462524414, -5.5402517318725586e-05, 2.181529998779297e-05, 9.903311729431152e-05, 0.00017625093460083008, 0.00025346875190734863, 0.0003306865692138672, 0.00040790438652038574, 0.0004851222038269043, 0.0005623400211334229, 0.0006395578384399414, 0.00071677565574646, 0.0007939934730529785, 0.0008712112903594971, 0.0009484291076660156, 0.0010256469249725342, 0.0011028647422790527, 0.0011800825595855713, 0.0012573003768920898, 0.0013345181941986084, 0.001411736011505127, 0.0014889538288116455, 0.001566171646118164, 0.0016433894634246826, 0.0017206072807312012, 0.0017978250980377197, 0.0018750429153442383, 0.0019522607326507568, 0.0020294785499572754, 0.002106696367263794, 0.0021839141845703125]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 8.0, 7.0, 8.0, 7.0, 14.0, 14.0, 19.0, 25.0, 37.0, 58.0, 52.0, 87.0, 116.0, 135.0, 245.0, 461.0, 1899.0, 42471.0, 968841.0, 31195.0, 1601.0, 413.0, 222.0, 160.0, 111.0, 77.0, 51.0, 56.0, 31.0, 27.0, 24.0, 22.0, 13.0, 10.0, 10.0, 7.0, 5.0, 5.0, 2.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.036834716796875, -0.03554058074951172, -0.03424644470214844, -0.032952308654785156, -0.031658172607421875, -0.030364036560058594, -0.029069900512695312, -0.02777576446533203, -0.02648162841796875, -0.02518749237060547, -0.023893356323242188, -0.022599220275878906, -0.021305084228515625, -0.020010948181152344, -0.018716812133789062, -0.01742267608642578, -0.0161285400390625, -0.014834403991699219, -0.013540267944335938, -0.012246131896972656, -0.010951995849609375, -0.009657859802246094, -0.008363723754882812, -0.007069587707519531, -0.00577545166015625, -0.004481315612792969, -0.0031871795654296875, -0.0018930435180664062, -0.000598907470703125, 0.0006952285766601562, 0.0019893646240234375, 0.0032835006713867188, 0.00457763671875, 0.005871772766113281, 0.0071659088134765625, 0.008460044860839844, 0.009754180908203125, 0.011048316955566406, 0.012342453002929688, 0.013636589050292969, 0.01493072509765625, 0.01622486114501953, 0.017518997192382812, 0.018813133239746094, 0.020107269287109375, 0.021401405334472656, 0.022695541381835938, 0.02398967742919922, 0.0252838134765625, 0.02657794952392578, 0.027872085571289062, 0.029166221618652344, 0.030460357666015625, 0.031754493713378906, 0.03304862976074219, 0.03434276580810547, 0.03563690185546875, 0.03693103790283203, 0.03822517395019531, 0.039519309997558594, 0.040813446044921875, 0.042107582092285156, 0.04340171813964844, 0.04469585418701172, 0.045989990234375]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 8.0, 27.0, 133.0, 548.0, 244.0, 42.0, 12.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.008036607876420021, -0.007628250867128372, -0.007219893392175436, -0.0068115359172225, -0.006403178907930851, -0.005994821898639202, -0.005586464423686266, -0.00517810694873333, -0.004769749939441681, -0.004361392930150032, -0.003953035455197096, -0.0035446782130748034, -0.003136320970952511, -0.0027279637288302183, -0.002319606486707926, -0.0019112492445856333, -0.0015028920024633408, -0.0010945347603410482, -0.0006861775182187557, -0.0002778202760964632, 0.00013053696602582932, 0.0005388942081481218, 0.0009472514502704144, 0.0013556086923927069, 0.0017639659345149994, 0.002172323176637292, 0.0025806804187595844, 0.002989037660881877, 0.0033973949030041695, 0.003805752145126462, 0.0042141093872487545, 0.004622466862201691, 0.0050308238714933395, 0.005439180880784988, 0.005847538355737925, 0.006255895830690861, 0.00666425283998251, 0.0070726098492741585, 0.007480967324227095, 0.00788932479918003, 0.00829768180847168, 0.008706038817763329, 0.009114395827054977, 0.009522753767669201, 0.00993111077696085, 0.010339467786252499, 0.010747825726866722, 0.011156182736158371, 0.01156453974545002, 0.011972896754741669, 0.012381253764033318, 0.012789611704647541, 0.01319796871393919, 0.013606325723230839, 0.014014683663845062, 0.014423040673136711, 0.01483139768242836, 0.015239754691720009, 0.015648111701011658, 0.016056468710303307, 0.016464825719594955, 0.016873184591531754, 0.017281541600823402, 0.01768989861011505, 0.0180982556194067]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 8.0, 11.0, 11.0, 12.0, 9.0, 14.0, 23.0, 21.0, 29.0, 29.0, 40.0, 34.0, 38.0, 49.0, 45.0, 56.0, 46.0, 45.0, 43.0, 59.0, 50.0, 52.0, 34.0, 34.0, 31.0, 32.0, 25.0, 21.0, 22.0, 18.0, 13.0, 12.0, 7.0, 9.0, 6.0, 3.0, 6.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0013741254806518555, -0.0013270238414406776, -0.0012799222022294998, -0.001232820563018322, -0.0011857189238071442, -0.0011386172845959663, -0.0010915156453847885, -0.0010444140061736107, -0.0009973123669624329, -0.000950210727751255, -0.0009031090885400772, -0.0008560074493288994, -0.0008089058101177216, -0.0007618041709065437, -0.0007147025316953659, -0.0006676008924841881, -0.0006204992532730103, -0.0005733976140618324, -0.0005262959748506546, -0.0004791943356394768, -0.00043209269642829895, -0.0003849910572171211, -0.0003378894180059433, -0.00029078777879476547, -0.00024368613958358765, -0.00019658450037240982, -0.000149482861161232, -0.00010238122195005417, -5.527958273887634e-05, -8.177943527698517e-06, 3.892369568347931e-05, 8.602533489465714e-05, 0.00013312697410583496, 0.0001802286133170128, 0.0002273302525281906, 0.00027443189173936844, 0.00032153353095054626, 0.0003686351701617241, 0.0004157368093729019, 0.00046283844858407974, 0.0005099400877952576, 0.0005570417270064354, 0.0006041433662176132, 0.000651245005428791, 0.0006983466446399689, 0.0007454482838511467, 0.0007925499230623245, 0.0008396515622735023, 0.0008867532014846802, 0.000933854840695858, 0.0009809564799070358, 0.0010280581191182137, 0.0010751597583293915, 0.0011222613975405693, 0.0011693630367517471, 0.001216464675962925, 0.0012635663151741028, 0.0013106679543852806, 0.0013577695935964584, 0.0014048712328076363, 0.001451972872018814, 0.001499074511229992, 0.0015461761504411697, 0.0015932777896523476, 0.0016403794288635254]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 8.0, 6.0, 13.0, 7.0, 13.0, 13.0, 22.0, 19.0, 18.0, 19.0, 21.0, 35.0, 34.0, 29.0, 42.0, 34.0, 39.0, 49.0, 54.0, 53.0, 32.0, 50.0, 37.0, 44.0, 30.0, 34.0, 32.0, 36.0, 30.0, 27.0, 24.0, 14.0, 19.0, 8.0, 14.0, 12.0, 9.0, 5.0, 4.0, 5.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.63671875, -5.4522705078125, -5.267822265625, -5.0833740234375, -4.89892578125, -4.7144775390625, -4.530029296875, -4.3455810546875, -4.1611328125, -3.9766845703125, -3.792236328125, -3.6077880859375, -3.42333984375, -3.2388916015625, -3.054443359375, -2.8699951171875, -2.685546875, -2.5010986328125, -2.316650390625, -2.1322021484375, -1.94775390625, -1.7633056640625, -1.578857421875, -1.3944091796875, -1.2099609375, -1.0255126953125, -0.841064453125, -0.6566162109375, -0.47216796875, -0.2877197265625, -0.103271484375, 0.0811767578125, 0.265625, 0.4500732421875, 0.634521484375, 0.8189697265625, 1.00341796875, 1.1878662109375, 1.372314453125, 1.5567626953125, 1.7412109375, 1.9256591796875, 2.110107421875, 2.2945556640625, 2.47900390625, 2.6634521484375, 2.847900390625, 3.0323486328125, 3.216796875, 3.4012451171875, 3.585693359375, 3.7701416015625, 3.95458984375, 4.1390380859375, 4.323486328125, 4.5079345703125, 4.6923828125, 4.8768310546875, 5.061279296875, 5.2457275390625, 5.43017578125, 5.6146240234375, 5.799072265625, 5.9835205078125, 6.16796875]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 7.0, 6.0, 5.0, 8.0, 10.0, 16.0, 29.0, 24.0, 51.0, 50.0, 63.0, 110.0, 157.0, 237.0, 306.0, 494.0, 722.0, 1174.0, 1929.0, 3918.0, 9680.0, 38327.0, 224194.0, 608634.0, 120740.0, 22940.0, 7001.0, 3046.0, 1624.0, 995.0, 657.0, 414.0, 302.0, 204.0, 137.0, 96.0, 73.0, 47.0, 36.0, 27.0, 21.0, 14.0, 14.0, 11.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-15.0234375, -14.57275390625, -14.1220703125, -13.67138671875, -13.220703125, -12.77001953125, -12.3193359375, -11.86865234375, -11.41796875, -10.96728515625, -10.5166015625, -10.06591796875, -9.615234375, -9.16455078125, -8.7138671875, -8.26318359375, -7.8125, -7.36181640625, -6.9111328125, -6.46044921875, -6.009765625, -5.55908203125, -5.1083984375, -4.65771484375, -4.20703125, -3.75634765625, -3.3056640625, -2.85498046875, -2.404296875, -1.95361328125, -1.5029296875, -1.05224609375, -0.6015625, -0.15087890625, 0.2998046875, 0.75048828125, 1.201171875, 1.65185546875, 2.1025390625, 2.55322265625, 3.00390625, 3.45458984375, 3.9052734375, 4.35595703125, 4.806640625, 5.25732421875, 5.7080078125, 6.15869140625, 6.609375, 7.06005859375, 7.5107421875, 7.96142578125, 8.412109375, 8.86279296875, 9.3134765625, 9.76416015625, 10.21484375, 10.66552734375, 11.1162109375, 11.56689453125, 12.017578125, 12.46826171875, 12.9189453125, 13.36962890625, 13.8203125]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 5.0, 4.0, 10.0, 5.0, 7.0, 11.0, 14.0, 18.0, 14.0, 22.0, 34.0, 35.0, 31.0, 37.0, 39.0, 53.0, 67.0, 105.0, 169.0, 1381.0, 332.0, 162.0, 96.0, 66.0, 60.0, 45.0, 28.0, 29.0, 22.0, 31.0, 23.0, 17.0, 13.0, 6.0, 14.0, 13.0, 10.0, 5.0, 3.0, 6.0, 1.0, 4.0, 0.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.7890625, -12.3614501953125, -11.933837890625, -11.5062255859375, -11.07861328125, -10.6510009765625, -10.223388671875, -9.7957763671875, -9.3681640625, -8.9405517578125, -8.512939453125, -8.0853271484375, -7.65771484375, -7.2301025390625, -6.802490234375, -6.3748779296875, -5.947265625, -5.5196533203125, -5.092041015625, -4.6644287109375, -4.23681640625, -3.8092041015625, -3.381591796875, -2.9539794921875, -2.5263671875, -2.0987548828125, -1.671142578125, -1.2435302734375, -0.81591796875, -0.3883056640625, 0.039306640625, 0.4669189453125, 0.89453125, 1.3221435546875, 1.749755859375, 2.1773681640625, 2.60498046875, 3.0325927734375, 3.460205078125, 3.8878173828125, 4.3154296875, 4.7430419921875, 5.170654296875, 5.5982666015625, 6.02587890625, 6.4534912109375, 6.881103515625, 7.3087158203125, 7.736328125, 8.1639404296875, 8.591552734375, 9.0191650390625, 9.44677734375, 9.8743896484375, 10.302001953125, 10.7296142578125, 11.1572265625, 11.5848388671875, 12.012451171875, 12.4400634765625, 12.86767578125, 13.2952880859375, 13.722900390625, 14.1505126953125, 14.578125]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 2.0, 7.0, 10.0, 12.0, 21.0, 17.0, 31.0, 40.0, 52.0, 62.0, 77.0, 144.0, 216.0, 405.0, 925.0, 3883.0, 2859233.0, 276422.0, 2427.0, 754.0, 338.0, 200.0, 119.0, 90.0, 68.0, 38.0, 36.0, 20.0, 13.0, 13.0, 8.0, 7.0, 7.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-59.6875, -58.0693359375, -56.451171875, -54.8330078125, -53.21484375, -51.5966796875, -49.978515625, -48.3603515625, -46.7421875, -45.1240234375, -43.505859375, -41.8876953125, -40.26953125, -38.6513671875, -37.033203125, -35.4150390625, -33.796875, -32.1787109375, -30.560546875, -28.9423828125, -27.32421875, -25.7060546875, -24.087890625, -22.4697265625, -20.8515625, -19.2333984375, -17.615234375, -15.9970703125, -14.37890625, -12.7607421875, -11.142578125, -9.5244140625, -7.90625, -6.2880859375, -4.669921875, -3.0517578125, -1.43359375, 0.1845703125, 1.802734375, 3.4208984375, 5.0390625, 6.6572265625, 8.275390625, 9.8935546875, 11.51171875, 13.1298828125, 14.748046875, 16.3662109375, 17.984375, 19.6025390625, 21.220703125, 22.8388671875, 24.45703125, 26.0751953125, 27.693359375, 29.3115234375, 30.9296875, 32.5478515625, 34.166015625, 35.7841796875, 37.40234375, 39.0205078125, 40.638671875, 42.2568359375, 43.875]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 7.0, 39.0, 218.0, 477.0, 225.0, 43.0, 8.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-258.8482666015625, -253.8253936767578, -248.80250549316406, -243.77963256835938, -238.7567596435547, -233.73388671875, -228.71099853515625, -223.68812561035156, -218.66525268554688, -213.6423797607422, -208.61949157714844, -203.59661865234375, -198.57374572753906, -193.55087280273438, -188.52798461914062, -183.50511169433594, -178.4822235107422, -173.4593505859375, -168.43646240234375, -163.41358947753906, -158.39071655273438, -153.36782836914062, -148.34495544433594, -143.32208251953125, -138.2991943359375, -133.2763214111328, -128.25343322753906, -123.23056030273438, -118.20768737792969, -113.18480682373047, -108.16192626953125, -103.13905334472656, -98.11618041992188, -93.09329986572266, -88.07042694091797, -83.04754638671875, -78.02467346191406, -73.00179290771484, -67.97891235351562, -62.95603561401367, -57.93315887451172, -52.910282135009766, -47.88740539550781, -42.864524841308594, -37.84164810180664, -32.81877136230469, -27.7958927154541, -22.773014068603516, -17.750137329101562, -12.727259635925293, -7.704381942749023, -2.681504249572754, 2.3413734436035156, 7.364250183105469, 12.387128829956055, 17.41000747680664, 22.432884216308594, 27.455760955810547, 32.4786376953125, 37.50151824951172, 42.52439498901367, 47.547271728515625, 52.570152282714844, 57.5930290222168, 62.61590576171875]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 0.0, 8.0, 4.0, 2.0, 5.0, 5.0, 10.0, 5.0, 3.0, 5.0, 9.0, 9.0, 17.0, 12.0, 26.0, 17.0, 19.0, 14.0, 26.0, 27.0, 32.0, 38.0, 34.0, 33.0, 40.0, 35.0, 40.0, 35.0, 41.0, 46.0, 46.0, 46.0, 34.0, 37.0, 21.0, 27.0, 21.0, 29.0, 14.0, 25.0, 21.0, 13.0, 9.0, 8.0, 13.0, 4.0, 9.0, 8.0, 9.0, 4.0, 3.0, 4.0, 1.0, 2.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0], "bins": [-37.03619384765625, -35.87750244140625, -34.71881103515625, -33.560115814208984, -32.401424407958984, -31.242733001708984, -30.08403968811035, -28.92534637451172, -27.76665496826172, -26.60796356201172, -25.449270248413086, -24.290576934814453, -23.131885528564453, -21.973194122314453, -20.81450080871582, -19.655807495117188, -18.497116088867188, -17.338424682617188, -16.179731369018555, -15.021039009094238, -13.862346649169922, -12.703654289245605, -11.544961929321289, -10.386269569396973, -9.227577209472656, -8.06888484954834, -6.910192489624023, -5.751500129699707, -4.592807769775391, -3.434115409851074, -2.275423049926758, -1.1167306900024414, 0.041961669921875, 1.2006540298461914, 2.359346389770508, 3.518038749694824, 4.676731109619141, 5.835423469543457, 6.994115829467773, 8.15280818939209, 9.311500549316406, 10.470192909240723, 11.628885269165039, 12.787577629089355, 13.946269989013672, 15.104962348937988, 16.263654708862305, 17.422348022460938, 18.581039428710938, 19.739730834960938, 20.89842414855957, 22.057117462158203, 23.215808868408203, 24.374500274658203, 25.533193588256836, 26.69188690185547, 27.85057830810547, 29.00926971435547, 30.1679630279541, 31.326656341552734, 32.485347747802734, 33.644039154052734, 34.802734375, 35.96142578125, 37.1201171875]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 5.0, 9.0, 4.0, 10.0, 12.0, 5.0, 9.0, 14.0, 14.0, 20.0, 24.0, 19.0, 22.0, 27.0, 34.0, 42.0, 35.0, 40.0, 52.0, 44.0, 54.0, 61.0, 37.0, 38.0, 38.0, 35.0, 44.0, 24.0, 34.0, 30.0, 29.0, 27.0, 22.0, 18.0, 22.0, 5.0, 8.0, 10.0, 11.0, 4.0, 5.0, 4.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.92578125, -6.728271484375, -6.53076171875, -6.333251953125, -6.1357421875, -5.938232421875, -5.74072265625, -5.543212890625, -5.345703125, -5.148193359375, -4.95068359375, -4.753173828125, -4.5556640625, -4.358154296875, -4.16064453125, -3.963134765625, -3.765625, -3.568115234375, -3.37060546875, -3.173095703125, -2.9755859375, -2.778076171875, -2.58056640625, -2.383056640625, -2.185546875, -1.988037109375, -1.79052734375, -1.593017578125, -1.3955078125, -1.197998046875, -1.00048828125, -0.802978515625, -0.60546875, -0.407958984375, -0.21044921875, -0.012939453125, 0.1845703125, 0.382080078125, 0.57958984375, 0.777099609375, 0.974609375, 1.172119140625, 1.36962890625, 1.567138671875, 1.7646484375, 1.962158203125, 2.15966796875, 2.357177734375, 2.5546875, 2.752197265625, 2.94970703125, 3.147216796875, 3.3447265625, 3.542236328125, 3.73974609375, 3.937255859375, 4.134765625, 4.332275390625, 4.52978515625, 4.727294921875, 4.9248046875, 5.122314453125, 5.31982421875, 5.517333984375, 5.71484375]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 4.0, 7.0, 9.0, 13.0, 13.0, 27.0, 29.0, 36.0, 56.0, 93.0, 143.0, 195.0, 270.0, 395.0, 608.0, 931.0, 1448.0, 2266.0, 3744.0, 6823.0, 14182.0, 40318.0, 203914.0, 1156844.0, 2081859.0, 541772.0, 91458.0, 23656.0, 9811.0, 5031.0, 2903.0, 1892.0, 1136.0, 713.0, 518.0, 349.0, 269.0, 156.0, 106.0, 86.0, 60.0, 54.0, 25.0, 20.0, 14.0, 11.0, 6.0, 8.0, 4.0, 2.0, 3.0, 1.0, 2.0], "bins": [-11.34375, -11.0220947265625, -10.700439453125, -10.3787841796875, -10.05712890625, -9.7354736328125, -9.413818359375, -9.0921630859375, -8.7705078125, -8.4488525390625, -8.127197265625, -7.8055419921875, -7.48388671875, -7.1622314453125, -6.840576171875, -6.5189208984375, -6.197265625, -5.8756103515625, -5.553955078125, -5.2322998046875, -4.91064453125, -4.5889892578125, -4.267333984375, -3.9456787109375, -3.6240234375, -3.3023681640625, -2.980712890625, -2.6590576171875, -2.33740234375, -2.0157470703125, -1.694091796875, -1.3724365234375, -1.05078125, -0.7291259765625, -0.407470703125, -0.0858154296875, 0.23583984375, 0.5574951171875, 0.879150390625, 1.2008056640625, 1.5224609375, 1.8441162109375, 2.165771484375, 2.4874267578125, 2.80908203125, 3.1307373046875, 3.452392578125, 3.7740478515625, 4.095703125, 4.4173583984375, 4.739013671875, 5.0606689453125, 5.38232421875, 5.7039794921875, 6.025634765625, 6.3472900390625, 6.6689453125, 6.9906005859375, 7.312255859375, 7.6339111328125, 7.95556640625, 8.2772216796875, 8.598876953125, 8.9205322265625, 9.2421875]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 6.0, 17.0, 34.0, 119.0, 282.0, 667.0, 1503.0, 928.0, 333.0, 121.0, 49.0, 24.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.25, -32.2333984375, -31.216796875, -30.2001953125, -29.18359375, -28.1669921875, -27.150390625, -26.1337890625, -25.1171875, -24.1005859375, -23.083984375, -22.0673828125, -21.05078125, -20.0341796875, -19.017578125, -18.0009765625, -16.984375, -15.9677734375, -14.951171875, -13.9345703125, -12.91796875, -11.9013671875, -10.884765625, -9.8681640625, -8.8515625, -7.8349609375, -6.818359375, -5.8017578125, -4.78515625, -3.7685546875, -2.751953125, -1.7353515625, -0.71875, 0.2978515625, 1.314453125, 2.3310546875, 3.34765625, 4.3642578125, 5.380859375, 6.3974609375, 7.4140625, 8.4306640625, 9.447265625, 10.4638671875, 11.48046875, 12.4970703125, 13.513671875, 14.5302734375, 15.546875, 16.5634765625, 17.580078125, 18.5966796875, 19.61328125, 20.6298828125, 21.646484375, 22.6630859375, 23.6796875, 24.6962890625, 25.712890625, 26.7294921875, 27.74609375, 28.7626953125, 29.779296875, 30.7958984375, 31.8125]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 16.0, 46.0, 187.0, 697.0, 9060.0, 4161436.0, 21450.0, 1029.0, 243.0, 80.0, 25.0, 11.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-76.1875, -73.7744140625, -71.361328125, -68.9482421875, -66.53515625, -64.1220703125, -61.708984375, -59.2958984375, -56.8828125, -54.4697265625, -52.056640625, -49.6435546875, -47.23046875, -44.8173828125, -42.404296875, -39.9912109375, -37.578125, -35.1650390625, -32.751953125, -30.3388671875, -27.92578125, -25.5126953125, -23.099609375, -20.6865234375, -18.2734375, -15.8603515625, -13.447265625, -11.0341796875, -8.62109375, -6.2080078125, -3.794921875, -1.3818359375, 1.03125, 3.4443359375, 5.857421875, 8.2705078125, 10.68359375, 13.0966796875, 15.509765625, 17.9228515625, 20.3359375, 22.7490234375, 25.162109375, 27.5751953125, 29.98828125, 32.4013671875, 34.814453125, 37.2275390625, 39.640625, 42.0537109375, 44.466796875, 46.8798828125, 49.29296875, 51.7060546875, 54.119140625, 56.5322265625, 58.9453125, 61.3583984375, 63.771484375, 66.1845703125, 68.59765625, 71.0107421875, 73.423828125, 75.8369140625, 78.25]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 12.0, 37.0, 150.0, 272.0, 280.0, 170.0, 65.0, 18.0, 4.0, 2.0, 0.0, 0.0, 2.0], "bins": [-215.133056640625, -211.23463439941406, -207.33621215820312, -203.43777465820312, -199.5393524169922, -195.64093017578125, -191.7425079345703, -187.84408569335938, -183.94566345214844, -180.0472412109375, -176.14881896972656, -172.25039672851562, -168.35195922851562, -164.4535369873047, -160.55511474609375, -156.6566925048828, -152.75827026367188, -148.85984802246094, -144.96142578125, -141.06298828125, -137.16456604003906, -133.26614379882812, -129.3677215576172, -125.46929931640625, -121.57086181640625, -117.67243957519531, -113.77400970458984, -109.8755874633789, -105.97716522216797, -102.0787353515625, -98.18031311035156, -94.28189086914062, -90.38346862792969, -86.48504638671875, -82.58661651611328, -78.68819427490234, -74.7897720336914, -70.89134216308594, -66.992919921875, -63.09449768066406, -59.196075439453125, -55.29764938354492, -51.399227142333984, -47.50080108642578, -43.602378845214844, -39.70395278930664, -35.80552673339844, -31.907102584838867, -28.008678436279297, -24.110254287719727, -20.211830139160156, -16.313404083251953, -12.414979934692383, -8.516555786132812, -4.618129730224609, -0.7197055816650391, 3.1787185668945312, 7.07714319229126, 10.975567817687988, 14.873992919921875, 18.772417068481445, 22.670841217041016, 26.56926727294922, 30.46769142150879, 34.36611557006836]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 10.0, 11.0, 11.0, 10.0, 8.0, 13.0, 10.0, 19.0, 14.0, 21.0, 27.0, 19.0, 35.0, 26.0, 27.0, 25.0, 29.0, 44.0, 32.0, 51.0, 33.0, 47.0, 44.0, 40.0, 43.0, 37.0, 30.0, 24.0, 30.0, 28.0, 32.0, 22.0, 20.0, 25.0, 19.0, 17.0, 7.0, 16.0, 11.0, 8.0, 6.0, 3.0, 4.0, 8.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.388275146484375, -38.188262939453125, -36.98825454711914, -35.788246154785156, -34.588233947753906, -33.388221740722656, -32.18821334838867, -30.988203048706055, -29.788192749023438, -28.58818244934082, -27.388172149658203, -26.188161849975586, -24.98815155029297, -23.78814125061035, -22.588130950927734, -21.388120651245117, -20.1881103515625, -18.988100051879883, -17.788089752197266, -16.58807945251465, -15.388069152832031, -14.188058853149414, -12.988048553466797, -11.78803825378418, -10.588027954101562, -9.388017654418945, -8.188007354736328, -6.987997055053711, -5.787986755371094, -4.587976455688477, -3.3879661560058594, -2.187955856323242, -0.987945556640625, 0.2120647430419922, 1.4120750427246094, 2.6120853424072266, 3.8120956420898438, 5.012105941772461, 6.212116241455078, 7.412126541137695, 8.612136840820312, 9.81214714050293, 11.012157440185547, 12.212167739868164, 13.412178039550781, 14.612188339233398, 15.812198638916016, 17.012208938598633, 18.21221923828125, 19.412229537963867, 20.612239837646484, 21.8122501373291, 23.01226043701172, 24.212270736694336, 25.412281036376953, 26.61229133605957, 27.812301635742188, 29.012311935424805, 30.212322235107422, 31.41233253479004, 32.612342834472656, 33.812355041503906, 35.01236343383789, 36.212371826171875, 37.412384033203125]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 5.0, 2.0, 5.0, 5.0, 5.0, 2.0, 16.0, 13.0, 15.0, 11.0, 17.0, 14.0, 26.0, 18.0, 22.0, 30.0, 42.0, 29.0, 34.0, 42.0, 45.0, 29.0, 46.0, 44.0, 33.0, 29.0, 36.0, 45.0, 43.0, 38.0, 33.0, 25.0, 38.0, 16.0, 24.0, 28.0, 25.0, 13.0, 14.0, 15.0, 8.0, 7.0, 5.0, 7.0, 5.0, 4.0, 0.0, 2.0, 0.0, 2.0], "bins": [-5.6328125, -5.48291015625, -5.3330078125, -5.18310546875, -5.033203125, -4.88330078125, -4.7333984375, -4.58349609375, -4.43359375, -4.28369140625, -4.1337890625, -3.98388671875, -3.833984375, -3.68408203125, -3.5341796875, -3.38427734375, -3.234375, -3.08447265625, -2.9345703125, -2.78466796875, -2.634765625, -2.48486328125, -2.3349609375, -2.18505859375, -2.03515625, -1.88525390625, -1.7353515625, -1.58544921875, -1.435546875, -1.28564453125, -1.1357421875, -0.98583984375, -0.8359375, -0.68603515625, -0.5361328125, -0.38623046875, -0.236328125, -0.08642578125, 0.0634765625, 0.21337890625, 0.36328125, 0.51318359375, 0.6630859375, 0.81298828125, 0.962890625, 1.11279296875, 1.2626953125, 1.41259765625, 1.5625, 1.71240234375, 1.8623046875, 2.01220703125, 2.162109375, 2.31201171875, 2.4619140625, 2.61181640625, 2.76171875, 2.91162109375, 3.0615234375, 3.21142578125, 3.361328125, 3.51123046875, 3.6611328125, 3.81103515625, 3.9609375]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 5.0, 7.0, 10.0, 12.0, 28.0, 24.0, 47.0, 57.0, 107.0, 141.0, 196.0, 293.0, 436.0, 683.0, 1000.0, 1515.0, 2305.0, 3493.0, 5394.0, 8324.0, 12557.0, 20064.0, 32083.0, 52884.0, 89892.0, 151824.0, 213085.0, 177215.0, 107596.0, 62951.0, 37951.0, 23756.0, 14852.0, 9469.0, 6188.0, 4168.0, 2695.0, 1758.0, 1157.0, 787.0, 527.0, 329.0, 224.0, 126.0, 116.0, 55.0, 68.0, 44.0, 23.0, 16.0, 12.0, 6.0, 5.0, 5.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.39208984375, -0.38008880615234375, -0.3680877685546875, -0.35608673095703125, -0.344085693359375, -0.33208465576171875, -0.3200836181640625, -0.30808258056640625, -0.29608154296875, -0.28408050537109375, -0.2720794677734375, -0.26007843017578125, -0.248077392578125, -0.23607635498046875, -0.2240753173828125, -0.21207427978515625, -0.2000732421875, -0.18807220458984375, -0.1760711669921875, -0.16407012939453125, -0.152069091796875, -0.14006805419921875, -0.1280670166015625, -0.11606597900390625, -0.10406494140625, -0.09206390380859375, -0.0800628662109375, -0.06806182861328125, -0.056060791015625, -0.04405975341796875, -0.0320587158203125, -0.02005767822265625, -0.008056640625, 0.00394439697265625, 0.0159454345703125, 0.02794647216796875, 0.039947509765625, 0.05194854736328125, 0.0639495849609375, 0.07595062255859375, 0.08795166015625, 0.09995269775390625, 0.1119537353515625, 0.12395477294921875, 0.135955810546875, 0.14795684814453125, 0.1599578857421875, 0.17195892333984375, 0.1839599609375, 0.19596099853515625, 0.2079620361328125, 0.21996307373046875, 0.231964111328125, 0.24396514892578125, 0.2559661865234375, 0.26796722412109375, 0.27996826171875, 0.29196929931640625, 0.3039703369140625, 0.31597137451171875, 0.327972412109375, 0.33997344970703125, 0.3519744873046875, 0.36397552490234375, 0.3759765625]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 1.0, 5.0, 1.0, 4.0, 10.0, 8.0, 11.0, 17.0, 18.0, 12.0, 23.0, 22.0, 22.0, 28.0, 39.0, 27.0, 33.0, 45.0, 47.0, 46.0, 38.0, 1066.0, 39.0, 32.0, 38.0, 39.0, 35.0, 52.0, 44.0, 40.0, 30.0, 24.0, 17.0, 21.0, 19.0, 17.0, 10.0, 9.0, 10.0, 9.0, 5.0, 5.0, 4.0, 1.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-3.185546875, -3.0780029296875, -2.970458984375, -2.8629150390625, -2.75537109375, -2.6478271484375, -2.540283203125, -2.4327392578125, -2.3251953125, -2.2176513671875, -2.110107421875, -2.0025634765625, -1.89501953125, -1.7874755859375, -1.679931640625, -1.5723876953125, -1.46484375, -1.3572998046875, -1.249755859375, -1.1422119140625, -1.03466796875, -0.9271240234375, -0.819580078125, -0.7120361328125, -0.6044921875, -0.4969482421875, -0.389404296875, -0.2818603515625, -0.17431640625, -0.0667724609375, 0.040771484375, 0.1483154296875, 0.255859375, 0.3634033203125, 0.470947265625, 0.5784912109375, 0.68603515625, 0.7935791015625, 0.901123046875, 1.0086669921875, 1.1162109375, 1.2237548828125, 1.331298828125, 1.4388427734375, 1.54638671875, 1.6539306640625, 1.761474609375, 1.8690185546875, 1.9765625, 2.0841064453125, 2.191650390625, 2.2991943359375, 2.40673828125, 2.5142822265625, 2.621826171875, 2.7293701171875, 2.8369140625, 2.9444580078125, 3.052001953125, 3.1595458984375, 3.26708984375, 3.3746337890625, 3.482177734375, 3.5897216796875, 3.697265625]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 3.0, 1.0, 6.0, 9.0, 15.0, 25.0, 24.0, 42.0, 48.0, 72.0, 114.0, 197.0, 290.0, 504.0, 834.0, 1309.0, 2339.0, 4208.0, 6792.0, 12025.0, 20475.0, 35578.0, 62589.0, 108526.0, 174667.0, 1260523.0, 165827.0, 101825.0, 58395.0, 33718.0, 19203.0, 11130.0, 6571.0, 3794.0, 2183.0, 1312.0, 729.0, 463.0, 260.0, 168.0, 102.0, 72.0, 52.0, 43.0, 28.0, 19.0, 8.0, 10.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 3.0], "bins": [-0.296142578125, -0.2870140075683594, -0.27788543701171875, -0.2687568664550781, -0.2596282958984375, -0.2504997253417969, -0.24137115478515625, -0.23224258422851562, -0.223114013671875, -0.21398544311523438, -0.20485687255859375, -0.19572830200195312, -0.1865997314453125, -0.17747116088867188, -0.16834259033203125, -0.15921401977539062, -0.15008544921875, -0.14095687866210938, -0.13182830810546875, -0.12269973754882812, -0.1135711669921875, -0.10444259643554688, -0.09531402587890625, -0.08618545532226562, -0.077056884765625, -0.06792831420898438, -0.05879974365234375, -0.049671173095703125, -0.0405426025390625, -0.031414031982421875, -0.02228546142578125, -0.013156890869140625, -0.0040283203125, 0.005100250244140625, 0.01422882080078125, 0.023357391357421875, 0.0324859619140625, 0.041614532470703125, 0.05074310302734375, 0.059871673583984375, 0.069000244140625, 0.07812881469726562, 0.08725738525390625, 0.09638595581054688, 0.1055145263671875, 0.11464309692382812, 0.12377166748046875, 0.13290023803710938, 0.14202880859375, 0.15115737915039062, 0.16028594970703125, 0.16941452026367188, 0.1785430908203125, 0.18767166137695312, 0.19680023193359375, 0.20592880249023438, 0.215057373046875, 0.22418594360351562, 0.23331451416015625, 0.24244308471679688, 0.2515716552734375, 0.2607002258300781, 0.26982879638671875, 0.2789573669433594, 0.2880859375]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 5.0, 2.0, 5.0, 3.0, 3.0, 5.0, 14.0, 11.0, 11.0, 13.0, 12.0, 13.0, 20.0, 23.0, 23.0, 33.0, 45.0, 36.0, 35.0, 35.0, 42.0, 34.0, 47.0, 57.0, 49.0, 40.0, 59.0, 48.0, 32.0, 33.0, 22.0, 32.0, 22.0, 18.0, 31.0, 14.0, 9.0, 12.0, 8.0, 9.0, 10.0, 3.0, 5.0, 6.0, 9.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0], "bins": [-0.0021381378173828125, -0.002071678638458252, -0.0020052194595336914, -0.0019387602806091309, -0.0018723011016845703, -0.0018058419227600098, -0.0017393827438354492, -0.0016729235649108887, -0.0016064643859863281, -0.0015400052070617676, -0.001473546028137207, -0.0014070868492126465, -0.001340627670288086, -0.0012741684913635254, -0.0012077093124389648, -0.0011412501335144043, -0.0010747909545898438, -0.0010083317756652832, -0.0009418725967407227, -0.0008754134178161621, -0.0008089542388916016, -0.000742495059967041, -0.0006760358810424805, -0.0006095767021179199, -0.0005431175231933594, -0.00047665834426879883, -0.0004101991653442383, -0.00034373998641967773, -0.0002772808074951172, -0.00021082162857055664, -0.0001443624496459961, -7.790327072143555e-05, -1.1444091796875e-05, 5.501508712768555e-05, 0.0001214742660522461, 0.00018793344497680664, 0.0002543926239013672, 0.00032085180282592773, 0.0003873109817504883, 0.00045377016067504883, 0.0005202293395996094, 0.0005866885185241699, 0.0006531476974487305, 0.000719606876373291, 0.0007860660552978516, 0.0008525252342224121, 0.0009189844131469727, 0.0009854435920715332, 0.0010519027709960938, 0.0011183619499206543, 0.0011848211288452148, 0.0012512803077697754, 0.001317739486694336, 0.0013841986656188965, 0.001450657844543457, 0.0015171170234680176, 0.0015835762023925781, 0.0016500353813171387, 0.0017164945602416992, 0.0017829537391662598, 0.0018494129180908203, 0.0019158720970153809, 0.0019823312759399414, 0.002048790454864502, 0.0021152496337890625]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 6.0, 3.0, 4.0, 5.0, 3.0, 7.0, 10.0, 11.0, 8.0, 14.0, 9.0, 18.0, 22.0, 38.0, 23.0, 49.0, 53.0, 98.0, 87.0, 130.0, 171.0, 269.0, 437.0, 775.0, 5942.0, 955711.0, 81388.0, 1554.0, 556.0, 325.0, 202.0, 152.0, 109.0, 81.0, 62.0, 43.0, 40.0, 24.0, 25.0, 15.0, 19.0, 10.0, 10.0, 8.0, 10.0, 7.0, 3.0, 4.0, 4.0, 0.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.044464111328125, -0.043064117431640625, -0.04166412353515625, -0.040264129638671875, -0.0388641357421875, -0.037464141845703125, -0.03606414794921875, -0.034664154052734375, -0.03326416015625, -0.031864166259765625, -0.03046417236328125, -0.029064178466796875, -0.0276641845703125, -0.026264190673828125, -0.02486419677734375, -0.023464202880859375, -0.022064208984375, -0.020664215087890625, -0.01926422119140625, -0.017864227294921875, -0.0164642333984375, -0.015064239501953125, -0.01366424560546875, -0.012264251708984375, -0.0108642578125, -0.009464263916015625, -0.00806427001953125, -0.006664276123046875, -0.0052642822265625, -0.003864288330078125, -0.00246429443359375, -0.001064300537109375, 0.000335693359375, 0.001735687255859375, 0.00313568115234375, 0.004535675048828125, 0.0059356689453125, 0.007335662841796875, 0.00873565673828125, 0.010135650634765625, 0.01153564453125, 0.012935638427734375, 0.01433563232421875, 0.015735626220703125, 0.0171356201171875, 0.018535614013671875, 0.01993560791015625, 0.021335601806640625, 0.022735595703125, 0.024135589599609375, 0.02553558349609375, 0.026935577392578125, 0.0283355712890625, 0.029735565185546875, 0.03113555908203125, 0.032535552978515625, 0.033935546875, 0.035335540771484375, 0.03673553466796875, 0.038135528564453125, 0.0395355224609375, 0.040935516357421875, 0.04233551025390625, 0.043735504150390625, 0.045135498046875]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 41.0, 935.0, 37.0, 1.0, 2.0], "bins": [-0.06643931567668915, -0.065340057015419, -0.06424079835414886, -0.06314153224229813, -0.062042273581027985, -0.06094301491975784, -0.0598437525331974, -0.05874449387192726, -0.05764523148536682, -0.05654597282409668, -0.05544671043753624, -0.0543474517762661, -0.05324818938970566, -0.052148930728435516, -0.051049668341875076, -0.049950409680604935, -0.048851147294044495, -0.04775188863277435, -0.04665262624621391, -0.04555336758494377, -0.04445410519838333, -0.04335484653711319, -0.04225558415055275, -0.04115632548928261, -0.040057066828012466, -0.038957808166742325, -0.037858545780181885, -0.03675928711891174, -0.0356600247323513, -0.03456076607108116, -0.03346150368452072, -0.03236224502325058, -0.03126298636198044, -0.030163725838065147, -0.029064465314149857, -0.027965204790234566, -0.026865944266319275, -0.025766683742403984, -0.024667423218488693, -0.02356816455721855, -0.02246890217065811, -0.02136964164674282, -0.02027038112282753, -0.01917112059891224, -0.018071860074996948, -0.016972599551081657, -0.015873339027166367, -0.01477407943457365, -0.013674817979335785, -0.012575557455420494, -0.011476296931505203, -0.010377036407589912, -0.009277775883674622, -0.00817851535975933, -0.0070792557671666145, -0.005979995243251324, -0.004880734719336033, -0.003781474195420742, -0.002682213904336095, -0.0015829536132514477, -0.00048369308933615685, 0.000615567434579134, 0.0017148274928331375, 0.0028140880167484283, 0.003913348540663719]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 4.0, 4.0, 0.0, 1.0, 3.0, 2.0, 10.0, 6.0, 12.0, 10.0, 8.0, 16.0, 19.0, 20.0, 27.0, 24.0, 28.0, 41.0, 37.0, 59.0, 42.0, 49.0, 59.0, 47.0, 39.0, 49.0, 39.0, 42.0, 43.0, 36.0, 45.0, 32.0, 28.0, 23.0, 28.0, 22.0, 9.0, 12.0, 11.0, 9.0, 7.0, 5.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0022081732749938965, -0.0021206168457865715, -0.0020330604165792465, -0.0019455039873719215, -0.0018579475581645966, -0.0017703911289572716, -0.0016828346997499466, -0.0015952782705426216, -0.0015077218413352966, -0.0014201654121279716, -0.0013326089829206467, -0.0012450525537133217, -0.0011574961245059967, -0.0010699396952986717, -0.0009823832660913467, -0.0008948268368840218, -0.0008072704076766968, -0.0007197139784693718, -0.0006321575492620468, -0.0005446011200547218, -0.00045704469084739685, -0.00036948826164007187, -0.0002819318324327469, -0.0001943754032254219, -0.00010681897401809692, -1.9262544810771942e-05, 6.829388439655304e-05, 0.00015585031360387802, 0.000243406742811203, 0.000330963172018528, 0.00041851960122585297, 0.000506076030433178, 0.0005936324596405029, 0.0006811888888478279, 0.0007687453180551529, 0.0008563017472624779, 0.0009438581764698029, 0.0010314146056771278, 0.0011189710348844528, 0.0012065274640917778, 0.0012940838932991028, 0.0013816403225064278, 0.0014691967517137527, 0.0015567531809210777, 0.0016443096101284027, 0.0017318660393357277, 0.0018194224685430527, 0.0019069788977503777, 0.0019945353269577026, 0.0020820917561650276, 0.0021696481853723526, 0.0022572046145796776, 0.0023447610437870026, 0.0024323174729943275, 0.0025198739022016525, 0.0026074303314089775, 0.0026949867606163025, 0.0027825431898236275, 0.0028700996190309525, 0.0029576560482382774, 0.0030452124774456024, 0.0031327689066529274, 0.0032203253358602524, 0.0033078817650675774, 0.0033954381942749023]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 5.0, 2.0, 5.0, 5.0, 5.0, 1.0, 17.0, 13.0, 15.0, 11.0, 17.0, 14.0, 26.0, 18.0, 22.0, 30.0, 42.0, 29.0, 34.0, 42.0, 44.0, 30.0, 46.0, 44.0, 33.0, 29.0, 36.0, 45.0, 43.0, 38.0, 33.0, 25.0, 38.0, 16.0, 24.0, 28.0, 25.0, 13.0, 14.0, 15.0, 8.0, 7.0, 5.0, 7.0, 5.0, 4.0, 0.0, 2.0, 0.0, 2.0], "bins": [-5.6328125, -5.48291015625, -5.3330078125, -5.18310546875, -5.033203125, -4.88330078125, -4.7333984375, -4.58349609375, -4.43359375, -4.28369140625, -4.1337890625, -3.98388671875, -3.833984375, -3.68408203125, -3.5341796875, -3.38427734375, -3.234375, -3.08447265625, -2.9345703125, -2.78466796875, -2.634765625, -2.48486328125, -2.3349609375, -2.18505859375, -2.03515625, -1.88525390625, -1.7353515625, -1.58544921875, -1.435546875, -1.28564453125, -1.1357421875, -0.98583984375, -0.8359375, -0.68603515625, -0.5361328125, -0.38623046875, -0.236328125, -0.08642578125, 0.0634765625, 0.21337890625, 0.36328125, 0.51318359375, 0.6630859375, 0.81298828125, 0.962890625, 1.11279296875, 1.2626953125, 1.41259765625, 1.5625, 1.71240234375, 1.8623046875, 2.01220703125, 2.162109375, 2.31201171875, 2.4619140625, 2.61181640625, 2.76171875, 2.91162109375, 3.0615234375, 3.21142578125, 3.361328125, 3.51123046875, 3.6611328125, 3.81103515625, 3.9609375]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 4.0, 1.0, 2.0, 9.0, 5.0, 5.0, 15.0, 14.0, 21.0, 31.0, 44.0, 48.0, 63.0, 81.0, 135.0, 185.0, 253.0, 441.0, 794.0, 1486.0, 3458.0, 8744.0, 27801.0, 122737.0, 514268.0, 286490.0, 55861.0, 15144.0, 5372.0, 2178.0, 1118.0, 622.0, 360.0, 239.0, 162.0, 104.0, 66.0, 53.0, 44.0, 37.0, 24.0, 16.0, 12.0, 5.0, 6.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.2265625, -9.94830322265625, -9.6700439453125, -9.39178466796875, -9.113525390625, -8.83526611328125, -8.5570068359375, -8.27874755859375, -8.00048828125, -7.72222900390625, -7.4439697265625, -7.16571044921875, -6.887451171875, -6.60919189453125, -6.3309326171875, -6.05267333984375, -5.7744140625, -5.49615478515625, -5.2178955078125, -4.93963623046875, -4.661376953125, -4.38311767578125, -4.1048583984375, -3.82659912109375, -3.54833984375, -3.27008056640625, -2.9918212890625, -2.71356201171875, -2.435302734375, -2.15704345703125, -1.8787841796875, -1.60052490234375, -1.322265625, -1.04400634765625, -0.7657470703125, -0.48748779296875, -0.209228515625, 0.06903076171875, 0.3472900390625, 0.62554931640625, 0.90380859375, 1.18206787109375, 1.4603271484375, 1.73858642578125, 2.016845703125, 2.29510498046875, 2.5733642578125, 2.85162353515625, 3.1298828125, 3.40814208984375, 3.6864013671875, 3.96466064453125, 4.242919921875, 4.52117919921875, 4.7994384765625, 5.07769775390625, 5.35595703125, 5.63421630859375, 5.9124755859375, 6.19073486328125, 6.468994140625, 6.74725341796875, 7.0255126953125, 7.30377197265625, 7.58203125]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 7.0, 6.0, 7.0, 6.0, 7.0, 10.0, 18.0, 22.0, 22.0, 31.0, 33.0, 37.0, 34.0, 44.0, 50.0, 81.0, 121.0, 237.0, 1463.0, 269.0, 100.0, 84.0, 53.0, 53.0, 45.0, 39.0, 35.0, 25.0, 14.0, 20.0, 18.0, 8.0, 7.0, 8.0, 11.0, 7.0, 3.0, 2.0, 5.0, 2.0, 5.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-11.671875, -11.262451171875, -10.85302734375, -10.443603515625, -10.0341796875, -9.624755859375, -9.21533203125, -8.805908203125, -8.396484375, -7.987060546875, -7.57763671875, -7.168212890625, -6.7587890625, -6.349365234375, -5.93994140625, -5.530517578125, -5.12109375, -4.711669921875, -4.30224609375, -3.892822265625, -3.4833984375, -3.073974609375, -2.66455078125, -2.255126953125, -1.845703125, -1.436279296875, -1.02685546875, -0.617431640625, -0.2080078125, 0.201416015625, 0.61083984375, 1.020263671875, 1.4296875, 1.839111328125, 2.24853515625, 2.657958984375, 3.0673828125, 3.476806640625, 3.88623046875, 4.295654296875, 4.705078125, 5.114501953125, 5.52392578125, 5.933349609375, 6.3427734375, 6.752197265625, 7.16162109375, 7.571044921875, 7.98046875, 8.389892578125, 8.79931640625, 9.208740234375, 9.6181640625, 10.027587890625, 10.43701171875, 10.846435546875, 11.255859375, 11.665283203125, 12.07470703125, 12.484130859375, 12.8935546875, 13.302978515625, 13.71240234375, 14.121826171875, 14.53125]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 1.0, 0.0, 3.0, 8.0, 6.0, 5.0, 7.0, 9.0, 13.0, 17.0, 27.0, 32.0, 46.0, 62.0, 116.0, 175.0, 278.0, 587.0, 1822.0, 59561.0, 3069805.0, 10937.0, 1026.0, 473.0, 231.0, 147.0, 88.0, 60.0, 43.0, 28.0, 16.0, 19.0, 16.0, 12.0, 7.0, 2.0, 10.0, 4.0, 3.0, 1.0, 4.0, 3.0, 1.0, 2.0], "bins": [-44.53125, -43.427001953125, -42.32275390625, -41.218505859375, -40.1142578125, -39.010009765625, -37.90576171875, -36.801513671875, -35.697265625, -34.593017578125, -33.48876953125, -32.384521484375, -31.2802734375, -30.176025390625, -29.07177734375, -27.967529296875, -26.86328125, -25.759033203125, -24.65478515625, -23.550537109375, -22.4462890625, -21.342041015625, -20.23779296875, -19.133544921875, -18.029296875, -16.925048828125, -15.82080078125, -14.716552734375, -13.6123046875, -12.508056640625, -11.40380859375, -10.299560546875, -9.1953125, -8.091064453125, -6.98681640625, -5.882568359375, -4.7783203125, -3.674072265625, -2.56982421875, -1.465576171875, -0.361328125, 0.742919921875, 1.84716796875, 2.951416015625, 4.0556640625, 5.159912109375, 6.26416015625, 7.368408203125, 8.47265625, 9.576904296875, 10.68115234375, 11.785400390625, 12.8896484375, 13.993896484375, 15.09814453125, 16.202392578125, 17.306640625, 18.410888671875, 19.51513671875, 20.619384765625, 21.7236328125, 22.827880859375, 23.93212890625, 25.036376953125, 26.140625]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 61.0, 571.0, 371.0, 10.0, 0.0, 0.0, 0.0, 1.0], "bins": [-297.1816101074219, -292.0477294921875, -286.9138488769531, -281.77996826171875, -276.6460876464844, -271.51220703125, -266.37835693359375, -261.24444580078125, -256.110595703125, -250.97671508789062, -245.84283447265625, -240.70895385742188, -235.57508850097656, -230.4412078857422, -225.3073272705078, -220.17344665527344, -215.03955078125, -209.90567016601562, -204.77178955078125, -199.63790893554688, -194.50404357910156, -189.3701629638672, -184.2362823486328, -179.10240173339844, -173.96853637695312, -168.83465576171875, -163.70077514648438, -158.56689453125, -153.4330291748047, -148.2991485595703, -143.16526794433594, -138.03138732910156, -132.8975067138672, -127.76362609863281, -122.62975311279297, -117.4958724975586, -112.36199188232422, -107.22811889648438, -102.09423828125, -96.96035766601562, -91.82647705078125, -86.69259643554688, -81.55872344970703, -76.42484283447266, -71.29096221923828, -66.15708923339844, -61.02320861816406, -55.88932800292969, -50.755455017089844, -45.621578216552734, -40.48769760131836, -35.35382080078125, -30.219942092895508, -25.086063385009766, -19.952186584472656, -14.818305969238281, -9.684427261352539, -4.550549030303955, 0.5833292007446289, 5.717206954956055, 10.851085662841797, 15.984964370727539, 21.11884117126465, 26.252721786499023, 31.386598587036133]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 8.0, 8.0, 10.0, 7.0, 13.0, 8.0, 16.0, 15.0, 24.0, 15.0, 32.0, 38.0, 23.0, 31.0, 40.0, 30.0, 33.0, 42.0, 32.0, 45.0, 40.0, 36.0, 55.0, 51.0, 34.0, 35.0, 37.0, 35.0, 23.0, 23.0, 30.0, 18.0, 21.0, 18.0, 10.0, 14.0, 13.0, 9.0, 10.0, 9.0, 6.0, 2.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-33.40723419189453, -32.471710205078125, -31.536182403564453, -30.600658416748047, -29.665132522583008, -28.72960662841797, -27.79408073425293, -26.85855484008789, -25.923030853271484, -24.987504959106445, -24.051979064941406, -23.116455078125, -22.18092918395996, -21.245403289794922, -20.309877395629883, -19.374351501464844, -18.438825607299805, -17.503299713134766, -16.567773818969727, -15.632248878479004, -14.696723937988281, -13.761198043823242, -12.825672149658203, -11.890146255493164, -10.954621315002441, -10.019095420837402, -9.08357048034668, -8.14804458618164, -7.21251916885376, -6.276993751525879, -5.34146785736084, -4.405942440032959, -3.470417022705078, -2.5348916053771973, -1.5993659496307373, -0.6638402938842773, 0.2716851234436035, 1.2072105407714844, 2.1427364349365234, 3.0782618522644043, 4.013787269592285, 4.949312686920166, 5.884838104248047, 6.820363998413086, 7.755889415740967, 8.691414833068848, 9.626940727233887, 10.56246566772461, 11.497991561889648, 12.433517456054688, 13.36904239654541, 14.30456829071045, 15.240093231201172, 16.17561912536621, 17.11114501953125, 18.04667091369629, 18.982196807861328, 19.917722702026367, 20.853248596191406, 21.788772583007812, 22.72429847717285, 23.65982437133789, 24.59535026550293, 25.53087615966797, 26.466400146484375]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 1.0, 0.0, 4.0, 8.0, 5.0, 8.0, 10.0, 12.0, 12.0, 11.0, 15.0, 18.0, 19.0, 28.0, 24.0, 25.0, 29.0, 32.0, 41.0, 44.0, 28.0, 32.0, 33.0, 44.0, 43.0, 45.0, 33.0, 32.0, 41.0, 36.0, 30.0, 34.0, 29.0, 28.0, 33.0, 25.0, 15.0, 17.0, 12.0, 18.0, 12.0, 12.0, 11.0, 6.0, 5.0, 3.0, 2.0, 3.0, 4.0, 0.0, 0.0, 1.0], "bins": [-5.7578125, -5.59893798828125, -5.4400634765625, -5.28118896484375, -5.122314453125, -4.96343994140625, -4.8045654296875, -4.64569091796875, -4.48681640625, -4.32794189453125, -4.1690673828125, -4.01019287109375, -3.851318359375, -3.69244384765625, -3.5335693359375, -3.37469482421875, -3.2158203125, -3.05694580078125, -2.8980712890625, -2.73919677734375, -2.580322265625, -2.42144775390625, -2.2625732421875, -2.10369873046875, -1.94482421875, -1.78594970703125, -1.6270751953125, -1.46820068359375, -1.309326171875, -1.15045166015625, -0.9915771484375, -0.83270263671875, -0.673828125, -0.51495361328125, -0.3560791015625, -0.19720458984375, -0.038330078125, 0.12054443359375, 0.2794189453125, 0.43829345703125, 0.59716796875, 0.75604248046875, 0.9149169921875, 1.07379150390625, 1.232666015625, 1.39154052734375, 1.5504150390625, 1.70928955078125, 1.8681640625, 2.02703857421875, 2.1859130859375, 2.34478759765625, 2.503662109375, 2.66253662109375, 2.8214111328125, 2.98028564453125, 3.13916015625, 3.29803466796875, 3.4569091796875, 3.61578369140625, 3.774658203125, 3.93353271484375, 4.0924072265625, 4.25128173828125, 4.41015625]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 6.0, 3.0, 6.0, 5.0, 14.0, 17.0, 25.0, 35.0, 28.0, 35.0, 44.0, 52.0, 97.0, 131.0, 134.0, 208.0, 353.0, 430.0, 667.0, 1270.0, 3719.0, 19955.0, 230932.0, 3306096.0, 585417.0, 35153.0, 5457.0, 1585.0, 720.0, 468.0, 310.0, 239.0, 168.0, 130.0, 83.0, 77.0, 59.0, 50.0, 29.0, 28.0, 17.0, 10.0, 6.0, 5.0, 5.0, 7.0, 4.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-29.8125, -28.95166015625, -28.0908203125, -27.22998046875, -26.369140625, -25.50830078125, -24.6474609375, -23.78662109375, -22.92578125, -22.06494140625, -21.2041015625, -20.34326171875, -19.482421875, -18.62158203125, -17.7607421875, -16.89990234375, -16.0390625, -15.17822265625, -14.3173828125, -13.45654296875, -12.595703125, -11.73486328125, -10.8740234375, -10.01318359375, -9.15234375, -8.29150390625, -7.4306640625, -6.56982421875, -5.708984375, -4.84814453125, -3.9873046875, -3.12646484375, -2.265625, -1.40478515625, -0.5439453125, 0.31689453125, 1.177734375, 2.03857421875, 2.8994140625, 3.76025390625, 4.62109375, 5.48193359375, 6.3427734375, 7.20361328125, 8.064453125, 8.92529296875, 9.7861328125, 10.64697265625, 11.5078125, 12.36865234375, 13.2294921875, 14.09033203125, 14.951171875, 15.81201171875, 16.6728515625, 17.53369140625, 18.39453125, 19.25537109375, 20.1162109375, 20.97705078125, 21.837890625, 22.69873046875, 23.5595703125, 24.42041015625, 25.28125]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 3.0, 6.0, 8.0, 7.0, 5.0, 20.0, 22.0, 27.0, 42.0, 43.0, 75.0, 77.0, 111.0, 142.0, 179.0, 254.0, 281.0, 366.0, 433.0, 409.0, 329.0, 265.0, 216.0, 193.0, 139.0, 101.0, 77.0, 56.0, 47.0, 41.0, 32.0, 21.0, 21.0, 8.0, 7.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.6171875, -9.2947998046875, -8.972412109375, -8.6500244140625, -8.32763671875, -8.0052490234375, -7.682861328125, -7.3604736328125, -7.0380859375, -6.7156982421875, -6.393310546875, -6.0709228515625, -5.74853515625, -5.4261474609375, -5.103759765625, -4.7813720703125, -4.458984375, -4.1365966796875, -3.814208984375, -3.4918212890625, -3.16943359375, -2.8470458984375, -2.524658203125, -2.2022705078125, -1.8798828125, -1.5574951171875, -1.235107421875, -0.9127197265625, -0.59033203125, -0.2679443359375, 0.054443359375, 0.3768310546875, 0.69921875, 1.0216064453125, 1.343994140625, 1.6663818359375, 1.98876953125, 2.3111572265625, 2.633544921875, 2.9559326171875, 3.2783203125, 3.6007080078125, 3.923095703125, 4.2454833984375, 4.56787109375, 4.8902587890625, 5.212646484375, 5.5350341796875, 5.857421875, 6.1798095703125, 6.502197265625, 6.8245849609375, 7.14697265625, 7.4693603515625, 7.791748046875, 8.1141357421875, 8.4365234375, 8.7589111328125, 9.081298828125, 9.4036865234375, 9.72607421875, 10.0484619140625, 10.370849609375, 10.6932373046875, 11.015625]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 6.0, 4.0, 7.0, 3.0, 14.0, 18.0, 24.0, 38.0, 70.0, 114.0, 195.0, 324.0, 610.0, 1311.0, 3016.0, 7994.0, 24293.0, 88227.0, 392800.0, 2019231.0, 1322971.0, 245744.0, 59595.0, 17199.0, 5964.0, 2340.0, 1033.0, 484.0, 253.0, 155.0, 99.0, 60.0, 39.0, 24.0, 9.0, 9.0, 5.0, 6.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-10.9921875, -10.6470947265625, -10.302001953125, -9.9569091796875, -9.61181640625, -9.2667236328125, -8.921630859375, -8.5765380859375, -8.2314453125, -7.8863525390625, -7.541259765625, -7.1961669921875, -6.85107421875, -6.5059814453125, -6.160888671875, -5.8157958984375, -5.470703125, -5.1256103515625, -4.780517578125, -4.4354248046875, -4.09033203125, -3.7452392578125, -3.400146484375, -3.0550537109375, -2.7099609375, -2.3648681640625, -2.019775390625, -1.6746826171875, -1.32958984375, -0.9844970703125, -0.639404296875, -0.2943115234375, 0.05078125, 0.3958740234375, 0.740966796875, 1.0860595703125, 1.43115234375, 1.7762451171875, 2.121337890625, 2.4664306640625, 2.8115234375, 3.1566162109375, 3.501708984375, 3.8468017578125, 4.19189453125, 4.5369873046875, 4.882080078125, 5.2271728515625, 5.572265625, 5.9173583984375, 6.262451171875, 6.6075439453125, 6.95263671875, 7.2977294921875, 7.642822265625, 7.9879150390625, 8.3330078125, 8.6781005859375, 9.023193359375, 9.3682861328125, 9.71337890625, 10.0584716796875, 10.403564453125, 10.7486572265625, 11.09375]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 5.0, 4.0, 3.0, 7.0, 4.0, 9.0, 14.0, 23.0, 20.0, 29.0, 30.0, 45.0, 48.0, 43.0, 56.0, 66.0, 74.0, 61.0, 59.0, 54.0, 56.0, 54.0, 45.0, 35.0, 36.0, 30.0, 25.0, 16.0, 16.0, 4.0, 7.0, 7.0, 9.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-61.973384857177734, -60.0745735168457, -58.175758361816406, -56.276947021484375, -54.37813186645508, -52.47932052612305, -50.58050537109375, -48.68169403076172, -46.78288269042969, -44.884071350097656, -42.98525619506836, -41.08644485473633, -39.18762969970703, -37.288818359375, -35.39000701904297, -33.49119186401367, -31.592378616333008, -29.693565368652344, -27.79475212097168, -25.895938873291016, -23.997127532958984, -22.09831428527832, -20.199501037597656, -18.300689697265625, -16.401874542236328, -14.503061294555664, -12.604249000549316, -10.705435752868652, -8.806623458862305, -6.907810211181641, -5.008996963500977, -3.110184669494629, -1.2113723754882812, 0.6874405145645142, 2.5862534046173096, 4.4850664138793945, 6.3838791847229, 8.282691955566406, 10.18150520324707, 12.080317497253418, 13.979130744934082, 15.877943992614746, 17.776756286621094, 19.675569534301758, 21.574382781982422, 23.473194122314453, 25.37200927734375, 27.27082061767578, 29.169633865356445, 31.06844711303711, 32.96725845336914, 34.86607360839844, 36.76488494873047, 38.6636962890625, 40.5625114440918, 42.46132278442383, 44.360137939453125, 46.258949279785156, 48.15776443481445, 50.056575775146484, 51.95539093017578, 53.85420227050781, 55.753013610839844, 57.65182876586914, 59.55064010620117]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 3.0, 6.0, 6.0, 7.0, 4.0, 16.0, 6.0, 7.0, 11.0, 18.0, 19.0, 11.0, 24.0, 27.0, 27.0, 34.0, 39.0, 26.0, 32.0, 26.0, 45.0, 34.0, 34.0, 43.0, 43.0, 39.0, 35.0, 27.0, 25.0, 33.0, 38.0, 24.0, 30.0, 27.0, 35.0, 14.0, 20.0, 15.0, 17.0, 12.0, 12.0, 10.0, 11.0, 5.0, 3.0, 2.0, 5.0, 7.0, 2.0, 5.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0], "bins": [-42.24371337890625, -40.918155670166016, -39.59259796142578, -38.26704406738281, -36.94148635864258, -35.615928649902344, -34.29037094116211, -32.964813232421875, -31.639257431030273, -30.31369972229004, -28.988143920898438, -27.662586212158203, -26.33702850341797, -25.011472702026367, -23.685914993286133, -22.36035919189453, -21.034801483154297, -19.709243774414062, -18.38368797302246, -17.058130264282227, -15.732573509216309, -14.40701675415039, -13.081459045410156, -11.755902290344238, -10.43034553527832, -9.104788780212402, -7.779231548309326, -6.45367431640625, -5.128117561340332, -3.802560806274414, -2.477003574371338, -1.1514463424682617, 0.17411041259765625, 1.4996674060821533, 2.8252243995666504, 4.150781631469727, 5.4763383865356445, 6.8018951416015625, 8.127452850341797, 9.453009605407715, 10.778566360473633, 12.10412311553955, 13.429679870605469, 14.755237579345703, 16.080795288085938, 17.40635108947754, 18.731908798217773, 20.057464599609375, 21.38302230834961, 22.708580017089844, 24.034135818481445, 25.35969352722168, 26.68524932861328, 28.010807037353516, 29.33636474609375, 30.661922454833984, 31.987478256225586, 33.31303405761719, 34.63859176635742, 35.964149475097656, 37.28970718383789, 38.615264892578125, 39.940818786621094, 41.26637649536133, 42.59193420410156]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 4.0, 4.0, 3.0, 7.0, 6.0, 9.0, 7.0, 12.0, 13.0, 20.0, 15.0, 24.0, 24.0, 26.0, 35.0, 36.0, 32.0, 39.0, 47.0, 52.0, 47.0, 41.0, 45.0, 33.0, 44.0, 44.0, 29.0, 31.0, 40.0, 37.0, 31.0, 18.0, 23.0, 30.0, 18.0, 12.0, 10.0, 10.0, 14.0, 5.0, 10.0, 4.0, 4.0, 3.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-87.4375, -84.7158203125, -81.994140625, -79.2724609375, -76.55078125, -73.8291015625, -71.107421875, -68.3857421875, -65.6640625, -62.9423828125, -60.220703125, -57.4990234375, -54.77734375, -52.0556640625, -49.333984375, -46.6123046875, -43.890625, -41.1689453125, -38.447265625, -35.7255859375, -33.00390625, -30.2822265625, -27.560546875, -24.8388671875, -22.1171875, -19.3955078125, -16.673828125, -13.9521484375, -11.23046875, -8.5087890625, -5.787109375, -3.0654296875, -0.34375, 2.3779296875, 5.099609375, 7.8212890625, 10.54296875, 13.2646484375, 15.986328125, 18.7080078125, 21.4296875, 24.1513671875, 26.873046875, 29.5947265625, 32.31640625, 35.0380859375, 37.759765625, 40.4814453125, 43.203125, 45.9248046875, 48.646484375, 51.3681640625, 54.08984375, 56.8115234375, 59.533203125, 62.2548828125, 64.9765625, 67.6982421875, 70.419921875, 73.1416015625, 75.86328125, 78.5849609375, 81.306640625, 84.0283203125, 86.75]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 6.0, 13.0, 20.0, 19.0, 37.0, 51.0, 82.0, 104.0, 180.0, 290.0, 446.0, 672.0, 1028.0, 1681.0, 2603.0, 4014.0, 6552.0, 10801.0, 17779.0, 29940.0, 50455.0, 85083.0, 139788.0, 196485.0, 186590.0, 125568.0, 75317.0, 44665.0, 26493.0, 16038.0, 9565.0, 6067.0, 3610.0, 2332.0, 1478.0, 949.0, 560.0, 417.0, 253.0, 186.0, 123.0, 69.0, 49.0, 31.0, 22.0, 20.0, 12.0, 8.0, 3.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0], "bins": [-5.07421875, -4.919921875, -4.765625, -4.611328125, -4.45703125, -4.302734375, -4.1484375, -3.994140625, -3.83984375, -3.685546875, -3.53125, -3.376953125, -3.22265625, -3.068359375, -2.9140625, -2.759765625, -2.60546875, -2.451171875, -2.296875, -2.142578125, -1.98828125, -1.833984375, -1.6796875, -1.525390625, -1.37109375, -1.216796875, -1.0625, -0.908203125, -0.75390625, -0.599609375, -0.4453125, -0.291015625, -0.13671875, 0.017578125, 0.171875, 0.326171875, 0.48046875, 0.634765625, 0.7890625, 0.943359375, 1.09765625, 1.251953125, 1.40625, 1.560546875, 1.71484375, 1.869140625, 2.0234375, 2.177734375, 2.33203125, 2.486328125, 2.640625, 2.794921875, 2.94921875, 3.103515625, 3.2578125, 3.412109375, 3.56640625, 3.720703125, 3.875, 4.029296875, 4.18359375, 4.337890625, 4.4921875, 4.646484375, 4.80078125]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 2.0, 12.0, 6.0, 5.0, 11.0, 6.0, 9.0, 6.0, 10.0, 14.0, 21.0, 16.0, 28.0, 18.0, 34.0, 35.0, 30.0, 37.0, 40.0, 49.0, 48.0, 46.0, 1080.0, 47.0, 37.0, 27.0, 39.0, 27.0, 30.0, 29.0, 27.0, 15.0, 27.0, 32.0, 17.0, 26.0, 18.0, 12.0, 10.0, 10.0, 6.0, 3.0, 8.0, 5.0, 0.0, 5.0, 6.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-53.53125, -51.92041015625, -50.3095703125, -48.69873046875, -47.087890625, -45.47705078125, -43.8662109375, -42.25537109375, -40.64453125, -39.03369140625, -37.4228515625, -35.81201171875, -34.201171875, -32.59033203125, -30.9794921875, -29.36865234375, -27.7578125, -26.14697265625, -24.5361328125, -22.92529296875, -21.314453125, -19.70361328125, -18.0927734375, -16.48193359375, -14.87109375, -13.26025390625, -11.6494140625, -10.03857421875, -8.427734375, -6.81689453125, -5.2060546875, -3.59521484375, -1.984375, -0.37353515625, 1.2373046875, 2.84814453125, 4.458984375, 6.06982421875, 7.6806640625, 9.29150390625, 10.90234375, 12.51318359375, 14.1240234375, 15.73486328125, 17.345703125, 18.95654296875, 20.5673828125, 22.17822265625, 23.7890625, 25.39990234375, 27.0107421875, 28.62158203125, 30.232421875, 31.84326171875, 33.4541015625, 35.06494140625, 36.67578125, 38.28662109375, 39.8974609375, 41.50830078125, 43.119140625, 44.72998046875, 46.3408203125, 47.95166015625, 49.5625]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 3.0, 1.0, 11.0, 11.0, 23.0, 15.0, 33.0, 50.0, 79.0, 119.0, 154.0, 252.0, 401.0, 601.0, 960.0, 1622.0, 2346.0, 4034.0, 6228.0, 10383.0, 16844.0, 27330.0, 44796.0, 74102.0, 118233.0, 167046.0, 1231138.0, 144267.0, 94897.0, 58331.0, 35741.0, 21805.0, 13275.0, 8259.0, 5156.0, 3177.0, 1962.0, 1240.0, 839.0, 476.0, 336.0, 183.0, 142.0, 92.0, 52.0, 31.0, 23.0, 13.0, 10.0, 9.0, 0.0, 4.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.322265625, -3.212493896484375, -3.10272216796875, -2.992950439453125, -2.8831787109375, -2.773406982421875, -2.66363525390625, -2.553863525390625, -2.444091796875, -2.334320068359375, -2.22454833984375, -2.114776611328125, -2.0050048828125, -1.895233154296875, -1.78546142578125, -1.675689697265625, -1.56591796875, -1.456146240234375, -1.34637451171875, -1.236602783203125, -1.1268310546875, -1.017059326171875, -0.90728759765625, -0.797515869140625, -0.687744140625, -0.577972412109375, -0.46820068359375, -0.358428955078125, -0.2486572265625, -0.138885498046875, -0.02911376953125, 0.080657958984375, 0.1904296875, 0.300201416015625, 0.40997314453125, 0.519744873046875, 0.6295166015625, 0.739288330078125, 0.84906005859375, 0.958831787109375, 1.068603515625, 1.178375244140625, 1.28814697265625, 1.397918701171875, 1.5076904296875, 1.617462158203125, 1.72723388671875, 1.837005615234375, 1.94677734375, 2.056549072265625, 2.16632080078125, 2.276092529296875, 2.3858642578125, 2.495635986328125, 2.60540771484375, 2.715179443359375, 2.824951171875, 2.934722900390625, 3.04449462890625, 3.154266357421875, 3.2640380859375, 3.373809814453125, 3.48358154296875, 3.593353271484375, 3.703125]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 9.0, 3.0, 3.0, 9.0, 4.0, 5.0, 10.0, 16.0, 16.0, 20.0, 20.0, 21.0, 21.0, 29.0, 44.0, 49.0, 53.0, 63.0, 81.0, 82.0, 83.0, 48.0, 53.0, 36.0, 45.0, 25.0, 22.0, 16.0, 21.0, 20.0, 15.0, 9.0, 13.0, 8.0, 7.0, 8.0, 4.0, 3.0, 1.0, 5.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0350341796875, -0.03394746780395508, -0.032860755920410156, -0.031774044036865234, -0.030687332153320312, -0.02960062026977539, -0.02851390838623047, -0.027427196502685547, -0.026340484619140625, -0.025253772735595703, -0.02416706085205078, -0.02308034896850586, -0.021993637084960938, -0.020906925201416016, -0.019820213317871094, -0.018733501434326172, -0.01764678955078125, -0.016560077667236328, -0.015473365783691406, -0.014386653900146484, -0.013299942016601562, -0.01221323013305664, -0.011126518249511719, -0.010039806365966797, -0.008953094482421875, -0.007866382598876953, -0.006779670715332031, -0.005692958831787109, -0.0046062469482421875, -0.0035195350646972656, -0.0024328231811523438, -0.0013461112976074219, -0.0002593994140625, 0.0008273124694824219, 0.0019140243530273438, 0.0030007362365722656, 0.0040874481201171875, 0.005174160003662109, 0.006260871887207031, 0.007347583770751953, 0.008434295654296875, 0.009521007537841797, 0.010607719421386719, 0.01169443130493164, 0.012781143188476562, 0.013867855072021484, 0.014954566955566406, 0.016041278839111328, 0.01712799072265625, 0.018214702606201172, 0.019301414489746094, 0.020388126373291016, 0.021474838256835938, 0.02256155014038086, 0.02364826202392578, 0.024734973907470703, 0.025821685791015625, 0.026908397674560547, 0.02799510955810547, 0.02908182144165039, 0.030168533325195312, 0.031255245208740234, 0.032341957092285156, 0.03342866897583008, 0.034515380859375]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 5.0, 4.0, 5.0, 6.0, 11.0, 11.0, 19.0, 10.0, 23.0, 32.0, 42.0, 53.0, 94.0, 96.0, 146.0, 216.0, 341.0, 564.0, 914.0, 1748.0, 3411.0, 7244.0, 16258.0, 40188.0, 114757.0, 385594.0, 322443.0, 93233.0, 33901.0, 13839.0, 6370.0, 3043.0, 1517.0, 848.0, 517.0, 319.0, 215.0, 127.0, 97.0, 74.0, 49.0, 43.0, 40.0, 27.0, 12.0, 12.0, 20.0, 9.0, 4.0, 5.0, 4.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17041015625, -0.16471290588378906, -0.15901565551757812, -0.1533184051513672, -0.14762115478515625, -0.1419239044189453, -0.13622665405273438, -0.13052940368652344, -0.1248321533203125, -0.11913490295410156, -0.11343765258789062, -0.10774040222167969, -0.10204315185546875, -0.09634590148925781, -0.09064865112304688, -0.08495140075683594, -0.079254150390625, -0.07355690002441406, -0.06785964965820312, -0.06216239929199219, -0.05646514892578125, -0.05076789855957031, -0.045070648193359375, -0.03937339782714844, -0.0336761474609375, -0.027978897094726562, -0.022281646728515625, -0.016584396362304688, -0.01088714599609375, -0.0051898956298828125, 0.000507354736328125, 0.0062046051025390625, 0.01190185546875, 0.017599105834960938, 0.023296356201171875, 0.028993606567382812, 0.03469085693359375, 0.04038810729980469, 0.046085357666015625, 0.05178260803222656, 0.0574798583984375, 0.06317710876464844, 0.06887435913085938, 0.07457160949707031, 0.08026885986328125, 0.08596611022949219, 0.09166336059570312, 0.09736061096191406, 0.103057861328125, 0.10875511169433594, 0.11445236206054688, 0.12014961242675781, 0.12584686279296875, 0.1315441131591797, 0.13724136352539062, 0.14293861389160156, 0.1486358642578125, 0.15433311462402344, 0.16003036499023438, 0.1657276153564453, 0.17142486572265625, 0.1771221160888672, 0.18281936645507812, 0.18851661682128906, 0.1942138671875]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 6.0, 4.0, 2.0, 7.0, 11.0, 16.0, 16.0, 38.0, 33.0, 50.0, 87.0, 97.0, 131.0, 136.0, 151.0, 88.0, 53.0, 24.0, 20.0, 17.0, 9.0, 6.0, 2.0, 2.0], "bins": [-0.11790435761213303, -0.115700863301754, -0.11349736154079437, -0.11129386723041534, -0.10909036546945572, -0.10688687115907669, -0.10468336939811707, -0.10247987508773804, -0.10027638077735901, -0.09807288646697998, -0.09586938470602036, -0.09366589039564133, -0.0914623886346817, -0.08925889432430267, -0.08705539256334305, -0.08485189825296402, -0.0826483964920044, -0.08044490218162537, -0.07824140042066574, -0.07603790611028671, -0.07383440434932709, -0.07163091003894806, -0.06942740827798843, -0.0672239139676094, -0.06502041220664978, -0.06281691789627075, -0.06061341613531113, -0.0584099180996418, -0.05620642006397247, -0.054002925753593445, -0.05179942771792412, -0.04959592968225479, -0.04739243537187576, -0.045188937336206436, -0.04298543930053711, -0.04078194126486778, -0.038578443229198456, -0.03637494891881943, -0.0341714508831501, -0.031967952847480774, -0.029764452949166298, -0.02756095491349697, -0.025357458740472794, -0.023153960704803467, -0.02095046266913414, -0.018746964633464813, -0.016543466597795486, -0.014339970424771309, -0.012136472389101982, -0.009932974353432655, -0.007729477249085903, -0.005525979679077864, -0.0033224821090698242, -0.0011189840734004974, 0.0010845130309462547, 0.003288010135293007, 0.005491508170962334, 0.007695005740970373, 0.009898503310978413, 0.012102000415325165, 0.014305498450994492, 0.01650899648666382, 0.018712494522333145, 0.020915990695357323, 0.02311948873102665]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 2.0, 6.0, 2.0, 2.0, 3.0, 5.0, 9.0, 7.0, 11.0, 10.0, 20.0, 18.0, 24.0, 26.0, 21.0, 34.0, 27.0, 32.0, 25.0, 36.0, 31.0, 52.0, 51.0, 31.0, 40.0, 32.0, 40.0, 40.0, 33.0, 25.0, 30.0, 34.0, 29.0, 22.0, 29.0, 20.0, 28.0, 17.0, 18.0, 14.0, 20.0, 12.0, 6.0, 10.0, 10.0, 8.0, 4.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.027413129806518555, -0.02647901326417923, -0.025544894859194756, -0.02461077645421028, -0.023676659911870956, -0.02274254336953163, -0.021808424964547157, -0.020874306559562683, -0.019940190017223358, -0.019006073474884033, -0.01807195506989956, -0.017137836664915085, -0.01620372012257576, -0.01526960264891386, -0.01433548517525196, -0.013401367701590061, -0.012467250227928162, -0.011533132754266262, -0.010599015280604362, -0.009664897806942463, -0.008730780333280563, -0.007796662859618664, -0.006862545385956764, -0.005928427912294865, -0.004994310438632965, -0.0040601929649710655, -0.003126075491309166, -0.0021919580176472664, -0.0012578405439853668, -0.00032372307032346725, 0.0006103944033384323, 0.0015445118770003319, 0.0024786293506622314, 0.003412746824324131, 0.004346864297986031, 0.00528098177164793, 0.00621509924530983, 0.007149216718971729, 0.008083334192633629, 0.009017451666295528, 0.009951569139957428, 0.010885686613619328, 0.011819804087281227, 0.012753921560943127, 0.013688039034605026, 0.014622156508266926, 0.015556273981928825, 0.0164903923869133, 0.017424508929252625, 0.01835862547159195, 0.019292743876576424, 0.020226862281560898, 0.021160978823900223, 0.022095095366239548, 0.023029213771224022, 0.023963332176208496, 0.02489744871854782, 0.025831565260887146, 0.02676568366587162, 0.027699802070856094, 0.02863391861319542, 0.029568035155534744, 0.03050215356051922, 0.03143627196550369, 0.03237038850784302]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 4.0, 4.0, 3.0, 7.0, 6.0, 8.0, 8.0, 12.0, 12.0, 20.0, 17.0, 23.0, 23.0, 26.0, 36.0, 36.0, 32.0, 38.0, 46.0, 52.0, 46.0, 44.0, 45.0, 32.0, 44.0, 45.0, 28.0, 31.0, 40.0, 38.0, 29.0, 20.0, 23.0, 30.0, 18.0, 11.0, 11.0, 10.0, 14.0, 5.0, 10.0, 4.0, 4.0, 3.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-87.5, -84.7783203125, -82.056640625, -79.3349609375, -76.61328125, -73.8916015625, -71.169921875, -68.4482421875, -65.7265625, -63.0048828125, -60.283203125, -57.5615234375, -54.83984375, -52.1181640625, -49.396484375, -46.6748046875, -43.953125, -41.2314453125, -38.509765625, -35.7880859375, -33.06640625, -30.3447265625, -27.623046875, -24.9013671875, -22.1796875, -19.4580078125, -16.736328125, -14.0146484375, -11.29296875, -8.5712890625, -5.849609375, -3.1279296875, -0.40625, 2.3154296875, 5.037109375, 7.7587890625, 10.48046875, 13.2021484375, 15.923828125, 18.6455078125, 21.3671875, 24.0888671875, 26.810546875, 29.5322265625, 32.25390625, 34.9755859375, 37.697265625, 40.4189453125, 43.140625, 45.8623046875, 48.583984375, 51.3056640625, 54.02734375, 56.7490234375, 59.470703125, 62.1923828125, 64.9140625, 67.6357421875, 70.357421875, 73.0791015625, 75.80078125, 78.5224609375, 81.244140625, 83.9658203125, 86.6875]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 8.0, 5.0, 13.0, 10.0, 19.0, 22.0, 27.0, 44.0, 70.0, 83.0, 96.0, 148.0, 216.0, 332.0, 452.0, 758.0, 1305.0, 2443.0, 5018.0, 12483.0, 35711.0, 113954.0, 332564.0, 353462.0, 125064.0, 39078.0, 13497.0, 5433.0, 2570.0, 1297.0, 746.0, 480.0, 316.0, 239.0, 152.0, 104.0, 79.0, 66.0, 59.0, 40.0, 27.0, 20.0, 14.0, 10.0, 8.0, 9.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-12.5703125, -12.177978515625, -11.78564453125, -11.393310546875, -11.0009765625, -10.608642578125, -10.21630859375, -9.823974609375, -9.431640625, -9.039306640625, -8.64697265625, -8.254638671875, -7.8623046875, -7.469970703125, -7.07763671875, -6.685302734375, -6.29296875, -5.900634765625, -5.50830078125, -5.115966796875, -4.7236328125, -4.331298828125, -3.93896484375, -3.546630859375, -3.154296875, -2.761962890625, -2.36962890625, -1.977294921875, -1.5849609375, -1.192626953125, -0.80029296875, -0.407958984375, -0.015625, 0.376708984375, 0.76904296875, 1.161376953125, 1.5537109375, 1.946044921875, 2.33837890625, 2.730712890625, 3.123046875, 3.515380859375, 3.90771484375, 4.300048828125, 4.6923828125, 5.084716796875, 5.47705078125, 5.869384765625, 6.26171875, 6.654052734375, 7.04638671875, 7.438720703125, 7.8310546875, 8.223388671875, 8.61572265625, 9.008056640625, 9.400390625, 9.792724609375, 10.18505859375, 10.577392578125, 10.9697265625, 11.362060546875, 11.75439453125, 12.146728515625, 12.5390625]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 0.0, 1.0, 8.0, 9.0, 8.0, 10.0, 20.0, 13.0, 17.0, 24.0, 23.0, 28.0, 29.0, 44.0, 37.0, 40.0, 38.0, 59.0, 51.0, 2105.0, 42.0, 50.0, 46.0, 35.0, 32.0, 37.0, 37.0, 28.0, 25.0, 33.0, 21.0, 17.0, 12.0, 18.0, 7.0, 11.0, 11.0, 9.0, 3.0, 6.0, 2.0, 3.0, 1.0, 2.0, 1.0], "bins": [-136.0, -132.4619140625, -128.923828125, -125.3857421875, -121.84765625, -118.3095703125, -114.771484375, -111.2333984375, -107.6953125, -104.1572265625, -100.619140625, -97.0810546875, -93.54296875, -90.0048828125, -86.466796875, -82.9287109375, -79.390625, -75.8525390625, -72.314453125, -68.7763671875, -65.23828125, -61.7001953125, -58.162109375, -54.6240234375, -51.0859375, -47.5478515625, -44.009765625, -40.4716796875, -36.93359375, -33.3955078125, -29.857421875, -26.3193359375, -22.78125, -19.2431640625, -15.705078125, -12.1669921875, -8.62890625, -5.0908203125, -1.552734375, 1.9853515625, 5.5234375, 9.0615234375, 12.599609375, 16.1376953125, 19.67578125, 23.2138671875, 26.751953125, 30.2900390625, 33.828125, 37.3662109375, 40.904296875, 44.4423828125, 47.98046875, 51.5185546875, 55.056640625, 58.5947265625, 62.1328125, 65.6708984375, 69.208984375, 72.7470703125, 76.28515625, 79.8232421875, 83.361328125, 86.8994140625, 90.4375]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 3.0, 1.0, 6.0, 14.0, 16.0, 28.0, 23.0, 36.0, 37.0, 68.0, 100.0, 123.0, 179.0, 265.0, 405.0, 678.0, 1254.0, 3718.0, 22582.0, 286031.0, 2749297.0, 69192.0, 7377.0, 1883.0, 864.0, 516.0, 312.0, 196.0, 160.0, 94.0, 75.0, 53.0, 29.0, 29.0, 18.0, 9.0, 6.0, 6.0, 6.0, 7.0, 2.0, 5.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.796875, -21.024658203125, -20.25244140625, -19.480224609375, -18.7080078125, -17.935791015625, -17.16357421875, -16.391357421875, -15.619140625, -14.846923828125, -14.07470703125, -13.302490234375, -12.5302734375, -11.758056640625, -10.98583984375, -10.213623046875, -9.44140625, -8.669189453125, -7.89697265625, -7.124755859375, -6.3525390625, -5.580322265625, -4.80810546875, -4.035888671875, -3.263671875, -2.491455078125, -1.71923828125, -0.947021484375, -0.1748046875, 0.597412109375, 1.36962890625, 2.141845703125, 2.9140625, 3.686279296875, 4.45849609375, 5.230712890625, 6.0029296875, 6.775146484375, 7.54736328125, 8.319580078125, 9.091796875, 9.864013671875, 10.63623046875, 11.408447265625, 12.1806640625, 12.952880859375, 13.72509765625, 14.497314453125, 15.26953125, 16.041748046875, 16.81396484375, 17.586181640625, 18.3583984375, 19.130615234375, 19.90283203125, 20.675048828125, 21.447265625, 22.219482421875, 22.99169921875, 23.763916015625, 24.5361328125, 25.308349609375, 26.08056640625, 26.852783203125, 27.625]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 2.0, 4.0, 1.0, 6.0, 5.0, 9.0, 9.0, 17.0, 20.0, 47.0, 75.0, 95.0, 134.0, 144.0, 141.0, 81.0, 62.0, 42.0, 26.0, 27.0, 9.0, 10.0, 6.0, 8.0, 6.0, 1.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-174.95213317871094, -169.8813018798828, -164.8104705810547, -159.7396240234375, -154.66879272460938, -149.59796142578125, -144.52713012695312, -139.456298828125, -134.38546752929688, -129.31463623046875, -124.2437973022461, -119.17296600341797, -114.10212707519531, -109.03129577636719, -103.96046447753906, -98.88963317871094, -93.81878662109375, -88.74795532226562, -83.67711639404297, -78.60628509521484, -73.53544616699219, -68.46461486816406, -63.39378356933594, -58.32294845581055, -53.252113342285156, -48.181278228759766, -43.110443115234375, -38.03961181640625, -32.96877670288086, -27.89794158935547, -22.82710838317871, -17.756275177001953, -12.685455322265625, -7.614621162414551, -2.5437870025634766, 2.5270471572875977, 7.597881317138672, 12.668716430664062, 17.73954963684082, 22.810382843017578, 27.88121795654297, 32.95205307006836, 38.02288818359375, 43.093719482421875, 48.164554595947266, 53.235389709472656, 58.30622100830078, 63.37705612182617, 68.44789123535156, 73.51872253417969, 78.58956146240234, 83.66039276123047, 88.73123168945312, 93.80206298828125, 98.87289428710938, 103.9437255859375, 109.01456451416016, 114.08539581298828, 119.15623474121094, 124.22706604003906, 129.2978973388672, 134.36874389648438, 139.4395751953125, 144.51040649414062, 149.58123779296875]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 4.0, 2.0, 9.0, 8.0, 9.0, 6.0, 14.0, 19.0, 19.0, 21.0, 22.0, 24.0, 43.0, 38.0, 40.0, 33.0, 45.0, 51.0, 42.0, 50.0, 51.0, 46.0, 51.0, 46.0, 51.0, 32.0, 30.0, 30.0, 27.0, 29.0, 23.0, 15.0, 9.0, 12.0, 12.0, 6.0, 9.0, 3.0, 5.0, 4.0, 9.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-153.3412322998047, -148.22720336914062, -143.1131591796875, -137.99913024902344, -132.88510131835938, -127.77105712890625, -122.65702819824219, -117.5429916381836, -112.428955078125, -107.3149185180664, -102.20088195800781, -97.08685302734375, -91.97281646728516, -86.85877990722656, -81.7447509765625, -76.6307144165039, -71.51667785644531, -66.40264129638672, -61.28860855102539, -56.17457580566406, -51.06053924560547, -45.946502685546875, -40.83246994018555, -35.71843719482422, -30.604400634765625, -25.490365982055664, -20.376331329345703, -15.262296676635742, -10.148262023925781, -5.03422737121582, 0.07980728149414062, 5.193840026855469, 10.307891845703125, 15.421926498413086, 20.535961151123047, 25.649995803833008, 30.76403045654297, 35.87806701660156, 40.99209976196289, 46.10613250732422, 51.22016906738281, 56.334205627441406, 61.448238372802734, 66.56227111816406, 71.67630767822266, 76.79034423828125, 81.90437316894531, 87.0184097290039, 92.1324462890625, 97.2464828491211, 102.36051940917969, 107.47454833984375, 112.58858489990234, 117.70262145996094, 122.816650390625, 127.9306869506836, 133.0447235107422, 138.15875244140625, 143.27279663085938, 148.38682556152344, 153.5008544921875, 158.61489868164062, 163.7289276123047, 168.84295654296875, 173.95700073242188]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 5.0, 6.0, 7.0, 9.0, 14.0, 11.0, 22.0, 27.0, 34.0, 49.0, 71.0, 94.0, 107.0, 169.0, 226.0, 320.0, 449.0, 605.0, 820.0, 1131.0, 1040485.0, 1043.0, 742.0, 583.0, 384.0, 293.0, 227.0, 164.0, 108.0, 78.0, 56.0, 58.0, 33.0, 30.0, 35.0, 17.0, 10.0, 5.0, 8.0, 6.0, 5.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-67.7447738647461, -65.8315200805664, -63.918270111083984, -62.00502014160156, -60.091766357421875, -58.17851638793945, -56.26526641845703, -54.352012634277344, -52.43876266479492, -50.5255126953125, -48.61225891113281, -46.69900894165039, -44.78575897216797, -42.87250518798828, -40.95925521850586, -39.04600524902344, -37.13275146484375, -35.21950149536133, -33.30624771118164, -31.39299774169922, -29.479745864868164, -27.56649398803711, -25.653244018554688, -23.739992141723633, -21.826740264892578, -19.913488388061523, -18.00023651123047, -16.086986541748047, -14.173734664916992, -12.260482788085938, -10.3472318649292, -8.433980941772461, -6.520729064941406, -4.60747766494751, -2.6942262649536133, -0.7809748649597168, 1.1322765350341797, 3.0455284118652344, 4.958779335021973, 6.872030258178711, 8.785282135009766, 10.69853401184082, 12.611784934997559, 14.525035858154297, 16.43828773498535, 18.351539611816406, 20.264789581298828, 22.178041458129883, 24.091293334960938, 26.004545211791992, 27.917797088623047, 29.83104705810547, 31.744298934936523, 33.65755081176758, 35.57080078125, 37.48405456542969, 39.39730453491211, 41.31055450439453, 43.22380828857422, 45.13705825805664, 47.05030822753906, 48.96356201171875, 50.87681198120117, 52.790061950683594, 54.70331573486328]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 8.0, 0.0, 16.0, 8.0, 21.0, 54.0, 119.0, 21041.0, 51441980.0, 59.0, 31.0, 13.0, 14.0, 3.0, 2.0, 2.0, 1.0, 4.0, 2.0, 1.0, 4.0, 0.0, 1.0, 3.0, 3.0, 4.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2976.0, -2810.95849609375, -2645.9169921875, -2480.87548828125, -2315.833984375, -2150.79248046875, -1985.750732421875, -1820.709228515625, -1655.667724609375, -1490.626220703125, -1325.584716796875, -1160.5430908203125, -995.5015869140625, -830.4600830078125, -665.4185180664062, -500.376953125, -335.33544921875, -170.29391479492188, -5.25238037109375, 159.78915405273438, 324.8306884765625, 489.8721923828125, 654.9137573242188, 819.955322265625, 984.996826171875, 1150.038330078125, 1315.079833984375, 1480.1214599609375, 1645.1629638671875, 1810.2044677734375, 1975.24609375, 2140.28759765625, 2305.3291015625, 2470.37060546875, 2635.412109375, 2800.45361328125, 2965.4951171875, 3130.53662109375, 3295.578369140625, 3460.619873046875, 3625.661376953125, 3790.702880859375, 3955.744384765625, 4120.7861328125, 4285.82763671875, 4450.869140625, 4615.91064453125, 4780.9521484375, 4945.99365234375, 5111.03515625, 5276.07666015625, 5441.1181640625, 5606.15966796875, 5771.201171875, 5936.24267578125, 6101.2841796875, 6266.326171875, 6431.36767578125, 6596.4091796875, 6761.45068359375, 6926.4921875, 7091.53369140625, 7256.5751953125, 7421.6171875, 7586.658203125]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 7.0, 3.0, 5.0, 17.0, 26.0, 32.0, 48.0, 66.0, 114.0, 179.0, 290.0, 501.0, 721.0, 1178.0, 1948.0, 2847.0, 4414.0, 6771.0, 10487.0, 16460.0, 25396.0, 40135.0, 61333.0, 94465.0, 142201.0, 209871.0, 298054.0, 391257.0, 3532374.0, 442358.0, 319296.0, 231435.0, 157487.0, 105454.0, 69049.0, 44300.0, 28729.0, 18861.0, 11943.0, 7651.0, 4841.0, 3226.0, 2103.0, 1203.0, 820.0, 510.0, 348.0, 232.0, 124.0, 106.0, 76.0, 41.0, 22.0, 15.0, 8.0, 7.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-1.0322265625, -0.9995880126953125, -0.966949462890625, -0.9343109130859375, -0.90167236328125, -0.8690338134765625, -0.836395263671875, -0.8037567138671875, -0.7711181640625, -0.7384796142578125, -0.705841064453125, -0.6732025146484375, -0.64056396484375, -0.6079254150390625, -0.575286865234375, -0.5426483154296875, -0.510009765625, -0.4773712158203125, -0.444732666015625, -0.4120941162109375, -0.37945556640625, -0.3468170166015625, -0.314178466796875, -0.2815399169921875, -0.2489013671875, -0.2162628173828125, -0.183624267578125, -0.1509857177734375, -0.11834716796875, -0.0857086181640625, -0.053070068359375, -0.0204315185546875, 0.01220703125, 0.0448455810546875, 0.077484130859375, 0.1101226806640625, 0.14276123046875, 0.1753997802734375, 0.208038330078125, 0.2406768798828125, 0.2733154296875, 0.3059539794921875, 0.338592529296875, 0.3712310791015625, 0.40386962890625, 0.4365081787109375, 0.469146728515625, 0.5017852783203125, 0.534423828125, 0.5670623779296875, 0.599700927734375, 0.6323394775390625, 0.66497802734375, 0.6976165771484375, 0.730255126953125, 0.7628936767578125, 0.7955322265625, 0.8281707763671875, 0.860809326171875, 0.8934478759765625, 0.92608642578125, 0.9587249755859375, 0.991363525390625, 1.0240020751953125, 1.056640625]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 2.0, 10.0, 6.0, 6.0, 5.0, 8.0, 10.0, 16.0, 15.0, 14.0, 28.0, 16.0, 13.0, 16.0, 18.0, 30.0, 31.0, 36.0, 24.0, 37.0, 40.0, 40.0, 44.0, 483.0, 616.0, 33.0, 35.0, 39.0, 40.0, 26.0, 34.0, 24.0, 26.0, 26.0, 24.0, 25.0, 14.0, 26.0, 21.0, 9.0, 11.0, 9.0, 14.0, 2.0, 7.0, 7.0, 4.0, 2.0, 3.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-17.171875, -16.61767578125, -16.0634765625, -15.50927734375, -14.955078125, -14.40087890625, -13.8466796875, -13.29248046875, -12.73828125, -12.18408203125, -11.6298828125, -11.07568359375, -10.521484375, -9.96728515625, -9.4130859375, -8.85888671875, -8.3046875, -7.75048828125, -7.1962890625, -6.64208984375, -6.087890625, -5.53369140625, -4.9794921875, -4.42529296875, -3.87109375, -3.31689453125, -2.7626953125, -2.20849609375, -1.654296875, -1.10009765625, -0.5458984375, 0.00830078125, 0.5625, 1.11669921875, 1.6708984375, 2.22509765625, 2.779296875, 3.33349609375, 3.8876953125, 4.44189453125, 4.99609375, 5.55029296875, 6.1044921875, 6.65869140625, 7.212890625, 7.76708984375, 8.3212890625, 8.87548828125, 9.4296875, 9.98388671875, 10.5380859375, 11.09228515625, 11.646484375, 12.20068359375, 12.7548828125, 13.30908203125, 13.86328125, 14.41748046875, 14.9716796875, 15.52587890625, 16.080078125, 16.63427734375, 17.1884765625, 17.74267578125, 18.296875]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 9.0, 3.0, 14.0, 12.0, 13.0, 28.0, 56.0, 101.0, 151.0, 280.0, 480.0, 779.0, 1351.0, 2315.0, 3753.0, 6453.0, 10414.0, 17624.0, 29847.0, 49339.0, 81048.0, 131792.0, 207542.0, 307107.0, 405985.0, 3539568.0, 493852.0, 346833.0, 245689.0, 159099.0, 99477.0, 59878.0, 36438.0, 21667.0, 13186.0, 7839.0, 4614.0, 2832.0, 1614.0, 994.0, 514.0, 363.0, 182.0, 123.0, 65.0, 38.0, 33.0, 24.0, 8.0, 6.0, 5.0, 7.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1318359375, -1.09613037109375, -1.0604248046875, -1.02471923828125, -0.989013671875, -0.95330810546875, -0.9176025390625, -0.88189697265625, -0.84619140625, -0.81048583984375, -0.7747802734375, -0.73907470703125, -0.703369140625, -0.66766357421875, -0.6319580078125, -0.59625244140625, -0.560546875, -0.52484130859375, -0.4891357421875, -0.45343017578125, -0.417724609375, -0.38201904296875, -0.3463134765625, -0.31060791015625, -0.27490234375, -0.23919677734375, -0.2034912109375, -0.16778564453125, -0.132080078125, -0.09637451171875, -0.0606689453125, -0.02496337890625, 0.0107421875, 0.04644775390625, 0.0821533203125, 0.11785888671875, 0.153564453125, 0.18927001953125, 0.2249755859375, 0.26068115234375, 0.29638671875, 0.33209228515625, 0.3677978515625, 0.40350341796875, 0.439208984375, 0.47491455078125, 0.5106201171875, 0.54632568359375, 0.58203125, 0.61773681640625, 0.6534423828125, 0.68914794921875, 0.724853515625, 0.76055908203125, 0.7962646484375, 0.83197021484375, 0.86767578125, 0.90338134765625, 0.9390869140625, 0.97479248046875, 1.010498046875, 1.04620361328125, 1.0819091796875, 1.11761474609375, 1.1533203125]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 5.0, 5.0, 8.0, 8.0, 7.0, 8.0, 8.0, 12.0, 23.0, 25.0, 22.0, 19.0, 26.0, 26.0, 29.0, 40.0, 41.0, 35.0, 43.0, 40.0, 40.0, 1026.0, 92.0, 41.0, 38.0, 47.0, 27.0, 39.0, 28.0, 31.0, 27.0, 23.0, 18.0, 24.0, 15.0, 15.0, 16.0, 9.0, 7.0, 3.0, 6.0, 7.0, 3.0, 5.0, 4.0, 1.0, 6.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.390625, -14.885986328125, -14.38134765625, -13.876708984375, -13.3720703125, -12.867431640625, -12.36279296875, -11.858154296875, -11.353515625, -10.848876953125, -10.34423828125, -9.839599609375, -9.3349609375, -8.830322265625, -8.32568359375, -7.821044921875, -7.31640625, -6.811767578125, -6.30712890625, -5.802490234375, -5.2978515625, -4.793212890625, -4.28857421875, -3.783935546875, -3.279296875, -2.774658203125, -2.27001953125, -1.765380859375, -1.2607421875, -0.756103515625, -0.25146484375, 0.253173828125, 0.7578125, 1.262451171875, 1.76708984375, 2.271728515625, 2.7763671875, 3.281005859375, 3.78564453125, 4.290283203125, 4.794921875, 5.299560546875, 5.80419921875, 6.308837890625, 6.8134765625, 7.318115234375, 7.82275390625, 8.327392578125, 8.83203125, 9.336669921875, 9.84130859375, 10.345947265625, 10.8505859375, 11.355224609375, 11.85986328125, 12.364501953125, 12.869140625, 13.373779296875, 13.87841796875, 14.383056640625, 14.8876953125, 15.392333984375, 15.89697265625, 16.401611328125, 16.90625]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 1.0, 9.0, 10.0, 11.0, 14.0, 18.0, 27.0, 35.0, 31.0, 45.0, 59.0, 69.0, 106.0, 170.0, 274.0, 537.0, 1010.0, 2025.0, 4555.0, 10649.0, 28135.0, 80120.0, 274420.0, 5727979.0, 101959.0, 35653.0, 12884.0, 5296.0, 2479.0, 1253.0, 621.0, 368.0, 201.0, 129.0, 83.0, 63.0, 38.0, 26.0, 24.0, 20.0, 13.0, 6.0, 10.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.953125, -4.763427734375, -4.57373046875, -4.384033203125, -4.1943359375, -4.004638671875, -3.81494140625, -3.625244140625, -3.435546875, -3.245849609375, -3.05615234375, -2.866455078125, -2.6767578125, -2.487060546875, -2.29736328125, -2.107666015625, -1.91796875, -1.728271484375, -1.53857421875, -1.348876953125, -1.1591796875, -0.969482421875, -0.77978515625, -0.590087890625, -0.400390625, -0.210693359375, -0.02099609375, 0.168701171875, 0.3583984375, 0.548095703125, 0.73779296875, 0.927490234375, 1.1171875, 1.306884765625, 1.49658203125, 1.686279296875, 1.8759765625, 2.065673828125, 2.25537109375, 2.445068359375, 2.634765625, 2.824462890625, 3.01416015625, 3.203857421875, 3.3935546875, 3.583251953125, 3.77294921875, 3.962646484375, 4.15234375, 4.342041015625, 4.53173828125, 4.721435546875, 4.9111328125, 5.100830078125, 5.29052734375, 5.480224609375, 5.669921875, 5.859619140625, 6.04931640625, 6.239013671875, 6.4287109375, 6.618408203125, 6.80810546875, 6.997802734375, 7.1875]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 5.0, 1.0, 12.0, 4.0, 9.0, 1.0, 11.0, 15.0, 12.0, 21.0, 21.0, 18.0, 19.0, 21.0, 32.0, 31.0, 43.0, 43.0, 38.0, 41.0, 39.0, 177.0, 933.0, 54.0, 51.0, 41.0, 42.0, 32.0, 41.0, 48.0, 31.0, 28.0, 23.0, 19.0, 13.0, 19.0, 10.0, 10.0, 6.0, 6.0, 3.0, 4.0, 3.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.5546875, -13.0728759765625, -12.591064453125, -12.1092529296875, -11.62744140625, -11.1456298828125, -10.663818359375, -10.1820068359375, -9.7001953125, -9.2183837890625, -8.736572265625, -8.2547607421875, -7.77294921875, -7.2911376953125, -6.809326171875, -6.3275146484375, -5.845703125, -5.3638916015625, -4.882080078125, -4.4002685546875, -3.91845703125, -3.4366455078125, -2.954833984375, -2.4730224609375, -1.9912109375, -1.5093994140625, -1.027587890625, -0.5457763671875, -0.06396484375, 0.4178466796875, 0.899658203125, 1.3814697265625, 1.86328125, 2.3450927734375, 2.826904296875, 3.3087158203125, 3.79052734375, 4.2723388671875, 4.754150390625, 5.2359619140625, 5.7177734375, 6.1995849609375, 6.681396484375, 7.1632080078125, 7.64501953125, 8.1268310546875, 8.608642578125, 9.0904541015625, 9.572265625, 10.0540771484375, 10.535888671875, 11.0177001953125, 11.49951171875, 11.9813232421875, 12.463134765625, 12.9449462890625, 13.4267578125, 13.9085693359375, 14.390380859375, 14.8721923828125, 15.35400390625, 15.8358154296875, 16.317626953125, 16.7994384765625, 17.28125]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 17.0, 155.0, 609.0, 190.0, 22.0, 11.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-100.61790466308594, -97.20551300048828, -93.79312133789062, -90.3807373046875, -86.96834564208984, -83.55595397949219, -80.14356231689453, -76.73117065429688, -73.31878662109375, -69.9063949584961, -66.49400329589844, -63.08161544799805, -59.669227600097656, -56.2568359375, -52.844444274902344, -49.43205261230469, -46.01966094970703, -42.607269287109375, -39.194881439208984, -35.78248977661133, -32.37010192871094, -28.95771026611328, -25.545318603515625, -22.1329288482666, -18.720539093017578, -15.308149337768555, -11.895758628845215, -8.483367919921875, -5.070978164672852, -1.6585884094238281, 1.7538032531738281, 5.166193008422852, 8.578590393066406, 11.99098014831543, 15.40337085723877, 18.81576156616211, 22.228151321411133, 25.640541076660156, 29.052932739257812, 32.46532440185547, 35.87771224975586, 39.290103912353516, 42.702491760253906, 46.11488342285156, 49.52727508544922, 52.93966293334961, 56.352054595947266, 59.764442443847656, 63.17683410644531, 66.58922576904297, 70.00161743164062, 73.41400146484375, 76.8263931274414, 80.23878479003906, 83.65117645263672, 87.06356811523438, 90.4759521484375, 93.88834381103516, 97.30073547363281, 100.71311950683594, 104.1255111694336, 107.53790283203125, 110.9502944946289, 114.36268615722656, 117.77507781982422]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 3.0, 14.0, 9.0, 21.0, 26.0, 39.0, 56.0, 78.0, 99.0, 84.0, 133.0, 96.0, 93.0, 66.0, 61.0, 47.0, 24.0, 24.0, 14.0, 5.0, 5.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.6602668762207, -30.982486724853516, -29.304706573486328, -27.62692642211914, -25.949146270751953, -24.271366119384766, -22.59358787536621, -20.915807723999023, -19.238027572631836, -17.56024742126465, -15.882467269897461, -14.20468807220459, -12.526907920837402, -10.849127769470215, -9.171348571777344, -7.493568420410156, -5.815788269042969, -4.138008117675781, -2.460228443145752, -0.7824487686157227, 0.8953313827514648, 2.5731115341186523, 4.250890731811523, 5.928670883178711, 7.606451034545898, 9.284231185913086, 10.962011337280273, 12.639790534973145, 14.317570686340332, 15.99535083770752, 17.67313003540039, 19.350910186767578, 21.02869415283203, 22.70647430419922, 24.384254455566406, 26.062034606933594, 27.73981475830078, 29.41759490966797, 31.095373153686523, 32.773155212402344, 34.45093536376953, 36.12871551513672, 37.806495666503906, 39.484275817871094, 41.16205596923828, 42.83983612060547, 44.517616271972656, 46.195396423339844, 47.873172760009766, 49.55095291137695, 51.22873306274414, 52.90651321411133, 54.584293365478516, 56.2620735168457, 57.939849853515625, 59.61763000488281, 61.29541015625, 62.97319030761719, 64.65097045898438, 66.32875061035156, 68.00653076171875, 69.68431091308594, 71.36209106445312, 73.03987121582031, 74.7176513671875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 5.0, 9.0, 15.0, 12.0, 37.0, 64.0, 104.0, 231.0, 519.0, 1270.0, 3389.0, 11842.0, 99122.0, 4030010.0, 36019.0, 7172.0, 2385.0, 973.0, 490.0, 227.0, 128.0, 91.0, 54.0, 39.0, 28.0, 15.0, 9.0, 5.0, 3.0, 5.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.44384765625, -0.4305229187011719, -0.41719818115234375, -0.4038734436035156, -0.3905487060546875, -0.3772239685058594, -0.36389923095703125, -0.3505744934082031, -0.337249755859375, -0.3239250183105469, -0.31060028076171875, -0.2972755432128906, -0.2839508056640625, -0.2706260681152344, -0.25730133056640625, -0.24397659301757812, -0.23065185546875, -0.21732711791992188, -0.20400238037109375, -0.19067764282226562, -0.1773529052734375, -0.16402816772460938, -0.15070343017578125, -0.13737869262695312, -0.124053955078125, -0.11072921752929688, -0.09740447998046875, -0.08407974243164062, -0.0707550048828125, -0.057430267333984375, -0.04410552978515625, -0.030780792236328125, -0.0174560546875, -0.004131317138671875, 0.00919342041015625, 0.022518157958984375, 0.0358428955078125, 0.049167633056640625, 0.06249237060546875, 0.07581710815429688, 0.089141845703125, 0.10246658325195312, 0.11579132080078125, 0.12911605834960938, 0.1424407958984375, 0.15576553344726562, 0.16909027099609375, 0.18241500854492188, 0.19573974609375, 0.20906448364257812, 0.22238922119140625, 0.23571395874023438, 0.2490386962890625, 0.2623634338378906, 0.27568817138671875, 0.2890129089355469, 0.302337646484375, 0.3156623840332031, 0.32898712158203125, 0.3423118591308594, 0.3556365966796875, 0.3689613342285156, 0.38228607177734375, 0.3956108093261719, 0.408935546875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 3.0, 5.0, 0.0, 1.0, 9.0, 1.0, 4.0, 5.0, 8.0, 6.0, 11.0, 16.0, 26.0, 330.0, 480.0, 15.0, 21.0, 8.0, 14.0, 11.0, 10.0, 4.0, 3.0, 4.0, 3.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11474609375, -0.1097869873046875, -0.104827880859375, -0.0998687744140625, -0.09490966796875, -0.0899505615234375, -0.084991455078125, -0.0800323486328125, -0.0750732421875, -0.0701141357421875, -0.065155029296875, -0.0601959228515625, -0.05523681640625, -0.0502777099609375, -0.045318603515625, -0.0403594970703125, -0.035400390625, -0.0304412841796875, -0.025482177734375, -0.0205230712890625, -0.01556396484375, -0.0106048583984375, -0.005645751953125, -0.0006866455078125, 0.0042724609375, 0.0092315673828125, 0.014190673828125, 0.0191497802734375, 0.02410888671875, 0.0290679931640625, 0.034027099609375, 0.0389862060546875, 0.0439453125, 0.0489044189453125, 0.053863525390625, 0.0588226318359375, 0.06378173828125, 0.0687408447265625, 0.073699951171875, 0.0786590576171875, 0.0836181640625, 0.0885772705078125, 0.093536376953125, 0.0984954833984375, 0.10345458984375, 0.1084136962890625, 0.113372802734375, 0.1183319091796875, 0.123291015625, 0.1282501220703125, 0.133209228515625, 0.1381683349609375, 0.14312744140625, 0.1480865478515625, 0.153045654296875, 0.1580047607421875, 0.1629638671875, 0.1679229736328125, 0.172882080078125, 0.1778411865234375, 0.18280029296875, 0.1877593994140625, 0.192718505859375, 0.1976776123046875, 0.20263671875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 12.0, 9.0, 9.0, 12.0, 15.0, 33.0, 42.0, 50.0, 58.0, 105.0, 162.0, 235.0, 464.0, 784.0, 1566.0, 3329.0, 7929.0, 23878.0, 96911.0, 918975.0, 2914575.0, 172603.0, 34283.0, 10348.0, 4024.0, 1765.0, 876.0, 481.0, 251.0, 160.0, 99.0, 58.0, 51.0, 34.0, 26.0, 16.0, 14.0, 21.0, 7.0, 8.0, 2.0, 3.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.17578125, -0.16954421997070312, -0.16330718994140625, -0.15707015991210938, -0.1508331298828125, -0.14459609985351562, -0.13835906982421875, -0.13212203979492188, -0.125885009765625, -0.11964797973632812, -0.11341094970703125, -0.10717391967773438, -0.1009368896484375, -0.09469985961914062, -0.08846282958984375, -0.08222579956054688, -0.07598876953125, -0.06975173950195312, -0.06351470947265625, -0.057277679443359375, -0.0510406494140625, -0.044803619384765625, -0.03856658935546875, -0.032329559326171875, -0.026092529296875, -0.019855499267578125, -0.01361846923828125, -0.007381439208984375, -0.0011444091796875, 0.005092620849609375, 0.01132965087890625, 0.017566680908203125, 0.0238037109375, 0.030040740966796875, 0.03627777099609375, 0.042514801025390625, 0.0487518310546875, 0.054988861083984375, 0.06122589111328125, 0.06746292114257812, 0.073699951171875, 0.07993698120117188, 0.08617401123046875, 0.09241104125976562, 0.0986480712890625, 0.10488510131835938, 0.11112213134765625, 0.11735916137695312, 0.12359619140625, 0.12983322143554688, 0.13607025146484375, 0.14230728149414062, 0.1485443115234375, 0.15478134155273438, 0.16101837158203125, 0.16725540161132812, 0.173492431640625, 0.17972946166992188, 0.18596649169921875, 0.19220352172851562, 0.1984405517578125, 0.20467758178710938, 0.21091461181640625, 0.21715164184570312, 0.223388671875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 4.0, 5.0, 1.0, 11.0, 9.0, 11.0, 20.0, 12.0, 20.0, 42.0, 46.0, 50.0, 74.0, 88.0, 132.0, 191.0, 325.0, 686.0, 966.0, 575.0, 286.0, 152.0, 100.0, 74.0, 51.0, 34.0, 21.0, 19.0, 15.0, 11.0, 9.0, 7.0, 10.0, 3.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.08685302734375, -0.08379173278808594, -0.08073043823242188, -0.07766914367675781, -0.07460784912109375, -0.07154655456542969, -0.06848526000976562, -0.06542396545410156, -0.0623626708984375, -0.05930137634277344, -0.056240081787109375, -0.05317878723144531, -0.05011749267578125, -0.04705619812011719, -0.043994903564453125, -0.04093360900878906, -0.037872314453125, -0.03481101989746094, -0.031749725341796875, -0.028688430786132812, -0.02562713623046875, -0.022565841674804688, -0.019504547119140625, -0.016443252563476562, -0.0133819580078125, -0.010320663452148438, -0.007259368896484375, -0.0041980743408203125, -0.00113677978515625, 0.0019245147705078125, 0.004985809326171875, 0.008047103881835938, 0.0111083984375, 0.014169692993164062, 0.017230987548828125, 0.020292282104492188, 0.02335357666015625, 0.026414871215820312, 0.029476165771484375, 0.03253746032714844, 0.0355987548828125, 0.03866004943847656, 0.041721343994140625, 0.04478263854980469, 0.04784393310546875, 0.05090522766113281, 0.053966522216796875, 0.05702781677246094, 0.060089111328125, 0.06315040588378906, 0.06621170043945312, 0.06927299499511719, 0.07233428955078125, 0.07539558410644531, 0.07845687866210938, 0.08151817321777344, 0.0845794677734375, 0.08764076232910156, 0.09070205688476562, 0.09376335144042969, 0.09682464599609375, 0.09988594055175781, 0.10294723510742188, 0.10600852966308594, 0.10906982421875]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 5.0, 2.0, 13.0, 32.0, 105.0, 255.0, 398.0, 149.0, 28.0, 8.0, 5.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1389408111572266, -1.1037307977676392, -1.0685209035873413, -1.033310890197754, -0.9981009364128113, -0.9628909826278687, -0.9276809692382812, -0.8924710154533386, -0.857261061668396, -0.8220511078834534, -0.7868411540985107, -0.7516311407089233, -0.7164211869239807, -0.6812112331390381, -0.6460012197494507, -0.6107912659645081, -0.5755813121795654, -0.5403713583946228, -0.5051614046096802, -0.4699513912200928, -0.43474143743515015, -0.3995314836502075, -0.3643215000629425, -0.3291115164756775, -0.29390156269073486, -0.25869160890579224, -0.22348162531852722, -0.1882716566324234, -0.15306168794631958, -0.11785171926021576, -0.08264175057411194, -0.04743178188800812, -0.012221693992614746, 0.022988274693489075, 0.058198243379592896, 0.09340821206569672, 0.12861818075180054, 0.16382814943790436, 0.19903811812400818, 0.234248086810112, 0.2694580554962158, 0.30466800928115845, 0.33987799286842346, 0.3750879764556885, 0.4102979302406311, 0.44550788402557373, 0.48071786761283875, 0.5159278512001038, 0.5511378049850464, 0.586347758769989, 0.6215577125549316, 0.656767725944519, 0.6919776797294617, 0.7271876335144043, 0.7623976469039917, 0.7976076006889343, 0.832817554473877, 0.8680275082588196, 0.9032374620437622, 0.9384474754333496, 0.9736574292182922, 1.0088673830032349, 1.0440773963928223, 1.0792872905731201, 1.1144973039627075]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 9.0, 5.0, 6.0, 6.0, 12.0, 14.0, 16.0, 20.0, 24.0, 24.0, 21.0, 35.0, 29.0, 53.0, 40.0, 41.0, 42.0, 41.0, 50.0, 51.0, 51.0, 56.0, 55.0, 35.0, 43.0, 47.0, 25.0, 26.0, 35.0, 17.0, 15.0, 16.0, 8.0, 8.0, 13.0, 1.0, 7.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.46753746271133423, -0.45359697937965393, -0.439656525850296, -0.4257160425186157, -0.4117755889892578, -0.3978351056575775, -0.3838946223258972, -0.3699541687965393, -0.3560137152671814, -0.3420732319355011, -0.3281327784061432, -0.3141922950744629, -0.300251841545105, -0.2863113582134247, -0.2723708748817444, -0.2584304213523865, -0.24448993802070618, -0.23054946959018707, -0.21660900115966797, -0.20266851782798767, -0.18872806429862976, -0.17478758096694946, -0.16084711253643036, -0.14690664410591125, -0.13296617567539215, -0.11902570724487305, -0.10508523881435394, -0.09114476293325424, -0.07720429450273514, -0.06326382607221603, -0.04932335019111633, -0.03538288176059723, -0.021442413330078125, -0.007501943036913872, 0.0064385272562503815, 0.020378999412059784, 0.03431946784257889, 0.04825993627309799, 0.06220041215419769, 0.0761408805847168, 0.0900813490152359, 0.104021817445755, 0.11796228587627411, 0.1319027543067932, 0.1458432376384735, 0.15978369116783142, 0.17372417449951172, 0.18766464293003082, 0.20160511136054993, 0.21554557979106903, 0.22948604822158813, 0.24342653155326843, 0.25736698508262634, 0.27130746841430664, 0.28524792194366455, 0.29918840527534485, 0.31312888860702515, 0.32706937193870544, 0.34100982546806335, 0.35495030879974365, 0.36889076232910156, 0.38283124566078186, 0.39677172899246216, 0.41071218252182007, 0.424652636051178]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 10.0, 6.0, 11.0, 7.0, 14.0, 27.0, 33.0, 37.0, 65.0, 110.0, 154.0, 239.0, 375.0, 611.0, 1029.0, 1906.0, 3465.0, 6643.0, 14250.0, 36177.0, 884404.0, 59652.0, 20143.0, 8912.0, 4491.0, 2387.0, 1369.0, 759.0, 445.0, 260.0, 184.0, 144.0, 74.0, 45.0, 37.0, 30.0, 12.0, 8.0, 9.0, 7.0, 6.0, 4.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 2.0], "bins": [-0.81005859375, -0.7873687744140625, -0.764678955078125, -0.7419891357421875, -0.71929931640625, -0.6966094970703125, -0.673919677734375, -0.6512298583984375, -0.6285400390625, -0.6058502197265625, -0.583160400390625, -0.5604705810546875, -0.53778076171875, -0.5150909423828125, -0.492401123046875, -0.4697113037109375, -0.447021484375, -0.4243316650390625, -0.401641845703125, -0.3789520263671875, -0.35626220703125, -0.3335723876953125, -0.310882568359375, -0.2881927490234375, -0.2655029296875, -0.2428131103515625, -0.220123291015625, -0.1974334716796875, -0.17474365234375, -0.1520538330078125, -0.129364013671875, -0.1066741943359375, -0.083984375, -0.0612945556640625, -0.038604736328125, -0.0159149169921875, 0.00677490234375, 0.0294647216796875, 0.052154541015625, 0.0748443603515625, 0.0975341796875, 0.1202239990234375, 0.142913818359375, 0.1656036376953125, 0.18829345703125, 0.2109832763671875, 0.233673095703125, 0.2563629150390625, 0.279052734375, 0.3017425537109375, 0.324432373046875, 0.3471221923828125, 0.36981201171875, 0.3925018310546875, 0.415191650390625, 0.4378814697265625, 0.4605712890625, 0.4832611083984375, 0.505950927734375, 0.5286407470703125, 0.55133056640625, 0.5740203857421875, 0.596710205078125, 0.6194000244140625, 0.64208984375]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 7.0, 1.0, 1.0, 6.0, 3.0, 5.0, 8.0, 4.0, 4.0, 11.0, 22.0, 25.0, 373.0, 440.0, 16.0, 13.0, 6.0, 17.0, 12.0, 8.0, 5.0, 3.0, 6.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11395263671875, -0.1090230941772461, -0.10409355163574219, -0.09916400909423828, -0.09423446655273438, -0.08930492401123047, -0.08437538146972656, -0.07944583892822266, -0.07451629638671875, -0.06958675384521484, -0.06465721130371094, -0.05972766876220703, -0.054798126220703125, -0.04986858367919922, -0.04493904113769531, -0.040009498596191406, -0.0350799560546875, -0.030150413513183594, -0.025220870971679688, -0.02029132843017578, -0.015361785888671875, -0.010432243347167969, -0.0055027008056640625, -0.0005731582641601562, 0.00435638427734375, 0.009285926818847656, 0.014215469360351562, 0.01914501190185547, 0.024074554443359375, 0.02900409698486328, 0.03393363952636719, 0.038863182067871094, 0.043792724609375, 0.048722267150878906, 0.05365180969238281, 0.05858135223388672, 0.06351089477539062, 0.06844043731689453, 0.07336997985839844, 0.07829952239990234, 0.08322906494140625, 0.08815860748291016, 0.09308815002441406, 0.09801769256591797, 0.10294723510742188, 0.10787677764892578, 0.11280632019042969, 0.1177358627319336, 0.1226654052734375, 0.1275949478149414, 0.1325244903564453, 0.13745403289794922, 0.14238357543945312, 0.14731311798095703, 0.15224266052246094, 0.15717220306396484, 0.16210174560546875, 0.16703128814697266, 0.17196083068847656, 0.17689037322998047, 0.18181991577148438, 0.18674945831298828, 0.1916790008544922, 0.1966085433959961, 0.2015380859375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 5.0, 10.0, 18.0, 13.0, 43.0, 41.0, 60.0, 88.0, 115.0, 162.0, 256.0, 398.0, 699.0, 1396.0, 3001.0, 8158.0, 25654.0, 99953.0, 444980.0, 353295.0, 77085.0, 20536.0, 6942.0, 2666.0, 1181.0, 666.0, 364.0, 239.0, 162.0, 104.0, 71.0, 59.0, 42.0, 33.0, 27.0, 15.0, 9.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3466796875, -0.334259033203125, -0.32183837890625, -0.309417724609375, -0.2969970703125, -0.284576416015625, -0.27215576171875, -0.259735107421875, -0.247314453125, -0.234893798828125, -0.22247314453125, -0.210052490234375, -0.1976318359375, -0.185211181640625, -0.17279052734375, -0.160369873046875, -0.14794921875, -0.135528564453125, -0.12310791015625, -0.110687255859375, -0.0982666015625, -0.085845947265625, -0.07342529296875, -0.061004638671875, -0.048583984375, -0.036163330078125, -0.02374267578125, -0.011322021484375, 0.0010986328125, 0.013519287109375, 0.02593994140625, 0.038360595703125, 0.05078125, 0.063201904296875, 0.07562255859375, 0.088043212890625, 0.1004638671875, 0.112884521484375, 0.12530517578125, 0.137725830078125, 0.150146484375, 0.162567138671875, 0.17498779296875, 0.187408447265625, 0.1998291015625, 0.212249755859375, 0.22467041015625, 0.237091064453125, 0.24951171875, 0.261932373046875, 0.27435302734375, 0.286773681640625, 0.2991943359375, 0.311614990234375, 0.32403564453125, 0.336456298828125, 0.348876953125, 0.361297607421875, 0.37371826171875, 0.386138916015625, 0.3985595703125, 0.410980224609375, 0.42340087890625, 0.435821533203125, 0.4482421875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 7.0, 2.0, 6.0, 3.0, 13.0, 6.0, 4.0, 13.0, 6.0, 18.0, 23.0, 14.0, 24.0, 24.0, 29.0, 27.0, 36.0, 36.0, 43.0, 40.0, 45.0, 42.0, 46.0, 34.0, 34.0, 41.0, 36.0, 36.0, 36.0, 33.0, 26.0, 35.0, 33.0, 20.0, 19.0, 16.0, 17.0, 14.0, 14.0, 13.0, 10.0, 3.0, 6.0, 6.0, 10.0, 2.0, 5.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.415283203125, -0.4028434753417969, -0.39040374755859375, -0.3779640197753906, -0.3655242919921875, -0.3530845642089844, -0.34064483642578125, -0.3282051086425781, -0.315765380859375, -0.3033256530761719, -0.29088592529296875, -0.2784461975097656, -0.2660064697265625, -0.2535667419433594, -0.24112701416015625, -0.22868728637695312, -0.21624755859375, -0.20380783081054688, -0.19136810302734375, -0.17892837524414062, -0.1664886474609375, -0.15404891967773438, -0.14160919189453125, -0.12916946411132812, -0.116729736328125, -0.10429000854492188, -0.09185028076171875, -0.07941055297851562, -0.0669708251953125, -0.054531097412109375, -0.04209136962890625, -0.029651641845703125, -0.0172119140625, -0.004772186279296875, 0.00766754150390625, 0.020107269287109375, 0.0325469970703125, 0.044986724853515625, 0.05742645263671875, 0.06986618041992188, 0.082305908203125, 0.09474563598632812, 0.10718536376953125, 0.11962509155273438, 0.1320648193359375, 0.14450454711914062, 0.15694427490234375, 0.16938400268554688, 0.18182373046875, 0.19426345825195312, 0.20670318603515625, 0.21914291381835938, 0.2315826416015625, 0.24402236938476562, 0.25646209716796875, 0.2689018249511719, 0.281341552734375, 0.2937812805175781, 0.30622100830078125, 0.3186607360839844, 0.3311004638671875, 0.3435401916503906, 0.35597991943359375, 0.3684196472167969, 0.380859375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 6.0, 4.0, 9.0, 6.0, 8.0, 18.0, 19.0, 38.0, 48.0, 87.0, 153.0, 341.0, 801.0, 2794.0, 20285.0, 966633.0, 50926.0, 4455.0, 1068.0, 376.0, 200.0, 97.0, 64.0, 34.0, 25.0, 18.0, 12.0, 8.0, 5.0, 5.0, 6.0, 5.0, 1.0, 5.0, 0.0, 1.0, 2.0], "bins": [-0.9736328125, -0.9507980346679688, -0.9279632568359375, -0.9051284790039062, -0.882293701171875, -0.8594589233398438, -0.8366241455078125, -0.8137893676757812, -0.79095458984375, -0.7681198120117188, -0.7452850341796875, -0.7224502563476562, -0.699615478515625, -0.6767807006835938, -0.6539459228515625, -0.6311111450195312, -0.6082763671875, -0.5854415893554688, -0.5626068115234375, -0.5397720336914062, -0.516937255859375, -0.49410247802734375, -0.4712677001953125, -0.44843292236328125, -0.42559814453125, -0.40276336669921875, -0.3799285888671875, -0.35709381103515625, -0.334259033203125, -0.31142425537109375, -0.2885894775390625, -0.26575469970703125, -0.242919921875, -0.22008514404296875, -0.1972503662109375, -0.17441558837890625, -0.151580810546875, -0.12874603271484375, -0.1059112548828125, -0.08307647705078125, -0.06024169921875, -0.03740692138671875, -0.0145721435546875, 0.00826263427734375, 0.031097412109375, 0.05393218994140625, 0.0767669677734375, 0.09960174560546875, 0.1224365234375, 0.14527130126953125, 0.1681060791015625, 0.19094085693359375, 0.213775634765625, 0.23661041259765625, 0.2594451904296875, 0.28227996826171875, 0.30511474609375, 0.32794952392578125, 0.3507843017578125, 0.37361907958984375, 0.396453857421875, 0.41928863525390625, 0.4421234130859375, 0.46495819091796875, 0.48779296875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 7.0, 10.0, 25.0, 61.0, 201.0, 340.0, 237.0, 85.0, 27.0, 10.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.069110870361328e-05, -6.741099059581757e-05, -6.413087248802185e-05, -6.0850754380226135e-05, -5.757063627243042e-05, -5.4290518164634705e-05, -5.101040005683899e-05, -4.7730281949043274e-05, -4.445016384124756e-05, -4.117004573345184e-05, -3.788992762565613e-05, -3.460980951786041e-05, -3.13296914100647e-05, -2.8049573302268982e-05, -2.4769455194473267e-05, -2.148933708667755e-05, -1.8209218978881836e-05, -1.492910087108612e-05, -1.1648982763290405e-05, -8.36886465549469e-06, -5.088746547698975e-06, -1.8086284399032593e-06, 1.471489667892456e-06, 4.751607775688171e-06, 8.031725883483887e-06, 1.1311843991279602e-05, 1.4591962099075317e-05, 1.7872080206871033e-05, 2.1152198314666748e-05, 2.4432316422462463e-05, 2.771243453025818e-05, 3.0992552638053894e-05, 3.427267074584961e-05, 3.7552788853645325e-05, 4.083290696144104e-05, 4.4113025069236755e-05, 4.739314317703247e-05, 5.0673261284828186e-05, 5.39533793926239e-05, 5.723349750041962e-05, 6.051361560821533e-05, 6.379373371601105e-05, 6.707385182380676e-05, 7.035396993160248e-05, 7.36340880393982e-05, 7.691420614719391e-05, 8.019432425498962e-05, 8.347444236278534e-05, 8.675456047058105e-05, 9.003467857837677e-05, 9.331479668617249e-05, 9.65949147939682e-05, 9.987503290176392e-05, 0.00010315515100955963, 0.00010643526911735535, 0.00010971538722515106, 0.00011299550533294678, 0.00011627562344074249, 0.00011955574154853821, 0.00012283585965633392, 0.00012611597776412964, 0.00012939609587192535, 0.00013267621397972107, 0.00013595633208751678, 0.0001392364501953125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 4.0, 0.0, 5.0, 8.0, 8.0, 5.0, 11.0, 18.0, 36.0, 48.0, 94.0, 175.0, 321.0, 705.0, 1727.0, 5702.0, 31807.0, 607456.0, 370236.0, 22882.0, 4550.0, 1485.0, 619.0, 273.0, 140.0, 92.0, 61.0, 33.0, 18.0, 10.0, 11.0, 6.0, 4.0, 3.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.404541015625, -0.39186859130859375, -0.3791961669921875, -0.36652374267578125, -0.353851318359375, -0.34117889404296875, -0.3285064697265625, -0.31583404541015625, -0.30316162109375, -0.29048919677734375, -0.2778167724609375, -0.26514434814453125, -0.252471923828125, -0.23979949951171875, -0.2271270751953125, -0.21445465087890625, -0.2017822265625, -0.18910980224609375, -0.1764373779296875, -0.16376495361328125, -0.151092529296875, -0.13842010498046875, -0.1257476806640625, -0.11307525634765625, -0.10040283203125, -0.08773040771484375, -0.0750579833984375, -0.06238555908203125, -0.049713134765625, -0.03704071044921875, -0.0243682861328125, -0.01169586181640625, 0.0009765625, 0.01364898681640625, 0.0263214111328125, 0.03899383544921875, 0.051666259765625, 0.06433868408203125, 0.0770111083984375, 0.08968353271484375, 0.10235595703125, 0.11502838134765625, 0.1277008056640625, 0.14037322998046875, 0.153045654296875, 0.16571807861328125, 0.1783905029296875, 0.19106292724609375, 0.2037353515625, 0.21640777587890625, 0.2290802001953125, 0.24175262451171875, 0.254425048828125, 0.26709747314453125, 0.2797698974609375, 0.29244232177734375, 0.30511474609375, 0.31778717041015625, 0.3304595947265625, 0.34313201904296875, 0.355804443359375, 0.36847686767578125, 0.3811492919921875, 0.39382171630859375, 0.406494140625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 6.0, 13.0, 7.0, 14.0, 38.0, 43.0, 59.0, 83.0, 110.0, 130.0, 125.0, 112.0, 82.0, 60.0, 39.0, 29.0, 19.0, 8.0, 6.0, 8.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.6279296875, -0.6118545532226562, -0.5957794189453125, -0.5797042846679688, -0.563629150390625, -0.5475540161132812, -0.5314788818359375, -0.5154037475585938, -0.49932861328125, -0.48325347900390625, -0.4671783447265625, -0.45110321044921875, -0.435028076171875, -0.41895294189453125, -0.4028778076171875, -0.38680267333984375, -0.3707275390625, -0.35465240478515625, -0.3385772705078125, -0.32250213623046875, -0.306427001953125, -0.29035186767578125, -0.2742767333984375, -0.25820159912109375, -0.24212646484375, -0.22605133056640625, -0.2099761962890625, -0.19390106201171875, -0.177825927734375, -0.16175079345703125, -0.1456756591796875, -0.12960052490234375, -0.113525390625, -0.09745025634765625, -0.0813751220703125, -0.06529998779296875, -0.049224853515625, -0.03314971923828125, -0.0170745849609375, -0.00099945068359375, 0.01507568359375, 0.03115081787109375, 0.0472259521484375, 0.06330108642578125, 0.079376220703125, 0.09545135498046875, 0.1115264892578125, 0.12760162353515625, 0.1436767578125, 0.15975189208984375, 0.1758270263671875, 0.19190216064453125, 0.207977294921875, 0.22405242919921875, 0.2401275634765625, 0.25620269775390625, 0.27227783203125, 0.28835296630859375, 0.3044281005859375, 0.32050323486328125, 0.336578369140625, 0.35265350341796875, 0.3687286376953125, 0.38480377197265625, 0.40087890625]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 8.0, 10.0, 18.0, 100.0, 482.0, 285.0, 66.0, 21.0, 12.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.553358554840088, -6.238617897033691, -5.923877239227295, -5.609136581420898, -5.294395446777344, -4.979654788970947, -4.664914131164551, -4.350172996520996, -4.035432815551758, -3.7206921577453613, -3.4059512615203857, -3.0912106037139893, -2.7764697074890137, -2.461729049682617, -2.1469883918762207, -1.8322474956512451, -1.5175065994262695, -1.2027658224105835, -0.8880251049995422, -0.573284387588501, -0.25854361057281494, 0.056197166442871094, 0.3709378242492676, 0.6856787204742432, 1.0004193782806396, 1.3151601552963257, 1.6299009323120117, 1.9446415901184082, 2.2593822479248047, 2.5741231441497803, 2.8888638019561768, 3.2036046981811523, 3.518345832824707, 3.8330864906311035, 4.1478271484375, 4.462568283081055, 4.777308940887451, 5.092049598693848, 5.406790256500244, 5.721530914306641, 6.036272048950195, 6.351012706756592, 6.665753364562988, 6.980494499206543, 7.2952351570129395, 7.609975814819336, 7.924716472625732, 8.239457130432129, 8.554197311401367, 8.868938446044922, 9.18367862701416, 9.498419761657715, 9.813159942626953, 10.127901077270508, 10.442642211914062, 10.7573823928833, 11.072123527526855, 11.38686466217041, 11.701604843139648, 12.016345977783203, 12.331086158752441, 12.645827293395996, 12.960567474365234, 13.275308609008789, 13.590049743652344]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 1.0, 3.0, 4.0, 4.0, 10.0, 7.0, 11.0, 15.0, 13.0, 25.0, 49.0, 69.0, 85.0, 106.0, 146.0, 114.0, 102.0, 63.0, 46.0, 33.0, 22.0, 17.0, 9.0, 5.0, 6.0, 2.0, 4.0, 5.0, 2.0, 3.0, 3.0, 2.0, 4.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.674504280090332, -6.442097187042236, -6.209690093994141, -5.977282524108887, -5.744875431060791, -5.512468338012695, -5.2800612449646, -5.047654151916504, -4.81524658203125, -4.582839488983154, -4.350432395935059, -4.118024826049805, -3.885617733001709, -3.6532106399536133, -3.4208035469055176, -3.1883962154388428, -2.955989122390747, -2.7235820293426514, -2.4911746978759766, -2.258767604827881, -2.026360273361206, -1.7939531803131104, -1.561545968055725, -1.3291387557983398, -1.0967315435409546, -0.8643243312835693, -0.6319171190261841, -0.3995099663734436, -0.16710275411605835, 0.06530439853668213, 0.2977116107940674, 0.5301188230514526, 0.7625260353088379, 0.9949332475662231, 1.2273404598236084, 1.459747552871704, 1.692154884338379, 1.9245619773864746, 2.1569690704345703, 2.389376401901245, 2.62178373336792, 2.8541908264160156, 3.0865981578826904, 3.319005250930786, 3.551412582397461, 3.7838196754455566, 4.016226768493652, 4.248634338378906, 4.481040954589844, 4.7134480476379395, 4.945855140686035, 5.178262710571289, 5.410669803619385, 5.6430768966674805, 5.875483989715576, 6.107891082763672, 6.340298652648926, 6.5727057456970215, 6.805112838745117, 7.037520408630371, 7.269927501678467, 7.5023345947265625, 7.734741687774658, 7.967148780822754, 8.199556350708008]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 3.0, 1.0, 8.0, 10.0, 30.0, 79.0, 178.0, 472.0, 1637.0, 6544.0, 46246.0, 4027632.0, 95827.0, 10805.0, 2631.0, 1053.0, 491.0, 244.0, 133.0, 100.0, 59.0, 35.0, 21.0, 19.0, 12.0, 5.0, 6.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9619140625, -0.9128875732421875, -0.863861083984375, -0.8148345947265625, -0.76580810546875, -0.7167816162109375, -0.667755126953125, -0.6187286376953125, -0.5697021484375, -0.5206756591796875, -0.471649169921875, -0.4226226806640625, -0.37359619140625, -0.3245697021484375, -0.275543212890625, -0.2265167236328125, -0.177490234375, -0.1284637451171875, -0.079437255859375, -0.0304107666015625, 0.01861572265625, 0.0676422119140625, 0.116668701171875, 0.1656951904296875, 0.2147216796875, 0.2637481689453125, 0.312774658203125, 0.3618011474609375, 0.41082763671875, 0.4598541259765625, 0.508880615234375, 0.5579071044921875, 0.60693359375, 0.6559600830078125, 0.704986572265625, 0.7540130615234375, 0.80303955078125, 0.8520660400390625, 0.901092529296875, 0.9501190185546875, 0.9991455078125, 1.0481719970703125, 1.097198486328125, 1.1462249755859375, 1.19525146484375, 1.2442779541015625, 1.293304443359375, 1.3423309326171875, 1.391357421875, 1.4403839111328125, 1.489410400390625, 1.5384368896484375, 1.58746337890625, 1.6364898681640625, 1.685516357421875, 1.7345428466796875, 1.7835693359375, 1.8325958251953125, 1.881622314453125, 1.9306488037109375, 1.97967529296875, 2.0287017822265625, 2.077728271484375, 2.1267547607421875, 2.17578125]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 5.0, 5.0, 5.0, 9.0, 15.0, 18.0, 25.0, 99.0, 381.0, 293.0, 51.0, 22.0, 12.0, 20.0, 8.0, 8.0, 5.0, 9.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07965087890625, -0.07546138763427734, -0.07127189636230469, -0.06708240509033203, -0.06289291381835938, -0.05870342254638672, -0.05451393127441406, -0.050324440002441406, -0.04613494873046875, -0.041945457458496094, -0.03775596618652344, -0.03356647491455078, -0.029376983642578125, -0.02518749237060547, -0.020998001098632812, -0.016808509826660156, -0.0126190185546875, -0.008429527282714844, -0.0042400360107421875, -5.054473876953125e-05, 0.004138946533203125, 0.008328437805175781, 0.012517929077148438, 0.016707420349121094, 0.02089691162109375, 0.025086402893066406, 0.029275894165039062, 0.03346538543701172, 0.037654876708984375, 0.04184436798095703, 0.04603385925292969, 0.050223350524902344, 0.054412841796875, 0.058602333068847656, 0.06279182434082031, 0.06698131561279297, 0.07117080688476562, 0.07536029815673828, 0.07954978942871094, 0.0837392807006836, 0.08792877197265625, 0.0921182632446289, 0.09630775451660156, 0.10049724578857422, 0.10468673706054688, 0.10887622833251953, 0.11306571960449219, 0.11725521087646484, 0.1214447021484375, 0.12563419342041016, 0.1298236846923828, 0.13401317596435547, 0.13820266723632812, 0.14239215850830078, 0.14658164978027344, 0.1507711410522461, 0.15496063232421875, 0.1591501235961914, 0.16333961486816406, 0.16752910614013672, 0.17171859741210938, 0.17590808868408203, 0.1800975799560547, 0.18428707122802734, 0.1884765625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 7.0, 11.0, 19.0, 22.0, 37.0, 39.0, 63.0, 68.0, 140.0, 186.0, 374.0, 675.0, 1293.0, 3087.0, 8565.0, 31072.0, 208494.0, 3495544.0, 385223.0, 42314.0, 10378.0, 3507.0, 1460.0, 702.0, 398.0, 185.0, 129.0, 78.0, 44.0, 41.0, 40.0, 23.0, 15.0, 12.0, 9.0, 7.0, 7.0, 4.0, 1.0, 1.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.541015625, -0.5239028930664062, -0.5067901611328125, -0.48967742919921875, -0.472564697265625, -0.45545196533203125, -0.4383392333984375, -0.42122650146484375, -0.40411376953125, -0.38700103759765625, -0.3698883056640625, -0.35277557373046875, -0.335662841796875, -0.31855010986328125, -0.3014373779296875, -0.28432464599609375, -0.2672119140625, -0.25009918212890625, -0.2329864501953125, -0.21587371826171875, -0.198760986328125, -0.18164825439453125, -0.1645355224609375, -0.14742279052734375, -0.13031005859375, -0.11319732666015625, -0.0960845947265625, -0.07897186279296875, -0.061859130859375, -0.04474639892578125, -0.0276336669921875, -0.01052093505859375, 0.006591796875, 0.02370452880859375, 0.0408172607421875, 0.05792999267578125, 0.075042724609375, 0.09215545654296875, 0.1092681884765625, 0.12638092041015625, 0.14349365234375, 0.16060638427734375, 0.1777191162109375, 0.19483184814453125, 0.211944580078125, 0.22905731201171875, 0.2461700439453125, 0.26328277587890625, 0.2803955078125, 0.29750823974609375, 0.3146209716796875, 0.33173370361328125, 0.348846435546875, 0.36595916748046875, 0.3830718994140625, 0.40018463134765625, 0.41729736328125, 0.43441009521484375, 0.4515228271484375, 0.46863555908203125, 0.485748291015625, 0.5028610229492188, 0.5199737548828125, 0.5370864868164062, 0.55419921875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 3.0, 3.0, 3.0, 3.0, 1.0, 7.0, 3.0, 10.0, 14.0, 20.0, 22.0, 29.0, 34.0, 53.0, 75.0, 138.0, 219.0, 370.0, 813.0, 1215.0, 478.0, 225.0, 108.0, 72.0, 47.0, 28.0, 18.0, 21.0, 12.0, 13.0, 5.0, 4.0, 6.0, 1.0, 2.0, 0.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08221435546875, -0.07868480682373047, -0.07515525817871094, -0.0716257095336914, -0.06809616088867188, -0.06456661224365234, -0.06103706359863281, -0.05750751495361328, -0.05397796630859375, -0.05044841766357422, -0.04691886901855469, -0.043389320373535156, -0.039859771728515625, -0.036330223083496094, -0.03280067443847656, -0.02927112579345703, -0.0257415771484375, -0.02221202850341797, -0.018682479858398438, -0.015152931213378906, -0.011623382568359375, -0.008093833923339844, -0.0045642852783203125, -0.0010347366333007812, 0.00249481201171875, 0.006024360656738281, 0.009553909301757812, 0.013083457946777344, 0.016613006591796875, 0.020142555236816406, 0.023672103881835938, 0.02720165252685547, 0.030731201171875, 0.03426074981689453, 0.03779029846191406, 0.041319847106933594, 0.044849395751953125, 0.048378944396972656, 0.05190849304199219, 0.05543804168701172, 0.05896759033203125, 0.06249713897705078, 0.06602668762207031, 0.06955623626708984, 0.07308578491210938, 0.0766153335571289, 0.08014488220214844, 0.08367443084716797, 0.0872039794921875, 0.09073352813720703, 0.09426307678222656, 0.0977926254272461, 0.10132217407226562, 0.10485172271728516, 0.10838127136230469, 0.11191082000732422, 0.11544036865234375, 0.11896991729736328, 0.12249946594238281, 0.12602901458740234, 0.12955856323242188, 0.1330881118774414, 0.13661766052246094, 0.14014720916748047, 0.1436767578125]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 6.0, 7.0, 13.0, 58.0, 659.0, 251.0, 8.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.830989837646484, -7.671131134033203, -7.511272430419922, -7.351413726806641, -7.191555023193359, -7.031696796417236, -6.871838092803955, -6.711979389190674, -6.552120685577393, -6.392261981964111, -6.23240327835083, -6.072544574737549, -5.912686347961426, -5.7528276443481445, -5.592968940734863, -5.433110237121582, -5.273251533508301, -5.1133928298950195, -4.953534126281738, -4.793675422668457, -4.633816719055176, -4.473958492279053, -4.3140997886657715, -4.15424108505249, -3.994382381439209, -3.8345236778259277, -3.6746649742126465, -3.5148065090179443, -3.354947805404663, -3.195089101791382, -3.0352306365966797, -2.8753719329833984, -2.7155137062072754, -2.555655002593994, -2.395796298980713, -2.2359378337860107, -2.0760791301727295, -1.9162204265594482, -1.7563618421554565, -1.5965032577514648, -1.4366445541381836, -1.2767858505249023, -1.1169272661209106, -0.9570686221122742, -0.7972099781036377, -0.6373513340950012, -0.47749269008636475, -0.31763410568237305, -0.1577754020690918, 0.0020832419395446777, 0.16194188594818115, 0.3218005299568176, 0.4816591739654541, 0.6415178179740906, 0.801376461982727, 0.9612350463867188, 1.12109375, 1.2809524536132812, 1.440811038017273, 1.6006696224212646, 1.760528326034546, 1.9203870296478271, 2.0802454948425293, 2.2401041984558105, 2.399962902069092]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 4.0, 3.0, 5.0, 4.0, 7.0, 8.0, 13.0, 10.0, 9.0, 13.0, 17.0, 18.0, 14.0, 22.0, 30.0, 47.0, 37.0, 32.0, 44.0, 43.0, 47.0, 56.0, 59.0, 48.0, 46.0, 53.0, 49.0, 37.0, 40.0, 35.0, 26.0, 21.0, 20.0, 14.0, 16.0, 9.0, 13.0, 5.0, 8.0, 6.0, 9.0, 9.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5732935667037964, -0.5500187873840332, -0.52674400806427, -0.5034692287445068, -0.48019444942474365, -0.45691967010498047, -0.4336448907852173, -0.4103701114654541, -0.3870953321456909, -0.36382055282592773, -0.34054577350616455, -0.31727099418640137, -0.2939962148666382, -0.270721435546875, -0.24744665622711182, -0.22417187690734863, -0.20089709758758545, -0.17762231826782227, -0.15434753894805908, -0.1310727596282959, -0.10779798030853271, -0.08452320098876953, -0.06124842166900635, -0.037973642349243164, -0.01469886302947998, 0.008575916290283203, 0.03185069561004639, 0.05512547492980957, 0.07840025424957275, 0.10167503356933594, 0.12494981288909912, 0.1482245922088623, 0.17149943113327026, 0.19477421045303345, 0.21804898977279663, 0.24132376909255981, 0.264598548412323, 0.2878733277320862, 0.31114810705184937, 0.33442288637161255, 0.35769766569137573, 0.3809724450111389, 0.4042472243309021, 0.4275220036506653, 0.45079678297042847, 0.47407156229019165, 0.49734634160995483, 0.520621120929718, 0.5438959002494812, 0.5671706795692444, 0.5904454588890076, 0.6137202382087708, 0.6369950175285339, 0.6602697968482971, 0.6835445761680603, 0.7068193554878235, 0.7300941348075867, 0.7533689141273499, 0.776643693447113, 0.7999184727668762, 0.8231932520866394, 0.8464680314064026, 0.8697428107261658, 0.893017590045929, 0.9162923693656921]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 6.0, 7.0, 9.0, 12.0, 10.0, 20.0, 27.0, 41.0, 54.0, 85.0, 124.0, 204.0, 306.0, 473.0, 954.0, 2250.0, 6315.0, 21057.0, 204200.0, 761976.0, 35317.0, 9165.0, 3100.0, 1301.0, 627.0, 307.0, 190.0, 136.0, 92.0, 51.0, 35.0, 26.0, 24.0, 18.0, 12.0, 8.0, 12.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.0546875, -1.0197296142578125, -0.984771728515625, -0.9498138427734375, -0.91485595703125, -0.8798980712890625, -0.844940185546875, -0.8099822998046875, -0.7750244140625, -0.7400665283203125, -0.705108642578125, -0.6701507568359375, -0.63519287109375, -0.6002349853515625, -0.565277099609375, -0.5303192138671875, -0.495361328125, -0.4604034423828125, -0.425445556640625, -0.3904876708984375, -0.35552978515625, -0.3205718994140625, -0.285614013671875, -0.2506561279296875, -0.2156982421875, -0.1807403564453125, -0.145782470703125, -0.1108245849609375, -0.07586669921875, -0.0409088134765625, -0.005950927734375, 0.0290069580078125, 0.06396484375, 0.0989227294921875, 0.133880615234375, 0.1688385009765625, 0.20379638671875, 0.2387542724609375, 0.273712158203125, 0.3086700439453125, 0.3436279296875, 0.3785858154296875, 0.413543701171875, 0.4485015869140625, 0.48345947265625, 0.5184173583984375, 0.553375244140625, 0.5883331298828125, 0.623291015625, 0.6582489013671875, 0.693206787109375, 0.7281646728515625, 0.76312255859375, 0.7980804443359375, 0.833038330078125, 0.8679962158203125, 0.9029541015625, 0.9379119873046875, 0.972869873046875, 1.0078277587890625, 1.04278564453125, 1.0777435302734375, 1.112701416015625, 1.1476593017578125, 1.1826171875]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 4.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 7.0, 13.0, 19.0, 33.0, 85.0, 164.0, 279.0, 213.0, 90.0, 40.0, 14.0, 9.0, 8.0, 6.0, 4.0, 6.0, 5.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07659912109375, -0.0722665786743164, -0.06793403625488281, -0.06360149383544922, -0.059268951416015625, -0.05493640899658203, -0.05060386657714844, -0.046271324157714844, -0.04193878173828125, -0.037606239318847656, -0.03327369689941406, -0.02894115447998047, -0.024608612060546875, -0.02027606964111328, -0.015943527221679688, -0.011610984802246094, -0.0072784423828125, -0.0029458999633789062, 0.0013866424560546875, 0.005719184875488281, 0.010051727294921875, 0.014384269714355469, 0.018716812133789062, 0.023049354553222656, 0.02738189697265625, 0.031714439392089844, 0.03604698181152344, 0.04037952423095703, 0.044712066650390625, 0.04904460906982422, 0.05337715148925781, 0.057709693908691406, 0.062042236328125, 0.0663747787475586, 0.07070732116699219, 0.07503986358642578, 0.07937240600585938, 0.08370494842529297, 0.08803749084472656, 0.09237003326416016, 0.09670257568359375, 0.10103511810302734, 0.10536766052246094, 0.10970020294189453, 0.11403274536132812, 0.11836528778076172, 0.12269783020019531, 0.1270303726196289, 0.1313629150390625, 0.1356954574584961, 0.1400279998779297, 0.14436054229736328, 0.14869308471679688, 0.15302562713623047, 0.15735816955566406, 0.16169071197509766, 0.16602325439453125, 0.17035579681396484, 0.17468833923339844, 0.17902088165283203, 0.18335342407226562, 0.18768596649169922, 0.1920185089111328, 0.1963510513305664, 0.20068359375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 4.0, 0.0, 5.0, 2.0, 7.0, 7.0, 7.0, 5.0, 21.0, 23.0, 24.0, 43.0, 53.0, 68.0, 117.0, 175.0, 279.0, 505.0, 1198.0, 3089.0, 11082.0, 56209.0, 376974.0, 498375.0, 78852.0, 14506.0, 3998.0, 1410.0, 625.0, 311.0, 180.0, 102.0, 77.0, 58.0, 37.0, 35.0, 27.0, 16.0, 11.0, 15.0, 8.0, 6.0, 4.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.51953125, -0.5033416748046875, -0.487152099609375, -0.4709625244140625, -0.45477294921875, -0.4385833740234375, -0.422393798828125, -0.4062042236328125, -0.3900146484375, -0.3738250732421875, -0.357635498046875, -0.3414459228515625, -0.32525634765625, -0.3090667724609375, -0.292877197265625, -0.2766876220703125, -0.260498046875, -0.2443084716796875, -0.228118896484375, -0.2119293212890625, -0.19573974609375, -0.1795501708984375, -0.163360595703125, -0.1471710205078125, -0.1309814453125, -0.1147918701171875, -0.098602294921875, -0.0824127197265625, -0.06622314453125, -0.0500335693359375, -0.033843994140625, -0.0176544189453125, -0.00146484375, 0.0147247314453125, 0.030914306640625, 0.0471038818359375, 0.06329345703125, 0.0794830322265625, 0.095672607421875, 0.1118621826171875, 0.1280517578125, 0.1442413330078125, 0.160430908203125, 0.1766204833984375, 0.19281005859375, 0.2089996337890625, 0.225189208984375, 0.2413787841796875, 0.257568359375, 0.2737579345703125, 0.289947509765625, 0.3061370849609375, 0.32232666015625, 0.3385162353515625, 0.354705810546875, 0.3708953857421875, 0.3870849609375, 0.4032745361328125, 0.419464111328125, 0.4356536865234375, 0.45184326171875, 0.4680328369140625, 0.484222412109375, 0.5004119873046875, 0.5166015625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 3.0, 4.0, 7.0, 4.0, 8.0, 6.0, 16.0, 22.0, 31.0, 21.0, 19.0, 33.0, 25.0, 46.0, 46.0, 34.0, 41.0, 43.0, 46.0, 40.0, 52.0, 32.0, 59.0, 45.0, 37.0, 34.0, 36.0, 33.0, 29.0, 27.0, 29.0, 21.0, 13.0, 15.0, 10.0, 13.0, 8.0, 3.0, 3.0, 4.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.287841796875, -0.27878570556640625, -0.2697296142578125, -0.26067352294921875, -0.251617431640625, -0.24256134033203125, -0.2335052490234375, -0.22444915771484375, -0.21539306640625, -0.20633697509765625, -0.1972808837890625, -0.18822479248046875, -0.179168701171875, -0.17011260986328125, -0.1610565185546875, -0.15200042724609375, -0.1429443359375, -0.13388824462890625, -0.1248321533203125, -0.11577606201171875, -0.106719970703125, -0.09766387939453125, -0.0886077880859375, -0.07955169677734375, -0.07049560546875, -0.06143951416015625, -0.0523834228515625, -0.04332733154296875, -0.034271240234375, -0.02521514892578125, -0.0161590576171875, -0.00710296630859375, 0.001953125, 0.01100921630859375, 0.0200653076171875, 0.02912139892578125, 0.038177490234375, 0.04723358154296875, 0.0562896728515625, 0.06534576416015625, 0.07440185546875, 0.08345794677734375, 0.0925140380859375, 0.10157012939453125, 0.110626220703125, 0.11968231201171875, 0.1287384033203125, 0.13779449462890625, 0.1468505859375, 0.15590667724609375, 0.1649627685546875, 0.17401885986328125, 0.183074951171875, 0.19213104248046875, 0.2011871337890625, 0.21024322509765625, 0.21929931640625, 0.22835540771484375, 0.2374114990234375, 0.24646759033203125, 0.255523681640625, 0.26457977294921875, 0.2736358642578125, 0.28269195556640625, 0.291748046875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 6.0, 9.0, 14.0, 16.0, 19.0, 39.0, 72.0, 128.0, 286.0, 609.0, 2054.0, 12650.0, 957608.0, 69166.0, 4039.0, 1105.0, 361.0, 166.0, 71.0, 55.0, 26.0, 13.0, 10.0, 7.0, 6.0, 5.0, 2.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.076171875, -1.0399627685546875, -1.003753662109375, -0.9675445556640625, -0.93133544921875, -0.8951263427734375, -0.858917236328125, -0.8227081298828125, -0.7864990234375, -0.7502899169921875, -0.714080810546875, -0.6778717041015625, -0.64166259765625, -0.6054534912109375, -0.569244384765625, -0.5330352783203125, -0.496826171875, -0.4606170654296875, -0.424407958984375, -0.3881988525390625, -0.35198974609375, -0.3157806396484375, -0.279571533203125, -0.2433624267578125, -0.2071533203125, -0.1709442138671875, -0.134735107421875, -0.0985260009765625, -0.06231689453125, -0.0261077880859375, 0.010101318359375, 0.0463104248046875, 0.08251953125, 0.1187286376953125, 0.154937744140625, 0.1911468505859375, 0.22735595703125, 0.2635650634765625, 0.299774169921875, 0.3359832763671875, 0.3721923828125, 0.4084014892578125, 0.444610595703125, 0.4808197021484375, 0.51702880859375, 0.5532379150390625, 0.589447021484375, 0.6256561279296875, 0.661865234375, 0.6980743408203125, 0.734283447265625, 0.7704925537109375, 0.80670166015625, 0.8429107666015625, 0.879119873046875, 0.9153289794921875, 0.9515380859375, 0.9877471923828125, 1.023956298828125, 1.0601654052734375, 1.09637451171875, 1.1325836181640625, 1.168792724609375, 1.2050018310546875, 1.2412109375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 6.0, 8.0, 13.0, 22.0, 42.0, 94.0, 160.0, 236.0, 193.0, 100.0, 63.0, 26.0, 23.0, 11.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.314018249511719e-05, -3.1149014830589294e-05, -2.91578471660614e-05, -2.7166679501533508e-05, -2.5175511837005615e-05, -2.3184344172477722e-05, -2.119317650794983e-05, -1.9202008843421936e-05, -1.7210841178894043e-05, -1.521967351436615e-05, -1.3228505849838257e-05, -1.1237338185310364e-05, -9.24617052078247e-06, -7.255002856254578e-06, -5.2638351917266846e-06, -3.2726675271987915e-06, -1.2814998626708984e-06, 7.096678018569946e-07, 2.7008354663848877e-06, 4.692003130912781e-06, 6.683170795440674e-06, 8.674338459968567e-06, 1.066550612449646e-05, 1.2656673789024353e-05, 1.4647841453552246e-05, 1.663900911808014e-05, 1.8630176782608032e-05, 2.0621344447135925e-05, 2.261251211166382e-05, 2.460367977619171e-05, 2.6594847440719604e-05, 2.8586015105247498e-05, 3.057718276977539e-05, 3.2568350434303284e-05, 3.455951809883118e-05, 3.655068576335907e-05, 3.854185342788696e-05, 4.0533021092414856e-05, 4.252418875694275e-05, 4.451535642147064e-05, 4.6506524085998535e-05, 4.849769175052643e-05, 5.048885941505432e-05, 5.2480027079582214e-05, 5.447119474411011e-05, 5.6462362408638e-05, 5.8453530073165894e-05, 6.044469773769379e-05, 6.243586540222168e-05, 6.442703306674957e-05, 6.641820073127747e-05, 6.840936839580536e-05, 7.040053606033325e-05, 7.239170372486115e-05, 7.438287138938904e-05, 7.637403905391693e-05, 7.836520671844482e-05, 8.035637438297272e-05, 8.234754204750061e-05, 8.43387097120285e-05, 8.63298773765564e-05, 8.832104504108429e-05, 9.031221270561218e-05, 9.230338037014008e-05, 9.429454803466797e-05]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 7.0, 6.0, 12.0, 19.0, 34.0, 44.0, 61.0, 130.0, 277.0, 753.0, 2243.0, 12136.0, 272113.0, 732733.0, 23419.0, 3114.0, 851.0, 301.0, 135.0, 68.0, 33.0, 20.0, 16.0, 13.0, 4.0, 4.0, 1.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7412109375, -0.7212600708007812, -0.7013092041015625, -0.6813583374023438, -0.661407470703125, -0.6414566040039062, -0.6215057373046875, -0.6015548706054688, -0.58160400390625, -0.5616531372070312, -0.5417022705078125, -0.5217514038085938, -0.501800537109375, -0.48184967041015625, -0.4618988037109375, -0.44194793701171875, -0.4219970703125, -0.40204620361328125, -0.3820953369140625, -0.36214447021484375, -0.342193603515625, -0.32224273681640625, -0.3022918701171875, -0.28234100341796875, -0.26239013671875, -0.24243927001953125, -0.2224884033203125, -0.20253753662109375, -0.182586669921875, -0.16263580322265625, -0.1426849365234375, -0.12273406982421875, -0.102783203125, -0.08283233642578125, -0.0628814697265625, -0.04293060302734375, -0.022979736328125, -0.00302886962890625, 0.0169219970703125, 0.03687286376953125, 0.05682373046875, 0.07677459716796875, 0.0967254638671875, 0.11667633056640625, 0.136627197265625, 0.15657806396484375, 0.1765289306640625, 0.19647979736328125, 0.2164306640625, 0.23638153076171875, 0.2563323974609375, 0.27628326416015625, 0.296234130859375, 0.31618499755859375, 0.3361358642578125, 0.35608673095703125, 0.37603759765625, 0.39598846435546875, 0.4159393310546875, 0.43589019775390625, 0.455841064453125, 0.47579193115234375, 0.4957427978515625, 0.5156936645507812, 0.53564453125]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 0.0, 2.0, 4.0, 7.0, 11.0, 25.0, 13.0, 22.0, 32.0, 31.0, 64.0, 88.0, 91.0, 107.0, 102.0, 80.0, 85.0, 70.0, 49.0, 39.0, 26.0, 21.0, 8.0, 10.0, 8.0, 5.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.40478515625, -0.39360809326171875, -0.3824310302734375, -0.37125396728515625, -0.360076904296875, -0.34889984130859375, -0.3377227783203125, -0.32654571533203125, -0.31536865234375, -0.30419158935546875, -0.2930145263671875, -0.28183746337890625, -0.270660400390625, -0.25948333740234375, -0.2483062744140625, -0.23712921142578125, -0.2259521484375, -0.21477508544921875, -0.2035980224609375, -0.19242095947265625, -0.181243896484375, -0.17006683349609375, -0.1588897705078125, -0.14771270751953125, -0.13653564453125, -0.12535858154296875, -0.1141815185546875, -0.10300445556640625, -0.091827392578125, -0.08065032958984375, -0.0694732666015625, -0.05829620361328125, -0.047119140625, -0.03594207763671875, -0.0247650146484375, -0.01358795166015625, -0.002410888671875, 0.00876617431640625, 0.0199432373046875, 0.03112030029296875, 0.04229736328125, 0.05347442626953125, 0.0646514892578125, 0.07582855224609375, 0.087005615234375, 0.09818267822265625, 0.1093597412109375, 0.12053680419921875, 0.1317138671875, 0.14289093017578125, 0.1540679931640625, 0.16524505615234375, 0.176422119140625, 0.18759918212890625, 0.1987762451171875, 0.20995330810546875, 0.22113037109375, 0.23230743408203125, 0.2434844970703125, 0.25466156005859375, 0.265838623046875, 0.27701568603515625, 0.2881927490234375, 0.29936981201171875, 0.310546875]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 24.0, 248.0, 601.0, 93.0, 15.0, 6.0, 7.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.830286026000977, -13.503093719482422, -13.17590045928955, -12.848708152770996, -12.521514892578125, -12.19432258605957, -11.8671293258667, -11.539937019348145, -11.212743759155273, -10.885551452636719, -10.558358192443848, -10.231165885925293, -9.903972625732422, -9.576780319213867, -9.249587059020996, -8.922394752502441, -8.59520149230957, -8.268009185791016, -7.9408159255981445, -7.613623142242432, -7.286430358886719, -6.959237575531006, -6.632044792175293, -6.304852485656738, -5.977660179138184, -5.650467395782471, -5.323274612426758, -4.996081829071045, -4.668889045715332, -4.341696262359619, -4.014503479003906, -3.6873109340667725, -3.3601179122924805, -3.0329251289367676, -2.7057323455810547, -2.378539562225342, -2.051346778869629, -1.7241541147232056, -1.3969614505767822, -1.0697686672210693, -0.7425758838653564, -0.41538313031196594, -0.08819037675857544, 0.23900234699249268, 0.5661951303482056, 0.8933879137039185, 1.2205805778503418, 1.5477733612060547, 1.8749661445617676, 2.2021589279174805, 2.5293517112731934, 2.8565444946289062, 3.183737277984619, 3.510930061340332, 3.838122606277466, 4.165315628051758, 4.4925079345703125, 4.819700717926025, 5.146893501281738, 5.474086284637451, 5.801279067993164, 6.128471851348877, 6.45566463470459, 6.7828569412231445, 7.110050201416016]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 0.0, 3.0, 4.0, 3.0, 5.0, 6.0, 4.0, 6.0, 21.0, 30.0, 29.0, 57.0, 61.0, 72.0, 109.0, 100.0, 95.0, 82.0, 83.0, 58.0, 53.0, 37.0, 19.0, 21.0, 13.0, 11.0, 5.0, 1.0, 2.0, 2.0, 3.0, 6.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.019100189208984, -3.899399995803833, -3.7796995639801025, -3.659999370574951, -3.5402991771698, -3.4205989837646484, -3.300898551940918, -3.1811983585357666, -3.0614981651306152, -2.941797971725464, -2.8220975399017334, -2.702397346496582, -2.5826971530914307, -2.4629969596862793, -2.343296527862549, -2.2235963344573975, -2.103896141052246, -1.9841958284378052, -1.8644956350326538, -1.744795322418213, -1.6250951290130615, -1.5053948163986206, -1.3856945037841797, -1.2659943103790283, -1.1462938785552979, -1.026593565940857, -0.9068933725357056, -0.7871930599212646, -0.6674928665161133, -0.5477925539016724, -0.4280923008918762, -0.3083920478820801, -0.1886918544769287, -0.06899159401655197, 0.05070866644382477, 0.1704089343547821, 0.29010918736457825, 0.4098094701766968, 0.5295097231864929, 0.6492099761962891, 0.7689102292060852, 0.8886104822158813, 1.0083107948303223, 1.1280109882354736, 1.2477113008499146, 1.3674116134643555, 1.4871118068695068, 1.6068120002746582, 1.7265123128890991, 1.84621262550354, 1.9659128189086914, 2.0856130123138428, 2.2053134441375732, 2.3250136375427246, 2.444713830947876, 2.5644140243530273, 2.684114456176758, 2.803814649581909, 2.9235150814056396, 3.043215274810791, 3.1629154682159424, 3.2826156616210938, 3.402316093444824, 3.5220162868499756, 3.641716480255127]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 5.0, 8.0, 18.0, 20.0, 30.0, 54.0, 107.0, 201.0, 415.0, 980.0, 3144.0, 18815.0, 4089238.0, 72071.0, 5894.0, 1589.0, 641.0, 332.0, 197.0, 131.0, 97.0, 56.0, 58.0, 37.0, 28.0, 26.0, 20.0, 11.0, 10.0, 11.0, 8.0, 9.0, 4.0, 6.0, 2.0, 3.0, 2.0, 5.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7626953125, -1.6815338134765625, -1.600372314453125, -1.5192108154296875, -1.43804931640625, -1.3568878173828125, -1.275726318359375, -1.1945648193359375, -1.1134033203125, -1.0322418212890625, -0.951080322265625, -0.8699188232421875, -0.78875732421875, -0.7075958251953125, -0.626434326171875, -0.5452728271484375, -0.464111328125, -0.3829498291015625, -0.301788330078125, -0.2206268310546875, -0.13946533203125, -0.0583038330078125, 0.022857666015625, 0.1040191650390625, 0.1851806640625, 0.2663421630859375, 0.347503662109375, 0.4286651611328125, 0.50982666015625, 0.5909881591796875, 0.672149658203125, 0.7533111572265625, 0.83447265625, 0.9156341552734375, 0.996795654296875, 1.0779571533203125, 1.15911865234375, 1.2402801513671875, 1.321441650390625, 1.4026031494140625, 1.4837646484375, 1.5649261474609375, 1.646087646484375, 1.7272491455078125, 1.80841064453125, 1.8895721435546875, 1.970733642578125, 2.0518951416015625, 2.133056640625, 2.2142181396484375, 2.295379638671875, 2.3765411376953125, 2.45770263671875, 2.5388641357421875, 2.620025634765625, 2.7011871337890625, 2.7823486328125, 2.8635101318359375, 2.944671630859375, 3.0258331298828125, 3.10699462890625, 3.1881561279296875, 3.269317626953125, 3.3504791259765625, 3.431640625]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 1.0, 1.0, 3.0, 6.0, 15.0, 22.0, 46.0, 93.0, 191.0, 279.0, 188.0, 85.0, 37.0, 14.0, 11.0, 3.0, 6.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.095947265625, -0.09148406982421875, -0.0870208740234375, -0.08255767822265625, -0.078094482421875, -0.07363128662109375, -0.0691680908203125, -0.06470489501953125, -0.06024169921875, -0.05577850341796875, -0.0513153076171875, -0.04685211181640625, -0.042388916015625, -0.03792572021484375, -0.0334625244140625, -0.02899932861328125, -0.0245361328125, -0.02007293701171875, -0.0156097412109375, -0.01114654541015625, -0.006683349609375, -0.00222015380859375, 0.0022430419921875, 0.00670623779296875, 0.01116943359375, 0.01563262939453125, 0.0200958251953125, 0.02455902099609375, 0.029022216796875, 0.03348541259765625, 0.0379486083984375, 0.04241180419921875, 0.046875, 0.05133819580078125, 0.0558013916015625, 0.06026458740234375, 0.064727783203125, 0.06919097900390625, 0.0736541748046875, 0.07811737060546875, 0.08258056640625, 0.08704376220703125, 0.0915069580078125, 0.09597015380859375, 0.100433349609375, 0.10489654541015625, 0.1093597412109375, 0.11382293701171875, 0.1182861328125, 0.12274932861328125, 0.1272125244140625, 0.13167572021484375, 0.136138916015625, 0.14060211181640625, 0.1450653076171875, 0.14952850341796875, 0.15399169921875, 0.15845489501953125, 0.1629180908203125, 0.16738128662109375, 0.171844482421875, 0.17630767822265625, 0.1807708740234375, 0.18523406982421875, 0.189697265625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 7.0, 1.0, 3.0, 1.0, 2.0, 2.0, 11.0, 10.0, 8.0, 20.0, 40.0, 105.0, 219.0, 734.0, 7631.0, 4098223.0, 84878.0, 1777.0, 321.0, 133.0, 59.0, 30.0, 23.0, 12.0, 11.0, 13.0, 4.0, 6.0, 9.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.21484375, -4.12066650390625, -4.0264892578125, -3.93231201171875, -3.838134765625, -3.74395751953125, -3.6497802734375, -3.55560302734375, -3.46142578125, -3.36724853515625, -3.2730712890625, -3.17889404296875, -3.084716796875, -2.99053955078125, -2.8963623046875, -2.80218505859375, -2.7080078125, -2.61383056640625, -2.5196533203125, -2.42547607421875, -2.331298828125, -2.23712158203125, -2.1429443359375, -2.04876708984375, -1.95458984375, -1.86041259765625, -1.7662353515625, -1.67205810546875, -1.577880859375, -1.48370361328125, -1.3895263671875, -1.29534912109375, -1.201171875, -1.10699462890625, -1.0128173828125, -0.91864013671875, -0.824462890625, -0.73028564453125, -0.6361083984375, -0.54193115234375, -0.44775390625, -0.35357666015625, -0.2593994140625, -0.16522216796875, -0.071044921875, 0.02313232421875, 0.1173095703125, 0.21148681640625, 0.3056640625, 0.39984130859375, 0.4940185546875, 0.58819580078125, 0.682373046875, 0.77655029296875, 0.8707275390625, 0.96490478515625, 1.05908203125, 1.15325927734375, 1.2474365234375, 1.34161376953125, 1.435791015625, 1.52996826171875, 1.6241455078125, 1.71832275390625, 1.8125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 4.0, 8.0, 6.0, 8.0, 8.0, 13.0, 18.0, 21.0, 38.0, 54.0, 92.0, 192.0, 666.0, 1746.0, 668.0, 231.0, 116.0, 67.0, 41.0, 26.0, 13.0, 11.0, 7.0, 7.0, 5.0, 1.0, 2.0, 0.0, 2.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10626220703125, -0.10109424591064453, -0.09592628479003906, -0.0907583236694336, -0.08559036254882812, -0.08042240142822266, -0.07525444030761719, -0.07008647918701172, -0.06491851806640625, -0.05975055694580078, -0.05458259582519531, -0.049414634704589844, -0.044246673583984375, -0.039078712463378906, -0.03391075134277344, -0.02874279022216797, -0.0235748291015625, -0.01840686798095703, -0.013238906860351562, -0.008070945739746094, -0.002902984619140625, 0.0022649765014648438, 0.0074329376220703125, 0.012600898742675781, 0.01776885986328125, 0.02293682098388672, 0.028104782104492188, 0.033272743225097656, 0.038440704345703125, 0.043608665466308594, 0.04877662658691406, 0.05394458770751953, 0.059112548828125, 0.06428050994873047, 0.06944847106933594, 0.0746164321899414, 0.07978439331054688, 0.08495235443115234, 0.09012031555175781, 0.09528827667236328, 0.10045623779296875, 0.10562419891357422, 0.11079216003417969, 0.11596012115478516, 0.12112808227539062, 0.1262960433959961, 0.13146400451660156, 0.13663196563720703, 0.1417999267578125, 0.14696788787841797, 0.15213584899902344, 0.1573038101196289, 0.16247177124023438, 0.16763973236083984, 0.1728076934814453, 0.17797565460205078, 0.18314361572265625, 0.18831157684326172, 0.1934795379638672, 0.19864749908447266, 0.20381546020507812, 0.2089834213256836, 0.21415138244628906, 0.21931934356689453, 0.2244873046875]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 7.0, 17.0, 109.0, 386.0, 314.0, 105.0, 26.0, 19.0, 6.0, 7.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2960350513458252, -1.2439188957214355, -1.1918028593063354, -1.1396867036819458, -1.0875705480575562, -1.035454511642456, -0.9833383560180664, -0.9312222599983215, -0.8791061639785767, -0.8269900679588318, -0.7748739123344421, -0.7227578163146973, -0.6706417202949524, -0.6185256242752075, -0.5664094686508179, -0.514293372631073, -0.46217721700668335, -0.4100610911846161, -0.3579449951648712, -0.30582886934280396, -0.2537127733230591, -0.20159664750099182, -0.14948052167892456, -0.09736442565917969, -0.04524829983711243, 0.006867814809083939, 0.058983929455280304, 0.11110004782676697, 0.16321615874767303, 0.2153322696685791, 0.26744839549064636, 0.31956449151039124, 0.3716806173324585, 0.42379674315452576, 0.47591283917427063, 0.5280289649963379, 0.5801450610160828, 0.6322611570358276, 0.6843773126602173, 0.7364934086799622, 0.788609504699707, 0.8407256007194519, 0.8928417563438416, 0.9449578523635864, 0.9970739483833313, 1.0491900444030762, 1.1013062000274658, 1.1534223556518555, 1.2055385112762451, 1.2576546669006348, 1.3097707033157349, 1.3618868589401245, 1.4140030145645142, 1.4661190509796143, 1.518235206604004, 1.5703513622283936, 1.6224673986434937, 1.6745835542678833, 1.7266995906829834, 1.778815746307373, 1.8309319019317627, 1.8830479383468628, 1.9351640939712524, 1.9872801303863525, 2.039396286010742]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 6.0, 5.0, 9.0, 8.0, 17.0, 15.0, 13.0, 21.0, 35.0, 22.0, 25.0, 37.0, 37.0, 47.0, 53.0, 48.0, 50.0, 54.0, 59.0, 50.0, 47.0, 54.0, 39.0, 30.0, 36.0, 29.0, 34.0, 17.0, 25.0, 13.0, 13.0, 9.0, 11.0, 7.0, 8.0, 6.0, 3.0, 2.0, 3.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.4939628839492798, -0.47825679183006287, -0.46255072951316833, -0.4468446373939514, -0.4311385750770569, -0.41543248295783997, -0.39972639083862305, -0.3840203285217285, -0.3683142364025116, -0.3526081442832947, -0.33690208196640015, -0.3211959898471832, -0.3054898977279663, -0.2897838354110718, -0.27407774329185486, -0.25837165117263794, -0.2426655888557434, -0.22695951163768768, -0.21125343441963196, -0.19554734230041504, -0.17984126508235931, -0.1641351878643036, -0.14842909574508667, -0.13272301852703094, -0.11701694130897522, -0.1013108640909195, -0.08560477942228317, -0.06989869475364685, -0.054192617535591125, -0.0384865403175354, -0.02278045564889908, -0.007074370980262756, 0.008631765842437744, 0.024337846785783768, 0.04004392772912979, 0.055750008672475815, 0.07145608961582184, 0.08716216683387756, 0.10286825150251389, 0.11857433617115021, 0.13428041338920593, 0.14998649060726166, 0.16569256782531738, 0.1813986599445343, 0.19710473716259003, 0.21281081438064575, 0.22851690649986267, 0.2442229837179184, 0.2599290609359741, 0.27563515305519104, 0.29134121537208557, 0.3070473074913025, 0.322753369808197, 0.33845946192741394, 0.35416555404663086, 0.3698716163635254, 0.3855777084827423, 0.40128380060195923, 0.41698986291885376, 0.4326959550380707, 0.4484020471572876, 0.46410810947418213, 0.47981420159339905, 0.49552029371261597, 0.5112263560295105]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 7.0, 13.0, 17.0, 22.0, 25.0, 45.0, 71.0, 87.0, 147.0, 260.0, 386.0, 813.0, 2207.0, 12027.0, 666573.0, 353199.0, 9063.0, 1828.0, 691.0, 406.0, 238.0, 135.0, 89.0, 68.0, 39.0, 34.0, 14.0, 17.0, 8.0, 9.0, 7.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.4560546875, -1.4118499755859375, -1.367645263671875, -1.3234405517578125, -1.27923583984375, -1.2350311279296875, -1.190826416015625, -1.1466217041015625, -1.1024169921875, -1.0582122802734375, -1.014007568359375, -0.9698028564453125, -0.92559814453125, -0.8813934326171875, -0.837188720703125, -0.7929840087890625, -0.748779296875, -0.7045745849609375, -0.660369873046875, -0.6161651611328125, -0.57196044921875, -0.5277557373046875, -0.483551025390625, -0.4393463134765625, -0.3951416015625, -0.3509368896484375, -0.306732177734375, -0.2625274658203125, -0.21832275390625, -0.1741180419921875, -0.129913330078125, -0.0857086181640625, -0.04150390625, 0.0027008056640625, 0.046905517578125, 0.0911102294921875, 0.13531494140625, 0.1795196533203125, 0.223724365234375, 0.2679290771484375, 0.3121337890625, 0.3563385009765625, 0.400543212890625, 0.4447479248046875, 0.48895263671875, 0.5331573486328125, 0.577362060546875, 0.6215667724609375, 0.665771484375, 0.7099761962890625, 0.754180908203125, 0.7983856201171875, 0.84259033203125, 0.8867950439453125, 0.930999755859375, 0.9752044677734375, 1.0194091796875, 1.0636138916015625, 1.107818603515625, 1.1520233154296875, 1.19622802734375, 1.2404327392578125, 1.284637451171875, 1.3288421630859375, 1.373046875]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 10.0, 12.0, 30.0, 107.0, 245.0, 268.0, 196.0, 79.0, 27.0, 9.0, 8.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1011962890625, -0.09669113159179688, -0.09218597412109375, -0.08768081665039062, -0.0831756591796875, -0.07867050170898438, -0.07416534423828125, -0.06966018676757812, -0.065155029296875, -0.060649871826171875, -0.05614471435546875, -0.051639556884765625, -0.0471343994140625, -0.042629241943359375, -0.03812408447265625, -0.033618927001953125, -0.02911376953125, -0.024608612060546875, -0.02010345458984375, -0.015598297119140625, -0.0110931396484375, -0.006587982177734375, -0.00208282470703125, 0.002422332763671875, 0.006927490234375, 0.011432647705078125, 0.01593780517578125, 0.020442962646484375, 0.0249481201171875, 0.029453277587890625, 0.03395843505859375, 0.038463592529296875, 0.04296875, 0.047473907470703125, 0.05197906494140625, 0.056484222412109375, 0.0609893798828125, 0.06549453735351562, 0.06999969482421875, 0.07450485229492188, 0.079010009765625, 0.08351516723632812, 0.08802032470703125, 0.09252548217773438, 0.0970306396484375, 0.10153579711914062, 0.10604095458984375, 0.11054611206054688, 0.11505126953125, 0.11955642700195312, 0.12406158447265625, 0.12856674194335938, 0.1330718994140625, 0.13757705688476562, 0.14208221435546875, 0.14658737182617188, 0.151092529296875, 0.15559768676757812, 0.16010284423828125, 0.16460800170898438, 0.1691131591796875, 0.17361831665039062, 0.17812347412109375, 0.18262863159179688, 0.1871337890625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 4.0, 1.0, 9.0, 6.0, 5.0, 9.0, 17.0, 17.0, 22.0, 41.0, 49.0, 68.0, 105.0, 139.0, 183.0, 296.0, 493.0, 865.0, 2036.0, 6123.0, 23047.0, 129338.0, 662573.0, 180930.0, 29966.0, 7322.0, 2343.0, 984.0, 555.0, 312.0, 185.0, 131.0, 111.0, 68.0, 61.0, 50.0, 29.0, 17.0, 14.0, 11.0, 7.0, 10.0, 6.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.77587890625, -0.754669189453125, -0.73345947265625, -0.712249755859375, -0.6910400390625, -0.669830322265625, -0.64862060546875, -0.627410888671875, -0.606201171875, -0.584991455078125, -0.56378173828125, -0.542572021484375, -0.5213623046875, -0.500152587890625, -0.47894287109375, -0.457733154296875, -0.4365234375, -0.415313720703125, -0.39410400390625, -0.372894287109375, -0.3516845703125, -0.330474853515625, -0.30926513671875, -0.288055419921875, -0.266845703125, -0.245635986328125, -0.22442626953125, -0.203216552734375, -0.1820068359375, -0.160797119140625, -0.13958740234375, -0.118377685546875, -0.09716796875, -0.075958251953125, -0.05474853515625, -0.033538818359375, -0.0123291015625, 0.008880615234375, 0.03009033203125, 0.051300048828125, 0.072509765625, 0.093719482421875, 0.11492919921875, 0.136138916015625, 0.1573486328125, 0.178558349609375, 0.19976806640625, 0.220977783203125, 0.2421875, 0.263397216796875, 0.28460693359375, 0.305816650390625, 0.3270263671875, 0.348236083984375, 0.36944580078125, 0.390655517578125, 0.411865234375, 0.433074951171875, 0.45428466796875, 0.475494384765625, 0.4967041015625, 0.517913818359375, 0.53912353515625, 0.560333251953125, 0.58154296875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 4.0, 2.0, 8.0, 5.0, 5.0, 9.0, 7.0, 5.0, 24.0, 19.0, 18.0, 25.0, 31.0, 28.0, 35.0, 46.0, 52.0, 41.0, 50.0, 41.0, 61.0, 50.0, 55.0, 43.0, 40.0, 55.0, 34.0, 29.0, 25.0, 21.0, 28.0, 29.0, 12.0, 11.0, 14.0, 8.0, 9.0, 4.0, 6.0, 8.0, 4.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.383056640625, -0.37284088134765625, -0.3626251220703125, -0.35240936279296875, -0.342193603515625, -0.33197784423828125, -0.3217620849609375, -0.31154632568359375, -0.30133056640625, -0.29111480712890625, -0.2808990478515625, -0.27068328857421875, -0.260467529296875, -0.25025177001953125, -0.2400360107421875, -0.22982025146484375, -0.2196044921875, -0.20938873291015625, -0.1991729736328125, -0.18895721435546875, -0.178741455078125, -0.16852569580078125, -0.1583099365234375, -0.14809417724609375, -0.13787841796875, -0.12766265869140625, -0.1174468994140625, -0.10723114013671875, -0.097015380859375, -0.08679962158203125, -0.0765838623046875, -0.06636810302734375, -0.05615234375, -0.04593658447265625, -0.0357208251953125, -0.02550506591796875, -0.015289306640625, -0.00507354736328125, 0.0051422119140625, 0.01535797119140625, 0.02557373046875, 0.03578948974609375, 0.0460052490234375, 0.05622100830078125, 0.066436767578125, 0.07665252685546875, 0.0868682861328125, 0.09708404541015625, 0.1072998046875, 0.11751556396484375, 0.1277313232421875, 0.13794708251953125, 0.148162841796875, 0.15837860107421875, 0.1685943603515625, 0.17881011962890625, 0.18902587890625, 0.19924163818359375, 0.2094573974609375, 0.21967315673828125, 0.229888916015625, 0.24010467529296875, 0.2503204345703125, 0.26053619384765625, 0.270751953125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 7.0, 4.0, 5.0, 11.0, 22.0, 24.0, 37.0, 65.0, 133.0, 309.0, 845.0, 3291.0, 41978.0, 911230.0, 84166.0, 4641.0, 1032.0, 377.0, 152.0, 89.0, 46.0, 30.0, 16.0, 18.0, 8.0, 5.0, 3.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.75244140625, -0.7270126342773438, -0.7015838623046875, -0.6761550903320312, -0.650726318359375, -0.6252975463867188, -0.5998687744140625, -0.5744400024414062, -0.54901123046875, -0.5235824584960938, -0.4981536865234375, -0.47272491455078125, -0.447296142578125, -0.42186737060546875, -0.3964385986328125, -0.37100982666015625, -0.3455810546875, -0.32015228271484375, -0.2947235107421875, -0.26929473876953125, -0.243865966796875, -0.21843719482421875, -0.1930084228515625, -0.16757965087890625, -0.14215087890625, -0.11672210693359375, -0.0912933349609375, -0.06586456298828125, -0.040435791015625, -0.01500701904296875, 0.0104217529296875, 0.03585052490234375, 0.061279296875, 0.08670806884765625, 0.1121368408203125, 0.13756561279296875, 0.162994384765625, 0.18842315673828125, 0.2138519287109375, 0.23928070068359375, 0.26470947265625, 0.29013824462890625, 0.3155670166015625, 0.34099578857421875, 0.366424560546875, 0.39185333251953125, 0.4172821044921875, 0.44271087646484375, 0.4681396484375, 0.49356842041015625, 0.5189971923828125, 0.5444259643554688, 0.569854736328125, 0.5952835083007812, 0.6207122802734375, 0.6461410522460938, 0.67156982421875, 0.6969985961914062, 0.7224273681640625, 0.7478561401367188, 0.773284912109375, 0.7987136840820312, 0.8241424560546875, 0.8495712280273438, 0.875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 4.0, 7.0, 5.0, 4.0, 9.0, 6.0, 9.0, 25.0, 22.0, 31.0, 59.0, 83.0, 100.0, 139.0, 130.0, 101.0, 78.0, 45.0, 39.0, 22.0, 24.0, 18.0, 11.0, 5.0, 10.0, 9.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0411949157714844e-05, -3.8904137909412384e-05, -3.7396326661109924e-05, -3.5888515412807465e-05, -3.4380704164505005e-05, -3.2872892916202545e-05, -3.1365081667900085e-05, -2.9857270419597626e-05, -2.8349459171295166e-05, -2.6841647922992706e-05, -2.5333836674690247e-05, -2.3826025426387787e-05, -2.2318214178085327e-05, -2.0810402929782867e-05, -1.9302591681480408e-05, -1.7794780433177948e-05, -1.6286969184875488e-05, -1.4779157936573029e-05, -1.3271346688270569e-05, -1.1763535439968109e-05, -1.025572419166565e-05, -8.74791294336319e-06, -7.24010169506073e-06, -5.73229044675827e-06, -4.2244791984558105e-06, -2.716667950153351e-06, -1.2088567018508911e-06, 2.989545464515686e-07, 1.8067657947540283e-06, 3.314577043056488e-06, 4.822388291358948e-06, 6.3301995396614075e-06, 7.838010787963867e-06, 9.345822036266327e-06, 1.0853633284568787e-05, 1.2361444532871246e-05, 1.3869255781173706e-05, 1.5377067029476166e-05, 1.6884878277778625e-05, 1.8392689526081085e-05, 1.9900500774383545e-05, 2.1408312022686005e-05, 2.2916123270988464e-05, 2.4423934519290924e-05, 2.5931745767593384e-05, 2.7439557015895844e-05, 2.8947368264198303e-05, 3.0455179512500763e-05, 3.196299076080322e-05, 3.347080200910568e-05, 3.497861325740814e-05, 3.64864245057106e-05, 3.799423575401306e-05, 3.950204700231552e-05, 4.100985825061798e-05, 4.251766949892044e-05, 4.40254807472229e-05, 4.553329199552536e-05, 4.704110324382782e-05, 4.854891449213028e-05, 5.005672574043274e-05, 5.15645369887352e-05, 5.307234823703766e-05, 5.458015948534012e-05, 5.608797073364258e-05]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 5.0, 11.0, 13.0, 15.0, 42.0, 61.0, 84.0, 147.0, 334.0, 748.0, 2013.0, 10387.0, 172966.0, 812692.0, 42200.0, 4656.0, 1165.0, 451.0, 238.0, 117.0, 69.0, 54.0, 27.0, 19.0, 18.0, 7.0, 4.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.92578125, -0.9022140502929688, -0.8786468505859375, -0.8550796508789062, -0.831512451171875, -0.8079452514648438, -0.7843780517578125, -0.7608108520507812, -0.73724365234375, -0.7136764526367188, -0.6901092529296875, -0.6665420532226562, -0.642974853515625, -0.6194076538085938, -0.5958404541015625, -0.5722732543945312, -0.5487060546875, -0.5251388549804688, -0.5015716552734375, -0.47800445556640625, -0.454437255859375, -0.43087005615234375, -0.4073028564453125, -0.38373565673828125, -0.36016845703125, -0.33660125732421875, -0.3130340576171875, -0.28946685791015625, -0.265899658203125, -0.24233245849609375, -0.2187652587890625, -0.19519805908203125, -0.171630859375, -0.14806365966796875, -0.1244964599609375, -0.10092926025390625, -0.077362060546875, -0.05379486083984375, -0.0302276611328125, -0.00666046142578125, 0.01690673828125, 0.04047393798828125, 0.0640411376953125, 0.08760833740234375, 0.111175537109375, 0.13474273681640625, 0.1583099365234375, 0.18187713623046875, 0.2054443359375, 0.22901153564453125, 0.2525787353515625, 0.27614593505859375, 0.299713134765625, 0.32328033447265625, 0.3468475341796875, 0.37041473388671875, 0.39398193359375, 0.41754913330078125, 0.4411163330078125, 0.46468353271484375, 0.488250732421875, 0.5118179321289062, 0.5353851318359375, 0.5589523315429688, 0.58251953125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 5.0, 5.0, 7.0, 9.0, 14.0, 13.0, 18.0, 17.0, 34.0, 43.0, 66.0, 56.0, 80.0, 84.0, 95.0, 86.0, 74.0, 51.0, 58.0, 44.0, 29.0, 18.0, 22.0, 14.0, 15.0, 13.0, 5.0, 7.0, 4.0, 4.0, 1.0, 2.0, 3.0, 2.0, 0.0, 3.0, 2.0, 2.0], "bins": [-0.34326171875, -0.33479881286621094, -0.3263359069824219, -0.3178730010986328, -0.30941009521484375, -0.3009471893310547, -0.2924842834472656, -0.28402137756347656, -0.2755584716796875, -0.26709556579589844, -0.2586326599121094, -0.2501697540283203, -0.24170684814453125, -0.2332439422607422, -0.22478103637695312, -0.21631813049316406, -0.207855224609375, -0.19939231872558594, -0.19092941284179688, -0.1824665069580078, -0.17400360107421875, -0.1655406951904297, -0.15707778930664062, -0.14861488342285156, -0.1401519775390625, -0.13168907165527344, -0.12322616577148438, -0.11476325988769531, -0.10630035400390625, -0.09783744812011719, -0.08937454223632812, -0.08091163635253906, -0.07244873046875, -0.06398582458496094, -0.055522918701171875, -0.04706001281738281, -0.03859710693359375, -0.030134201049804688, -0.021671295166015625, -0.013208389282226562, -0.0047454833984375, 0.0037174224853515625, 0.012180328369140625, 0.020643234252929688, 0.02910614013671875, 0.03756904602050781, 0.046031951904296875, 0.05449485778808594, 0.062957763671875, 0.07142066955566406, 0.07988357543945312, 0.08834648132324219, 0.09680938720703125, 0.10527229309082031, 0.11373519897460938, 0.12219810485839844, 0.1306610107421875, 0.13912391662597656, 0.14758682250976562, 0.1560497283935547, 0.16451263427734375, 0.1729755401611328, 0.18143844604492188, 0.18990135192871094, 0.1983642578125]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 22.0, 638.0, 334.0, 8.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.03475570678711, -32.298927307128906, -31.563098907470703, -30.8272705078125, -30.091442108154297, -29.355613708496094, -28.61978530883789, -27.883956909179688, -27.148128509521484, -26.41230010986328, -25.676471710205078, -24.940643310546875, -24.204814910888672, -23.46898651123047, -22.733158111572266, -21.997329711914062, -21.261503219604492, -20.52567481994629, -19.789846420288086, -19.054018020629883, -18.31818962097168, -17.582361221313477, -16.846534729003906, -16.110706329345703, -15.374876976013184, -14.63904857635498, -13.903220176696777, -13.16739273071289, -12.431564331054688, -11.695735931396484, -10.959907531738281, -10.224079132080078, -9.488252639770508, -8.752424240112305, -8.016595840454102, -7.280767917633057, -6.5449395179748535, -5.80911111831665, -5.0732831954956055, -4.337454795837402, -3.601626396179199, -2.865797996520996, -2.129969835281372, -1.394141674041748, -0.6583132743835449, 0.0775151252746582, 0.8133430480957031, 1.5491714477539062, 2.2849998474121094, 3.0208282470703125, 3.7566564083099365, 4.4924845695495605, 5.228312969207764, 5.964141368865967, 6.699969291687012, 7.435797691345215, 8.171626091003418, 8.907454490661621, 9.643282890319824, 10.379110336303711, 11.114938735961914, 11.850767135620117, 12.58659553527832, 13.322423934936523, 14.058252334594727]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 10.0, 6.0, 11.0, 14.0, 23.0, 22.0, 33.0, 42.0, 53.0, 48.0, 59.0, 77.0, 69.0, 67.0, 82.0, 76.0, 51.0, 56.0, 51.0, 39.0, 26.0, 23.0, 17.0, 14.0, 9.0, 10.0, 6.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.870981216430664, -2.7597594261169434, -2.6485376358032227, -2.537315845489502, -2.426093816757202, -2.3148720264434814, -2.2036502361297607, -2.09242844581604, -1.9812066555023193, -1.8699848651885986, -1.7587629556655884, -1.6475411653518677, -1.536319375038147, -1.4250974655151367, -1.313875675201416, -1.2026538848876953, -1.091431975364685, -0.9802101254463196, -0.8689883351325989, -0.7577664852142334, -0.6465446949005127, -0.5353228449821472, -0.42410099506378174, -0.31287920475006104, -0.20165735483169556, -0.09043552726507187, 0.02078630030155182, 0.1320081353187561, 0.2432299554347992, 0.3544517755508423, 0.46567362546920776, 0.5768954157829285, 0.688117265701294, 0.7993391156196594, 0.9105609059333801, 1.0217827558517456, 1.1330045461654663, 1.2442264556884766, 1.3554482460021973, 1.466670036315918, 1.5778918266296387, 1.6891136169433594, 1.8003355264663696, 1.9115573167800903, 2.0227792263031006, 2.1340010166168213, 2.245222806930542, 2.3564445972442627, 2.4676666259765625, 2.578888416290283, 2.690110206604004, 2.8013319969177246, 2.9125540256500244, 3.023775815963745, 3.134997606277466, 3.2462193965911865, 3.3574411869049072, 3.468662977218628, 3.5798847675323486, 3.6911067962646484, 3.802328586578369, 3.91355037689209, 4.0247721672058105, 4.135993957519531, 4.247215747833252]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 27.0, 48.0, 146.0, 570.0, 183002.0, 4008755.0, 1243.0, 283.0, 108.0, 57.0, 17.0, 13.0, 5.0, 5.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.1015625, -5.8580322265625, -5.614501953125, -5.3709716796875, -5.12744140625, -4.8839111328125, -4.640380859375, -4.3968505859375, -4.1533203125, -3.9097900390625, -3.666259765625, -3.4227294921875, -3.17919921875, -2.9356689453125, -2.692138671875, -2.4486083984375, -2.205078125, -1.9615478515625, -1.718017578125, -1.4744873046875, -1.23095703125, -0.9874267578125, -0.743896484375, -0.5003662109375, -0.2568359375, -0.0133056640625, 0.230224609375, 0.4737548828125, 0.71728515625, 0.9608154296875, 1.204345703125, 1.4478759765625, 1.69140625, 1.9349365234375, 2.178466796875, 2.4219970703125, 2.66552734375, 2.9090576171875, 3.152587890625, 3.3961181640625, 3.6396484375, 3.8831787109375, 4.126708984375, 4.3702392578125, 4.61376953125, 4.8572998046875, 5.100830078125, 5.3443603515625, 5.587890625, 5.8314208984375, 6.074951171875, 6.3184814453125, 6.56201171875, 6.8055419921875, 7.049072265625, 7.2926025390625, 7.5361328125, 7.7796630859375, 8.023193359375, 8.2667236328125, 8.51025390625, 8.7537841796875, 8.997314453125, 9.2408447265625, 9.484375]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 6.0, 13.0, 21.0, 50.0, 130.0, 184.0, 240.0, 198.0, 95.0, 42.0, 12.0, 7.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1453857421875, -0.13944625854492188, -0.13350677490234375, -0.12756729125976562, -0.1216278076171875, -0.11568832397460938, -0.10974884033203125, -0.10380935668945312, -0.097869873046875, -0.09193038940429688, -0.08599090576171875, -0.08005142211914062, -0.0741119384765625, -0.06817245483398438, -0.06223297119140625, -0.056293487548828125, -0.05035400390625, -0.044414520263671875, -0.03847503662109375, -0.032535552978515625, -0.0265960693359375, -0.020656585693359375, -0.01471710205078125, -0.008777618408203125, -0.002838134765625, 0.003101348876953125, 0.00904083251953125, 0.014980316162109375, 0.0209197998046875, 0.026859283447265625, 0.03279876708984375, 0.038738250732421875, 0.044677734375, 0.050617218017578125, 0.05655670166015625, 0.062496185302734375, 0.0684356689453125, 0.07437515258789062, 0.08031463623046875, 0.08625411987304688, 0.092193603515625, 0.09813308715820312, 0.10407257080078125, 0.11001205444335938, 0.1159515380859375, 0.12189102172851562, 0.12783050537109375, 0.13376998901367188, 0.13970947265625, 0.14564895629882812, 0.15158843994140625, 0.15752792358398438, 0.1634674072265625, 0.16940689086914062, 0.17534637451171875, 0.18128585815429688, 0.187225341796875, 0.19316482543945312, 0.19910430908203125, 0.20504379272460938, 0.2109832763671875, 0.21692276000976562, 0.22286224365234375, 0.22880172729492188, 0.2347412109375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 5.0, 1.0, 10.0, 10.0, 22.0, 37.0, 67.0, 123.0, 244.0, 503.0, 1310.0, 5085.0, 36330.0, 2877447.0, 1238934.0, 27216.0, 4597.0, 1339.0, 496.0, 233.0, 122.0, 67.0, 35.0, 20.0, 17.0, 5.0, 6.0, 4.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.998046875, -0.9595794677734375, -0.921112060546875, -0.8826446533203125, -0.84417724609375, -0.8057098388671875, -0.767242431640625, -0.7287750244140625, -0.6903076171875, -0.6518402099609375, -0.613372802734375, -0.5749053955078125, -0.53643798828125, -0.4979705810546875, -0.459503173828125, -0.4210357666015625, -0.382568359375, -0.3441009521484375, -0.305633544921875, -0.2671661376953125, -0.22869873046875, -0.1902313232421875, -0.151763916015625, -0.1132965087890625, -0.0748291015625, -0.0363616943359375, 0.002105712890625, 0.0405731201171875, 0.07904052734375, 0.1175079345703125, 0.155975341796875, 0.1944427490234375, 0.23291015625, 0.2713775634765625, 0.309844970703125, 0.3483123779296875, 0.38677978515625, 0.4252471923828125, 0.463714599609375, 0.5021820068359375, 0.5406494140625, 0.5791168212890625, 0.617584228515625, 0.6560516357421875, 0.69451904296875, 0.7329864501953125, 0.771453857421875, 0.8099212646484375, 0.848388671875, 0.8868560791015625, 0.925323486328125, 0.9637908935546875, 1.00225830078125, 1.0407257080078125, 1.079193115234375, 1.1176605224609375, 1.1561279296875, 1.1945953369140625, 1.233062744140625, 1.2715301513671875, 1.30999755859375, 1.3484649658203125, 1.386932373046875, 1.4253997802734375, 1.4638671875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 12.0, 8.0, 6.0, 18.0, 24.0, 38.0, 49.0, 87.0, 139.0, 325.0, 911.0, 1494.0, 486.0, 201.0, 120.0, 53.0, 34.0, 27.0, 18.0, 6.0, 8.0, 1.0, 3.0, 3.0, 6.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.153564453125, -0.14722442626953125, -0.1408843994140625, -0.13454437255859375, -0.128204345703125, -0.12186431884765625, -0.1155242919921875, -0.10918426513671875, -0.10284423828125, -0.09650421142578125, -0.0901641845703125, -0.08382415771484375, -0.077484130859375, -0.07114410400390625, -0.0648040771484375, -0.05846405029296875, -0.0521240234375, -0.04578399658203125, -0.0394439697265625, -0.03310394287109375, -0.026763916015625, -0.02042388916015625, -0.0140838623046875, -0.00774383544921875, -0.00140380859375, 0.00493621826171875, 0.0112762451171875, 0.01761627197265625, 0.023956298828125, 0.03029632568359375, 0.0366363525390625, 0.04297637939453125, 0.04931640625, 0.05565643310546875, 0.0619964599609375, 0.06833648681640625, 0.074676513671875, 0.08101654052734375, 0.0873565673828125, 0.09369659423828125, 0.10003662109375, 0.10637664794921875, 0.1127166748046875, 0.11905670166015625, 0.125396728515625, 0.13173675537109375, 0.1380767822265625, 0.14441680908203125, 0.1507568359375, 0.15709686279296875, 0.1634368896484375, 0.16977691650390625, 0.176116943359375, 0.18245697021484375, 0.1887969970703125, 0.19513702392578125, 0.20147705078125, 0.20781707763671875, 0.2141571044921875, 0.22049713134765625, 0.226837158203125, 0.23317718505859375, 0.2395172119140625, 0.24585723876953125, 0.252197265625]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 3.0, 3.0, 18.0, 56.0, 96.0, 213.0, 268.0, 210.0, 92.0, 33.0, 10.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6196396350860596, -1.5725220441818237, -1.525404453277588, -1.478286862373352, -1.4311692714691162, -1.38405179977417, -1.336934208869934, -1.2898166179656982, -1.2426990270614624, -1.1955814361572266, -1.1484638452529907, -1.1013462543487549, -1.0542287826538086, -1.0071111917495728, -0.9599936008453369, -0.9128760099411011, -0.8657584190368652, -0.8186408281326294, -0.7715232372283936, -0.7244057059288025, -0.6772881150245667, -0.6301705241203308, -0.5830529928207397, -0.5359354019165039, -0.48881781101226807, -0.4417002201080322, -0.3945826590061188, -0.3474650979042053, -0.3003475069999695, -0.25322991609573364, -0.2061123549938202, -0.15899479389190674, -0.1118772029876709, -0.06475962698459625, -0.017642050981521606, 0.02947552502155304, 0.07659310102462769, 0.12371067702770233, 0.17082825303077698, 0.21794581413269043, 0.26506340503692627, 0.3121809959411621, 0.35929855704307556, 0.406416118144989, 0.45353370904922485, 0.5006512999534607, 0.5477688312530518, 0.5948864221572876, 0.6420040130615234, 0.6891216039657593, 0.7362391948699951, 0.7833567261695862, 0.830474317073822, 0.8775919079780579, 0.9247094392776489, 0.9718270301818848, 1.0189446210861206, 1.0660622119903564, 1.1131798028945923, 1.1602973937988281, 1.2074148654937744, 1.2545324563980103, 1.301650047302246, 1.348767638206482, 1.3958852291107178]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 4.0, 8.0, 16.0, 12.0, 10.0, 13.0, 15.0, 18.0, 31.0, 22.0, 33.0, 27.0, 48.0, 36.0, 42.0, 37.0, 46.0, 53.0, 42.0, 43.0, 43.0, 28.0, 36.0, 42.0, 41.0, 31.0, 34.0, 28.0, 26.0, 16.0, 16.0, 17.0, 15.0, 20.0, 5.0, 6.0, 7.0, 9.0, 6.0, 3.0, 5.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.515007734298706, -0.50058513879776, -0.4861625134944916, -0.47173991799354553, -0.4573172926902771, -0.44289469718933105, -0.428472101688385, -0.41404950618743896, -0.39962688088417053, -0.3852042853832245, -0.37078166007995605, -0.35635906457901, -0.34193646907806396, -0.32751384377479553, -0.3130912482738495, -0.29866862297058105, -0.284246027469635, -0.26982343196868896, -0.25540080666542053, -0.2409782111644745, -0.22655560076236725, -0.21213299036026, -0.19771039485931396, -0.18328778445720673, -0.1688651740550995, -0.15444256365299225, -0.140019953250885, -0.12559735774993896, -0.11117474734783173, -0.09675213694572449, -0.08232953399419785, -0.0679069310426712, -0.053484320640563965, -0.039061713963747025, -0.024639107286930084, -0.010216500610113144, 0.004206106066703796, 0.018628716468811035, 0.03305131942033768, 0.04747392237186432, 0.06189653277397156, 0.0763191431760788, 0.09074174612760544, 0.10516434907913208, 0.11958695948123932, 0.13400956988334656, 0.1484321653842926, 0.16285477578639984, 0.17727738618850708, 0.19169999659061432, 0.20612260699272156, 0.2205452024936676, 0.23496781289577484, 0.24939042329788208, 0.2638130187988281, 0.27823561429977417, 0.2926582396030426, 0.30708083510398865, 0.3215034604072571, 0.3359260559082031, 0.35034865140914917, 0.3647712767124176, 0.37919387221336365, 0.3936164975166321, 0.4080390930175781]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 0.0, 5.0, 5.0, 7.0, 10.0, 13.0, 21.0, 37.0, 48.0, 91.0, 148.0, 207.0, 366.0, 630.0, 1418.0, 4512.0, 61711.0, 923698.0, 48494.0, 4086.0, 1372.0, 645.0, 400.0, 241.0, 130.0, 94.0, 53.0, 32.0, 26.0, 21.0, 7.0, 11.0, 4.0, 3.0, 5.0, 2.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.3701171875, -1.3265838623046875, -1.283050537109375, -1.2395172119140625, -1.19598388671875, -1.1524505615234375, -1.108917236328125, -1.0653839111328125, -1.0218505859375, -0.9783172607421875, -0.934783935546875, -0.8912506103515625, -0.84771728515625, -0.8041839599609375, -0.760650634765625, -0.7171173095703125, -0.673583984375, -0.6300506591796875, -0.586517333984375, -0.5429840087890625, -0.49945068359375, -0.4559173583984375, -0.412384033203125, -0.3688507080078125, -0.3253173828125, -0.2817840576171875, -0.238250732421875, -0.1947174072265625, -0.15118408203125, -0.1076507568359375, -0.064117431640625, -0.0205841064453125, 0.02294921875, 0.0664825439453125, 0.110015869140625, 0.1535491943359375, 0.19708251953125, 0.2406158447265625, 0.284149169921875, 0.3276824951171875, 0.3712158203125, 0.4147491455078125, 0.458282470703125, 0.5018157958984375, 0.54534912109375, 0.5888824462890625, 0.632415771484375, 0.6759490966796875, 0.719482421875, 0.7630157470703125, 0.806549072265625, 0.8500823974609375, 0.89361572265625, 0.9371490478515625, 0.980682373046875, 1.0242156982421875, 1.0677490234375, 1.1112823486328125, 1.154815673828125, 1.1983489990234375, 1.24188232421875, 1.2854156494140625, 1.328948974609375, 1.3724822998046875, 1.416015625]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 5.0, 17.0, 27.0, 68.0, 140.0, 209.0, 214.0, 171.0, 99.0, 25.0, 13.0, 6.0, 3.0, 3.0, 1.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.145263671875, -0.1395111083984375, -0.133758544921875, -0.1280059814453125, -0.12225341796875, -0.1165008544921875, -0.110748291015625, -0.1049957275390625, -0.0992431640625, -0.0934906005859375, -0.087738037109375, -0.0819854736328125, -0.07623291015625, -0.0704803466796875, -0.064727783203125, -0.0589752197265625, -0.05322265625, -0.0474700927734375, -0.041717529296875, -0.0359649658203125, -0.03021240234375, -0.0244598388671875, -0.018707275390625, -0.0129547119140625, -0.0072021484375, -0.0014495849609375, 0.004302978515625, 0.0100555419921875, 0.01580810546875, 0.0215606689453125, 0.027313232421875, 0.0330657958984375, 0.038818359375, 0.0445709228515625, 0.050323486328125, 0.0560760498046875, 0.06182861328125, 0.0675811767578125, 0.073333740234375, 0.0790863037109375, 0.0848388671875, 0.0905914306640625, 0.096343994140625, 0.1020965576171875, 0.10784912109375, 0.1136016845703125, 0.119354248046875, 0.1251068115234375, 0.130859375, 0.1366119384765625, 0.142364501953125, 0.1481170654296875, 0.15386962890625, 0.1596221923828125, 0.165374755859375, 0.1711273193359375, 0.1768798828125, 0.1826324462890625, 0.188385009765625, 0.1941375732421875, 0.19989013671875, 0.2056427001953125, 0.211395263671875, 0.2171478271484375, 0.222900390625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 6.0, 3.0, 1.0, 5.0, 5.0, 14.0, 15.0, 30.0, 43.0, 77.0, 99.0, 170.0, 296.0, 529.0, 987.0, 2003.0, 6207.0, 29540.0, 244013.0, 636119.0, 105317.0, 15779.0, 3947.0, 1490.0, 777.0, 403.0, 234.0, 152.0, 98.0, 73.0, 42.0, 29.0, 20.0, 21.0, 7.0, 5.0, 7.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.814453125, -0.78924560546875, -0.7640380859375, -0.73883056640625, -0.713623046875, -0.68841552734375, -0.6632080078125, -0.63800048828125, -0.61279296875, -0.58758544921875, -0.5623779296875, -0.53717041015625, -0.511962890625, -0.48675537109375, -0.4615478515625, -0.43634033203125, -0.4111328125, -0.38592529296875, -0.3607177734375, -0.33551025390625, -0.310302734375, -0.28509521484375, -0.2598876953125, -0.23468017578125, -0.20947265625, -0.18426513671875, -0.1590576171875, -0.13385009765625, -0.108642578125, -0.08343505859375, -0.0582275390625, -0.03302001953125, -0.0078125, 0.01739501953125, 0.0426025390625, 0.06781005859375, 0.093017578125, 0.11822509765625, 0.1434326171875, 0.16864013671875, 0.19384765625, 0.21905517578125, 0.2442626953125, 0.26947021484375, 0.294677734375, 0.31988525390625, 0.3450927734375, 0.37030029296875, 0.3955078125, 0.42071533203125, 0.4459228515625, 0.47113037109375, 0.496337890625, 0.52154541015625, 0.5467529296875, 0.57196044921875, 0.59716796875, 0.62237548828125, 0.6475830078125, 0.67279052734375, 0.697998046875, 0.72320556640625, 0.7484130859375, 0.77362060546875, 0.798828125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 7.0, 5.0, 9.0, 12.0, 10.0, 19.0, 32.0, 34.0, 39.0, 36.0, 41.0, 47.0, 44.0, 59.0, 49.0, 56.0, 45.0, 56.0, 59.0, 50.0, 43.0, 38.0, 31.0, 29.0, 25.0, 26.0, 18.0, 20.0, 7.0, 15.0, 11.0, 7.0, 8.0, 3.0, 3.0, 7.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.50341796875, -0.48931884765625, -0.4752197265625, -0.46112060546875, -0.447021484375, -0.43292236328125, -0.4188232421875, -0.40472412109375, -0.390625, -0.37652587890625, -0.3624267578125, -0.34832763671875, -0.334228515625, -0.32012939453125, -0.3060302734375, -0.29193115234375, -0.27783203125, -0.26373291015625, -0.2496337890625, -0.23553466796875, -0.221435546875, -0.20733642578125, -0.1932373046875, -0.17913818359375, -0.1650390625, -0.15093994140625, -0.1368408203125, -0.12274169921875, -0.108642578125, -0.09454345703125, -0.0804443359375, -0.06634521484375, -0.05224609375, -0.03814697265625, -0.0240478515625, -0.00994873046875, 0.004150390625, 0.01824951171875, 0.0323486328125, 0.04644775390625, 0.060546875, 0.07464599609375, 0.0887451171875, 0.10284423828125, 0.116943359375, 0.13104248046875, 0.1451416015625, 0.15924072265625, 0.17333984375, 0.18743896484375, 0.2015380859375, 0.21563720703125, 0.229736328125, 0.24383544921875, 0.2579345703125, 0.27203369140625, 0.2861328125, 0.30023193359375, 0.3143310546875, 0.32843017578125, 0.342529296875, 0.35662841796875, 0.3707275390625, 0.38482666015625, 0.39892578125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 7.0, 5.0, 10.0, 12.0, 30.0, 51.0, 108.0, 170.0, 500.0, 2560.0, 234018.0, 805726.0, 4325.0, 609.0, 188.0, 105.0, 55.0, 30.0, 14.0, 14.0, 5.0, 7.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.4873046875, -1.4449310302734375, -1.402557373046875, -1.3601837158203125, -1.31781005859375, -1.2754364013671875, -1.233062744140625, -1.1906890869140625, -1.1483154296875, -1.1059417724609375, -1.063568115234375, -1.0211944580078125, -0.97882080078125, -0.9364471435546875, -0.894073486328125, -0.8516998291015625, -0.809326171875, -0.7669525146484375, -0.724578857421875, -0.6822052001953125, -0.63983154296875, -0.5974578857421875, -0.555084228515625, -0.5127105712890625, -0.4703369140625, -0.4279632568359375, -0.385589599609375, -0.3432159423828125, -0.30084228515625, -0.2584686279296875, -0.216094970703125, -0.1737213134765625, -0.13134765625, -0.0889739990234375, -0.046600341796875, -0.0042266845703125, 0.03814697265625, 0.0805206298828125, 0.122894287109375, 0.1652679443359375, 0.2076416015625, 0.2500152587890625, 0.292388916015625, 0.3347625732421875, 0.37713623046875, 0.4195098876953125, 0.461883544921875, 0.5042572021484375, 0.546630859375, 0.5890045166015625, 0.631378173828125, 0.6737518310546875, 0.71612548828125, 0.7584991455078125, 0.800872802734375, 0.8432464599609375, 0.8856201171875, 0.9279937744140625, 0.970367431640625, 1.0127410888671875, 1.05511474609375, 1.0974884033203125, 1.139862060546875, 1.1822357177734375, 1.224609375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 4.0, 2.0, 6.0, 4.0, 5.0, 8.0, 16.0, 19.0, 21.0, 27.0, 47.0, 39.0, 47.0, 78.0, 72.0, 89.0, 113.0, 105.0, 79.0, 36.0, 44.0, 37.0, 29.0, 15.0, 20.0, 15.0, 10.0, 7.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.49879264831543e-05, -3.378372639417648e-05, -3.257952630519867e-05, -3.1375326216220856e-05, -3.0171126127243042e-05, -2.8966926038265228e-05, -2.7762725949287415e-05, -2.65585258603096e-05, -2.5354325771331787e-05, -2.4150125682353973e-05, -2.294592559337616e-05, -2.1741725504398346e-05, -2.0537525415420532e-05, -1.933332532644272e-05, -1.8129125237464905e-05, -1.692492514848709e-05, -1.5720725059509277e-05, -1.4516524970531464e-05, -1.331232488155365e-05, -1.2108124792575836e-05, -1.0903924703598022e-05, -9.699724614620209e-06, -8.495524525642395e-06, -7.291324436664581e-06, -6.087124347686768e-06, -4.882924258708954e-06, -3.67872416973114e-06, -2.4745240807533264e-06, -1.2703239917755127e-06, -6.612390279769897e-08, 1.1380761861801147e-06, 2.3422762751579285e-06, 3.546476364135742e-06, 4.750676453113556e-06, 5.95487654209137e-06, 7.159076631069183e-06, 8.363276720046997e-06, 9.56747680902481e-06, 1.0771676898002625e-05, 1.1975876986980438e-05, 1.3180077075958252e-05, 1.4384277164936066e-05, 1.558847725391388e-05, 1.6792677342891693e-05, 1.7996877431869507e-05, 1.920107752084732e-05, 2.0405277609825134e-05, 2.1609477698802948e-05, 2.2813677787780762e-05, 2.4017877876758575e-05, 2.522207796573639e-05, 2.6426278054714203e-05, 2.7630478143692017e-05, 2.883467823266983e-05, 3.0038878321647644e-05, 3.124307841062546e-05, 3.244727849960327e-05, 3.3651478588581085e-05, 3.48556786775589e-05, 3.605987876653671e-05, 3.7264078855514526e-05, 3.846827894449234e-05, 3.9672479033470154e-05, 4.087667912244797e-05, 4.208087921142578e-05]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 2.0, 4.0, 4.0, 9.0, 12.0, 7.0, 13.0, 27.0, 31.0, 60.0, 120.0, 212.0, 555.0, 1617.0, 6569.0, 114105.0, 892780.0, 27324.0, 3432.0, 915.0, 360.0, 153.0, 85.0, 46.0, 37.0, 26.0, 15.0, 4.0, 11.0, 10.0, 0.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.97607421875, -0.9484329223632812, -0.9207916259765625, -0.8931503295898438, -0.865509033203125, -0.8378677368164062, -0.8102264404296875, -0.7825851440429688, -0.75494384765625, -0.7273025512695312, -0.6996612548828125, -0.6720199584960938, -0.644378662109375, -0.6167373657226562, -0.5890960693359375, -0.5614547729492188, -0.5338134765625, -0.5061721801757812, -0.4785308837890625, -0.45088958740234375, -0.423248291015625, -0.39560699462890625, -0.3679656982421875, -0.34032440185546875, -0.31268310546875, -0.28504180908203125, -0.2574005126953125, -0.22975921630859375, -0.202117919921875, -0.17447662353515625, -0.1468353271484375, -0.11919403076171875, -0.091552734375, -0.06391143798828125, -0.0362701416015625, -0.00862884521484375, 0.019012451171875, 0.04665374755859375, 0.0742950439453125, 0.10193634033203125, 0.12957763671875, 0.15721893310546875, 0.1848602294921875, 0.21250152587890625, 0.240142822265625, 0.26778411865234375, 0.2954254150390625, 0.32306671142578125, 0.3507080078125, 0.37834930419921875, 0.4059906005859375, 0.43363189697265625, 0.461273193359375, 0.48891448974609375, 0.5165557861328125, 0.5441970825195312, 0.57183837890625, 0.5994796752929688, 0.6271209716796875, 0.6547622680664062, 0.682403564453125, 0.7100448608398438, 0.7376861572265625, 0.7653274536132812, 0.79296875]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 9.0, 10.0, 25.0, 24.0, 60.0, 98.0, 139.0, 157.0, 189.0, 109.0, 71.0, 40.0, 23.0, 13.0, 9.0, 2.0, 5.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.65283203125, -0.6354904174804688, -0.6181488037109375, -0.6008071899414062, -0.583465576171875, -0.5661239624023438, -0.5487823486328125, -0.5314407348632812, -0.51409912109375, -0.49675750732421875, -0.4794158935546875, -0.46207427978515625, -0.444732666015625, -0.42739105224609375, -0.4100494384765625, -0.39270782470703125, -0.3753662109375, -0.35802459716796875, -0.3406829833984375, -0.32334136962890625, -0.305999755859375, -0.28865814208984375, -0.2713165283203125, -0.25397491455078125, -0.23663330078125, -0.21929168701171875, -0.2019500732421875, -0.18460845947265625, -0.167266845703125, -0.14992523193359375, -0.1325836181640625, -0.11524200439453125, -0.097900390625, -0.08055877685546875, -0.0632171630859375, -0.04587554931640625, -0.028533935546875, -0.01119232177734375, 0.0061492919921875, 0.02349090576171875, 0.04083251953125, 0.05817413330078125, 0.0755157470703125, 0.09285736083984375, 0.110198974609375, 0.12754058837890625, 0.1448822021484375, 0.16222381591796875, 0.1795654296875, 0.19690704345703125, 0.2142486572265625, 0.23159027099609375, 0.248931884765625, 0.26627349853515625, 0.2836151123046875, 0.30095672607421875, 0.31829833984375, 0.33563995361328125, 0.3529815673828125, 0.37032318115234375, 0.387664794921875, 0.40500640869140625, 0.4223480224609375, 0.43968963623046875, 0.45703125]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 21.0, 74.0, 312.0, 357.0, 169.0, 43.0, 18.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.59561014175415, -5.319100379943848, -5.042590618133545, -4.766080856323242, -4.4895710945129395, -4.213061332702637, -3.936551570892334, -3.6600418090820312, -3.3835320472717285, -3.107022285461426, -2.830512523651123, -2.5540027618408203, -2.2774930000305176, -2.000983238220215, -1.724473476409912, -1.4479637145996094, -1.1714539527893066, -0.8949441909790039, -0.6184344291687012, -0.34192466735839844, -0.0654149055480957, 0.21109485626220703, 0.48760461807250977, 0.7641143798828125, 1.0406241416931152, 1.317133903503418, 1.5936436653137207, 1.8701534271240234, 2.146663188934326, 2.423172950744629, 2.6996827125549316, 2.9761924743652344, 3.2527027130126953, 3.529212474822998, 3.805722236633301, 4.0822319984436035, 4.358741760253906, 4.635251522064209, 4.911761283874512, 5.1882710456848145, 5.464780807495117, 5.74129056930542, 6.017800331115723, 6.294310092926025, 6.570819854736328, 6.847329616546631, 7.123839378356934, 7.400349140167236, 7.676858901977539, 7.953368663787842, 8.229878425598145, 8.506387710571289, 8.78289794921875, 9.059408187866211, 9.335917472839355, 9.6124267578125, 9.888936996459961, 10.165447235107422, 10.441956520080566, 10.718465805053711, 10.994976043701172, 11.271486282348633, 11.547995567321777, 11.824504852294922, 12.101015090942383]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 2.0, 4.0, 4.0, 7.0, 5.0, 16.0, 12.0, 12.0, 11.0, 10.0, 16.0, 30.0, 26.0, 29.0, 28.0, 37.0, 29.0, 41.0, 47.0, 40.0, 37.0, 43.0, 42.0, 45.0, 42.0, 41.0, 43.0, 46.0, 39.0, 25.0, 21.0, 29.0, 22.0, 26.0, 18.0, 13.0, 9.0, 6.0, 11.0, 8.0, 6.0, 10.0, 9.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-2.4054222106933594, -2.330981731414795, -2.2565414905548096, -2.182101011276245, -2.1076605319976807, -2.033220052719116, -1.9587798118591309, -1.8843393325805664, -1.809898853302002, -1.735458493232727, -1.6610180139541626, -1.5865776538848877, -1.5121371746063232, -1.4376968145370483, -1.3632564544677734, -1.288815975189209, -1.214375615119934, -1.1399352550506592, -1.0654947757720947, -0.9910544157028198, -0.9166139364242554, -0.8421735763549805, -0.7677331566810608, -0.6932927370071411, -0.6188523173332214, -0.5444118976593018, -0.4699714779853821, -0.3955310881137848, -0.3210906684398651, -0.24665024876594543, -0.17220985889434814, -0.09776943922042847, -0.02332901954650879, 0.05111139267683029, 0.12555180490016937, 0.19999220967292786, 0.27443262934684753, 0.3488730490207672, 0.4233134388923645, 0.4977538585662842, 0.5721942782402039, 0.6466346979141235, 0.7210751175880432, 0.7955155372619629, 0.8699558973312378, 0.9443963766098022, 1.0188367366790771, 1.0932772159576416, 1.1677175760269165, 1.2421579360961914, 1.3165984153747559, 1.3910387754440308, 1.4654792547225952, 1.5399196147918701, 1.6143600940704346, 1.6888004541397095, 1.7632408142089844, 1.8376811742782593, 1.9121216535568237, 1.9865620136260986, 2.061002492904663, 2.1354429721832275, 2.209883213043213, 2.2843236923217773, 2.358764171600342]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 12.0, 14.0, 28.0, 66.0, 123.0, 521.0, 2950.0, 194358.0, 3986974.0, 7413.0, 1100.0, 357.0, 169.0, 68.0, 56.0, 32.0, 15.0, 10.0, 9.0, 5.0, 5.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.982421875, -1.906646728515625, -1.83087158203125, -1.755096435546875, -1.6793212890625, -1.603546142578125, -1.52777099609375, -1.451995849609375, -1.376220703125, -1.300445556640625, -1.22467041015625, -1.148895263671875, -1.0731201171875, -0.997344970703125, -0.92156982421875, -0.845794677734375, -0.77001953125, -0.694244384765625, -0.61846923828125, -0.542694091796875, -0.4669189453125, -0.391143798828125, -0.31536865234375, -0.239593505859375, -0.163818359375, -0.088043212890625, -0.01226806640625, 0.063507080078125, 0.1392822265625, 0.215057373046875, 0.29083251953125, 0.366607666015625, 0.4423828125, 0.518157958984375, 0.59393310546875, 0.669708251953125, 0.7454833984375, 0.821258544921875, 0.89703369140625, 0.972808837890625, 1.048583984375, 1.124359130859375, 1.20013427734375, 1.275909423828125, 1.3516845703125, 1.427459716796875, 1.50323486328125, 1.579010009765625, 1.65478515625, 1.730560302734375, 1.80633544921875, 1.882110595703125, 1.9578857421875, 2.033660888671875, 2.10943603515625, 2.185211181640625, 2.260986328125, 2.336761474609375, 2.41253662109375, 2.488311767578125, 2.5640869140625, 2.639862060546875, 2.71563720703125, 2.791412353515625, 2.8671875]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 11.0, 17.0, 24.0, 44.0, 86.0, 149.0, 185.0, 177.0, 141.0, 81.0, 54.0, 19.0, 12.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1624755859375, -0.15598106384277344, -0.14948654174804688, -0.1429920196533203, -0.13649749755859375, -0.1300029754638672, -0.12350845336914062, -0.11701393127441406, -0.1105194091796875, -0.10402488708496094, -0.09753036499023438, -0.09103584289550781, -0.08454132080078125, -0.07804679870605469, -0.07155227661132812, -0.06505775451660156, -0.058563232421875, -0.05206871032714844, -0.045574188232421875, -0.03907966613769531, -0.03258514404296875, -0.026090621948242188, -0.019596099853515625, -0.013101577758789062, -0.0066070556640625, -0.0001125335693359375, 0.006381988525390625, 0.012876510620117188, 0.01937103271484375, 0.025865554809570312, 0.032360076904296875, 0.03885459899902344, 0.04534912109375, 0.05184364318847656, 0.058338165283203125, 0.06483268737792969, 0.07132720947265625, 0.07782173156738281, 0.08431625366210938, 0.09081077575683594, 0.0973052978515625, 0.10379981994628906, 0.11029434204101562, 0.11678886413574219, 0.12328338623046875, 0.1297779083251953, 0.13627243041992188, 0.14276695251464844, 0.149261474609375, 0.15575599670410156, 0.16225051879882812, 0.1687450408935547, 0.17523956298828125, 0.1817340850830078, 0.18822860717773438, 0.19472312927246094, 0.2012176513671875, 0.20771217346191406, 0.21420669555664062, 0.2207012176513672, 0.22719573974609375, 0.2336902618408203, 0.24018478393554688, 0.24667930603027344, 0.253173828125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 5.0, 2.0, 13.0, 13.0, 14.0, 34.0, 75.0, 157.0, 284.0, 677.0, 1768.0, 6744.0, 49985.0, 3497951.0, 608694.0, 21668.0, 4057.0, 1257.0, 445.0, 213.0, 110.0, 57.0, 25.0, 14.0, 10.0, 4.0, 5.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.9423828125, -0.9085235595703125, -0.874664306640625, -0.8408050537109375, -0.80694580078125, -0.7730865478515625, -0.739227294921875, -0.7053680419921875, -0.6715087890625, -0.6376495361328125, -0.603790283203125, -0.5699310302734375, -0.53607177734375, -0.5022125244140625, -0.468353271484375, -0.4344940185546875, -0.400634765625, -0.3667755126953125, -0.332916259765625, -0.2990570068359375, -0.26519775390625, -0.2313385009765625, -0.197479248046875, -0.1636199951171875, -0.1297607421875, -0.0959014892578125, -0.062042236328125, -0.0281829833984375, 0.00567626953125, 0.0395355224609375, 0.073394775390625, 0.1072540283203125, 0.14111328125, 0.1749725341796875, 0.208831787109375, 0.2426910400390625, 0.27655029296875, 0.3104095458984375, 0.344268798828125, 0.3781280517578125, 0.4119873046875, 0.4458465576171875, 0.479705810546875, 0.5135650634765625, 0.54742431640625, 0.5812835693359375, 0.615142822265625, 0.6490020751953125, 0.682861328125, 0.7167205810546875, 0.750579833984375, 0.7844390869140625, 0.81829833984375, 0.8521575927734375, 0.886016845703125, 0.9198760986328125, 0.9537353515625, 0.9875946044921875, 1.021453857421875, 1.0553131103515625, 1.08917236328125, 1.1230316162109375, 1.156890869140625, 1.1907501220703125, 1.224609375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 1.0, 6.0, 5.0, 9.0, 10.0, 14.0, 20.0, 43.0, 62.0, 129.0, 199.0, 528.0, 1489.0, 854.0, 350.0, 178.0, 48.0, 49.0, 32.0, 18.0, 9.0, 6.0, 5.0, 3.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17822265625, -0.17130279541015625, -0.1643829345703125, -0.15746307373046875, -0.150543212890625, -0.14362335205078125, -0.1367034912109375, -0.12978363037109375, -0.12286376953125, -0.11594390869140625, -0.1090240478515625, -0.10210418701171875, -0.095184326171875, -0.08826446533203125, -0.0813446044921875, -0.07442474365234375, -0.0675048828125, -0.06058502197265625, -0.0536651611328125, -0.04674530029296875, -0.039825439453125, -0.03290557861328125, -0.0259857177734375, -0.01906585693359375, -0.01214599609375, -0.00522613525390625, 0.0016937255859375, 0.00861358642578125, 0.015533447265625, 0.02245330810546875, 0.0293731689453125, 0.03629302978515625, 0.043212890625, 0.05013275146484375, 0.0570526123046875, 0.06397247314453125, 0.070892333984375, 0.07781219482421875, 0.0847320556640625, 0.09165191650390625, 0.09857177734375, 0.10549163818359375, 0.1124114990234375, 0.11933135986328125, 0.126251220703125, 0.13317108154296875, 0.1400909423828125, 0.14701080322265625, 0.1539306640625, 0.16085052490234375, 0.1677703857421875, 0.17469024658203125, 0.181610107421875, 0.18852996826171875, 0.1954498291015625, 0.20236968994140625, 0.20928955078125, 0.21620941162109375, 0.2231292724609375, 0.23004913330078125, 0.236968994140625, 0.24388885498046875, 0.2508087158203125, 0.25772857666015625, 0.2646484375]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 6.0, 26.0, 251.0, 557.0, 156.0, 13.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9330041408538818, -1.8149001598358154, -1.696796178817749, -1.5786921977996826, -1.4605882167816162, -1.3424842357635498, -1.2243801355361938, -1.1062761545181274, -0.988172173500061, -0.8700681924819946, -0.7519642114639282, -0.633860170841217, -0.5157561898231506, -0.39765220880508423, -0.27954816818237305, -0.16144418716430664, -0.043340206146240234, 0.07476378977298737, 0.19286778569221497, 0.31097179651260376, 0.42907577753067017, 0.5471797585487366, 0.6652837991714478, 0.7833877801895142, 0.9014917612075806, 1.019595742225647, 1.1376997232437134, 1.2558038234710693, 1.3739078044891357, 1.4920117855072021, 1.6101157665252686, 1.728219747543335, 1.8463239669799805, 1.9644279479980469, 2.0825319290161133, 2.2006359100341797, 2.318739891052246, 2.4368438720703125, 2.554947853088379, 2.6730518341064453, 2.7911558151245117, 2.909259796142578, 3.0273637771606445, 3.145467758178711, 3.2635717391967773, 3.3816757202148438, 3.49977970123291, 3.6178836822509766, 3.735987901687622, 3.8540918827056885, 3.972195863723755, 4.0903000831604, 4.208404064178467, 4.326508045196533, 4.4446120262146, 4.562716007232666, 4.680819988250732, 4.798923969268799, 4.917027950286865, 5.035131931304932, 5.153235912322998, 5.2713398933410645, 5.389443874359131, 5.507547855377197, 5.625651836395264]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 3.0, 5.0, 3.0, 7.0, 7.0, 11.0, 4.0, 8.0, 21.0, 26.0, 17.0, 24.0, 19.0, 22.0, 39.0, 38.0, 42.0, 47.0, 45.0, 41.0, 36.0, 41.0, 47.0, 40.0, 44.0, 36.0, 30.0, 47.0, 31.0, 37.0, 28.0, 28.0, 19.0, 14.0, 18.0, 14.0, 14.0, 12.0, 10.0, 5.0, 3.0, 5.0, 4.0, 4.0, 2.0, 3.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.5205402374267578, -0.5043980479240417, -0.48825591802597046, -0.4721137285232544, -0.4559715688228607, -0.43982940912246704, -0.423687219619751, -0.4075450599193573, -0.3914029002189636, -0.37526074051856995, -0.35911858081817627, -0.3429763913154602, -0.32683423161506653, -0.31069207191467285, -0.2945498824119568, -0.2784077227115631, -0.26226556301116943, -0.24612340331077576, -0.2299812287092209, -0.21383905410766602, -0.19769689440727234, -0.18155473470687866, -0.1654125601053238, -0.14927038550376892, -0.13312822580337524, -0.11698605865240097, -0.1008438915014267, -0.08470172435045242, -0.06855955719947815, -0.052417390048503876, -0.0362752228975296, -0.02013305574655533, -0.003990828990936279, 0.012151338160037994, 0.028293505311012268, 0.04443567246198654, 0.060577839612960815, 0.07672000676393509, 0.09286217391490936, 0.10900434106588364, 0.1251465082168579, 0.1412886679172516, 0.15743084251880646, 0.17357301712036133, 0.189715176820755, 0.20585733652114868, 0.22199951112270355, 0.23814168572425842, 0.2542838454246521, 0.2704260051250458, 0.28656816482543945, 0.3027103543281555, 0.3188525140285492, 0.33499467372894287, 0.35113686323165894, 0.3672790229320526, 0.3834211826324463, 0.39956334233283997, 0.41570550203323364, 0.4318476915359497, 0.4479898512363434, 0.46413201093673706, 0.4802742004394531, 0.4964163601398468, 0.5125585198402405]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 3.0, 7.0, 11.0, 5.0, 9.0, 16.0, 13.0, 38.0, 47.0, 53.0, 75.0, 94.0, 142.0, 162.0, 253.0, 366.0, 606.0, 1045.0, 2434.0, 8622.0, 54260.0, 453817.0, 457413.0, 55196.0, 8452.0, 2416.0, 1081.0, 583.0, 343.0, 254.0, 188.0, 145.0, 97.0, 82.0, 62.0, 37.0, 31.0, 25.0, 20.0, 17.0, 10.0, 7.0, 7.0, 3.0, 4.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.73779296875, -0.716094970703125, -0.69439697265625, -0.672698974609375, -0.6510009765625, -0.629302978515625, -0.60760498046875, -0.585906982421875, -0.564208984375, -0.542510986328125, -0.52081298828125, -0.499114990234375, -0.4774169921875, -0.455718994140625, -0.43402099609375, -0.412322998046875, -0.390625, -0.368927001953125, -0.34722900390625, -0.325531005859375, -0.3038330078125, -0.282135009765625, -0.26043701171875, -0.238739013671875, -0.217041015625, -0.195343017578125, -0.17364501953125, -0.151947021484375, -0.1302490234375, -0.108551025390625, -0.08685302734375, -0.065155029296875, -0.04345703125, -0.021759033203125, -6.103515625e-05, 0.021636962890625, 0.0433349609375, 0.065032958984375, 0.08673095703125, 0.108428955078125, 0.130126953125, 0.151824951171875, 0.17352294921875, 0.195220947265625, 0.2169189453125, 0.238616943359375, 0.26031494140625, 0.282012939453125, 0.3037109375, 0.325408935546875, 0.34710693359375, 0.368804931640625, 0.3905029296875, 0.412200927734375, 0.43389892578125, 0.455596923828125, 0.477294921875, 0.498992919921875, 0.52069091796875, 0.542388916015625, 0.5640869140625, 0.585784912109375, 0.60748291015625, 0.629180908203125, 0.65087890625]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 12.0, 16.0, 33.0, 67.0, 113.0, 156.0, 170.0, 184.0, 122.0, 68.0, 37.0, 14.0, 7.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1573486328125, -0.1509685516357422, -0.14458847045898438, -0.13820838928222656, -0.13182830810546875, -0.12544822692871094, -0.11906814575195312, -0.11268806457519531, -0.1063079833984375, -0.09992790222167969, -0.09354782104492188, -0.08716773986816406, -0.08078765869140625, -0.07440757751464844, -0.06802749633789062, -0.06164741516113281, -0.055267333984375, -0.04888725280761719, -0.042507171630859375, -0.03612709045410156, -0.02974700927734375, -0.023366928100585938, -0.016986846923828125, -0.010606765747070312, -0.0042266845703125, 0.0021533966064453125, 0.008533477783203125, 0.014913558959960938, 0.02129364013671875, 0.027673721313476562, 0.034053802490234375, 0.04043388366699219, 0.04681396484375, 0.05319404602050781, 0.059574127197265625, 0.06595420837402344, 0.07233428955078125, 0.07871437072753906, 0.08509445190429688, 0.09147453308105469, 0.0978546142578125, 0.10423469543457031, 0.11061477661132812, 0.11699485778808594, 0.12337493896484375, 0.12975502014160156, 0.13613510131835938, 0.1425151824951172, 0.148895263671875, 0.1552753448486328, 0.16165542602539062, 0.16803550720214844, 0.17441558837890625, 0.18079566955566406, 0.18717575073242188, 0.1935558319091797, 0.1999359130859375, 0.2063159942626953, 0.21269607543945312, 0.21907615661621094, 0.22545623779296875, 0.23183631896972656, 0.23821640014648438, 0.2445964813232422, 0.2509765625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 6.0, 2.0, 4.0, 9.0, 9.0, 6.0, 9.0, 6.0, 34.0, 31.0, 45.0, 71.0, 77.0, 155.0, 242.0, 357.0, 606.0, 1160.0, 2328.0, 5551.0, 15124.0, 53971.0, 245619.0, 499916.0, 165170.0, 37942.0, 11459.0, 4293.0, 1895.0, 957.0, 591.0, 306.0, 216.0, 108.0, 83.0, 59.0, 37.0, 34.0, 20.0, 21.0, 9.0, 14.0, 4.0, 3.0, 6.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.488525390625, -0.4706764221191406, -0.45282745361328125, -0.4349784851074219, -0.4171295166015625, -0.3992805480957031, -0.38143157958984375, -0.3635826110839844, -0.345733642578125, -0.3278846740722656, -0.31003570556640625, -0.2921867370605469, -0.2743377685546875, -0.2564888000488281, -0.23863983154296875, -0.22079086303710938, -0.20294189453125, -0.18509292602539062, -0.16724395751953125, -0.14939498901367188, -0.1315460205078125, -0.11369705200195312, -0.09584808349609375, -0.07799911499023438, -0.060150146484375, -0.042301177978515625, -0.02445220947265625, -0.006603240966796875, 0.0112457275390625, 0.029094696044921875, 0.04694366455078125, 0.06479263305664062, 0.0826416015625, 0.10049057006835938, 0.11833953857421875, 0.13618850708007812, 0.1540374755859375, 0.17188644409179688, 0.18973541259765625, 0.20758438110351562, 0.225433349609375, 0.24328231811523438, 0.26113128662109375, 0.2789802551269531, 0.2968292236328125, 0.3146781921386719, 0.33252716064453125, 0.3503761291503906, 0.36822509765625, 0.3860740661621094, 0.40392303466796875, 0.4217720031738281, 0.4396209716796875, 0.4574699401855469, 0.47531890869140625, 0.4931678771972656, 0.511016845703125, 0.5288658142089844, 0.5467147827148438, 0.5645637512207031, 0.5824127197265625, 0.6002616882324219, 0.6181106567382812, 0.6359596252441406, 0.65380859375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 1.0, 3.0, 13.0, 9.0, 11.0, 15.0, 18.0, 16.0, 25.0, 41.0, 35.0, 20.0, 33.0, 43.0, 36.0, 50.0, 38.0, 32.0, 52.0, 57.0, 56.0, 47.0, 43.0, 45.0, 44.0, 31.0, 31.0, 27.0, 23.0, 13.0, 14.0, 19.0, 16.0, 12.0, 5.0, 8.0, 5.0, 3.0, 8.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.4541015625, -0.4398651123046875, -0.425628662109375, -0.4113922119140625, -0.39715576171875, -0.3829193115234375, -0.368682861328125, -0.3544464111328125, -0.3402099609375, -0.3259735107421875, -0.311737060546875, -0.2975006103515625, -0.28326416015625, -0.2690277099609375, -0.254791259765625, -0.2405548095703125, -0.226318359375, -0.2120819091796875, -0.197845458984375, -0.1836090087890625, -0.16937255859375, -0.1551361083984375, -0.140899658203125, -0.1266632080078125, -0.1124267578125, -0.0981903076171875, -0.083953857421875, -0.0697174072265625, -0.05548095703125, -0.0412445068359375, -0.027008056640625, -0.0127716064453125, 0.00146484375, 0.0157012939453125, 0.029937744140625, 0.0441741943359375, 0.05841064453125, 0.0726470947265625, 0.086883544921875, 0.1011199951171875, 0.1153564453125, 0.1295928955078125, 0.143829345703125, 0.1580657958984375, 0.17230224609375, 0.1865386962890625, 0.200775146484375, 0.2150115966796875, 0.229248046875, 0.2434844970703125, 0.257720947265625, 0.2719573974609375, 0.28619384765625, 0.3004302978515625, 0.314666748046875, 0.3289031982421875, 0.3431396484375, 0.3573760986328125, 0.371612548828125, 0.3858489990234375, 0.40008544921875, 0.4143218994140625, 0.428558349609375, 0.4427947998046875, 0.45703125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 4.0, 4.0, 4.0, 15.0, 10.0, 14.0, 25.0, 47.0, 53.0, 86.0, 154.0, 299.0, 593.0, 1269.0, 3610.0, 15436.0, 126273.0, 730828.0, 146482.0, 16734.0, 3921.0, 1377.0, 623.0, 292.0, 139.0, 78.0, 64.0, 32.0, 24.0, 16.0, 13.0, 13.0, 5.0, 7.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.325439453125, -0.31511688232421875, -0.3047943115234375, -0.29447174072265625, -0.284149169921875, -0.27382659912109375, -0.2635040283203125, -0.25318145751953125, -0.24285888671875, -0.23253631591796875, -0.2222137451171875, -0.21189117431640625, -0.201568603515625, -0.19124603271484375, -0.1809234619140625, -0.17060089111328125, -0.1602783203125, -0.14995574951171875, -0.1396331787109375, -0.12931060791015625, -0.118988037109375, -0.10866546630859375, -0.0983428955078125, -0.08802032470703125, -0.07769775390625, -0.06737518310546875, -0.0570526123046875, -0.04673004150390625, -0.036407470703125, -0.02608489990234375, -0.0157623291015625, -0.00543975830078125, 0.0048828125, 0.01520538330078125, 0.0255279541015625, 0.03585052490234375, 0.046173095703125, 0.05649566650390625, 0.0668182373046875, 0.07714080810546875, 0.08746337890625, 0.09778594970703125, 0.1081085205078125, 0.11843109130859375, 0.128753662109375, 0.13907623291015625, 0.1493988037109375, 0.15972137451171875, 0.1700439453125, 0.18036651611328125, 0.1906890869140625, 0.20101165771484375, 0.211334228515625, 0.22165679931640625, 0.2319793701171875, 0.24230194091796875, 0.25262451171875, 0.26294708251953125, 0.2732696533203125, 0.28359222412109375, 0.293914794921875, 0.30423736572265625, 0.3145599365234375, 0.32488250732421875, 0.335205078125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 3.0, 2.0, 5.0, 5.0, 5.0, 12.0, 9.0, 22.0, 33.0, 39.0, 54.0, 61.0, 76.0, 93.0, 89.0, 100.0, 82.0, 77.0, 66.0, 34.0, 42.0, 33.0, 21.0, 6.0, 16.0, 6.0, 6.0, 5.0, 2.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.774332046508789e-05, -4.6552158892154694e-05, -4.5360997319221497e-05, -4.41698357462883e-05, -4.29786741733551e-05, -4.1787512600421906e-05, -4.059635102748871e-05, -3.940518945455551e-05, -3.8214027881622314e-05, -3.702286630868912e-05, -3.583170473575592e-05, -3.4640543162822723e-05, -3.3449381589889526e-05, -3.225822001695633e-05, -3.106705844402313e-05, -2.9875896871089935e-05, -2.8684735298156738e-05, -2.749357372522354e-05, -2.6302412152290344e-05, -2.5111250579357147e-05, -2.392008900642395e-05, -2.2728927433490753e-05, -2.1537765860557556e-05, -2.034660428762436e-05, -1.9155442714691162e-05, -1.7964281141757965e-05, -1.6773119568824768e-05, -1.558195799589157e-05, -1.4390796422958374e-05, -1.3199634850025177e-05, -1.200847327709198e-05, -1.0817311704158783e-05, -9.626150131225586e-06, -8.434988558292389e-06, -7.243826985359192e-06, -6.052665412425995e-06, -4.861503839492798e-06, -3.670342266559601e-06, -2.479180693626404e-06, -1.2880191206932068e-06, -9.685754776000977e-08, 1.0943040251731873e-06, 2.2854655981063843e-06, 3.4766271710395813e-06, 4.667788743972778e-06, 5.858950316905975e-06, 7.050111889839172e-06, 8.24127346277237e-06, 9.432435035705566e-06, 1.0623596608638763e-05, 1.181475818157196e-05, 1.3005919754505157e-05, 1.4197081327438354e-05, 1.538824290037155e-05, 1.657940447330475e-05, 1.7770566046237946e-05, 1.8961727619171143e-05, 2.015288919210434e-05, 2.1344050765037537e-05, 2.2535212337970734e-05, 2.372637391090393e-05, 2.4917535483837128e-05, 2.6108697056770325e-05, 2.7299858629703522e-05, 2.849102020263672e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 2.0, 2.0, 5.0, 1.0, 4.0, 9.0, 4.0, 9.0, 18.0, 26.0, 32.0, 27.0, 64.0, 101.0, 125.0, 216.0, 357.0, 631.0, 1212.0, 2698.0, 7270.0, 26442.0, 145265.0, 574689.0, 233724.0, 38927.0, 9995.0, 3412.0, 1459.0, 703.0, 418.0, 219.0, 165.0, 98.0, 64.0, 43.0, 31.0, 26.0, 18.0, 16.0, 7.0, 8.0, 9.0, 3.0, 3.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1976318359375, -0.18992042541503906, -0.18220901489257812, -0.1744976043701172, -0.16678619384765625, -0.1590747833251953, -0.15136337280273438, -0.14365196228027344, -0.1359405517578125, -0.12822914123535156, -0.12051773071289062, -0.11280632019042969, -0.10509490966796875, -0.09738349914550781, -0.08967208862304688, -0.08196067810058594, -0.074249267578125, -0.06653785705566406, -0.058826446533203125, -0.05111503601074219, -0.04340362548828125, -0.03569221496582031, -0.027980804443359375, -0.020269393920898438, -0.0125579833984375, -0.0048465728759765625, 0.002864837646484375, 0.010576248168945312, 0.01828765869140625, 0.025999069213867188, 0.033710479736328125, 0.04142189025878906, 0.04913330078125, 0.05684471130371094, 0.06455612182617188, 0.07226753234863281, 0.07997894287109375, 0.08769035339355469, 0.09540176391601562, 0.10311317443847656, 0.1108245849609375, 0.11853599548339844, 0.12624740600585938, 0.1339588165283203, 0.14167022705078125, 0.1493816375732422, 0.15709304809570312, 0.16480445861816406, 0.172515869140625, 0.18022727966308594, 0.18793869018554688, 0.1956501007080078, 0.20336151123046875, 0.2110729217529297, 0.21878433227539062, 0.22649574279785156, 0.2342071533203125, 0.24191856384277344, 0.24962997436523438, 0.2573413848876953, 0.26505279541015625, 0.2727642059326172, 0.2804756164550781, 0.28818702697753906, 0.2958984375]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 4.0, 3.0, 6.0, 12.0, 23.0, 27.0, 49.0, 57.0, 59.0, 79.0, 102.0, 129.0, 111.0, 80.0, 72.0, 55.0, 40.0, 32.0, 21.0, 6.0, 10.0, 8.0, 6.0, 5.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2242431640625, -0.21547889709472656, -0.20671463012695312, -0.1979503631591797, -0.18918609619140625, -0.1804218292236328, -0.17165756225585938, -0.16289329528808594, -0.1541290283203125, -0.14536476135253906, -0.13660049438476562, -0.1278362274169922, -0.11907196044921875, -0.11030769348144531, -0.10154342651367188, -0.09277915954589844, -0.084014892578125, -0.07525062561035156, -0.06648635864257812, -0.05772209167480469, -0.04895782470703125, -0.04019355773925781, -0.031429290771484375, -0.022665023803710938, -0.0139007568359375, -0.0051364898681640625, 0.003627777099609375, 0.012392044067382812, 0.02115631103515625, 0.029920578002929688, 0.038684844970703125, 0.04744911193847656, 0.05621337890625, 0.06497764587402344, 0.07374191284179688, 0.08250617980957031, 0.09127044677734375, 0.10003471374511719, 0.10879898071289062, 0.11756324768066406, 0.1263275146484375, 0.13509178161621094, 0.14385604858398438, 0.1526203155517578, 0.16138458251953125, 0.1701488494873047, 0.17891311645507812, 0.18767738342285156, 0.196441650390625, 0.20520591735839844, 0.21397018432617188, 0.2227344512939453, 0.23149871826171875, 0.2402629852294922, 0.24902725219726562, 0.25779151916503906, 0.2665557861328125, 0.27532005310058594, 0.2840843200683594, 0.2928485870361328, 0.30161285400390625, 0.3103771209716797, 0.3191413879394531, 0.32790565490722656, 0.336669921875]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 10.0, 22.0, 37.0, 95.0, 183.0, 268.0, 188.0, 103.0, 48.0, 28.0, 14.0, 9.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.2716193199157715, -7.101199626922607, -6.930779933929443, -6.7603607177734375, -6.589941024780273, -6.419521331787109, -6.249101638793945, -6.078681945800781, -5.908262252807617, -5.737842559814453, -5.567422866821289, -5.397003173828125, -5.226583957672119, -5.056164264678955, -4.885744571685791, -4.715324878692627, -4.544905662536621, -4.374485969543457, -4.204066276550293, -4.033646583557129, -3.863227128982544, -3.692807674407959, -3.522387981414795, -3.351968288421631, -3.181548595428467, -3.0111289024353027, -2.8407094478607178, -2.6702897548675537, -2.4998700618743896, -2.3294506072998047, -2.1590309143066406, -1.9886112213134766, -1.8181915283203125, -1.647771954536438, -1.477352261543274, -1.3069326877593994, -1.1365129947662354, -0.9660934209823608, -0.7956738471984863, -0.6252541542053223, -0.45483458042144775, -0.28441494703292847, -0.11399534344673157, 0.05642426013946533, 0.22684389352798462, 0.3972635269165039, 0.5676831007003784, 0.7381027936935425, 0.908522367477417, 1.0789419412612915, 1.2493616342544556, 1.41978120803833, 1.5902009010314941, 1.7606204748153687, 1.9310400485992432, 2.1014597415924072, 2.271879196166992, 2.4422988891601562, 2.612718343734741, 2.7831380367279053, 2.9535577297210693, 3.1239771842956543, 3.2943968772888184, 3.4648165702819824, 3.6352362632751465]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 5.0, 2.0, 3.0, 10.0, 6.0, 5.0, 11.0, 18.0, 17.0, 13.0, 19.0, 19.0, 26.0, 27.0, 29.0, 35.0, 34.0, 46.0, 43.0, 37.0, 62.0, 49.0, 50.0, 50.0, 33.0, 53.0, 39.0, 52.0, 35.0, 24.0, 22.0, 25.0, 11.0, 16.0, 12.0, 12.0, 21.0, 12.0, 4.0, 5.0, 4.0, 7.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.7066590785980225, -2.630539655685425, -2.554420232772827, -2.4783008098602295, -2.402181625366211, -2.3260622024536133, -2.2499427795410156, -2.173823356628418, -2.0977039337158203, -2.0215845108032227, -1.945465087890625, -1.869345784187317, -1.7932263612747192, -1.7171069383621216, -1.6409876346588135, -1.5648682117462158, -1.4887487888336182, -1.4126293659210205, -1.3365099430084229, -1.2603906393051147, -1.184271216392517, -1.1081517934799194, -1.0320324897766113, -0.9559130668640137, -0.879793643951416, -0.8036742210388184, -0.7275548577308655, -0.6514354944229126, -0.5753160715103149, -0.4991966784000397, -0.4230772852897644, -0.3469579219818115, -0.27083826065063477, -0.1947188675403595, -0.11859947443008423, -0.04248008131980896, 0.03363931179046631, 0.10975870490074158, 0.18587809801101685, 0.2619974613189697, 0.3381168842315674, 0.41423627734184265, 0.4903556704521179, 0.5664750337600708, 0.6425944566726685, 0.7187138795852661, 0.794833242893219, 0.8709526062011719, 0.9470720291137695, 1.0231914520263672, 1.0993108749389648, 1.175430178642273, 1.2515496015548706, 1.3276690244674683, 1.4037883281707764, 1.479907751083374, 1.5560271739959717, 1.6321465969085693, 1.708266019821167, 1.784385323524475, 1.8605047464370728, 1.9366241693496704, 2.0127434730529785, 2.088862895965576, 2.164982318878174]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 4.0, 6.0, 9.0, 18.0, 39.0, 67.0, 172.0, 457.0, 1598.0, 10740.0, 680571.0, 3482359.0, 15033.0, 2047.0, 594.0, 238.0, 131.0, 69.0, 31.0, 34.0, 22.0, 15.0, 6.0, 7.0, 5.0, 5.0, 4.0, 5.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.92333984375, -0.8865127563476562, -0.8496856689453125, -0.8128585815429688, -0.776031494140625, -0.7392044067382812, -0.7023773193359375, -0.6655502319335938, -0.62872314453125, -0.5918960571289062, -0.5550689697265625, -0.5182418823242188, -0.481414794921875, -0.44458770751953125, -0.4077606201171875, -0.37093353271484375, -0.3341064453125, -0.29727935791015625, -0.2604522705078125, -0.22362518310546875, -0.186798095703125, -0.14997100830078125, -0.1131439208984375, -0.07631683349609375, -0.03948974609375, -0.00266265869140625, 0.0341644287109375, 0.07099151611328125, 0.107818603515625, 0.14464569091796875, 0.1814727783203125, 0.21829986572265625, 0.255126953125, 0.29195404052734375, 0.3287811279296875, 0.36560821533203125, 0.402435302734375, 0.43926239013671875, 0.4760894775390625, 0.5129165649414062, 0.54974365234375, 0.5865707397460938, 0.6233978271484375, 0.6602249145507812, 0.697052001953125, 0.7338790893554688, 0.7707061767578125, 0.8075332641601562, 0.8443603515625, 0.8811874389648438, 0.9180145263671875, 0.9548416137695312, 0.991668701171875, 1.0284957885742188, 1.0653228759765625, 1.1021499633789062, 1.13897705078125, 1.1758041381835938, 1.2126312255859375, 1.2494583129882812, 1.286285400390625, 1.3231124877929688, 1.3599395751953125, 1.3967666625976562, 1.43359375]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 7.0, 10.0, 29.0, 38.0, 77.0, 93.0, 163.0, 160.0, 135.0, 138.0, 67.0, 46.0, 22.0, 10.0, 9.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1629638671875, -0.1563396453857422, -0.14971542358398438, -0.14309120178222656, -0.13646697998046875, -0.12984275817871094, -0.12321853637695312, -0.11659431457519531, -0.1099700927734375, -0.10334587097167969, -0.09672164916992188, -0.09009742736816406, -0.08347320556640625, -0.07684898376464844, -0.07022476196289062, -0.06360054016113281, -0.056976318359375, -0.05035209655761719, -0.043727874755859375, -0.03710365295410156, -0.03047943115234375, -0.023855209350585938, -0.017230987548828125, -0.010606765747070312, -0.0039825439453125, 0.0026416778564453125, 0.009265899658203125, 0.015890121459960938, 0.02251434326171875, 0.029138565063476562, 0.035762786865234375, 0.04238700866699219, 0.04901123046875, 0.05563545227050781, 0.062259674072265625, 0.06888389587402344, 0.07550811767578125, 0.08213233947753906, 0.08875656127929688, 0.09538078308105469, 0.1020050048828125, 0.10862922668457031, 0.11525344848632812, 0.12187767028808594, 0.12850189208984375, 0.13512611389160156, 0.14175033569335938, 0.1483745574951172, 0.154998779296875, 0.1616230010986328, 0.16824722290039062, 0.17487144470214844, 0.18149566650390625, 0.18811988830566406, 0.19474411010742188, 0.2013683319091797, 0.2079925537109375, 0.2146167755126953, 0.22124099731445312, 0.22786521911621094, 0.23448944091796875, 0.24111366271972656, 0.24773788452148438, 0.2543621063232422, 0.260986328125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 0.0, 1.0, 5.0, 5.0, 14.0, 12.0, 17.0, 40.0, 59.0, 127.0, 240.0, 479.0, 1293.0, 3734.0, 16706.0, 156925.0, 3748292.0, 238946.0, 20385.0, 4358.0, 1461.0, 590.0, 285.0, 140.0, 71.0, 37.0, 26.0, 12.0, 7.0, 10.0, 3.0, 0.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.69482421875, -0.6728134155273438, -0.6508026123046875, -0.6287918090820312, -0.606781005859375, -0.5847702026367188, -0.5627593994140625, -0.5407485961914062, -0.51873779296875, -0.49672698974609375, -0.4747161865234375, -0.45270538330078125, -0.430694580078125, -0.40868377685546875, -0.3866729736328125, -0.36466217041015625, -0.3426513671875, -0.32064056396484375, -0.2986297607421875, -0.27661895751953125, -0.254608154296875, -0.23259735107421875, -0.2105865478515625, -0.18857574462890625, -0.16656494140625, -0.14455413818359375, -0.1225433349609375, -0.10053253173828125, -0.078521728515625, -0.05651092529296875, -0.0345001220703125, -0.01248931884765625, 0.009521484375, 0.03153228759765625, 0.0535430908203125, 0.07555389404296875, 0.097564697265625, 0.11957550048828125, 0.1415863037109375, 0.16359710693359375, 0.18560791015625, 0.20761871337890625, 0.2296295166015625, 0.25164031982421875, 0.273651123046875, 0.29566192626953125, 0.3176727294921875, 0.33968353271484375, 0.3616943359375, 0.38370513916015625, 0.4057159423828125, 0.42772674560546875, 0.449737548828125, 0.47174835205078125, 0.4937591552734375, 0.5157699584960938, 0.53778076171875, 0.5597915649414062, 0.5818023681640625, 0.6038131713867188, 0.625823974609375, 0.6478347778320312, 0.6698455810546875, 0.6918563842773438, 0.7138671875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 5.0, 3.0, 4.0, 10.0, 18.0, 19.0, 32.0, 51.0, 76.0, 181.0, 342.0, 886.0, 1520.0, 473.0, 191.0, 110.0, 64.0, 34.0, 17.0, 16.0, 9.0, 7.0, 4.0, 0.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.191162109375, -0.1854076385498047, -0.17965316772460938, -0.17389869689941406, -0.16814422607421875, -0.16238975524902344, -0.15663528442382812, -0.1508808135986328, -0.1451263427734375, -0.1393718719482422, -0.13361740112304688, -0.12786293029785156, -0.12210845947265625, -0.11635398864746094, -0.11059951782226562, -0.10484504699707031, -0.099090576171875, -0.09333610534667969, -0.08758163452148438, -0.08182716369628906, -0.07607269287109375, -0.07031822204589844, -0.06456375122070312, -0.05880928039550781, -0.0530548095703125, -0.04730033874511719, -0.041545867919921875, -0.03579139709472656, -0.03003692626953125, -0.024282455444335938, -0.018527984619140625, -0.012773513793945312, -0.00701904296875, -0.0012645721435546875, 0.004489898681640625, 0.010244369506835938, 0.01599884033203125, 0.021753311157226562, 0.027507781982421875, 0.03326225280761719, 0.0390167236328125, 0.04477119445800781, 0.050525665283203125, 0.05628013610839844, 0.06203460693359375, 0.06778907775878906, 0.07354354858398438, 0.07929801940917969, 0.085052490234375, 0.09080696105957031, 0.09656143188476562, 0.10231590270996094, 0.10807037353515625, 0.11382484436035156, 0.11957931518554688, 0.1253337860107422, 0.1310882568359375, 0.1368427276611328, 0.14259719848632812, 0.14835166931152344, 0.15410614013671875, 0.15986061096191406, 0.16561508178710938, 0.1713695526123047, 0.1771240234375]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 9.0, 13.0, 67.0, 213.0, 362.0, 243.0, 72.0, 24.0, 3.0, 4.0, 1.0, 3.0], "bins": [-3.4961936473846436, -3.4345080852508545, -3.3728227615356445, -3.3111371994018555, -3.2494516372680664, -3.1877663135528564, -3.1260807514190674, -3.0643951892852783, -3.0027098655700684, -2.9410243034362793, -2.8793389797210693, -2.8176534175872803, -2.755967855453491, -2.6942825317382812, -2.632596969604492, -2.570911407470703, -2.509225845336914, -2.447540283203125, -2.385854959487915, -2.324169397354126, -2.262483835220337, -2.200798511505127, -2.139112949371338, -2.077427387237549, -2.015742063522339, -1.9540566205978394, -1.8923710584640503, -1.8306856155395508, -1.7690001726150513, -1.7073147296905518, -1.6456291675567627, -1.5839437246322632, -1.5222581624984741, -1.4605727195739746, -1.3988871574401855, -1.337201714515686, -1.2755162715911865, -1.2138307094573975, -1.152145266532898, -1.0904598236083984, -1.0287742614746094, -0.9670887589454651, -0.9054033160209656, -0.8437178134918213, -0.7820323705673218, -0.7203468680381775, -0.6586613655090332, -0.5969759225845337, -0.5352904796600342, -0.4736050069332123, -0.4119195342063904, -0.3502340316772461, -0.2885485589504242, -0.2268630862236023, -0.165177583694458, -0.10349211096763611, -0.04180663824081421, 0.019878841936588287, 0.08156432211399078, 0.14324980974197388, 0.20493528246879578, 0.2666207551956177, 0.32830625772476196, 0.38999173045158386, 0.45167720317840576]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 8.0, 10.0, 9.0, 12.0, 17.0, 11.0, 27.0, 35.0, 35.0, 33.0, 49.0, 43.0, 55.0, 49.0, 62.0, 62.0, 58.0, 67.0, 57.0, 45.0, 51.0, 52.0, 33.0, 29.0, 38.0, 20.0, 19.0, 12.0, 7.0, 4.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5984569787979126, -0.5785012245178223, -0.5585454702377319, -0.5385897159576416, -0.5186339616775513, -0.49867817759513855, -0.47872239351272583, -0.4587666392326355, -0.43881088495254517, -0.41885513067245483, -0.3988993763923645, -0.3789435923099518, -0.35898783802986145, -0.3390320837497711, -0.3190762996673584, -0.29912054538726807, -0.27916479110717773, -0.2592090368270874, -0.23925326764583588, -0.21929749846458435, -0.19934174418449402, -0.1793859899044037, -0.15943022072315216, -0.13947445154190063, -0.1195186972618103, -0.09956293553113937, -0.07960717380046844, -0.059651412069797516, -0.03969565033912659, -0.019739888608455658, 0.000215873122215271, 0.020171642303466797, 0.040127336978912354, 0.06008309870958328, 0.08003886044025421, 0.09999462217092514, 0.11995038390159607, 0.1399061381816864, 0.15986190736293793, 0.17981767654418945, 0.19977343082427979, 0.21972918510437012, 0.23968495428562164, 0.25964072346687317, 0.2795964777469635, 0.29955223202705383, 0.31950801610946655, 0.3394637703895569, 0.3594195246696472, 0.37937527894973755, 0.3993310332298279, 0.4192868173122406, 0.43924257159233093, 0.45919832587242126, 0.479154109954834, 0.4991098642349243, 0.5190656185150146, 0.539021372795105, 0.5589771270751953, 0.5789328813552856, 0.598888635635376, 0.6188444495201111, 0.6388002038002014, 0.6587559580802917, 0.6787117123603821]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 4.0, 10.0, 9.0, 13.0, 21.0, 30.0, 41.0, 58.0, 87.0, 122.0, 160.0, 281.0, 419.0, 697.0, 1649.0, 5441.0, 29911.0, 259126.0, 628834.0, 102061.0, 13657.0, 3198.0, 1095.0, 553.0, 343.0, 232.0, 137.0, 99.0, 87.0, 53.0, 39.0, 19.0, 22.0, 12.0, 10.0, 13.0, 5.0, 3.0, 5.0, 1.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5927734375, -0.5693359375, -0.5458984375, -0.5224609375, -0.4990234375, -0.4755859375, -0.4521484375, -0.4287109375, -0.4052734375, -0.3818359375, -0.3583984375, -0.3349609375, -0.3115234375, -0.2880859375, -0.2646484375, -0.2412109375, -0.2177734375, -0.1943359375, -0.1708984375, -0.1474609375, -0.1240234375, -0.1005859375, -0.0771484375, -0.0537109375, -0.0302734375, -0.0068359375, 0.0166015625, 0.0400390625, 0.0634765625, 0.0869140625, 0.1103515625, 0.1337890625, 0.1572265625, 0.1806640625, 0.2041015625, 0.2275390625, 0.2509765625, 0.2744140625, 0.2978515625, 0.3212890625, 0.3447265625, 0.3681640625, 0.3916015625, 0.4150390625, 0.4384765625, 0.4619140625, 0.4853515625, 0.5087890625, 0.5322265625, 0.5556640625, 0.5791015625, 0.6025390625, 0.6259765625, 0.6494140625, 0.6728515625, 0.6962890625, 0.7197265625, 0.7431640625, 0.7666015625, 0.7900390625, 0.8134765625, 0.8369140625, 0.8603515625, 0.8837890625, 0.9072265625]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 14.0, 24.0, 34.0, 63.0, 100.0, 134.0, 141.0, 157.0, 134.0, 92.0, 48.0, 34.0, 13.0, 9.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1624755859375, -0.15595054626464844, -0.14942550659179688, -0.1429004669189453, -0.13637542724609375, -0.1298503875732422, -0.12332534790039062, -0.11680030822753906, -0.1102752685546875, -0.10375022888183594, -0.09722518920898438, -0.09070014953613281, -0.08417510986328125, -0.07765007019042969, -0.07112503051757812, -0.06459999084472656, -0.058074951171875, -0.05154991149902344, -0.045024871826171875, -0.03849983215332031, -0.03197479248046875, -0.025449752807617188, -0.018924713134765625, -0.012399673461914062, -0.0058746337890625, 0.0006504058837890625, 0.007175445556640625, 0.013700485229492188, 0.02022552490234375, 0.026750564575195312, 0.033275604248046875, 0.03980064392089844, 0.04632568359375, 0.05285072326660156, 0.059375762939453125, 0.06590080261230469, 0.07242584228515625, 0.07895088195800781, 0.08547592163085938, 0.09200096130371094, 0.0985260009765625, 0.10505104064941406, 0.11157608032226562, 0.11810111999511719, 0.12462615966796875, 0.1311511993408203, 0.13767623901367188, 0.14420127868652344, 0.150726318359375, 0.15725135803222656, 0.16377639770507812, 0.1703014373779297, 0.17682647705078125, 0.1833515167236328, 0.18987655639648438, 0.19640159606933594, 0.2029266357421875, 0.20945167541503906, 0.21597671508789062, 0.2225017547607422, 0.22902679443359375, 0.2355518341064453, 0.24207687377929688, 0.24860191345214844, 0.255126953125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 14.0, 6.0, 4.0, 18.0, 14.0, 27.0, 33.0, 58.0, 64.0, 118.0, 149.0, 266.0, 405.0, 697.0, 1224.0, 2572.0, 5955.0, 16560.0, 54385.0, 203580.0, 453103.0, 220104.0, 59051.0, 17697.0, 6460.0, 2703.0, 1345.0, 724.0, 418.0, 244.0, 159.0, 107.0, 86.0, 62.0, 38.0, 33.0, 15.0, 20.0, 9.0, 7.0, 4.0, 6.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.430908203125, -0.4163169860839844, -0.40172576904296875, -0.3871345520019531, -0.3725433349609375, -0.3579521179199219, -0.34336090087890625, -0.3287696838378906, -0.314178466796875, -0.2995872497558594, -0.28499603271484375, -0.2704048156738281, -0.2558135986328125, -0.24122238159179688, -0.22663116455078125, -0.21203994750976562, -0.19744873046875, -0.18285751342773438, -0.16826629638671875, -0.15367507934570312, -0.1390838623046875, -0.12449264526367188, -0.10990142822265625, -0.09531021118164062, -0.080718994140625, -0.06612777709960938, -0.05153656005859375, -0.036945343017578125, -0.0223541259765625, -0.007762908935546875, 0.00682830810546875, 0.021419525146484375, 0.0360107421875, 0.050601959228515625, 0.06519317626953125, 0.07978439331054688, 0.0943756103515625, 0.10896682739257812, 0.12355804443359375, 0.13814926147460938, 0.152740478515625, 0.16733169555664062, 0.18192291259765625, 0.19651412963867188, 0.2111053466796875, 0.22569656372070312, 0.24028778076171875, 0.2548789978027344, 0.26947021484375, 0.2840614318847656, 0.29865264892578125, 0.3132438659667969, 0.3278350830078125, 0.3424263000488281, 0.35701751708984375, 0.3716087341308594, 0.386199951171875, 0.4007911682128906, 0.41538238525390625, 0.4299736022949219, 0.4445648193359375, 0.4591560363769531, 0.47374725341796875, 0.4883384704589844, 0.5029296875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 4.0, 2.0, 8.0, 10.0, 11.0, 9.0, 15.0, 15.0, 17.0, 26.0, 30.0, 25.0, 38.0, 37.0, 36.0, 52.0, 42.0, 43.0, 55.0, 46.0, 46.0, 63.0, 45.0, 46.0, 29.0, 34.0, 29.0, 35.0, 34.0, 26.0, 16.0, 18.0, 15.0, 12.0, 11.0, 10.0, 3.0, 9.0, 4.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.4248046875, -0.411407470703125, -0.39801025390625, -0.384613037109375, -0.3712158203125, -0.357818603515625, -0.34442138671875, -0.331024169921875, -0.317626953125, -0.304229736328125, -0.29083251953125, -0.277435302734375, -0.2640380859375, -0.250640869140625, -0.23724365234375, -0.223846435546875, -0.21044921875, -0.197052001953125, -0.18365478515625, -0.170257568359375, -0.1568603515625, -0.143463134765625, -0.13006591796875, -0.116668701171875, -0.103271484375, -0.089874267578125, -0.07647705078125, -0.063079833984375, -0.0496826171875, -0.036285400390625, -0.02288818359375, -0.009490966796875, 0.00390625, 0.017303466796875, 0.03070068359375, 0.044097900390625, 0.0574951171875, 0.070892333984375, 0.08428955078125, 0.097686767578125, 0.111083984375, 0.124481201171875, 0.13787841796875, 0.151275634765625, 0.1646728515625, 0.178070068359375, 0.19146728515625, 0.204864501953125, 0.21826171875, 0.231658935546875, 0.24505615234375, 0.258453369140625, 0.2718505859375, 0.285247802734375, 0.29864501953125, 0.312042236328125, 0.325439453125, 0.338836669921875, 0.35223388671875, 0.365631103515625, 0.3790283203125, 0.392425537109375, 0.40582275390625, 0.419219970703125, 0.4326171875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 4.0, 2.0, 17.0, 19.0, 47.0, 77.0, 139.0, 330.0, 671.0, 1990.0, 8441.0, 84819.0, 796476.0, 140112.0, 11461.0, 2435.0, 793.0, 360.0, 159.0, 80.0, 40.0, 20.0, 17.0, 14.0, 11.0, 7.0, 3.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.48974609375, -0.476715087890625, -0.46368408203125, -0.450653076171875, -0.4376220703125, -0.424591064453125, -0.41156005859375, -0.398529052734375, -0.385498046875, -0.372467041015625, -0.35943603515625, -0.346405029296875, -0.3333740234375, -0.320343017578125, -0.30731201171875, -0.294281005859375, -0.28125, -0.268218994140625, -0.25518798828125, -0.242156982421875, -0.2291259765625, -0.216094970703125, -0.20306396484375, -0.190032958984375, -0.177001953125, -0.163970947265625, -0.15093994140625, -0.137908935546875, -0.1248779296875, -0.111846923828125, -0.09881591796875, -0.085784912109375, -0.07275390625, -0.059722900390625, -0.04669189453125, -0.033660888671875, -0.0206298828125, -0.007598876953125, 0.00543212890625, 0.018463134765625, 0.031494140625, 0.044525146484375, 0.05755615234375, 0.070587158203125, 0.0836181640625, 0.096649169921875, 0.10968017578125, 0.122711181640625, 0.1357421875, 0.148773193359375, 0.16180419921875, 0.174835205078125, 0.1878662109375, 0.200897216796875, 0.21392822265625, 0.226959228515625, 0.239990234375, 0.253021240234375, 0.26605224609375, 0.279083251953125, 0.2921142578125, 0.305145263671875, 0.31817626953125, 0.331207275390625, 0.34423828125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 5.0, 3.0, 6.0, 10.0, 5.0, 9.0, 13.0, 15.0, 29.0, 51.0, 67.0, 85.0, 122.0, 130.0, 127.0, 84.0, 67.0, 48.0, 36.0, 23.0, 23.0, 12.0, 7.0, 7.0, 5.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.416704177856445e-05, -4.255678504705429e-05, -4.094652831554413e-05, -3.9336271584033966e-05, -3.7726014852523804e-05, -3.611575812101364e-05, -3.450550138950348e-05, -3.289524465799332e-05, -3.1284987926483154e-05, -2.9674731194972992e-05, -2.806447446346283e-05, -2.6454217731952667e-05, -2.4843961000442505e-05, -2.3233704268932343e-05, -2.162344753742218e-05, -2.0013190805912018e-05, -1.8402934074401855e-05, -1.6792677342891693e-05, -1.518242061138153e-05, -1.3572163879871368e-05, -1.1961907148361206e-05, -1.0351650416851044e-05, -8.741393685340881e-06, -7.131136953830719e-06, -5.520880222320557e-06, -3.910623490810394e-06, -2.300366759300232e-06, -6.901100277900696e-07, 9.201467037200928e-07, 2.530403435230255e-06, 4.1406601667404175e-06, 5.75091689825058e-06, 7.361173629760742e-06, 8.971430361270905e-06, 1.0581687092781067e-05, 1.219194382429123e-05, 1.3802200555801392e-05, 1.5412457287311554e-05, 1.7022714018821716e-05, 1.863297075033188e-05, 2.024322748184204e-05, 2.1853484213352203e-05, 2.3463740944862366e-05, 2.5073997676372528e-05, 2.668425440788269e-05, 2.8294511139392853e-05, 2.9904767870903015e-05, 3.151502460241318e-05, 3.312528133392334e-05, 3.47355380654335e-05, 3.6345794796943665e-05, 3.795605152845383e-05, 3.956630825996399e-05, 4.117656499147415e-05, 4.2786821722984314e-05, 4.4397078454494476e-05, 4.600733518600464e-05, 4.76175919175148e-05, 4.922784864902496e-05, 5.0838105380535126e-05, 5.244836211204529e-05, 5.405861884355545e-05, 5.566887557506561e-05, 5.7279132306575775e-05, 5.888938903808594e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 1.0, 5.0, 5.0, 13.0, 12.0, 33.0, 34.0, 54.0, 77.0, 113.0, 200.0, 363.0, 845.0, 2137.0, 7157.0, 38272.0, 399227.0, 535369.0, 51155.0, 8992.0, 2507.0, 942.0, 469.0, 221.0, 125.0, 84.0, 42.0, 32.0, 17.0, 16.0, 8.0, 7.0, 6.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.31982421875, -0.3080101013183594, -0.29619598388671875, -0.2843818664550781, -0.2725677490234375, -0.2607536315917969, -0.24893951416015625, -0.23712539672851562, -0.225311279296875, -0.21349716186523438, -0.20168304443359375, -0.18986892700195312, -0.1780548095703125, -0.16624069213867188, -0.15442657470703125, -0.14261245727539062, -0.13079833984375, -0.11898422241210938, -0.10717010498046875, -0.09535598754882812, -0.0835418701171875, -0.07172775268554688, -0.05991363525390625, -0.048099517822265625, -0.036285400390625, -0.024471282958984375, -0.01265716552734375, -0.000843048095703125, 0.0109710693359375, 0.022785186767578125, 0.03459930419921875, 0.046413421630859375, 0.0582275390625, 0.07004165649414062, 0.08185577392578125, 0.09366989135742188, 0.1054840087890625, 0.11729812622070312, 0.12911224365234375, 0.14092636108398438, 0.152740478515625, 0.16455459594726562, 0.17636871337890625, 0.18818283081054688, 0.1999969482421875, 0.21181106567382812, 0.22362518310546875, 0.23543930053710938, 0.24725341796875, 0.2590675354003906, 0.27088165283203125, 0.2826957702636719, 0.2945098876953125, 0.3063240051269531, 0.31813812255859375, 0.3299522399902344, 0.341766357421875, 0.3535804748535156, 0.36539459228515625, 0.3772087097167969, 0.3890228271484375, 0.4008369445800781, 0.41265106201171875, 0.4244651794433594, 0.436279296875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 7.0, 1.0, 9.0, 14.0, 21.0, 29.0, 34.0, 61.0, 84.0, 102.0, 146.0, 137.0, 114.0, 80.0, 59.0, 36.0, 26.0, 17.0, 16.0, 8.0, 3.0, 2.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.277099609375, -0.2656059265136719, -0.25411224365234375, -0.24261856079101562, -0.2311248779296875, -0.21963119506835938, -0.20813751220703125, -0.19664382934570312, -0.185150146484375, -0.17365646362304688, -0.16216278076171875, -0.15066909790039062, -0.1391754150390625, -0.12768173217773438, -0.11618804931640625, -0.10469436645507812, -0.09320068359375, -0.08170700073242188, -0.07021331787109375, -0.058719635009765625, -0.0472259521484375, -0.035732269287109375, -0.02423858642578125, -0.012744903564453125, -0.001251220703125, 0.010242462158203125, 0.02173614501953125, 0.033229827880859375, 0.0447235107421875, 0.056217193603515625, 0.06771087646484375, 0.07920455932617188, 0.0906982421875, 0.10219192504882812, 0.11368560791015625, 0.12517929077148438, 0.1366729736328125, 0.14816665649414062, 0.15966033935546875, 0.17115402221679688, 0.182647705078125, 0.19414138793945312, 0.20563507080078125, 0.21712875366210938, 0.2286224365234375, 0.24011611938476562, 0.25160980224609375, 0.2631034851074219, 0.27459716796875, 0.2860908508300781, 0.29758453369140625, 0.3090782165527344, 0.3205718994140625, 0.3320655822753906, 0.34355926513671875, 0.3550529479980469, 0.366546630859375, 0.3780403137207031, 0.38953399658203125, 0.4010276794433594, 0.4125213623046875, 0.4240150451660156, 0.43550872802734375, 0.4470024108886719, 0.45849609375]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 12.0, 64.0, 375.0, 420.0, 102.0, 23.0, 9.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.604852676391602, -7.226531028747559, -6.848209381103516, -6.469887733459473, -6.091566562652588, -5.713244915008545, -5.334923267364502, -4.956602096557617, -4.578280448913574, -4.199958801269531, -3.8216373920440674, -3.4433157444000244, -3.0649943351745605, -2.6866726875305176, -2.3083510398864746, -1.9300296306610107, -1.5517077445983887, -1.1733862161636353, -0.7950646281242371, -0.41674304008483887, -0.03842151165008545, 0.33990001678466797, 0.7182216644287109, 1.0965430736541748, 1.4748647212982178, 1.8531862497329712, 2.2315077781677246, 2.6098294258117676, 2.9881510734558105, 3.3664724826812744, 3.7447941303253174, 4.123115539550781, 4.501437187194824, 4.879758834838867, 5.25808048248291, 5.636402130126953, 6.014723300933838, 6.393044948577881, 6.771366596221924, 7.149687767028809, 7.528009414672852, 7.9063310623168945, 8.284652709960938, 8.66297435760498, 9.041296005249023, 9.41961669921875, 9.79793930053711, 10.176259994506836, 10.554582595825195, 10.932904243469238, 11.311225891113281, 11.689547538757324, 12.067869186401367, 12.446189880371094, 12.824512481689453, 13.20283317565918, 13.581154823303223, 13.959476470947266, 14.337798118591309, 14.716119766235352, 15.094441413879395, 15.472763061523438, 15.851083755493164, 16.229406356811523, 16.60772705078125]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 4.0, 9.0, 9.0, 8.0, 9.0, 24.0, 32.0, 24.0, 43.0, 39.0, 48.0, 54.0, 52.0, 57.0, 64.0, 56.0, 58.0, 54.0, 61.0, 49.0, 53.0, 39.0, 28.0, 32.0, 25.0, 19.0, 15.0, 10.0, 9.0, 3.0, 5.0, 7.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7594268321990967, -2.6691651344299316, -2.5789031982421875, -2.4886415004730225, -2.3983798027038574, -2.3081181049346924, -2.2178564071655273, -2.127594470977783, -2.037332773208618, -1.9470710754394531, -1.8568092584609985, -1.766547441482544, -1.676285743713379, -1.5860240459442139, -1.4957622289657593, -1.4055004119873047, -1.3152387142181396, -1.2249770164489746, -1.13471519947052, -1.0444533824920654, -0.9541916847229004, -0.8639299273490906, -0.7736681699752808, -0.683406412601471, -0.5931446552276611, -0.5028828978538513, -0.4126211404800415, -0.3223593831062317, -0.23209762573242188, -0.14183586835861206, -0.051574110984802246, 0.03868764638900757, 0.12894916534423828, 0.2192109227180481, 0.3094726800918579, 0.3997344374656677, 0.48999619483947754, 0.5802579522132874, 0.6705197095870972, 0.760781466960907, 0.8510432243347168, 0.9413049817085266, 1.0315667390823364, 1.121828556060791, 1.212090253829956, 1.302351951599121, 1.3926137685775757, 1.4828755855560303, 1.5731372833251953, 1.6633989810943604, 1.753660798072815, 1.8439226150512695, 1.9341843128204346, 2.0244460105895996, 2.1147079467773438, 2.204969644546509, 2.295231342315674, 2.385493040084839, 2.475754737854004, 2.566016674041748, 2.656278371810913, 2.746540069580078, 2.8368020057678223, 2.9270637035369873, 3.0173254013061523]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 9.0, 11.0, 21.0, 21.0, 64.0, 125.0, 356.0, 1135.0, 7057.0, 209656.0, 3944151.0, 27219.0, 2925.0, 800.0, 317.0, 155.0, 88.0, 52.0, 44.0, 21.0, 21.0, 11.0, 7.0, 4.0, 3.0, 5.0, 3.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.08203125, -1.0391998291015625, -0.996368408203125, -0.9535369873046875, -0.91070556640625, -0.8678741455078125, -0.825042724609375, -0.7822113037109375, -0.7393798828125, -0.6965484619140625, -0.653717041015625, -0.6108856201171875, -0.56805419921875, -0.5252227783203125, -0.482391357421875, -0.4395599365234375, -0.396728515625, -0.3538970947265625, -0.311065673828125, -0.2682342529296875, -0.22540283203125, -0.1825714111328125, -0.139739990234375, -0.0969085693359375, -0.0540771484375, -0.0112457275390625, 0.031585693359375, 0.0744171142578125, 0.11724853515625, 0.1600799560546875, 0.202911376953125, 0.2457427978515625, 0.28857421875, 0.3314056396484375, 0.374237060546875, 0.4170684814453125, 0.45989990234375, 0.5027313232421875, 0.545562744140625, 0.5883941650390625, 0.6312255859375, 0.6740570068359375, 0.716888427734375, 0.7597198486328125, 0.80255126953125, 0.8453826904296875, 0.888214111328125, 0.9310455322265625, 0.973876953125, 1.0167083740234375, 1.059539794921875, 1.1023712158203125, 1.14520263671875, 1.1880340576171875, 1.230865478515625, 1.2736968994140625, 1.3165283203125, 1.3593597412109375, 1.402191162109375, 1.4450225830078125, 1.48785400390625, 1.5306854248046875, 1.573516845703125, 1.6163482666015625, 1.6591796875]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 5.0, 4.0, 11.0, 15.0, 50.0, 73.0, 114.0, 133.0, 167.0, 146.0, 116.0, 78.0, 40.0, 29.0, 18.0, 6.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1712646484375, -0.16431236267089844, -0.15736007690429688, -0.1504077911376953, -0.14345550537109375, -0.1365032196044922, -0.12955093383789062, -0.12259864807128906, -0.1156463623046875, -0.10869407653808594, -0.10174179077148438, -0.09478950500488281, -0.08783721923828125, -0.08088493347167969, -0.07393264770507812, -0.06698036193847656, -0.060028076171875, -0.05307579040527344, -0.046123504638671875, -0.03917121887207031, -0.03221893310546875, -0.025266647338867188, -0.018314361572265625, -0.011362075805664062, -0.0044097900390625, 0.0025424957275390625, 0.009494781494140625, 0.016447067260742188, 0.02339935302734375, 0.030351638793945312, 0.037303924560546875, 0.04425621032714844, 0.05120849609375, 0.05816078186035156, 0.06511306762695312, 0.07206535339355469, 0.07901763916015625, 0.08596992492675781, 0.09292221069335938, 0.09987449645996094, 0.1068267822265625, 0.11377906799316406, 0.12073135375976562, 0.1276836395263672, 0.13463592529296875, 0.1415882110595703, 0.14854049682617188, 0.15549278259277344, 0.162445068359375, 0.16939735412597656, 0.17634963989257812, 0.1833019256591797, 0.19025421142578125, 0.1972064971923828, 0.20415878295898438, 0.21111106872558594, 0.2180633544921875, 0.22501564025878906, 0.23196792602539062, 0.2389202117919922, 0.24587249755859375, 0.2528247833251953, 0.2597770690917969, 0.26672935485839844, 0.273681640625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 13.0, 7.0, 4.0, 20.0, 17.0, 29.0, 36.0, 63.0, 76.0, 148.0, 281.0, 465.0, 987.0, 2407.0, 6893.0, 26211.0, 229146.0, 3572443.0, 312442.0, 30299.0, 7311.0, 2599.0, 1079.0, 533.0, 303.0, 156.0, 86.0, 81.0, 42.0, 40.0, 27.0, 11.0, 7.0, 8.0, 5.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5830078125, -0.5632781982421875, -0.543548583984375, -0.5238189697265625, -0.50408935546875, -0.4843597412109375, -0.464630126953125, -0.4449005126953125, -0.4251708984375, -0.4054412841796875, -0.385711669921875, -0.3659820556640625, -0.34625244140625, -0.3265228271484375, -0.306793212890625, -0.2870635986328125, -0.267333984375, -0.2476043701171875, -0.227874755859375, -0.2081451416015625, -0.18841552734375, -0.1686859130859375, -0.148956298828125, -0.1292266845703125, -0.1094970703125, -0.0897674560546875, -0.070037841796875, -0.0503082275390625, -0.03057861328125, -0.0108489990234375, 0.008880615234375, 0.0286102294921875, 0.04833984375, 0.0680694580078125, 0.087799072265625, 0.1075286865234375, 0.12725830078125, 0.1469879150390625, 0.166717529296875, 0.1864471435546875, 0.2061767578125, 0.2259063720703125, 0.245635986328125, 0.2653656005859375, 0.28509521484375, 0.3048248291015625, 0.324554443359375, 0.3442840576171875, 0.364013671875, 0.3837432861328125, 0.403472900390625, 0.4232025146484375, 0.44293212890625, 0.4626617431640625, 0.482391357421875, 0.5021209716796875, 0.5218505859375, 0.5415802001953125, 0.561309814453125, 0.5810394287109375, 0.60076904296875, 0.6204986572265625, 0.640228271484375, 0.6599578857421875, 0.6796875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 4.0, 7.0, 4.0, 7.0, 7.0, 15.0, 17.0, 32.0, 49.0, 75.0, 165.0, 345.0, 857.0, 1386.0, 558.0, 252.0, 128.0, 65.0, 33.0, 20.0, 17.0, 14.0, 5.0, 8.0, 1.0, 7.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2369384765625, -0.22757530212402344, -0.21821212768554688, -0.2088489532470703, -0.19948577880859375, -0.1901226043701172, -0.18075942993164062, -0.17139625549316406, -0.1620330810546875, -0.15266990661621094, -0.14330673217773438, -0.1339435577392578, -0.12458038330078125, -0.11521720886230469, -0.10585403442382812, -0.09649085998535156, -0.087127685546875, -0.07776451110839844, -0.06840133666992188, -0.05903816223144531, -0.04967498779296875, -0.04031181335449219, -0.030948638916015625, -0.021585464477539062, -0.0122222900390625, -0.0028591156005859375, 0.006504058837890625, 0.015867233276367188, 0.02523040771484375, 0.03459358215332031, 0.043956756591796875, 0.05331993103027344, 0.06268310546875, 0.07204627990722656, 0.08140945434570312, 0.09077262878417969, 0.10013580322265625, 0.10949897766113281, 0.11886215209960938, 0.12822532653808594, 0.1375885009765625, 0.14695167541503906, 0.15631484985351562, 0.1656780242919922, 0.17504119873046875, 0.1844043731689453, 0.19376754760742188, 0.20313072204589844, 0.212493896484375, 0.22185707092285156, 0.23122024536132812, 0.2405834197998047, 0.24994659423828125, 0.2593097686767578, 0.2686729431152344, 0.27803611755371094, 0.2873992919921875, 0.29676246643066406, 0.3061256408691406, 0.3154888153076172, 0.32485198974609375, 0.3342151641845703, 0.3435783386230469, 0.35294151306152344, 0.3623046875]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 4.0, 5.0, 20.0, 45.0, 121.0, 239.0, 291.0, 163.0, 81.0, 24.0, 8.0, 1.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.337876319885254, -2.2604382038116455, -2.183000326156616, -2.105562210083008, -2.0281243324279785, -1.9506863355636597, -1.8732483386993408, -1.7958102226257324, -1.7183723449707031, -1.6409343481063843, -1.5634963512420654, -1.4860583543777466, -1.4086203575134277, -1.3311823606491089, -1.25374436378479, -1.1763062477111816, -1.0988682508468628, -1.021430253982544, -0.9439922571182251, -0.8665542602539062, -0.7891162633895874, -0.7116782665252686, -0.6342402100563049, -0.5568022131919861, -0.47936421632766724, -0.4019262194633484, -0.32448822259902954, -0.2470501959323883, -0.16961219906806946, -0.09217420220375061, -0.014736175537109375, 0.06270182132720947, 0.14013981819152832, 0.21757781505584717, 0.295015811920166, 0.37245383858680725, 0.4498918354511261, 0.5273298025131226, 0.6047678589820862, 0.682205855846405, 0.7596438527107239, 0.8370818495750427, 0.9145198464393616, 0.9919579029083252, 1.069395899772644, 1.146833896636963, 1.2242718935012817, 1.3017098903656006, 1.3791478872299194, 1.4565858840942383, 1.5340238809585571, 1.611461877822876, 1.6888998746871948, 1.7663378715515137, 1.843775987625122, 1.9212138652801514, 1.9986519813537598, 2.076090097427368, 2.1535279750823975, 2.230966091156006, 2.308403968811035, 2.3858420848846436, 2.463279962539673, 2.5407180786132812, 2.6181559562683105]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 9.0, 1.0, 4.0, 11.0, 7.0, 12.0, 17.0, 18.0, 18.0, 19.0, 27.0, 28.0, 35.0, 41.0, 43.0, 42.0, 50.0, 43.0, 52.0, 48.0, 38.0, 46.0, 51.0, 40.0, 43.0, 32.0, 43.0, 38.0, 30.0, 22.0, 20.0, 24.0, 13.0, 7.0, 13.0, 6.0, 4.0, 0.0, 3.0, 4.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8928328156471252, -0.8664751648902893, -0.8401175141334534, -0.8137598633766174, -0.7874022126197815, -0.7610445618629456, -0.7346868515014648, -0.7083292007446289, -0.681971549987793, -0.655613899230957, -0.6292562484741211, -0.6028985977172852, -0.5765409469604492, -0.5501832962036133, -0.5238256454467773, -0.497467964887619, -0.47111034393310547, -0.44475269317626953, -0.4183950424194336, -0.39203739166259766, -0.3656797409057617, -0.3393220901489258, -0.31296440958976746, -0.2866067588329315, -0.2602491080760956, -0.23389145731925964, -0.2075338065624237, -0.18117614090442657, -0.15481849014759064, -0.1284608393907547, -0.10210317373275757, -0.07574552297592163, -0.04938781261444092, -0.023030158132314682, 0.003327496349811554, 0.02968515455722809, 0.056042805314064026, 0.08240045607089996, 0.1087581217288971, 0.13511577248573303, 0.16147342324256897, 0.1878310739994049, 0.21418872475624084, 0.24054639041423798, 0.2669040560722351, 0.29326170682907104, 0.319619357585907, 0.3459770083427429, 0.37233465909957886, 0.3986923098564148, 0.42504996061325073, 0.45140761137008667, 0.4777652621269226, 0.5041229128837585, 0.5304806232452393, 0.5568382740020752, 0.5831959247589111, 0.6095535755157471, 0.635911226272583, 0.662268877029419, 0.6886265277862549, 0.7149841785430908, 0.7413418292999268, 0.7676994800567627, 0.7940571308135986]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 2.0, 2.0, 6.0, 10.0, 14.0, 20.0, 21.0, 50.0, 53.0, 71.0, 113.0, 151.0, 238.0, 378.0, 592.0, 1202.0, 2972.0, 11372.0, 73599.0, 587786.0, 321872.0, 36751.0, 6747.0, 2104.0, 971.0, 486.0, 321.0, 186.0, 139.0, 89.0, 66.0, 35.0, 34.0, 36.0, 18.0, 9.0, 13.0, 6.0, 7.0, 4.0, 6.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.77978515625, -0.7544937133789062, -0.7292022705078125, -0.7039108276367188, -0.678619384765625, -0.6533279418945312, -0.6280364990234375, -0.6027450561523438, -0.57745361328125, -0.5521621704101562, -0.5268707275390625, -0.5015792846679688, -0.476287841796875, -0.45099639892578125, -0.4257049560546875, -0.40041351318359375, -0.3751220703125, -0.34983062744140625, -0.3245391845703125, -0.29924774169921875, -0.273956298828125, -0.24866485595703125, -0.2233734130859375, -0.19808197021484375, -0.17279052734375, -0.14749908447265625, -0.1222076416015625, -0.09691619873046875, -0.071624755859375, -0.04633331298828125, -0.0210418701171875, 0.00424957275390625, 0.029541015625, 0.05483245849609375, 0.0801239013671875, 0.10541534423828125, 0.130706787109375, 0.15599822998046875, 0.1812896728515625, 0.20658111572265625, 0.23187255859375, 0.25716400146484375, 0.2824554443359375, 0.30774688720703125, 0.333038330078125, 0.35832977294921875, 0.3836212158203125, 0.40891265869140625, 0.4342041015625, 0.45949554443359375, 0.4847869873046875, 0.5100784301757812, 0.535369873046875, 0.5606613159179688, 0.5859527587890625, 0.6112442016601562, 0.63653564453125, 0.6618270874023438, 0.6871185302734375, 0.7124099731445312, 0.737701416015625, 0.7629928588867188, 0.7882843017578125, 0.8135757446289062, 0.8388671875]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 12.0, 17.0, 52.0, 63.0, 83.0, 134.0, 145.0, 155.0, 121.0, 100.0, 53.0, 32.0, 17.0, 11.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.165283203125, -0.15865325927734375, -0.1520233154296875, -0.14539337158203125, -0.138763427734375, -0.13213348388671875, -0.1255035400390625, -0.11887359619140625, -0.11224365234375, -0.10561370849609375, -0.0989837646484375, -0.09235382080078125, -0.085723876953125, -0.07909393310546875, -0.0724639892578125, -0.06583404541015625, -0.0592041015625, -0.05257415771484375, -0.0459442138671875, -0.03931427001953125, -0.032684326171875, -0.02605438232421875, -0.0194244384765625, -0.01279449462890625, -0.00616455078125, 0.00046539306640625, 0.0070953369140625, 0.01372528076171875, 0.020355224609375, 0.02698516845703125, 0.0336151123046875, 0.04024505615234375, 0.046875, 0.05350494384765625, 0.0601348876953125, 0.06676483154296875, 0.073394775390625, 0.08002471923828125, 0.0866546630859375, 0.09328460693359375, 0.09991455078125, 0.10654449462890625, 0.1131744384765625, 0.11980438232421875, 0.126434326171875, 0.13306427001953125, 0.1396942138671875, 0.14632415771484375, 0.1529541015625, 0.15958404541015625, 0.1662139892578125, 0.17284393310546875, 0.179473876953125, 0.18610382080078125, 0.1927337646484375, 0.19936370849609375, 0.20599365234375, 0.21262359619140625, 0.2192535400390625, 0.22588348388671875, 0.232513427734375, 0.23914337158203125, 0.2457733154296875, 0.25240325927734375, 0.259033203125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 8.0, 10.0, 10.0, 10.0, 15.0, 17.0, 49.0, 57.0, 86.0, 150.0, 252.0, 401.0, 712.0, 1464.0, 3159.0, 7810.0, 24275.0, 99876.0, 442132.0, 359652.0, 76800.0, 19583.0, 6523.0, 2669.0, 1243.0, 571.0, 379.0, 239.0, 140.0, 81.0, 62.0, 35.0, 26.0, 13.0, 16.0, 9.0, 7.0, 6.0, 3.0, 2.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.51220703125, -0.49385833740234375, -0.4755096435546875, -0.45716094970703125, -0.438812255859375, -0.42046356201171875, -0.4021148681640625, -0.38376617431640625, -0.36541748046875, -0.34706878662109375, -0.3287200927734375, -0.31037139892578125, -0.292022705078125, -0.27367401123046875, -0.2553253173828125, -0.23697662353515625, -0.2186279296875, -0.20027923583984375, -0.1819305419921875, -0.16358184814453125, -0.145233154296875, -0.12688446044921875, -0.1085357666015625, -0.09018707275390625, -0.07183837890625, -0.05348968505859375, -0.0351409912109375, -0.01679229736328125, 0.001556396484375, 0.01990509033203125, 0.0382537841796875, 0.05660247802734375, 0.074951171875, 0.09329986572265625, 0.1116485595703125, 0.12999725341796875, 0.148345947265625, 0.16669464111328125, 0.1850433349609375, 0.20339202880859375, 0.22174072265625, 0.24008941650390625, 0.2584381103515625, 0.27678680419921875, 0.295135498046875, 0.31348419189453125, 0.3318328857421875, 0.35018157958984375, 0.3685302734375, 0.38687896728515625, 0.4052276611328125, 0.42357635498046875, 0.441925048828125, 0.46027374267578125, 0.4786224365234375, 0.49697113037109375, 0.51531982421875, 0.5336685180664062, 0.5520172119140625, 0.5703659057617188, 0.588714599609375, 0.6070632934570312, 0.6254119873046875, 0.6437606811523438, 0.662109375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 7.0, 10.0, 8.0, 11.0, 17.0, 27.0, 23.0, 36.0, 28.0, 34.0, 36.0, 48.0, 53.0, 51.0, 49.0, 50.0, 46.0, 63.0, 46.0, 45.0, 44.0, 29.0, 29.0, 37.0, 39.0, 28.0, 12.0, 18.0, 11.0, 8.0, 14.0, 7.0, 11.0, 3.0, 7.0, 5.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.54248046875, -0.5281410217285156, -0.5138015747070312, -0.4994621276855469, -0.4851226806640625, -0.4707832336425781, -0.45644378662109375, -0.4421043395996094, -0.427764892578125, -0.4134254455566406, -0.39908599853515625, -0.3847465515136719, -0.3704071044921875, -0.3560676574707031, -0.34172821044921875, -0.3273887634277344, -0.31304931640625, -0.2987098693847656, -0.28437042236328125, -0.2700309753417969, -0.2556915283203125, -0.24135208129882812, -0.22701263427734375, -0.21267318725585938, -0.198333740234375, -0.18399429321289062, -0.16965484619140625, -0.15531539916992188, -0.1409759521484375, -0.12663650512695312, -0.11229705810546875, -0.09795761108398438, -0.0836181640625, -0.06927871704101562, -0.05493927001953125, -0.040599822998046875, -0.0262603759765625, -0.011920928955078125, 0.00241851806640625, 0.016757965087890625, 0.031097412109375, 0.045436859130859375, 0.05977630615234375, 0.07411575317382812, 0.0884552001953125, 0.10279464721679688, 0.11713409423828125, 0.13147354125976562, 0.14581298828125, 0.16015243530273438, 0.17449188232421875, 0.18883132934570312, 0.2031707763671875, 0.21751022338867188, 0.23184967041015625, 0.24618911743164062, 0.260528564453125, 0.2748680114746094, 0.28920745849609375, 0.3035469055175781, 0.3178863525390625, 0.3322257995605469, 0.34656524658203125, 0.3609046936035156, 0.375244140625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 4.0, 5.0, 9.0, 12.0, 12.0, 11.0, 30.0, 53.0, 68.0, 120.0, 212.0, 407.0, 860.0, 2069.0, 6345.0, 37417.0, 691071.0, 283529.0, 19245.0, 4165.0, 1506.0, 648.0, 301.0, 175.0, 93.0, 65.0, 38.0, 23.0, 15.0, 13.0, 9.0, 7.0, 1.0, 4.0, 8.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4248046875, -0.4105682373046875, -0.396331787109375, -0.3820953369140625, -0.36785888671875, -0.3536224365234375, -0.339385986328125, -0.3251495361328125, -0.3109130859375, -0.2966766357421875, -0.282440185546875, -0.2682037353515625, -0.25396728515625, -0.2397308349609375, -0.225494384765625, -0.2112579345703125, -0.197021484375, -0.1827850341796875, -0.168548583984375, -0.1543121337890625, -0.14007568359375, -0.1258392333984375, -0.111602783203125, -0.0973663330078125, -0.0831298828125, -0.0688934326171875, -0.054656982421875, -0.0404205322265625, -0.02618408203125, -0.0119476318359375, 0.002288818359375, 0.0165252685546875, 0.03076171875, 0.0449981689453125, 0.059234619140625, 0.0734710693359375, 0.08770751953125, 0.1019439697265625, 0.116180419921875, 0.1304168701171875, 0.1446533203125, 0.1588897705078125, 0.173126220703125, 0.1873626708984375, 0.20159912109375, 0.2158355712890625, 0.230072021484375, 0.2443084716796875, 0.258544921875, 0.2727813720703125, 0.287017822265625, 0.3012542724609375, 0.31549072265625, 0.3297271728515625, 0.343963623046875, 0.3582000732421875, 0.3724365234375, 0.3866729736328125, 0.400909423828125, 0.4151458740234375, 0.42938232421875, 0.4436187744140625, 0.457855224609375, 0.4720916748046875, 0.486328125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 6.0, 8.0, 10.0, 24.0, 33.0, 39.0, 74.0, 107.0, 142.0, 161.0, 113.0, 97.0, 61.0, 46.0, 31.0, 20.0, 7.0, 9.0, 2.0, 4.0, 4.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.982948303222656e-05, -4.8072077333927155e-05, -4.6314671635627747e-05, -4.455726593732834e-05, -4.279986023902893e-05, -4.104245454072952e-05, -3.9285048842430115e-05, -3.752764314413071e-05, -3.57702374458313e-05, -3.401283174753189e-05, -3.225542604923248e-05, -3.0498020350933075e-05, -2.8740614652633667e-05, -2.698320895433426e-05, -2.522580325603485e-05, -2.3468397557735443e-05, -2.1710991859436035e-05, -1.9953586161136627e-05, -1.819618046283722e-05, -1.643877476453781e-05, -1.4681369066238403e-05, -1.2923963367938995e-05, -1.1166557669639587e-05, -9.40915197134018e-06, -7.651746273040771e-06, -5.8943405747413635e-06, -4.1369348764419556e-06, -2.3795291781425476e-06, -6.221234798431396e-07, 1.1352822184562683e-06, 2.8926879167556763e-06, 4.650093615055084e-06, 6.407499313354492e-06, 8.1649050116539e-06, 9.922310709953308e-06, 1.1679716408252716e-05, 1.3437122106552124e-05, 1.5194527804851532e-05, 1.695193350315094e-05, 1.8709339201450348e-05, 2.0466744899749756e-05, 2.2224150598049164e-05, 2.3981556296348572e-05, 2.573896199464798e-05, 2.7496367692947388e-05, 2.9253773391246796e-05, 3.1011179089546204e-05, 3.276858478784561e-05, 3.452599048614502e-05, 3.628339618444443e-05, 3.8040801882743835e-05, 3.9798207581043243e-05, 4.155561327934265e-05, 4.331301897764206e-05, 4.507042467594147e-05, 4.6827830374240875e-05, 4.858523607254028e-05, 5.034264177083969e-05, 5.21000474691391e-05, 5.385745316743851e-05, 5.5614858865737915e-05, 5.737226456403732e-05, 5.912967026233673e-05, 6.088707596063614e-05, 6.264448165893555e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 10.0, 12.0, 20.0, 20.0, 34.0, 50.0, 70.0, 147.0, 232.0, 415.0, 920.0, 2204.0, 6209.0, 23061.0, 130981.0, 670724.0, 174165.0, 27655.0, 7236.0, 2348.0, 989.0, 468.0, 213.0, 137.0, 80.0, 48.0, 31.0, 22.0, 16.0, 10.0, 5.0, 5.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2451171875, -0.23622512817382812, -0.22733306884765625, -0.21844100952148438, -0.2095489501953125, -0.20065689086914062, -0.19176483154296875, -0.18287277221679688, -0.173980712890625, -0.16508865356445312, -0.15619659423828125, -0.14730453491210938, -0.1384124755859375, -0.12952041625976562, -0.12062835693359375, -0.11173629760742188, -0.10284423828125, -0.09395217895507812, -0.08506011962890625, -0.07616806030273438, -0.0672760009765625, -0.058383941650390625, -0.04949188232421875, -0.040599822998046875, -0.031707763671875, -0.022815704345703125, -0.01392364501953125, -0.005031585693359375, 0.0038604736328125, 0.012752532958984375, 0.02164459228515625, 0.030536651611328125, 0.0394287109375, 0.048320770263671875, 0.05721282958984375, 0.06610488891601562, 0.0749969482421875, 0.08388900756835938, 0.09278106689453125, 0.10167312622070312, 0.110565185546875, 0.11945724487304688, 0.12834930419921875, 0.13724136352539062, 0.1461334228515625, 0.15502548217773438, 0.16391754150390625, 0.17280960083007812, 0.18170166015625, 0.19059371948242188, 0.19948577880859375, 0.20837783813476562, 0.2172698974609375, 0.22616195678710938, 0.23505401611328125, 0.24394607543945312, 0.252838134765625, 0.2617301940917969, 0.27062225341796875, 0.2795143127441406, 0.2884063720703125, 0.2972984313964844, 0.30619049072265625, 0.3150825500488281, 0.323974609375]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 3.0, 3.0, 5.0, 8.0, 8.0, 19.0, 21.0, 18.0, 32.0, 47.0, 61.0, 57.0, 100.0, 106.0, 113.0, 100.0, 83.0, 47.0, 42.0, 33.0, 28.0, 17.0, 10.0, 10.0, 5.0, 7.0, 4.0, 3.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1622314453125, -0.15450477600097656, -0.14677810668945312, -0.1390514373779297, -0.13132476806640625, -0.12359809875488281, -0.11587142944335938, -0.10814476013183594, -0.1004180908203125, -0.09269142150878906, -0.08496475219726562, -0.07723808288574219, -0.06951141357421875, -0.06178474426269531, -0.054058074951171875, -0.04633140563964844, -0.038604736328125, -0.030878067016601562, -0.023151397705078125, -0.015424728393554688, -0.00769805908203125, 2.86102294921875e-05, 0.007755279541015625, 0.015481948852539062, 0.0232086181640625, 0.030935287475585938, 0.038661956787109375, 0.04638862609863281, 0.05411529541015625, 0.06184196472167969, 0.06956863403320312, 0.07729530334472656, 0.08502197265625, 0.09274864196777344, 0.10047531127929688, 0.10820198059082031, 0.11592864990234375, 0.12365531921386719, 0.13138198852539062, 0.13910865783691406, 0.1468353271484375, 0.15456199645996094, 0.16228866577148438, 0.1700153350830078, 0.17774200439453125, 0.1854686737060547, 0.19319534301757812, 0.20092201232910156, 0.208648681640625, 0.21637535095214844, 0.22410202026367188, 0.2318286895751953, 0.23955535888671875, 0.2472820281982422, 0.2550086975097656, 0.26273536682128906, 0.2704620361328125, 0.27818870544433594, 0.2859153747558594, 0.2936420440673828, 0.30136871337890625, 0.3090953826904297, 0.3168220520019531, 0.32454872131347656, 0.332275390625]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 10.0, 12.0, 14.0, 23.0, 37.0, 67.0, 106.0, 115.0, 147.0, 122.0, 119.0, 73.0, 51.0, 35.0, 19.0, 16.0, 9.0, 11.0, 4.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2507643699645996, -2.142014741897583, -2.0332651138305664, -1.9245154857635498, -1.8157657384872437, -1.707016110420227, -1.5982664823532104, -1.4895167350769043, -1.3807671070098877, -1.272017478942871, -1.1632678508758545, -1.054518222808838, -0.9457684755325317, -0.8370188474655151, -0.7282692193984985, -0.6195195317268372, -0.5107699632644653, -0.40202030539512634, -0.29327064752578735, -0.18452101945877075, -0.07577136158943176, 0.03297829627990723, 0.14172792434692383, 0.2504776120185852, 0.3592272400856018, 0.4679768979549408, 0.5767265558242798, 0.6854761838912964, 0.794225811958313, 0.9029754996299744, 1.0117251873016357, 1.1204748153686523, 1.229224443435669, 1.3379740715026855, 1.4467236995697021, 1.5554733276367188, 1.664223074913025, 1.7729727029800415, 1.881722331047058, 1.9904720783233643, 2.099221706390381, 2.2079713344573975, 2.316720962524414, 2.4254705905914307, 2.5342202186584473, 2.642970085144043, 2.7517194747924805, 2.860469341278076, 2.9692187309265137, 3.0779683589935303, 3.186717987060547, 3.2954676151275635, 3.40421724319458, 3.512967109680176, 3.6217164993286133, 3.730466365814209, 3.8392159938812256, 3.947965621948242, 4.056715488433838, 4.165464878082275, 4.274214744567871, 4.382964134216309, 4.491714000701904, 4.600463390350342, 4.7092132568359375]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 10.0, 9.0, 9.0, 8.0, 10.0, 9.0, 13.0, 29.0, 25.0, 32.0, 24.0, 36.0, 46.0, 53.0, 48.0, 41.0, 33.0, 34.0, 46.0, 44.0, 47.0, 50.0, 36.0, 43.0, 42.0, 36.0, 38.0, 22.0, 19.0, 16.0, 16.0, 8.0, 12.0, 24.0, 7.0, 6.0, 7.0, 6.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3538997173309326, -2.277125120162964, -2.200350522994995, -2.1235759258270264, -2.0468015670776367, -1.9700268507003784, -1.8932523727416992, -1.8164777755737305, -1.7397031784057617, -1.662928581237793, -1.5861539840698242, -1.509379506111145, -1.4326049089431763, -1.3558303117752075, -1.2790558338165283, -1.2022812366485596, -1.1255066394805908, -1.048732042312622, -0.9719575047492981, -0.8951829671859741, -0.8184083700180054, -0.7416337728500366, -0.6648592352867126, -0.5880846977233887, -0.5113101005554199, -0.43453553318977356, -0.3577609658241272, -0.28098639845848083, -0.20421183109283447, -0.1274372637271881, -0.05066269636154175, 0.026111841201782227, 0.10288667678833008, 0.17966124415397644, 0.2564358115196228, 0.33321037888526917, 0.4099849462509155, 0.4867595136165619, 0.5635340809822083, 0.6403086185455322, 0.717083215713501, 0.7938578128814697, 0.8706323504447937, 0.9474068880081177, 1.0241814851760864, 1.1009560823440552, 1.1777305603027344, 1.2545051574707031, 1.3312797546386719, 1.4080543518066406, 1.4848289489746094, 1.5616034269332886, 1.6383780241012573, 1.715152621269226, 1.7919270992279053, 1.868701696395874, 1.9454762935638428, 2.0222508907318115, 2.0990254878997803, 2.175800085067749, 2.2525744438171387, 2.3293490409851074, 2.406123638153076, 2.482898235321045, 2.5596728324890137]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 3.0, 2.0, 5.0, 12.0, 21.0, 31.0, 55.0, 89.0, 209.0, 523.0, 1553.0, 6073.0, 51958.0, 3878125.0, 238793.0, 12724.0, 2518.0, 811.0, 334.0, 176.0, 97.0, 56.0, 28.0, 23.0, 16.0, 16.0, 11.0, 6.0, 4.0, 2.0, 4.0, 5.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.69140625, -0.6609649658203125, -0.630523681640625, -0.6000823974609375, -0.56964111328125, -0.5391998291015625, -0.508758544921875, -0.4783172607421875, -0.4478759765625, -0.4174346923828125, -0.386993408203125, -0.3565521240234375, -0.32611083984375, -0.2956695556640625, -0.265228271484375, -0.2347869873046875, -0.204345703125, -0.1739044189453125, -0.143463134765625, -0.1130218505859375, -0.08258056640625, -0.0521392822265625, -0.021697998046875, 0.0087432861328125, 0.0391845703125, 0.0696258544921875, 0.100067138671875, 0.1305084228515625, 0.16094970703125, 0.1913909912109375, 0.221832275390625, 0.2522735595703125, 0.28271484375, 0.3131561279296875, 0.343597412109375, 0.3740386962890625, 0.40447998046875, 0.4349212646484375, 0.465362548828125, 0.4958038330078125, 0.5262451171875, 0.5566864013671875, 0.587127685546875, 0.6175689697265625, 0.64801025390625, 0.6784515380859375, 0.708892822265625, 0.7393341064453125, 0.769775390625, 0.8002166748046875, 0.830657958984375, 0.8610992431640625, 0.89154052734375, 0.9219818115234375, 0.952423095703125, 0.9828643798828125, 1.0133056640625, 1.0437469482421875, 1.074188232421875, 1.1046295166015625, 1.13507080078125, 1.1655120849609375, 1.195953369140625, 1.2263946533203125, 1.2568359375]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 12.0, 21.0, 30.0, 54.0, 65.0, 87.0, 91.0, 136.0, 143.0, 118.0, 88.0, 68.0, 42.0, 25.0, 14.0, 2.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1707763671875, -0.1639270782470703, -0.15707778930664062, -0.15022850036621094, -0.14337921142578125, -0.13652992248535156, -0.12968063354492188, -0.12283134460449219, -0.1159820556640625, -0.10913276672363281, -0.10228347778320312, -0.09543418884277344, -0.08858489990234375, -0.08173561096191406, -0.07488632202148438, -0.06803703308105469, -0.061187744140625, -0.05433845520019531, -0.047489166259765625, -0.04063987731933594, -0.03379058837890625, -0.026941299438476562, -0.020092010498046875, -0.013242721557617188, -0.0063934326171875, 0.0004558563232421875, 0.007305145263671875, 0.014154434204101562, 0.02100372314453125, 0.027853012084960938, 0.034702301025390625, 0.04155158996582031, 0.04840087890625, 0.05525016784667969, 0.062099456787109375, 0.06894874572753906, 0.07579803466796875, 0.08264732360839844, 0.08949661254882812, 0.09634590148925781, 0.1031951904296875, 0.11004447937011719, 0.11689376831054688, 0.12374305725097656, 0.13059234619140625, 0.13744163513183594, 0.14429092407226562, 0.1511402130126953, 0.157989501953125, 0.1648387908935547, 0.17168807983398438, 0.17853736877441406, 0.18538665771484375, 0.19223594665527344, 0.19908523559570312, 0.2059345245361328, 0.2127838134765625, 0.2196331024169922, 0.22648239135742188, 0.23333168029785156, 0.24018096923828125, 0.24703025817871094, 0.2538795471191406, 0.2607288360595703, 0.267578125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 11.0, 28.0, 30.0, 73.0, 102.0, 211.0, 398.0, 739.0, 1790.0, 5146.0, 22036.0, 224116.0, 3710531.0, 200059.0, 20697.0, 5047.0, 1678.0, 700.0, 382.0, 208.0, 134.0, 60.0, 40.0, 27.0, 19.0, 10.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7841796875, -0.7614364624023438, -0.7386932373046875, -0.7159500122070312, -0.693206787109375, -0.6704635620117188, -0.6477203369140625, -0.6249771118164062, -0.60223388671875, -0.5794906616210938, -0.5567474365234375, -0.5340042114257812, -0.511260986328125, -0.48851776123046875, -0.4657745361328125, -0.44303131103515625, -0.4202880859375, -0.39754486083984375, -0.3748016357421875, -0.35205841064453125, -0.329315185546875, -0.30657196044921875, -0.2838287353515625, -0.26108551025390625, -0.23834228515625, -0.21559906005859375, -0.1928558349609375, -0.17011260986328125, -0.147369384765625, -0.12462615966796875, -0.1018829345703125, -0.07913970947265625, -0.056396484375, -0.03365325927734375, -0.0109100341796875, 0.01183319091796875, 0.034576416015625, 0.05731964111328125, 0.0800628662109375, 0.10280609130859375, 0.12554931640625, 0.14829254150390625, 0.1710357666015625, 0.19377899169921875, 0.216522216796875, 0.23926544189453125, 0.2620086669921875, 0.28475189208984375, 0.3074951171875, 0.33023834228515625, 0.3529815673828125, 0.37572479248046875, 0.398468017578125, 0.42121124267578125, 0.4439544677734375, 0.46669769287109375, 0.48944091796875, 0.5121841430664062, 0.5349273681640625, 0.5576705932617188, 0.580413818359375, 0.6031570434570312, 0.6259002685546875, 0.6486434936523438, 0.67138671875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 3.0, 4.0, 5.0, 11.0, 13.0, 8.0, 29.0, 42.0, 83.0, 173.0, 409.0, 1187.0, 1294.0, 396.0, 166.0, 100.0, 58.0, 33.0, 19.0, 18.0, 10.0, 3.0, 2.0, 6.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.271240234375, -0.2624969482421875, -0.253753662109375, -0.2450103759765625, -0.23626708984375, -0.2275238037109375, -0.218780517578125, -0.2100372314453125, -0.2012939453125, -0.1925506591796875, -0.183807373046875, -0.1750640869140625, -0.16632080078125, -0.1575775146484375, -0.148834228515625, -0.1400909423828125, -0.13134765625, -0.1226043701171875, -0.113861083984375, -0.1051177978515625, -0.09637451171875, -0.0876312255859375, -0.078887939453125, -0.0701446533203125, -0.0614013671875, -0.0526580810546875, -0.043914794921875, -0.0351715087890625, -0.02642822265625, -0.0176849365234375, -0.008941650390625, -0.0001983642578125, 0.008544921875, 0.0172882080078125, 0.026031494140625, 0.0347747802734375, 0.04351806640625, 0.0522613525390625, 0.061004638671875, 0.0697479248046875, 0.0784912109375, 0.0872344970703125, 0.095977783203125, 0.1047210693359375, 0.11346435546875, 0.1222076416015625, 0.130950927734375, 0.1396942138671875, 0.1484375, 0.1571807861328125, 0.165924072265625, 0.1746673583984375, 0.18341064453125, 0.1921539306640625, 0.200897216796875, 0.2096405029296875, 0.2183837890625, 0.2271270751953125, 0.235870361328125, 0.2446136474609375, 0.25335693359375, 0.2621002197265625, 0.270843505859375, 0.2795867919921875, 0.288330078125]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 14.0, 59.0, 244.0, 381.0, 217.0, 73.0, 20.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.25734543800354, -1.1465258598327637, -1.0357062816619873, -0.9248865842819214, -0.814067006111145, -0.7032474279403687, -0.5924277901649475, -0.48160815238952637, -0.37078857421875, -0.25996896624565125, -0.1491493582725525, -0.038329750299453735, 0.07248985767364502, 0.1833094358444214, 0.29412907361984253, 0.40494871139526367, 0.51576828956604, 0.6265878677368164, 0.7374075055122375, 0.8482271432876587, 0.9590467214584351, 1.0698662996292114, 1.1806859970092773, 1.2915055751800537, 1.40232515335083, 1.5131447315216064, 1.6239643096923828, 1.7347840070724487, 1.845603585243225, 1.9564231634140015, 2.0672428607940674, 2.1780624389648438, 2.288882255554199, 2.3997018337249756, 2.510521411895752, 2.6213409900665283, 2.7321605682373047, 2.84298038482666, 2.9537999629974365, 3.064619541168213, 3.1754391193389893, 3.2862586975097656, 3.397078275680542, 3.5078978538513184, 3.618717670440674, 3.729537010192871, 3.8403568267822266, 3.951176404953003, 4.061995983123779, 4.172815799713135, 4.283635139465332, 4.3944549560546875, 4.505274295806885, 4.61609411239624, 4.7269134521484375, 4.837733268737793, 4.948553085327148, 5.059372901916504, 5.170192241668701, 5.281012058258057, 5.391831398010254, 5.502651214599609, 5.613470554351807, 5.724290370941162, 5.835109710693359]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 6.0, 6.0, 6.0, 13.0, 8.0, 11.0, 18.0, 12.0, 20.0, 18.0, 28.0, 36.0, 37.0, 48.0, 43.0, 44.0, 51.0, 57.0, 50.0, 48.0, 58.0, 41.0, 40.0, 37.0, 27.0, 46.0, 30.0, 39.0, 23.0, 23.0, 22.0, 22.0, 8.0, 9.0, 7.0, 6.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8965288400650024, -0.8705176115036011, -0.8445063829421997, -0.8184951543807983, -0.792483925819397, -0.7664726972579956, -0.7404614090919495, -0.7144501805305481, -0.6884389519691467, -0.6624277234077454, -0.636416494846344, -0.6104052662849426, -0.5843939781188965, -0.5583827495574951, -0.5323715209960938, -0.5063602924346924, -0.480349063873291, -0.45433783531188965, -0.4283266067504883, -0.4023153483867645, -0.37630411982536316, -0.3502928912639618, -0.32428163290023804, -0.29827040433883667, -0.2722591757774353, -0.24624794721603394, -0.22023670375347137, -0.1942254602909088, -0.16821423172950745, -0.14220300316810608, -0.11619175970554352, -0.09018051624298096, -0.06416922807693481, -0.03815799206495285, -0.012146756052970886, 0.013864479959011078, 0.03987571597099304, 0.06588694453239441, 0.09189818799495697, 0.11790943145751953, 0.1439206600189209, 0.16993188858032227, 0.19594313204288483, 0.2219543755054474, 0.24796560406684875, 0.2739768326282501, 0.2999880909919739, 0.32599931955337524, 0.3520105481147766, 0.378021776676178, 0.40403300523757935, 0.4300442636013031, 0.45605549216270447, 0.48206672072410583, 0.5080779790878296, 0.534089207649231, 0.5601004362106323, 0.5861116647720337, 0.6121228933334351, 0.6381341218948364, 0.6641453504562378, 0.6901565790176392, 0.7161678671836853, 0.7421790957450867, 0.768190324306488]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 5.0, 2.0, 7.0, 8.0, 6.0, 9.0, 14.0, 27.0, 26.0, 34.0, 52.0, 76.0, 92.0, 128.0, 183.0, 332.0, 558.0, 1012.0, 2149.0, 5887.0, 23432.0, 138701.0, 594854.0, 230096.0, 36757.0, 8385.0, 2834.0, 1231.0, 624.0, 335.0, 227.0, 129.0, 93.0, 73.0, 61.0, 33.0, 27.0, 20.0, 11.0, 8.0, 9.0, 5.0, 1.0, 4.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.78857421875, -0.7628326416015625, -0.737091064453125, -0.7113494873046875, -0.68560791015625, -0.6598663330078125, -0.634124755859375, -0.6083831787109375, -0.5826416015625, -0.5569000244140625, -0.531158447265625, -0.5054168701171875, -0.47967529296875, -0.4539337158203125, -0.428192138671875, -0.4024505615234375, -0.376708984375, -0.3509674072265625, -0.325225830078125, -0.2994842529296875, -0.27374267578125, -0.2480010986328125, -0.222259521484375, -0.1965179443359375, -0.1707763671875, -0.1450347900390625, -0.119293212890625, -0.0935516357421875, -0.06781005859375, -0.0420684814453125, -0.016326904296875, 0.0094146728515625, 0.03515625, 0.0608978271484375, 0.086639404296875, 0.1123809814453125, 0.13812255859375, 0.1638641357421875, 0.189605712890625, 0.2153472900390625, 0.2410888671875, 0.2668304443359375, 0.292572021484375, 0.3183135986328125, 0.34405517578125, 0.3697967529296875, 0.395538330078125, 0.4212799072265625, 0.447021484375, 0.4727630615234375, 0.498504638671875, 0.5242462158203125, 0.54998779296875, 0.5757293701171875, 0.601470947265625, 0.6272125244140625, 0.6529541015625, 0.6786956787109375, 0.704437255859375, 0.7301788330078125, 0.75592041015625, 0.7816619873046875, 0.807403564453125, 0.8331451416015625, 0.85888671875]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 9.0, 25.0, 21.0, 36.0, 68.0, 68.0, 90.0, 105.0, 134.0, 109.0, 109.0, 79.0, 62.0, 40.0, 20.0, 14.0, 10.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.167724609375, -0.16116714477539062, -0.15460968017578125, -0.14805221557617188, -0.1414947509765625, -0.13493728637695312, -0.12837982177734375, -0.12182235717773438, -0.115264892578125, -0.10870742797851562, -0.10214996337890625, -0.09559249877929688, -0.0890350341796875, -0.08247756958007812, -0.07592010498046875, -0.06936264038085938, -0.06280517578125, -0.056247711181640625, -0.04969024658203125, -0.043132781982421875, -0.0365753173828125, -0.030017852783203125, -0.02346038818359375, -0.016902923583984375, -0.010345458984375, -0.003787994384765625, 0.00276947021484375, 0.009326934814453125, 0.0158843994140625, 0.022441864013671875, 0.02899932861328125, 0.035556793212890625, 0.0421142578125, 0.048671722412109375, 0.05522918701171875, 0.061786651611328125, 0.0683441162109375, 0.07490158081054688, 0.08145904541015625, 0.08801651000976562, 0.094573974609375, 0.10113143920898438, 0.10768890380859375, 0.11424636840820312, 0.1208038330078125, 0.12736129760742188, 0.13391876220703125, 0.14047622680664062, 0.14703369140625, 0.15359115600585938, 0.16014862060546875, 0.16670608520507812, 0.1732635498046875, 0.17982101440429688, 0.18637847900390625, 0.19293594360351562, 0.199493408203125, 0.20605087280273438, 0.21260833740234375, 0.21916580200195312, 0.2257232666015625, 0.23228073120117188, 0.23883819580078125, 0.24539566040039062, 0.251953125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 5.0, 6.0, 8.0, 16.0, 26.0, 45.0, 46.0, 82.0, 112.0, 218.0, 355.0, 687.0, 1224.0, 2488.0, 5628.0, 14380.0, 42972.0, 159378.0, 443398.0, 267284.0, 73014.0, 21942.0, 8054.0, 3525.0, 1688.0, 819.0, 439.0, 247.0, 157.0, 106.0, 72.0, 48.0, 27.0, 21.0, 15.0, 6.0, 6.0, 4.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.5791015625, -0.561920166015625, -0.54473876953125, -0.527557373046875, -0.5103759765625, -0.493194580078125, -0.47601318359375, -0.458831787109375, -0.441650390625, -0.424468994140625, -0.40728759765625, -0.390106201171875, -0.3729248046875, -0.355743408203125, -0.33856201171875, -0.321380615234375, -0.30419921875, -0.287017822265625, -0.26983642578125, -0.252655029296875, -0.2354736328125, -0.218292236328125, -0.20111083984375, -0.183929443359375, -0.166748046875, -0.149566650390625, -0.13238525390625, -0.115203857421875, -0.0980224609375, -0.080841064453125, -0.06365966796875, -0.046478271484375, -0.029296875, -0.012115478515625, 0.00506591796875, 0.022247314453125, 0.0394287109375, 0.056610107421875, 0.07379150390625, 0.090972900390625, 0.108154296875, 0.125335693359375, 0.14251708984375, 0.159698486328125, 0.1768798828125, 0.194061279296875, 0.21124267578125, 0.228424072265625, 0.24560546875, 0.262786865234375, 0.27996826171875, 0.297149658203125, 0.3143310546875, 0.331512451171875, 0.34869384765625, 0.365875244140625, 0.383056640625, 0.400238037109375, 0.41741943359375, 0.434600830078125, 0.4517822265625, 0.468963623046875, 0.48614501953125, 0.503326416015625, 0.5205078125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 2.0, 3.0, 7.0, 5.0, 7.0, 15.0, 6.0, 16.0, 26.0, 25.0, 21.0, 31.0, 26.0, 42.0, 31.0, 51.0, 66.0, 55.0, 63.0, 64.0, 42.0, 43.0, 48.0, 49.0, 44.0, 39.0, 37.0, 30.0, 20.0, 27.0, 12.0, 11.0, 9.0, 17.0, 6.0, 6.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.67138671875, -0.6540603637695312, -0.6367340087890625, -0.6194076538085938, -0.602081298828125, -0.5847549438476562, -0.5674285888671875, -0.5501022338867188, -0.53277587890625, -0.5154495239257812, -0.4981231689453125, -0.48079681396484375, -0.463470458984375, -0.44614410400390625, -0.4288177490234375, -0.41149139404296875, -0.3941650390625, -0.37683868408203125, -0.3595123291015625, -0.34218597412109375, -0.324859619140625, -0.30753326416015625, -0.2902069091796875, -0.27288055419921875, -0.25555419921875, -0.23822784423828125, -0.2209014892578125, -0.20357513427734375, -0.186248779296875, -0.16892242431640625, -0.1515960693359375, -0.13426971435546875, -0.116943359375, -0.09961700439453125, -0.0822906494140625, -0.06496429443359375, -0.047637939453125, -0.03031158447265625, -0.0129852294921875, 0.00434112548828125, 0.02166748046875, 0.03899383544921875, 0.0563201904296875, 0.07364654541015625, 0.090972900390625, 0.10829925537109375, 0.1256256103515625, 0.14295196533203125, 0.1602783203125, 0.17760467529296875, 0.1949310302734375, 0.21225738525390625, 0.229583740234375, 0.24691009521484375, 0.2642364501953125, 0.28156280517578125, 0.29888916015625, 0.31621551513671875, 0.3335418701171875, 0.35086822509765625, 0.368194580078125, 0.38552093505859375, 0.4028472900390625, 0.42017364501953125, 0.4375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 7.0, 2.0, 7.0, 12.0, 14.0, 25.0, 38.0, 95.0, 221.0, 438.0, 1213.0, 4061.0, 24765.0, 829073.0, 176063.0, 8978.0, 2199.0, 735.0, 296.0, 144.0, 63.0, 49.0, 17.0, 10.0, 6.0, 3.0, 2.0, 6.0, 6.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.73876953125, -0.7147598266601562, -0.6907501220703125, -0.6667404174804688, -0.642730712890625, -0.6187210083007812, -0.5947113037109375, -0.5707015991210938, -0.54669189453125, -0.5226821899414062, -0.4986724853515625, -0.47466278076171875, -0.450653076171875, -0.42664337158203125, -0.4026336669921875, -0.37862396240234375, -0.3546142578125, -0.33060455322265625, -0.3065948486328125, -0.28258514404296875, -0.258575439453125, -0.23456573486328125, -0.2105560302734375, -0.18654632568359375, -0.16253662109375, -0.13852691650390625, -0.1145172119140625, -0.09050750732421875, -0.066497802734375, -0.04248809814453125, -0.0184783935546875, 0.00553131103515625, 0.029541015625, 0.05355072021484375, 0.0775604248046875, 0.10157012939453125, 0.125579833984375, 0.14958953857421875, 0.1735992431640625, 0.19760894775390625, 0.22161865234375, 0.24562835693359375, 0.2696380615234375, 0.29364776611328125, 0.317657470703125, 0.34166717529296875, 0.3656768798828125, 0.38968658447265625, 0.4136962890625, 0.43770599365234375, 0.4617156982421875, 0.48572540283203125, 0.509735107421875, 0.5337448120117188, 0.5577545166015625, 0.5817642211914062, 0.60577392578125, 0.6297836303710938, 0.6537933349609375, 0.6778030395507812, 0.701812744140625, 0.7258224487304688, 0.7498321533203125, 0.7738418579101562, 0.7978515625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 4.0, 9.0, 7.0, 12.0, 27.0, 46.0, 67.0, 155.0, 222.0, 184.0, 120.0, 68.0, 29.0, 25.0, 16.0, 5.0, 3.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.522106170654297e-05, -7.206760346889496e-05, -6.891414523124695e-05, -6.576068699359894e-05, -6.260722875595093e-05, -5.945377051830292e-05, -5.630031228065491e-05, -5.31468540430069e-05, -4.999339580535889e-05, -4.6839937567710876e-05, -4.3686479330062866e-05, -4.0533021092414856e-05, -3.7379562854766846e-05, -3.4226104617118835e-05, -3.1072646379470825e-05, -2.7919188141822815e-05, -2.4765729904174805e-05, -2.1612271666526794e-05, -1.8458813428878784e-05, -1.5305355191230774e-05, -1.2151896953582764e-05, -8.998438715934753e-06, -5.844980478286743e-06, -2.691522240638733e-06, 4.6193599700927734e-07, 3.6153942346572876e-06, 6.768852472305298e-06, 9.922310709953308e-06, 1.3075768947601318e-05, 1.622922718524933e-05, 1.938268542289734e-05, 2.253614366054535e-05, 2.568960189819336e-05, 2.884306013584137e-05, 3.199651837348938e-05, 3.514997661113739e-05, 3.83034348487854e-05, 4.145689308643341e-05, 4.461035132408142e-05, 4.776380956172943e-05, 5.091726779937744e-05, 5.407072603702545e-05, 5.722418427467346e-05, 6.037764251232147e-05, 6.353110074996948e-05, 6.668455898761749e-05, 6.98380172252655e-05, 7.299147546291351e-05, 7.614493370056152e-05, 7.929839193820953e-05, 8.245185017585754e-05, 8.560530841350555e-05, 8.875876665115356e-05, 9.191222488880157e-05, 9.506568312644958e-05, 9.82191413640976e-05, 0.0001013725996017456, 0.00010452605783939362, 0.00010767951607704163, 0.00011083297431468964, 0.00011398643255233765, 0.00011713989078998566, 0.00012029334902763367, 0.00012344680726528168, 0.0001266002655029297]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 3.0, 11.0, 12.0, 16.0, 14.0, 26.0, 49.0, 85.0, 139.0, 271.0, 615.0, 1799.0, 6740.0, 54137.0, 796201.0, 171104.0, 12770.0, 2805.0, 942.0, 351.0, 212.0, 98.0, 65.0, 28.0, 15.0, 17.0, 10.0, 7.0, 3.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.54833984375, -0.5304718017578125, -0.512603759765625, -0.4947357177734375, -0.47686767578125, -0.4589996337890625, -0.441131591796875, -0.4232635498046875, -0.4053955078125, -0.3875274658203125, -0.369659423828125, -0.3517913818359375, -0.33392333984375, -0.3160552978515625, -0.298187255859375, -0.2803192138671875, -0.262451171875, -0.2445831298828125, -0.226715087890625, -0.2088470458984375, -0.19097900390625, -0.1731109619140625, -0.155242919921875, -0.1373748779296875, -0.1195068359375, -0.1016387939453125, -0.083770751953125, -0.0659027099609375, -0.04803466796875, -0.0301666259765625, -0.012298583984375, 0.0055694580078125, 0.0234375, 0.0413055419921875, 0.059173583984375, 0.0770416259765625, 0.09490966796875, 0.1127777099609375, 0.130645751953125, 0.1485137939453125, 0.1663818359375, 0.1842498779296875, 0.202117919921875, 0.2199859619140625, 0.23785400390625, 0.2557220458984375, 0.273590087890625, 0.2914581298828125, 0.309326171875, 0.3271942138671875, 0.345062255859375, 0.3629302978515625, 0.38079833984375, 0.3986663818359375, 0.416534423828125, 0.4344024658203125, 0.4522705078125, 0.4701385498046875, 0.488006591796875, 0.5058746337890625, 0.52374267578125, 0.5416107177734375, 0.559478759765625, 0.5773468017578125, 0.59521484375]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 0.0, 3.0, 4.0, 3.0, 5.0, 9.0, 8.0, 16.0, 12.0, 28.0, 41.0, 69.0, 95.0, 145.0, 146.0, 145.0, 100.0, 59.0, 36.0, 34.0, 9.0, 17.0, 7.0, 8.0, 7.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.4873046875, -0.47351837158203125, -0.4597320556640625, -0.44594573974609375, -0.432159423828125, -0.41837310791015625, -0.4045867919921875, -0.39080047607421875, -0.37701416015625, -0.36322784423828125, -0.3494415283203125, -0.33565521240234375, -0.321868896484375, -0.30808258056640625, -0.2942962646484375, -0.28050994873046875, -0.2667236328125, -0.25293731689453125, -0.2391510009765625, -0.22536468505859375, -0.211578369140625, -0.19779205322265625, -0.1840057373046875, -0.17021942138671875, -0.15643310546875, -0.14264678955078125, -0.1288604736328125, -0.11507415771484375, -0.101287841796875, -0.08750152587890625, -0.0737152099609375, -0.05992889404296875, -0.046142578125, -0.03235626220703125, -0.0185699462890625, -0.00478363037109375, 0.009002685546875, 0.02278900146484375, 0.0365753173828125, 0.05036163330078125, 0.06414794921875, 0.07793426513671875, 0.0917205810546875, 0.10550689697265625, 0.119293212890625, 0.13307952880859375, 0.1468658447265625, 0.16065216064453125, 0.1744384765625, 0.18822479248046875, 0.2020111083984375, 0.21579742431640625, 0.229583740234375, 0.24337005615234375, 0.2571563720703125, 0.27094268798828125, 0.28472900390625, 0.29851531982421875, 0.3123016357421875, 0.32608795166015625, 0.339874267578125, 0.35366058349609375, 0.3674468994140625, 0.38123321533203125, 0.39501953125]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 7.0, 21.0, 43.0, 128.0, 275.0, 281.0, 138.0, 61.0, 29.0, 12.0, 6.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.318408012390137, -4.0066657066345215, -3.6949236392974854, -3.383181571960449, -3.071439266204834, -2.759697198867798, -2.4479551315307617, -2.1362128257751465, -1.8244707584381104, -1.5127285718917847, -1.200986385345459, -0.8892443180084229, -0.5775021314620972, -0.2657599449157715, 0.04598212242126465, 0.3577244281768799, 0.669466495513916, 0.9812086820602417, 1.2929508686065674, 1.6046929359436035, 1.9164351224899292, 2.228177309036255, 2.539919376373291, 2.8516616821289062, 3.1634037494659424, 3.4751458168029785, 3.7868881225585938, 4.098629951477051, 4.410372257232666, 4.722114562988281, 5.033856391906738, 5.345599174499512, 5.657341003417969, 5.969083309173584, 6.280825138092041, 6.592567443847656, 6.9043097496032715, 7.216052055358887, 7.527793884277344, 7.839536190032959, 8.151278495788574, 8.463020324707031, 8.774763107299805, 9.086504936218262, 9.398246765136719, 9.709989547729492, 10.02173137664795, 10.333473205566406, 10.64521598815918, 10.956957817077637, 11.26870059967041, 11.580442428588867, 11.892184257507324, 12.203927040100098, 12.515668869018555, 12.827411651611328, 13.139152526855469, 13.450894355773926, 13.7626371383667, 14.074378967285156, 14.386120796203613, 14.697863578796387, 15.009605407714844, 15.321348190307617, 15.633090019226074]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 5.0, 2.0, 5.0, 4.0, 10.0, 11.0, 12.0, 12.0, 21.0, 25.0, 20.0, 21.0, 32.0, 36.0, 39.0, 45.0, 48.0, 48.0, 49.0, 44.0, 39.0, 50.0, 40.0, 33.0, 40.0, 34.0, 38.0, 44.0, 25.0, 24.0, 17.0, 20.0, 18.0, 12.0, 13.0, 18.0, 12.0, 9.0, 9.0, 3.0, 4.0, 2.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.916163444519043, -2.8265156745910645, -2.736867904663086, -2.6472201347351074, -2.557572364807129, -2.4679245948791504, -2.378276824951172, -2.2886290550231934, -2.198981285095215, -2.1093335151672363, -2.019685745239258, -1.9300379753112793, -1.8403902053833008, -1.7507424354553223, -1.6610946655273438, -1.5714468955993652, -1.4817990064620972, -1.3921512365341187, -1.3025034666061401, -1.2128556966781616, -1.123207926750183, -1.0335601568222046, -0.9439123272895813, -0.8542645573616028, -0.7646167874336243, -0.6749690175056458, -0.5853212475776672, -0.49567344784736633, -0.4060256779193878, -0.3163779079914093, -0.2267301082611084, -0.13708233833312988, -0.04743456840515137, 0.042213208973407745, 0.13186098635196686, 0.22150877118110657, 0.3111565411090851, 0.4008043110370636, 0.4904521107673645, 0.580099880695343, 0.6697476506233215, 0.7593954205513, 0.8490431904792786, 0.9386910200119019, 1.0283387899398804, 1.1179865598678589, 1.2076343297958374, 1.297282099723816, 1.3869298696517944, 1.476577639579773, 1.5662254095077515, 1.65587317943573, 1.7455209493637085, 1.835168719291687, 1.924816608428955, 2.0144643783569336, 2.104112148284912, 2.1937599182128906, 2.283407688140869, 2.3730554580688477, 2.462703227996826, 2.5523509979248047, 2.641998767852783, 2.7316465377807617, 2.8212943077087402]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 2.0, 4.0, 10.0, 11.0, 13.0, 26.0, 31.0, 68.0, 109.0, 212.0, 469.0, 1166.0, 3943.0, 22251.0, 836951.0, 3290671.0, 30947.0, 4691.0, 1517.0, 587.0, 265.0, 126.0, 68.0, 44.0, 22.0, 14.0, 18.0, 14.0, 7.0, 4.0, 8.0, 7.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.953125, -0.9179229736328125, -0.882720947265625, -0.8475189208984375, -0.81231689453125, -0.7771148681640625, -0.741912841796875, -0.7067108154296875, -0.6715087890625, -0.6363067626953125, -0.601104736328125, -0.5659027099609375, -0.53070068359375, -0.4954986572265625, -0.460296630859375, -0.4250946044921875, -0.389892578125, -0.3546905517578125, -0.319488525390625, -0.2842864990234375, -0.24908447265625, -0.2138824462890625, -0.178680419921875, -0.1434783935546875, -0.1082763671875, -0.0730743408203125, -0.037872314453125, -0.0026702880859375, 0.03253173828125, 0.0677337646484375, 0.102935791015625, 0.1381378173828125, 0.17333984375, 0.2085418701171875, 0.243743896484375, 0.2789459228515625, 0.31414794921875, 0.3493499755859375, 0.384552001953125, 0.4197540283203125, 0.4549560546875, 0.4901580810546875, 0.525360107421875, 0.5605621337890625, 0.59576416015625, 0.6309661865234375, 0.666168212890625, 0.7013702392578125, 0.736572265625, 0.7717742919921875, 0.806976318359375, 0.8421783447265625, 0.87738037109375, 0.9125823974609375, 0.947784423828125, 0.9829864501953125, 1.0181884765625, 1.0533905029296875, 1.088592529296875, 1.1237945556640625, 1.15899658203125, 1.1941986083984375, 1.229400634765625, 1.2646026611328125, 1.2998046875]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 6.0, 3.0, 9.0, 15.0, 15.0, 32.0, 57.0, 81.0, 88.0, 68.0, 90.0, 94.0, 104.0, 84.0, 80.0, 57.0, 38.0, 40.0, 19.0, 5.0, 6.0, 9.0, 1.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1722412109375, -0.16544532775878906, -0.15864944458007812, -0.1518535614013672, -0.14505767822265625, -0.1382617950439453, -0.13146591186523438, -0.12467002868652344, -0.1178741455078125, -0.11107826232910156, -0.10428237915039062, -0.09748649597167969, -0.09069061279296875, -0.08389472961425781, -0.07709884643554688, -0.07030296325683594, -0.063507080078125, -0.05671119689941406, -0.049915313720703125, -0.04311943054199219, -0.03632354736328125, -0.029527664184570312, -0.022731781005859375, -0.015935897827148438, -0.0091400146484375, -0.0023441314697265625, 0.004451751708984375, 0.011247634887695312, 0.01804351806640625, 0.024839401245117188, 0.031635284423828125, 0.03843116760253906, 0.04522705078125, 0.05202293395996094, 0.058818817138671875, 0.06561470031738281, 0.07241058349609375, 0.07920646667480469, 0.08600234985351562, 0.09279823303222656, 0.0995941162109375, 0.10638999938964844, 0.11318588256835938, 0.11998176574707031, 0.12677764892578125, 0.1335735321044922, 0.14036941528320312, 0.14716529846191406, 0.153961181640625, 0.16075706481933594, 0.16755294799804688, 0.1743488311767578, 0.18114471435546875, 0.1879405975341797, 0.19473648071289062, 0.20153236389160156, 0.2083282470703125, 0.21512413024902344, 0.22192001342773438, 0.2287158966064453, 0.23551177978515625, 0.2423076629638672, 0.24910354614257812, 0.25589942932128906, 0.2626953125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 5.0, 8.0, 7.0, 17.0, 46.0, 44.0, 93.0, 182.0, 310.0, 601.0, 1417.0, 3881.0, 14035.0, 111448.0, 3816352.0, 218432.0, 19278.0, 4855.0, 1746.0, 750.0, 353.0, 190.0, 99.0, 67.0, 30.0, 18.0, 9.0, 7.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.75390625, -0.7190093994140625, -0.684112548828125, -0.6492156982421875, -0.61431884765625, -0.5794219970703125, -0.544525146484375, -0.5096282958984375, -0.4747314453125, -0.4398345947265625, -0.404937744140625, -0.3700408935546875, -0.33514404296875, -0.3002471923828125, -0.265350341796875, -0.2304534912109375, -0.195556640625, -0.1606597900390625, -0.125762939453125, -0.0908660888671875, -0.05596923828125, -0.0210723876953125, 0.013824462890625, 0.0487213134765625, 0.0836181640625, 0.1185150146484375, 0.153411865234375, 0.1883087158203125, 0.22320556640625, 0.2581024169921875, 0.292999267578125, 0.3278961181640625, 0.36279296875, 0.3976898193359375, 0.432586669921875, 0.4674835205078125, 0.50238037109375, 0.5372772216796875, 0.572174072265625, 0.6070709228515625, 0.6419677734375, 0.6768646240234375, 0.711761474609375, 0.7466583251953125, 0.78155517578125, 0.8164520263671875, 0.851348876953125, 0.8862457275390625, 0.921142578125, 0.9560394287109375, 0.990936279296875, 1.0258331298828125, 1.06072998046875, 1.0956268310546875, 1.130523681640625, 1.1654205322265625, 1.2003173828125, 1.2352142333984375, 1.270111083984375, 1.3050079345703125, 1.33990478515625, 1.3748016357421875, 1.409698486328125, 1.4445953369140625, 1.4794921875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 7.0, 4.0, 7.0, 12.0, 17.0, 28.0, 28.0, 57.0, 116.0, 291.0, 994.0, 1745.0, 419.0, 147.0, 80.0, 50.0, 22.0, 17.0, 5.0, 6.0, 7.0, 6.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.576171875, -0.5614738464355469, -0.5467758178710938, -0.5320777893066406, -0.5173797607421875, -0.5026817321777344, -0.48798370361328125, -0.4732856750488281, -0.458587646484375, -0.4438896179199219, -0.42919158935546875, -0.4144935607910156, -0.3997955322265625, -0.3850975036621094, -0.37039947509765625, -0.3557014465332031, -0.34100341796875, -0.3263053894042969, -0.31160736083984375, -0.2969093322753906, -0.2822113037109375, -0.2675132751464844, -0.25281524658203125, -0.23811721801757812, -0.223419189453125, -0.20872116088867188, -0.19402313232421875, -0.17932510375976562, -0.1646270751953125, -0.14992904663085938, -0.13523101806640625, -0.12053298950195312, -0.1058349609375, -0.09113693237304688, -0.07643890380859375, -0.061740875244140625, -0.0470428466796875, -0.032344818115234375, -0.01764678955078125, -0.002948760986328125, 0.011749267578125, 0.026447296142578125, 0.04114532470703125, 0.055843353271484375, 0.0705413818359375, 0.08523941040039062, 0.09993743896484375, 0.11463546752929688, 0.12933349609375, 0.14403152465820312, 0.15872955322265625, 0.17342758178710938, 0.1881256103515625, 0.20282363891601562, 0.21752166748046875, 0.23221969604492188, 0.246917724609375, 0.2616157531738281, 0.27631378173828125, 0.2910118103027344, 0.3057098388671875, 0.3204078674316406, 0.33510589599609375, 0.3498039245605469, 0.364501953125]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 7.0, 10.0, 18.0, 19.0, 33.0, 55.0, 75.0, 96.0, 133.0, 104.0, 124.0, 102.0, 77.0, 46.0, 40.0, 19.0, 15.0, 6.0, 6.0, 6.0, 2.0, 4.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0], "bins": [-2.5243358612060547, -2.469132900238037, -2.4139299392700195, -2.358727216720581, -2.3035242557525635, -2.248321294784546, -2.1931183338165283, -2.1379153728485107, -2.0827126502990723, -2.0275096893310547, -1.9723068475723267, -1.917103886604309, -1.861901044845581, -1.8066980838775635, -1.751495122909546, -1.6962921619415283, -1.6410892009735107, -1.5858862400054932, -1.5306833982467651, -1.4754804372787476, -1.4202775955200195, -1.365074634552002, -1.3098716735839844, -1.2546687126159668, -1.1994658708572388, -1.1442629098892212, -1.0890600681304932, -1.0338571071624756, -0.9786542057991028, -0.92345130443573, -0.8682483434677124, -0.8130454421043396, -0.7578424215316772, -0.7026395201683044, -0.6474366188049316, -0.5922336578369141, -0.5370307564735413, -0.48182785511016846, -0.42662492394447327, -0.3714219927787781, -0.3162190914154053, -0.26101619005203247, -0.20581325888633728, -0.15061034262180328, -0.09540742635726929, -0.040204524993896484, 0.014998406171798706, 0.0702013373374939, 0.1254042387008667, 0.1806071549654007, 0.2358100712299347, 0.2910130023956299, 0.3462159037590027, 0.4014188051223755, 0.4566217362880707, 0.5118246674537659, 0.5670275688171387, 0.6222304701805115, 0.6774333715438843, 0.7326363325119019, 0.7878392338752747, 0.8430421352386475, 0.898245096206665, 0.9534479975700378, 1.0086508989334106]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 4.0, 6.0, 10.0, 8.0, 19.0, 11.0, 19.0, 14.0, 20.0, 22.0, 24.0, 38.0, 28.0, 32.0, 51.0, 38.0, 46.0, 56.0, 63.0, 45.0, 40.0, 43.0, 51.0, 51.0, 44.0, 34.0, 32.0, 29.0, 18.0, 20.0, 15.0, 11.0, 9.0, 16.0, 9.0, 5.0, 7.0, 2.0, 2.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.186760425567627, -1.1497776508331299, -1.1127947568893433, -1.0758118629455566, -1.0388290882110596, -1.0018463134765625, -0.9648634195327759, -0.927880585193634, -0.8908977508544922, -0.8539149165153503, -0.8169320821762085, -0.7799492478370667, -0.7429664134979248, -0.705983579158783, -0.6690007448196411, -0.6320179104804993, -0.5950350761413574, -0.5580522418022156, -0.5210694074630737, -0.4840865731239319, -0.44710373878479004, -0.4101209044456482, -0.37313807010650635, -0.3361552357673645, -0.29917240142822266, -0.2621895670890808, -0.22520673274993896, -0.18822389841079712, -0.15124106407165527, -0.11425822973251343, -0.07727539539337158, -0.040292561054229736, -0.0033098459243774414, 0.033672988414764404, 0.07065582275390625, 0.1076386570930481, 0.14462149143218994, 0.1816043257713318, 0.21858716011047363, 0.2555699944496155, 0.2925528287887573, 0.32953566312789917, 0.366518497467041, 0.40350133180618286, 0.4404841661453247, 0.47746700048446655, 0.5144498348236084, 0.5514326691627502, 0.5884155035018921, 0.6253983378410339, 0.6623811721801758, 0.6993640065193176, 0.7363468408584595, 0.7733296751976013, 0.8103125095367432, 0.847295343875885, 0.8842781782150269, 0.9212610125541687, 0.9582438468933105, 0.9952266812324524, 1.0322095155715942, 1.0691924095153809, 1.106175184249878, 1.143157958984375, 1.1801408529281616]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 4.0, 2.0, 8.0, 12.0, 10.0, 16.0, 13.0, 14.0, 27.0, 54.0, 60.0, 97.0, 111.0, 175.0, 273.0, 472.0, 816.0, 1768.0, 4002.0, 10383.0, 32757.0, 135846.0, 646303.0, 158917.0, 36594.0, 11436.0, 4264.0, 1884.0, 859.0, 484.0, 281.0, 171.0, 121.0, 87.0, 51.0, 38.0, 37.0, 24.0, 22.0, 19.0, 9.0, 10.0, 5.0, 8.0, 3.0, 4.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.7607421875, -0.7366256713867188, -0.7125091552734375, -0.6883926391601562, -0.664276123046875, -0.6401596069335938, -0.6160430908203125, -0.5919265747070312, -0.56781005859375, -0.5436935424804688, -0.5195770263671875, -0.49546051025390625, -0.471343994140625, -0.44722747802734375, -0.4231109619140625, -0.39899444580078125, -0.3748779296875, -0.35076141357421875, -0.3266448974609375, -0.30252838134765625, -0.278411865234375, -0.25429534912109375, -0.2301788330078125, -0.20606231689453125, -0.18194580078125, -0.15782928466796875, -0.1337127685546875, -0.10959625244140625, -0.085479736328125, -0.06136322021484375, -0.0372467041015625, -0.01313018798828125, 0.010986328125, 0.03510284423828125, 0.0592193603515625, 0.08333587646484375, 0.107452392578125, 0.13156890869140625, 0.1556854248046875, 0.17980194091796875, 0.20391845703125, 0.22803497314453125, 0.2521514892578125, 0.27626800537109375, 0.300384521484375, 0.32450103759765625, 0.3486175537109375, 0.37273406982421875, 0.3968505859375, 0.42096710205078125, 0.4450836181640625, 0.46920013427734375, 0.493316650390625, 0.5174331665039062, 0.5415496826171875, 0.5656661987304688, 0.58978271484375, 0.6138992309570312, 0.6380157470703125, 0.6621322631835938, 0.686248779296875, 0.7103652954101562, 0.7344818115234375, 0.7585983276367188, 0.78271484375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 7.0, 9.0, 7.0, 15.0, 29.0, 32.0, 59.0, 72.0, 79.0, 104.0, 88.0, 98.0, 93.0, 74.0, 63.0, 57.0, 40.0, 36.0, 13.0, 13.0, 7.0, 6.0, 1.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.179443359375, -0.1725616455078125, -0.165679931640625, -0.1587982177734375, -0.15191650390625, -0.1450347900390625, -0.138153076171875, -0.1312713623046875, -0.1243896484375, -0.1175079345703125, -0.110626220703125, -0.1037445068359375, -0.09686279296875, -0.0899810791015625, -0.083099365234375, -0.0762176513671875, -0.0693359375, -0.0624542236328125, -0.055572509765625, -0.0486907958984375, -0.04180908203125, -0.0349273681640625, -0.028045654296875, -0.0211639404296875, -0.0142822265625, -0.0074005126953125, -0.000518798828125, 0.0063629150390625, 0.01324462890625, 0.0201263427734375, 0.027008056640625, 0.0338897705078125, 0.040771484375, 0.0476531982421875, 0.054534912109375, 0.0614166259765625, 0.06829833984375, 0.0751800537109375, 0.082061767578125, 0.0889434814453125, 0.0958251953125, 0.1027069091796875, 0.109588623046875, 0.1164703369140625, 0.12335205078125, 0.1302337646484375, 0.137115478515625, 0.1439971923828125, 0.15087890625, 0.1577606201171875, 0.164642333984375, 0.1715240478515625, 0.17840576171875, 0.1852874755859375, 0.192169189453125, 0.1990509033203125, 0.2059326171875, 0.2128143310546875, 0.219696044921875, 0.2265777587890625, 0.23345947265625, 0.2403411865234375, 0.247222900390625, 0.2541046142578125, 0.260986328125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 4.0, 7.0, 7.0, 13.0, 14.0, 13.0, 25.0, 35.0, 42.0, 63.0, 98.0, 162.0, 224.0, 414.0, 741.0, 1364.0, 2723.0, 5637.0, 13930.0, 37519.0, 130096.0, 627021.0, 157808.0, 42526.0, 15316.0, 6459.0, 2861.0, 1467.0, 757.0, 457.0, 270.0, 144.0, 118.0, 69.0, 53.0, 31.0, 16.0, 17.0, 6.0, 4.0, 6.0, 4.0, 4.0, 2.0, 3.0, 4.0, 4.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.60986328125, -0.5885086059570312, -0.5671539306640625, -0.5457992553710938, -0.524444580078125, -0.5030899047851562, -0.4817352294921875, -0.46038055419921875, -0.43902587890625, -0.41767120361328125, -0.3963165283203125, -0.37496185302734375, -0.353607177734375, -0.33225250244140625, -0.3108978271484375, -0.28954315185546875, -0.2681884765625, -0.24683380126953125, -0.2254791259765625, -0.20412445068359375, -0.182769775390625, -0.16141510009765625, -0.1400604248046875, -0.11870574951171875, -0.09735107421875, -0.07599639892578125, -0.0546417236328125, -0.03328704833984375, -0.011932373046875, 0.00942230224609375, 0.0307769775390625, 0.05213165283203125, 0.073486328125, 0.09484100341796875, 0.1161956787109375, 0.13755035400390625, 0.158905029296875, 0.18025970458984375, 0.2016143798828125, 0.22296905517578125, 0.24432373046875, 0.26567840576171875, 0.2870330810546875, 0.30838775634765625, 0.329742431640625, 0.35109710693359375, 0.3724517822265625, 0.39380645751953125, 0.4151611328125, 0.43651580810546875, 0.4578704833984375, 0.47922515869140625, 0.500579833984375, 0.5219345092773438, 0.5432891845703125, 0.5646438598632812, 0.58599853515625, 0.6073532104492188, 0.6287078857421875, 0.6500625610351562, 0.671417236328125, 0.6927719116210938, 0.7141265869140625, 0.7354812622070312, 0.7568359375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [5.0, 2.0, 0.0, 1.0, 3.0, 2.0, 7.0, 11.0, 7.0, 7.0, 9.0, 13.0, 15.0, 9.0, 16.0, 12.0, 17.0, 25.0, 23.0, 14.0, 25.0, 43.0, 33.0, 49.0, 41.0, 54.0, 51.0, 53.0, 43.0, 43.0, 37.0, 29.0, 41.0, 36.0, 34.0, 32.0, 30.0, 27.0, 18.0, 27.0, 12.0, 14.0, 10.0, 4.0, 7.0, 9.0, 5.0, 0.0, 4.0, 3.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.4501953125, -0.43389892578125, -0.4176025390625, -0.40130615234375, -0.385009765625, -0.36871337890625, -0.3524169921875, -0.33612060546875, -0.31982421875, -0.30352783203125, -0.2872314453125, -0.27093505859375, -0.254638671875, -0.23834228515625, -0.2220458984375, -0.20574951171875, -0.189453125, -0.17315673828125, -0.1568603515625, -0.14056396484375, -0.124267578125, -0.10797119140625, -0.0916748046875, -0.07537841796875, -0.05908203125, -0.04278564453125, -0.0264892578125, -0.01019287109375, 0.006103515625, 0.02239990234375, 0.0386962890625, 0.05499267578125, 0.0712890625, 0.08758544921875, 0.1038818359375, 0.12017822265625, 0.136474609375, 0.15277099609375, 0.1690673828125, 0.18536376953125, 0.20166015625, 0.21795654296875, 0.2342529296875, 0.25054931640625, 0.266845703125, 0.28314208984375, 0.2994384765625, 0.31573486328125, 0.33203125, 0.34832763671875, 0.3646240234375, 0.38092041015625, 0.397216796875, 0.41351318359375, 0.4298095703125, 0.44610595703125, 0.46240234375, 0.47869873046875, 0.4949951171875, 0.51129150390625, 0.527587890625, 0.54388427734375, 0.5601806640625, 0.57647705078125, 0.5927734375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 2.0, 2.0, 5.0, 10.0, 12.0, 32.0, 51.0, 127.0, 234.0, 634.0, 2027.0, 12694.0, 318661.0, 690227.0, 19821.0, 2764.0, 722.0, 277.0, 144.0, 49.0, 32.0, 13.0, 8.0, 2.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53466796875, -0.5141754150390625, -0.493682861328125, -0.4731903076171875, -0.45269775390625, -0.4322052001953125, -0.411712646484375, -0.3912200927734375, -0.3707275390625, -0.3502349853515625, -0.329742431640625, -0.3092498779296875, -0.28875732421875, -0.2682647705078125, -0.247772216796875, -0.2272796630859375, -0.206787109375, -0.1862945556640625, -0.165802001953125, -0.1453094482421875, -0.12481689453125, -0.1043243408203125, -0.083831787109375, -0.0633392333984375, -0.0428466796875, -0.0223541259765625, -0.001861572265625, 0.0186309814453125, 0.03912353515625, 0.0596160888671875, 0.080108642578125, 0.1006011962890625, 0.12109375, 0.1415863037109375, 0.162078857421875, 0.1825714111328125, 0.20306396484375, 0.2235565185546875, 0.244049072265625, 0.2645416259765625, 0.2850341796875, 0.3055267333984375, 0.326019287109375, 0.3465118408203125, 0.36700439453125, 0.3874969482421875, 0.407989501953125, 0.4284820556640625, 0.448974609375, 0.4694671630859375, 0.489959716796875, 0.5104522705078125, 0.53094482421875, 0.5514373779296875, 0.571929931640625, 0.5924224853515625, 0.6129150390625, 0.6334075927734375, 0.653900146484375, 0.6743927001953125, 0.69488525390625, 0.7153778076171875, 0.735870361328125, 0.7563629150390625, 0.77685546875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 3.0, 5.0, 8.0, 5.0, 12.0, 9.0, 16.0, 24.0, 22.0, 32.0, 31.0, 43.0, 69.0, 102.0, 162.0, 121.0, 83.0, 65.0, 42.0, 23.0, 27.0, 21.0, 14.0, 8.0, 12.0, 5.0, 5.0, 9.0, 4.0, 4.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.3882598876953125e-05, -5.23347407579422e-05, -5.0786882638931274e-05, -4.923902451992035e-05, -4.7691166400909424e-05, -4.61433082818985e-05, -4.459545016288757e-05, -4.304759204387665e-05, -4.149973392486572e-05, -3.99518758058548e-05, -3.840401768684387e-05, -3.685615956783295e-05, -3.530830144882202e-05, -3.3760443329811096e-05, -3.221258521080017e-05, -3.0664727091789246e-05, -2.911686897277832e-05, -2.7569010853767395e-05, -2.602115273475647e-05, -2.4473294615745544e-05, -2.292543649673462e-05, -2.1377578377723694e-05, -1.982972025871277e-05, -1.8281862139701843e-05, -1.6734004020690918e-05, -1.5186145901679993e-05, -1.3638287782669067e-05, -1.2090429663658142e-05, -1.0542571544647217e-05, -8.994713425636292e-06, -7.446855306625366e-06, -5.898997187614441e-06, -4.351139068603516e-06, -2.8032809495925903e-06, -1.255422830581665e-06, 2.9243528842926025e-07, 1.8402934074401855e-06, 3.388151526451111e-06, 4.936009645462036e-06, 6.4838677644729614e-06, 8.031725883483887e-06, 9.579584002494812e-06, 1.1127442121505737e-05, 1.2675300240516663e-05, 1.4223158359527588e-05, 1.5771016478538513e-05, 1.731887459754944e-05, 1.8866732716560364e-05, 2.041459083557129e-05, 2.1962448954582214e-05, 2.351030707359314e-05, 2.5058165192604065e-05, 2.660602331161499e-05, 2.8153881430625916e-05, 2.970173954963684e-05, 3.1249597668647766e-05, 3.279745578765869e-05, 3.434531390666962e-05, 3.589317202568054e-05, 3.744103014469147e-05, 3.898888826370239e-05, 4.053674638271332e-05, 4.208460450172424e-05, 4.363246262073517e-05, 4.5180320739746094e-05]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 5.0, 11.0, 10.0, 29.0, 56.0, 141.0, 282.0, 833.0, 3070.0, 32528.0, 915898.0, 88698.0, 5189.0, 1130.0, 377.0, 145.0, 59.0, 31.0, 21.0, 18.0, 11.0, 5.0, 4.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8525390625, -0.8271942138671875, -0.801849365234375, -0.7765045166015625, -0.75115966796875, -0.7258148193359375, -0.700469970703125, -0.6751251220703125, -0.6497802734375, -0.6244354248046875, -0.599090576171875, -0.5737457275390625, -0.54840087890625, -0.5230560302734375, -0.497711181640625, -0.4723663330078125, -0.447021484375, -0.4216766357421875, -0.396331787109375, -0.3709869384765625, -0.34564208984375, -0.3202972412109375, -0.294952392578125, -0.2696075439453125, -0.2442626953125, -0.2189178466796875, -0.193572998046875, -0.1682281494140625, -0.14288330078125, -0.1175384521484375, -0.092193603515625, -0.0668487548828125, -0.04150390625, -0.0161590576171875, 0.009185791015625, 0.0345306396484375, 0.05987548828125, 0.0852203369140625, 0.110565185546875, 0.1359100341796875, 0.1612548828125, 0.1865997314453125, 0.211944580078125, 0.2372894287109375, 0.26263427734375, 0.2879791259765625, 0.313323974609375, 0.3386688232421875, 0.364013671875, 0.3893585205078125, 0.414703369140625, 0.4400482177734375, 0.46539306640625, 0.4907379150390625, 0.516082763671875, 0.5414276123046875, 0.5667724609375, 0.5921173095703125, 0.617462158203125, 0.6428070068359375, 0.66815185546875, 0.6934967041015625, 0.718841552734375, 0.7441864013671875, 0.76953125]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 5.0, 9.0, 9.0, 21.0, 23.0, 29.0, 52.0, 75.0, 134.0, 231.0, 166.0, 77.0, 53.0, 33.0, 24.0, 21.0, 14.0, 8.0, 6.0, 5.0, 3.0, 2.0, 1.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.43115234375, -0.4174842834472656, -0.40381622314453125, -0.3901481628417969, -0.3764801025390625, -0.3628120422363281, -0.34914398193359375, -0.3354759216308594, -0.321807861328125, -0.3081398010253906, -0.29447174072265625, -0.2808036804199219, -0.2671356201171875, -0.2534675598144531, -0.23979949951171875, -0.22613143920898438, -0.21246337890625, -0.19879531860351562, -0.18512725830078125, -0.17145919799804688, -0.1577911376953125, -0.14412307739257812, -0.13045501708984375, -0.11678695678710938, -0.103118896484375, -0.08945083618164062, -0.07578277587890625, -0.062114715576171875, -0.0484466552734375, -0.034778594970703125, -0.02111053466796875, -0.007442474365234375, 0.0062255859375, 0.019893646240234375, 0.03356170654296875, 0.047229766845703125, 0.0608978271484375, 0.07456588745117188, 0.08823394775390625, 0.10190200805664062, 0.115570068359375, 0.12923812866210938, 0.14290618896484375, 0.15657424926757812, 0.1702423095703125, 0.18391036987304688, 0.19757843017578125, 0.21124649047851562, 0.22491455078125, 0.23858261108398438, 0.25225067138671875, 0.2659187316894531, 0.2795867919921875, 0.2932548522949219, 0.30692291259765625, 0.3205909729003906, 0.334259033203125, 0.3479270935058594, 0.36159515380859375, 0.3752632141113281, 0.3889312744140625, 0.4025993347167969, 0.41626739501953125, 0.4299354553222656, 0.443603515625]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 6.0, 17.0, 116.0, 496.0, 317.0, 49.0, 9.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.888079643249512, -4.258939266204834, -3.6297993659973145, -3.0006589889526367, -2.371518850326538, -1.7423787117004395, -1.1132383346557617, -0.4840984344482422, 0.14504194259643555, 0.774182140827179, 1.4033223390579224, 2.0324625968933105, 2.661602735519409, 3.290742874145508, 3.9198832511901855, 4.549023151397705, 5.178163528442383, 5.8073039054870605, 6.43644380569458, 7.065584182739258, 7.694724082946777, 8.323863983154297, 8.953004837036133, 9.582144737243652, 10.211284637451172, 10.840424537658691, 11.469565391540527, 12.098705291748047, 12.727845191955566, 13.356985092163086, 13.986125946044922, 14.615265846252441, 15.244405746459961, 15.87354564666748, 16.502685546875, 17.131826400756836, 17.760967254638672, 18.390106201171875, 19.01924705505371, 19.648387908935547, 20.27752685546875, 20.906667709350586, 21.53580665588379, 22.164947509765625, 22.79408836364746, 23.423227310180664, 24.0523681640625, 24.681507110595703, 25.310649871826172, 25.939790725708008, 26.56892967224121, 27.198070526123047, 27.827211380004883, 28.456350326538086, 29.085491180419922, 29.714630126953125, 30.34377098083496, 30.972911834716797, 31.60205078125, 32.23119354248047, 32.86033248901367, 33.489471435546875, 34.118614196777344, 34.74775314331055, 35.37689208984375]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 8.0, 5.0, 5.0, 8.0, 16.0, 17.0, 19.0, 21.0, 20.0, 27.0, 43.0, 31.0, 32.0, 45.0, 51.0, 35.0, 48.0, 46.0, 59.0, 44.0, 45.0, 45.0, 38.0, 44.0, 43.0, 28.0, 23.0, 24.0, 18.0, 20.0, 24.0, 16.0, 17.0, 9.0, 8.0, 6.0, 7.0, 1.0, 2.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.2176380157470703, -3.1202192306518555, -3.0228004455566406, -2.9253814220428467, -2.827962636947632, -2.730543851852417, -2.633124828338623, -2.535706043243408, -2.4382872581481934, -2.3408684730529785, -2.2434496879577637, -2.1460306644439697, -2.048611879348755, -1.95119309425354, -1.8537741899490356, -1.7563552856445312, -1.6589365005493164, -1.5615177154541016, -1.4640988111495972, -1.3666799068450928, -1.269261121749878, -1.171842336654663, -1.0744234323501587, -0.9770045876502991, -0.8795857429504395, -0.7821668982505798, -0.6847480535507202, -0.5873292088508606, -0.489910364151001, -0.39249151945114136, -0.29507267475128174, -0.19765383005142212, -0.1002349853515625, -0.002816140651702881, 0.09460270404815674, 0.19202154874801636, 0.289440393447876, 0.3868592381477356, 0.4842780828475952, 0.5816969275474548, 0.6791157722473145, 0.7765346169471741, 0.8739534616470337, 0.9713723063468933, 1.068791151046753, 1.1662099361419678, 1.2636288404464722, 1.3610477447509766, 1.4584665298461914, 1.5558853149414062, 1.6533042192459106, 1.750723123550415, 1.8481419086456299, 1.9455606937408447, 2.0429797172546387, 2.1403985023498535, 2.2378172874450684, 2.335236072540283, 2.432654857635498, 2.530073881149292, 2.627492666244507, 2.7249114513397217, 2.8223304748535156, 2.9197492599487305, 3.0171680450439453]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 1.0, 3.0, 8.0, 17.0, 21.0, 49.0, 85.0, 139.0, 294.0, 895.0, 3898.0, 34849.0, 3879678.0, 260242.0, 11199.0, 1844.0, 562.0, 227.0, 120.0, 58.0, 33.0, 25.0, 16.0, 4.0, 8.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.603515625, -1.561065673828125, -1.51861572265625, -1.476165771484375, -1.4337158203125, -1.391265869140625, -1.34881591796875, -1.306365966796875, -1.263916015625, -1.221466064453125, -1.17901611328125, -1.136566162109375, -1.0941162109375, -1.051666259765625, -1.00921630859375, -0.966766357421875, -0.92431640625, -0.881866455078125, -0.83941650390625, -0.796966552734375, -0.7545166015625, -0.712066650390625, -0.66961669921875, -0.627166748046875, -0.584716796875, -0.542266845703125, -0.49981689453125, -0.457366943359375, -0.4149169921875, -0.372467041015625, -0.33001708984375, -0.287567138671875, -0.2451171875, -0.202667236328125, -0.16021728515625, -0.117767333984375, -0.0753173828125, -0.032867431640625, 0.00958251953125, 0.052032470703125, 0.094482421875, 0.136932373046875, 0.17938232421875, 0.221832275390625, 0.2642822265625, 0.306732177734375, 0.34918212890625, 0.391632080078125, 0.43408203125, 0.476531982421875, 0.51898193359375, 0.561431884765625, 0.6038818359375, 0.646331787109375, 0.68878173828125, 0.731231689453125, 0.773681640625, 0.816131591796875, 0.85858154296875, 0.901031494140625, 0.9434814453125, 0.985931396484375, 1.02838134765625, 1.070831298828125, 1.11328125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 9.0, 14.0, 21.0, 29.0, 46.0, 51.0, 73.0, 74.0, 85.0, 101.0, 99.0, 85.0, 83.0, 64.0, 57.0, 46.0, 23.0, 13.0, 12.0, 9.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.218994140625, -0.21142959594726562, -0.20386505126953125, -0.19630050659179688, -0.1887359619140625, -0.18117141723632812, -0.17360687255859375, -0.16604232788085938, -0.158477783203125, -0.15091323852539062, -0.14334869384765625, -0.13578414916992188, -0.1282196044921875, -0.12065505981445312, -0.11309051513671875, -0.10552597045898438, -0.09796142578125, -0.09039688110351562, -0.08283233642578125, -0.07526779174804688, -0.0677032470703125, -0.060138702392578125, -0.05257415771484375, -0.045009613037109375, -0.037445068359375, -0.029880523681640625, -0.02231597900390625, -0.014751434326171875, -0.0071868896484375, 0.000377655029296875, 0.00794219970703125, 0.015506744384765625, 0.0230712890625, 0.030635833740234375, 0.03820037841796875, 0.045764923095703125, 0.0533294677734375, 0.060894012451171875, 0.06845855712890625, 0.07602310180664062, 0.083587646484375, 0.09115219116210938, 0.09871673583984375, 0.10628128051757812, 0.1138458251953125, 0.12141036987304688, 0.12897491455078125, 0.13653945922851562, 0.14410400390625, 0.15166854858398438, 0.15923309326171875, 0.16679763793945312, 0.1743621826171875, 0.18192672729492188, 0.18949127197265625, 0.19705581665039062, 0.204620361328125, 0.21218490600585938, 0.21974945068359375, 0.22731399536132812, 0.2348785400390625, 0.24244308471679688, 0.25000762939453125, 0.2575721740722656, 0.26513671875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 5.0, 4.0, 3.0, 15.0, 15.0, 23.0, 28.0, 29.0, 58.0, 77.0, 139.0, 256.0, 463.0, 973.0, 2515.0, 7206.0, 32077.0, 525338.0, 3542934.0, 64715.0, 11294.0, 3406.0, 1402.0, 562.0, 284.0, 158.0, 91.0, 67.0, 46.0, 17.0, 24.0, 13.0, 18.0, 7.0, 8.0, 6.0, 4.0, 4.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.2451171875, -1.210693359375, -1.17626953125, -1.141845703125, -1.107421875, -1.072998046875, -1.03857421875, -1.004150390625, -0.9697265625, -0.935302734375, -0.90087890625, -0.866455078125, -0.83203125, -0.797607421875, -0.76318359375, -0.728759765625, -0.6943359375, -0.659912109375, -0.62548828125, -0.591064453125, -0.556640625, -0.522216796875, -0.48779296875, -0.453369140625, -0.4189453125, -0.384521484375, -0.35009765625, -0.315673828125, -0.28125, -0.246826171875, -0.21240234375, -0.177978515625, -0.1435546875, -0.109130859375, -0.07470703125, -0.040283203125, -0.005859375, 0.028564453125, 0.06298828125, 0.097412109375, 0.1318359375, 0.166259765625, 0.20068359375, 0.235107421875, 0.26953125, 0.303955078125, 0.33837890625, 0.372802734375, 0.4072265625, 0.441650390625, 0.47607421875, 0.510498046875, 0.544921875, 0.579345703125, 0.61376953125, 0.648193359375, 0.6826171875, 0.717041015625, 0.75146484375, 0.785888671875, 0.8203125, 0.854736328125, 0.88916015625, 0.923583984375, 0.9580078125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 3.0, 3.0, 2.0, 4.0, 6.0, 7.0, 13.0, 18.0, 36.0, 53.0, 114.0, 314.0, 1699.0, 1256.0, 285.0, 116.0, 66.0, 25.0, 16.0, 12.0, 9.0, 7.0, 3.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3876953125, -0.3727569580078125, -0.357818603515625, -0.3428802490234375, -0.32794189453125, -0.3130035400390625, -0.298065185546875, -0.2831268310546875, -0.2681884765625, -0.2532501220703125, -0.238311767578125, -0.2233734130859375, -0.20843505859375, -0.1934967041015625, -0.178558349609375, -0.1636199951171875, -0.148681640625, -0.1337432861328125, -0.118804931640625, -0.1038665771484375, -0.08892822265625, -0.0739898681640625, -0.059051513671875, -0.0441131591796875, -0.0291748046875, -0.0142364501953125, 0.000701904296875, 0.0156402587890625, 0.03057861328125, 0.0455169677734375, 0.060455322265625, 0.0753936767578125, 0.09033203125, 0.1052703857421875, 0.120208740234375, 0.1351470947265625, 0.15008544921875, 0.1650238037109375, 0.179962158203125, 0.1949005126953125, 0.2098388671875, 0.2247772216796875, 0.239715576171875, 0.2546539306640625, 0.26959228515625, 0.2845306396484375, 0.299468994140625, 0.3144073486328125, 0.329345703125, 0.3442840576171875, 0.359222412109375, 0.3741607666015625, 0.38909912109375, 0.4040374755859375, 0.418975830078125, 0.4339141845703125, 0.4488525390625, 0.4637908935546875, 0.478729248046875, 0.4936676025390625, 0.50860595703125, 0.5235443115234375, 0.538482666015625, 0.5534210205078125, 0.568359375]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 6.0, 18.0, 49.0, 108.0, 262.0, 301.0, 181.0, 52.0, 14.0, 10.0, 7.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.051361083984375, -4.9226837158203125, -4.79400634765625, -4.6653289794921875, -4.536651611328125, -4.407974720001221, -4.279297351837158, -4.150619983673096, -4.021942615509033, -3.8932652473449707, -3.764587879180908, -3.635910749435425, -3.5072333812713623, -3.3785560131073, -3.2498788833618164, -3.121201515197754, -2.9925241470336914, -2.863846778869629, -2.7351694107055664, -2.606492280960083, -2.4778149127960205, -2.349137544631958, -2.2204604148864746, -2.091783046722412, -1.9631056785583496, -1.834428310394287, -1.7057510614395142, -1.5770738124847412, -1.4483964443206787, -1.3197190761566162, -1.1910418272018433, -1.0623645782470703, -0.9336874485015869, -0.8050101399421692, -0.6763328313827515, -0.5476555228233337, -0.418978214263916, -0.2903009057044983, -0.16162359714508057, -0.03294628858566284, 0.09573101997375488, 0.2244083285331726, 0.35308563709259033, 0.48176294565200806, 0.6104402542114258, 0.7391175627708435, 0.8677948713302612, 0.996472179889679, 1.1251494884490967, 1.2538268566131592, 1.3825041055679321, 1.511181354522705, 1.6398587226867676, 1.76853609085083, 1.897213339805603, 2.025890588760376, 2.1545679569244385, 2.283245325088501, 2.4119224548339844, 2.540599822998047, 2.6692771911621094, 2.797954559326172, 2.9266319274902344, 3.0553090572357178, 3.1839864253997803]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 7.0, 3.0, 6.0, 11.0, 7.0, 10.0, 19.0, 22.0, 23.0, 28.0, 28.0, 39.0, 44.0, 47.0, 61.0, 57.0, 56.0, 67.0, 70.0, 51.0, 64.0, 51.0, 54.0, 30.0, 29.0, 25.0, 21.0, 14.0, 23.0, 11.0, 10.0, 9.0, 6.0, 7.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3676822185516357, -1.3287575244903564, -1.2898327112197876, -1.2509080171585083, -1.211983323097229, -1.1730585098266602, -1.1341338157653809, -1.0952091217041016, -1.0562844276428223, -1.017359733581543, -0.9784349799156189, -0.9395102262496948, -0.9005855321884155, -0.8616607785224915, -0.8227360248565674, -0.7838113307952881, -0.7448865175247192, -0.7059617638587952, -0.6670370697975159, -0.6281123161315918, -0.5891876220703125, -0.5502628684043884, -0.5113381147384644, -0.47241339087486267, -0.433488667011261, -0.3945639431476593, -0.3556392192840576, -0.31671446561813354, -0.27778974175453186, -0.23886501789093018, -0.1999402791261673, -0.16101554036140442, -0.12209093570709229, -0.08316620439291, -0.04424147307872772, -0.005316741764545441, 0.03360798954963684, 0.07253271341323853, 0.1114574521780014, 0.15038219094276428, 0.18930691480636597, 0.22823163866996765, 0.26715636253356934, 0.3060811161994934, 0.3450058400630951, 0.3839305639266968, 0.42285531759262085, 0.46178004145622253, 0.5007047653198242, 0.5396295189857483, 0.5785542130470276, 0.6174789667129517, 0.656403660774231, 0.695328414440155, 0.7342531681060791, 0.7731778621673584, 0.8121026158332825, 0.8510273694992065, 0.8899520635604858, 0.9288768172264099, 0.967801570892334, 1.0067262649536133, 1.0456509590148926, 1.0845757722854614, 1.1235004663467407]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 7.0, 5.0, 5.0, 9.0, 12.0, 14.0, 31.0, 26.0, 56.0, 81.0, 131.0, 204.0, 365.0, 692.0, 1472.0, 3662.0, 10821.0, 36780.0, 162311.0, 628389.0, 151478.0, 35331.0, 10249.0, 3390.0, 1404.0, 670.0, 369.0, 197.0, 125.0, 101.0, 59.0, 32.0, 22.0, 18.0, 13.0, 7.0, 2.0, 7.0, 4.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.861328125, -0.835601806640625, -0.80987548828125, -0.784149169921875, -0.7584228515625, -0.732696533203125, -0.70697021484375, -0.681243896484375, -0.655517578125, -0.629791259765625, -0.60406494140625, -0.578338623046875, -0.5526123046875, -0.526885986328125, -0.50115966796875, -0.475433349609375, -0.44970703125, -0.423980712890625, -0.39825439453125, -0.372528076171875, -0.3468017578125, -0.321075439453125, -0.29534912109375, -0.269622802734375, -0.243896484375, -0.218170166015625, -0.19244384765625, -0.166717529296875, -0.1409912109375, -0.115264892578125, -0.08953857421875, -0.063812255859375, -0.0380859375, -0.012359619140625, 0.01336669921875, 0.039093017578125, 0.0648193359375, 0.090545654296875, 0.11627197265625, 0.141998291015625, 0.167724609375, 0.193450927734375, 0.21917724609375, 0.244903564453125, 0.2706298828125, 0.296356201171875, 0.32208251953125, 0.347808837890625, 0.37353515625, 0.399261474609375, 0.42498779296875, 0.450714111328125, 0.4764404296875, 0.502166748046875, 0.52789306640625, 0.553619384765625, 0.579345703125, 0.605072021484375, 0.63079833984375, 0.656524658203125, 0.6822509765625, 0.707977294921875, 0.73370361328125, 0.759429931640625, 0.78515625]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 5.0, 8.0, 8.0, 24.0, 21.0, 31.0, 37.0, 53.0, 60.0, 49.0, 82.0, 84.0, 77.0, 88.0, 86.0, 61.0, 57.0, 61.0, 40.0, 21.0, 17.0, 12.0, 13.0, 6.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2054443359375, -0.19822120666503906, -0.19099807739257812, -0.1837749481201172, -0.17655181884765625, -0.1693286895751953, -0.16210556030273438, -0.15488243103027344, -0.1476593017578125, -0.14043617248535156, -0.13321304321289062, -0.1259899139404297, -0.11876678466796875, -0.11154365539550781, -0.10432052612304688, -0.09709739685058594, -0.089874267578125, -0.08265113830566406, -0.07542800903320312, -0.06820487976074219, -0.06098175048828125, -0.05375862121582031, -0.046535491943359375, -0.03931236267089844, -0.0320892333984375, -0.024866104125976562, -0.017642974853515625, -0.010419845581054688, -0.00319671630859375, 0.0040264129638671875, 0.011249542236328125, 0.018472671508789062, 0.02569580078125, 0.03291893005371094, 0.040142059326171875, 0.04736518859863281, 0.05458831787109375, 0.06181144714355469, 0.06903457641601562, 0.07625770568847656, 0.0834808349609375, 0.09070396423339844, 0.09792709350585938, 0.10515022277832031, 0.11237335205078125, 0.11959648132324219, 0.12681961059570312, 0.13404273986816406, 0.141265869140625, 0.14848899841308594, 0.15571212768554688, 0.1629352569580078, 0.17015838623046875, 0.1773815155029297, 0.18460464477539062, 0.19182777404785156, 0.1990509033203125, 0.20627403259277344, 0.21349716186523438, 0.2207202911376953, 0.22794342041015625, 0.2351665496826172, 0.24238967895507812, 0.24961280822753906, 0.2568359375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 6.0, 2.0, 2.0, 6.0, 5.0, 13.0, 20.0, 31.0, 47.0, 52.0, 86.0, 151.0, 265.0, 461.0, 904.0, 1829.0, 4417.0, 11809.0, 35957.0, 130789.0, 603674.0, 185924.0, 46822.0, 15078.0, 5492.0, 2355.0, 1045.0, 562.0, 282.0, 170.0, 90.0, 70.0, 48.0, 26.0, 21.0, 17.0, 8.0, 6.0, 4.0, 4.0, 1.0, 0.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.61474609375, -0.5924835205078125, -0.570220947265625, -0.5479583740234375, -0.52569580078125, -0.5034332275390625, -0.481170654296875, -0.4589080810546875, -0.4366455078125, -0.4143829345703125, -0.392120361328125, -0.3698577880859375, -0.34759521484375, -0.3253326416015625, -0.303070068359375, -0.2808074951171875, -0.258544921875, -0.2362823486328125, -0.214019775390625, -0.1917572021484375, -0.16949462890625, -0.1472320556640625, -0.124969482421875, -0.1027069091796875, -0.0804443359375, -0.0581817626953125, -0.035919189453125, -0.0136566162109375, 0.00860595703125, 0.0308685302734375, 0.053131103515625, 0.0753936767578125, 0.09765625, 0.1199188232421875, 0.142181396484375, 0.1644439697265625, 0.18670654296875, 0.2089691162109375, 0.231231689453125, 0.2534942626953125, 0.2757568359375, 0.2980194091796875, 0.320281982421875, 0.3425445556640625, 0.36480712890625, 0.3870697021484375, 0.409332275390625, 0.4315948486328125, 0.453857421875, 0.4761199951171875, 0.498382568359375, 0.5206451416015625, 0.54290771484375, 0.5651702880859375, 0.587432861328125, 0.6096954345703125, 0.6319580078125, 0.6542205810546875, 0.676483154296875, 0.6987457275390625, 0.72100830078125, 0.7432708740234375, 0.765533447265625, 0.7877960205078125, 0.81005859375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 6.0, 5.0, 5.0, 5.0, 7.0, 23.0, 11.0, 19.0, 32.0, 24.0, 23.0, 24.0, 41.0, 40.0, 35.0, 49.0, 60.0, 50.0, 56.0, 53.0, 32.0, 52.0, 40.0, 45.0, 44.0, 35.0, 32.0, 27.0, 28.0, 20.0, 22.0, 16.0, 10.0, 8.0, 9.0, 7.0, 4.0, 0.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.6318359375, -0.6089324951171875, -0.586029052734375, -0.5631256103515625, -0.54022216796875, -0.5173187255859375, -0.494415283203125, -0.4715118408203125, -0.4486083984375, -0.4257049560546875, -0.402801513671875, -0.3798980712890625, -0.35699462890625, -0.3340911865234375, -0.311187744140625, -0.2882843017578125, -0.265380859375, -0.2424774169921875, -0.219573974609375, -0.1966705322265625, -0.17376708984375, -0.1508636474609375, -0.127960205078125, -0.1050567626953125, -0.0821533203125, -0.0592498779296875, -0.036346435546875, -0.0134429931640625, 0.00946044921875, 0.0323638916015625, 0.055267333984375, 0.0781707763671875, 0.10107421875, 0.1239776611328125, 0.146881103515625, 0.1697845458984375, 0.19268798828125, 0.2155914306640625, 0.238494873046875, 0.2613983154296875, 0.2843017578125, 0.3072052001953125, 0.330108642578125, 0.3530120849609375, 0.37591552734375, 0.3988189697265625, 0.421722412109375, 0.4446258544921875, 0.467529296875, 0.4904327392578125, 0.513336181640625, 0.5362396240234375, 0.55914306640625, 0.5820465087890625, 0.604949951171875, 0.6278533935546875, 0.6507568359375, 0.6736602783203125, 0.696563720703125, 0.7194671630859375, 0.74237060546875, 0.7652740478515625, 0.788177490234375, 0.8110809326171875, 0.833984375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 2.0, 8.0, 11.0, 16.0, 24.0, 25.0, 44.0, 51.0, 74.0, 128.0, 208.0, 449.0, 1013.0, 2673.0, 10276.0, 68956.0, 627560.0, 296423.0, 31310.0, 5966.0, 1795.0, 703.0, 321.0, 177.0, 103.0, 59.0, 48.0, 43.0, 33.0, 13.0, 11.0, 10.0, 7.0, 4.0, 2.0, 5.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.331298828125, -0.32088470458984375, -0.3104705810546875, -0.30005645751953125, -0.289642333984375, -0.27922821044921875, -0.2688140869140625, -0.25839996337890625, -0.24798583984375, -0.23757171630859375, -0.2271575927734375, -0.21674346923828125, -0.206329345703125, -0.19591522216796875, -0.1855010986328125, -0.17508697509765625, -0.1646728515625, -0.15425872802734375, -0.1438446044921875, -0.13343048095703125, -0.123016357421875, -0.11260223388671875, -0.1021881103515625, -0.09177398681640625, -0.08135986328125, -0.07094573974609375, -0.0605316162109375, -0.05011749267578125, -0.039703369140625, -0.02928924560546875, -0.0188751220703125, -0.00846099853515625, 0.001953125, 0.01236724853515625, 0.0227813720703125, 0.03319549560546875, 0.043609619140625, 0.05402374267578125, 0.0644378662109375, 0.07485198974609375, 0.08526611328125, 0.09568023681640625, 0.1060943603515625, 0.11650848388671875, 0.126922607421875, 0.13733673095703125, 0.1477508544921875, 0.15816497802734375, 0.1685791015625, 0.17899322509765625, 0.1894073486328125, 0.19982147216796875, 0.210235595703125, 0.22064971923828125, 0.2310638427734375, 0.24147796630859375, 0.25189208984375, 0.26230621337890625, 0.2727203369140625, 0.28313446044921875, 0.293548583984375, 0.30396270751953125, 0.3143768310546875, 0.32479095458984375, 0.335205078125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 2.0, 7.0, 2.0, 5.0, 13.0, 21.0, 43.0, 94.0, 148.0, 227.0, 204.0, 103.0, 63.0, 28.0, 18.0, 9.0, 13.0, 7.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012069940567016602, -0.00011780578643083572, -0.00011491216719150543, -0.00011201854795217514, -0.00010912492871284485, -0.00010623130947351456, -0.00010333769023418427, -0.00010044407099485397, -9.755045175552368e-05, -9.465683251619339e-05, -9.17632132768631e-05, -8.88695940375328e-05, -8.597597479820251e-05, -8.308235555887222e-05, -8.018873631954193e-05, -7.729511708021164e-05, -7.440149784088135e-05, -7.150787860155106e-05, -6.861425936222076e-05, -6.572064012289047e-05, -6.282702088356018e-05, -5.993340164422989e-05, -5.70397824048996e-05, -5.4146163165569305e-05, -5.1252543926239014e-05, -4.835892468690872e-05, -4.546530544757843e-05, -4.257168620824814e-05, -3.967806696891785e-05, -3.6784447729587555e-05, -3.389082849025726e-05, -3.099720925092697e-05, -2.810359001159668e-05, -2.5209970772266388e-05, -2.2316351532936096e-05, -1.9422732293605804e-05, -1.6529113054275513e-05, -1.3635493814945221e-05, -1.074187457561493e-05, -7.848255336284637e-06, -4.954636096954346e-06, -2.061016857624054e-06, 8.326023817062378e-07, 3.7262216210365295e-06, 6.619840860366821e-06, 9.513460099697113e-06, 1.2407079339027405e-05, 1.5300698578357697e-05, 1.8194317817687988e-05, 2.108793705701828e-05, 2.3981556296348572e-05, 2.6875175535678864e-05, 2.9768794775009155e-05, 3.266241401433945e-05, 3.555603325366974e-05, 3.844965249300003e-05, 4.134327173233032e-05, 4.4236890971660614e-05, 4.7130510210990906e-05, 5.00241294503212e-05, 5.291774868965149e-05, 5.581136792898178e-05, 5.870498716831207e-05, 6.159860640764236e-05, 6.449222564697266e-05]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 4.0, 8.0, 12.0, 14.0, 16.0, 35.0, 42.0, 77.0, 127.0, 253.0, 561.0, 1250.0, 3676.0, 13451.0, 85073.0, 714689.0, 196364.0, 23986.0, 5522.0, 1881.0, 745.0, 326.0, 170.0, 112.0, 54.0, 37.0, 24.0, 14.0, 9.0, 8.0, 8.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.300048828125, -0.2888031005859375, -0.277557373046875, -0.2663116455078125, -0.25506591796875, -0.2438201904296875, -0.232574462890625, -0.2213287353515625, -0.2100830078125, -0.1988372802734375, -0.187591552734375, -0.1763458251953125, -0.16510009765625, -0.1538543701171875, -0.142608642578125, -0.1313629150390625, -0.1201171875, -0.1088714599609375, -0.097625732421875, -0.0863800048828125, -0.07513427734375, -0.0638885498046875, -0.052642822265625, -0.0413970947265625, -0.0301513671875, -0.0189056396484375, -0.007659912109375, 0.0035858154296875, 0.01483154296875, 0.0260772705078125, 0.037322998046875, 0.0485687255859375, 0.059814453125, 0.0710601806640625, 0.082305908203125, 0.0935516357421875, 0.10479736328125, 0.1160430908203125, 0.127288818359375, 0.1385345458984375, 0.1497802734375, 0.1610260009765625, 0.172271728515625, 0.1835174560546875, 0.19476318359375, 0.2060089111328125, 0.217254638671875, 0.2285003662109375, 0.23974609375, 0.2509918212890625, 0.262237548828125, 0.2734832763671875, 0.28472900390625, 0.2959747314453125, 0.307220458984375, 0.3184661865234375, 0.3297119140625, 0.3409576416015625, 0.352203369140625, 0.3634490966796875, 0.37469482421875, 0.3859405517578125, 0.397186279296875, 0.4084320068359375, 0.419677734375]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 9.0, 8.0, 13.0, 12.0, 22.0, 16.0, 24.0, 27.0, 45.0, 82.0, 115.0, 170.0, 141.0, 96.0, 67.0, 29.0, 26.0, 30.0, 25.0, 14.0, 12.0, 6.0, 3.0, 2.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.315673828125, -0.30533599853515625, -0.2949981689453125, -0.28466033935546875, -0.274322509765625, -0.26398468017578125, -0.2536468505859375, -0.24330902099609375, -0.23297119140625, -0.22263336181640625, -0.2122955322265625, -0.20195770263671875, -0.191619873046875, -0.18128204345703125, -0.1709442138671875, -0.16060638427734375, -0.1502685546875, -0.13993072509765625, -0.1295928955078125, -0.11925506591796875, -0.108917236328125, -0.09857940673828125, -0.0882415771484375, -0.07790374755859375, -0.06756591796875, -0.05722808837890625, -0.0468902587890625, -0.03655242919921875, -0.026214599609375, -0.01587677001953125, -0.0055389404296875, 0.00479888916015625, 0.01513671875, 0.02547454833984375, 0.0358123779296875, 0.04615020751953125, 0.056488037109375, 0.06682586669921875, 0.0771636962890625, 0.08750152587890625, 0.09783935546875, 0.10817718505859375, 0.1185150146484375, 0.12885284423828125, 0.139190673828125, 0.14952850341796875, 0.1598663330078125, 0.17020416259765625, 0.1805419921875, 0.19087982177734375, 0.2012176513671875, 0.21155548095703125, 0.221893310546875, 0.23223114013671875, 0.2425689697265625, 0.25290679931640625, 0.26324462890625, 0.27358245849609375, 0.2839202880859375, 0.29425811767578125, 0.304595947265625, 0.31493377685546875, 0.3252716064453125, 0.33560943603515625, 0.345947265625]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 9.0, 8.0, 35.0, 105.0, 164.0, 245.0, 212.0, 114.0, 44.0, 40.0, 14.0, 7.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.89292573928833, -4.676269054412842, -4.459611892700195, -4.242955207824707, -4.026298522949219, -3.8096415996551514, -3.592984676361084, -3.3763279914855957, -3.1596710681915283, -2.943014144897461, -2.7263574600219727, -2.5097005367279053, -2.293043613433838, -2.0763869285583496, -1.8597300052642822, -1.6430732011795044, -1.4264163970947266, -1.2097595930099487, -0.9931027293205261, -0.7764458656311035, -0.5597890615463257, -0.34313225746154785, -0.12647533416748047, 0.09018146991729736, 0.3068382740020752, 0.523495078086853, 0.7401519417762756, 0.9568088054656982, 1.173465609550476, 1.390122413635254, 1.6067793369293213, 1.8234361410140991, 2.040093421936035, 2.2567503452301025, 2.473407030105591, 2.690063953399658, 2.9067206382751465, 3.123377561569214, 3.3400344848632812, 3.5566911697387695, 3.773348093032837, 3.9900050163269043, 4.206661701202393, 4.423318862915039, 4.639975547790527, 4.856632232666016, 5.073288917541504, 5.28994607925415, 5.506602764129639, 5.723259449005127, 5.939916610717773, 6.156573295593262, 6.37322998046875, 6.589886665344238, 6.806543827056885, 7.023200511932373, 7.2398576736450195, 7.456514358520508, 7.673171520233154, 7.889828205108643, 8.106485366821289, 8.323142051696777, 8.539798736572266, 8.756455421447754, 8.973112106323242]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 7.0, 8.0, 5.0, 14.0, 15.0, 18.0, 13.0, 19.0, 21.0, 33.0, 28.0, 43.0, 41.0, 54.0, 46.0, 62.0, 34.0, 50.0, 47.0, 54.0, 41.0, 42.0, 52.0, 41.0, 40.0, 31.0, 29.0, 17.0, 16.0, 14.0, 16.0, 18.0, 10.0, 7.0, 9.0, 4.0, 2.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.764763832092285, -2.6621859073638916, -2.559607982635498, -2.4570302963256836, -2.35445237159729, -2.2518744468688965, -2.149296760559082, -2.0467188358306885, -1.944140911102295, -1.8415629863739014, -1.7389851808547974, -1.6364073753356934, -1.5338294506072998, -1.4312515258789062, -1.3286737203598022, -1.2260959148406982, -1.1235179901123047, -1.0209400653839111, -0.9183622598648071, -0.8157843947410583, -0.7132065296173096, -0.6106286644935608, -0.508050799369812, -0.40547293424606323, -0.30289506912231445, -0.20031720399856567, -0.0977393388748169, 0.004838526248931885, 0.10741639137268066, 0.20999425649642944, 0.3125721216201782, 0.415149986743927, 0.5177278518676758, 0.6203057169914246, 0.7228835821151733, 0.8254614472389221, 0.9280393123626709, 1.0306172370910645, 1.1331950426101685, 1.2357728481292725, 1.338350772857666, 1.4409286975860596, 1.5435065031051636, 1.6460843086242676, 1.7486622333526611, 1.8512401580810547, 1.9538179636001587, 2.0563957691192627, 2.1589736938476562, 2.26155161857605, 2.3641295433044434, 2.466707229614258, 2.5692851543426514, 2.671863079071045, 2.7744407653808594, 2.877018690109253, 2.9795966148376465, 3.08217453956604, 3.1847524642944336, 3.287330150604248, 3.3899080753326416, 3.492486000061035, 3.5950636863708496, 3.697641611099243, 3.8002195358276367]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 3.0, 5.0, 10.0, 12.0, 12.0, 28.0, 43.0, 75.0, 146.0, 208.0, 404.0, 896.0, 2405.0, 10357.0, 113783.0, 3992980.0, 61636.0, 7615.0, 2051.0, 764.0, 348.0, 192.0, 122.0, 82.0, 39.0, 20.0, 15.0, 11.0, 6.0, 2.0, 4.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.9794921875, -1.923583984375, -1.86767578125, -1.811767578125, -1.755859375, -1.699951171875, -1.64404296875, -1.588134765625, -1.5322265625, -1.476318359375, -1.42041015625, -1.364501953125, -1.30859375, -1.252685546875, -1.19677734375, -1.140869140625, -1.0849609375, -1.029052734375, -0.97314453125, -0.917236328125, -0.861328125, -0.805419921875, -0.74951171875, -0.693603515625, -0.6376953125, -0.581787109375, -0.52587890625, -0.469970703125, -0.4140625, -0.358154296875, -0.30224609375, -0.246337890625, -0.1904296875, -0.134521484375, -0.07861328125, -0.022705078125, 0.033203125, 0.089111328125, 0.14501953125, 0.200927734375, 0.2568359375, 0.312744140625, 0.36865234375, 0.424560546875, 0.48046875, 0.536376953125, 0.59228515625, 0.648193359375, 0.7041015625, 0.760009765625, 0.81591796875, 0.871826171875, 0.927734375, 0.983642578125, 1.03955078125, 1.095458984375, 1.1513671875, 1.207275390625, 1.26318359375, 1.319091796875, 1.375, 1.430908203125, 1.48681640625, 1.542724609375, 1.5986328125]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 4.0, 6.0, 9.0, 12.0, 13.0, 29.0, 25.0, 29.0, 49.0, 56.0, 57.0, 64.0, 77.0, 78.0, 81.0, 72.0, 77.0, 68.0, 45.0, 38.0, 40.0, 26.0, 17.0, 9.0, 11.0, 6.0, 1.0, 5.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2044677734375, -0.1971302032470703, -0.18979263305664062, -0.18245506286621094, -0.17511749267578125, -0.16777992248535156, -0.16044235229492188, -0.1531047821044922, -0.1457672119140625, -0.1384296417236328, -0.13109207153320312, -0.12375450134277344, -0.11641693115234375, -0.10907936096191406, -0.10174179077148438, -0.09440422058105469, -0.087066650390625, -0.07972908020019531, -0.07239151000976562, -0.06505393981933594, -0.05771636962890625, -0.05037879943847656, -0.043041229248046875, -0.03570365905761719, -0.0283660888671875, -0.021028518676757812, -0.013690948486328125, -0.0063533782958984375, 0.00098419189453125, 0.008321762084960938, 0.015659332275390625, 0.022996902465820312, 0.03033447265625, 0.03767204284667969, 0.045009613037109375, 0.05234718322753906, 0.05968475341796875, 0.06702232360839844, 0.07435989379882812, 0.08169746398925781, 0.0890350341796875, 0.09637260437011719, 0.10371017456054688, 0.11104774475097656, 0.11838531494140625, 0.12572288513183594, 0.13306045532226562, 0.1403980255126953, 0.147735595703125, 0.1550731658935547, 0.16241073608398438, 0.16974830627441406, 0.17708587646484375, 0.18442344665527344, 0.19176101684570312, 0.1990985870361328, 0.2064361572265625, 0.2137737274169922, 0.22111129760742188, 0.22844886779785156, 0.23578643798828125, 0.24312400817871094, 0.2504615783691406, 0.2577991485595703, 0.26513671875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 8.0, 12.0, 10.0, 31.0, 39.0, 56.0, 109.0, 158.0, 274.0, 426.0, 756.0, 1486.0, 3380.0, 11200.0, 67649.0, 3834324.0, 242645.0, 21808.0, 5263.0, 2114.0, 1089.0, 606.0, 316.0, 218.0, 124.0, 66.0, 44.0, 20.0, 20.0, 16.0, 6.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.490234375, -1.4383392333984375, -1.386444091796875, -1.3345489501953125, -1.28265380859375, -1.2307586669921875, -1.178863525390625, -1.1269683837890625, -1.0750732421875, -1.0231781005859375, -0.971282958984375, -0.9193878173828125, -0.86749267578125, -0.8155975341796875, -0.763702392578125, -0.7118072509765625, -0.659912109375, -0.6080169677734375, -0.556121826171875, -0.5042266845703125, -0.45233154296875, -0.4004364013671875, -0.348541259765625, -0.2966461181640625, -0.2447509765625, -0.1928558349609375, -0.140960693359375, -0.0890655517578125, -0.03717041015625, 0.0147247314453125, 0.066619873046875, 0.1185150146484375, 0.17041015625, 0.2223052978515625, 0.274200439453125, 0.3260955810546875, 0.37799072265625, 0.4298858642578125, 0.481781005859375, 0.5336761474609375, 0.5855712890625, 0.6374664306640625, 0.689361572265625, 0.7412567138671875, 0.79315185546875, 0.8450469970703125, 0.896942138671875, 0.9488372802734375, 1.000732421875, 1.0526275634765625, 1.104522705078125, 1.1564178466796875, 1.20831298828125, 1.2602081298828125, 1.312103271484375, 1.3639984130859375, 1.4158935546875, 1.4677886962890625, 1.519683837890625, 1.5715789794921875, 1.62347412109375, 1.6753692626953125, 1.727264404296875, 1.7791595458984375, 1.8310546875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 7.0, 9.0, 15.0, 36.0, 49.0, 109.0, 359.0, 2858.0, 406.0, 111.0, 40.0, 30.0, 15.0, 9.0, 3.0, 4.0, 2.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0126953125, -0.98638916015625, -0.9600830078125, -0.93377685546875, -0.907470703125, -0.88116455078125, -0.8548583984375, -0.82855224609375, -0.80224609375, -0.77593994140625, -0.7496337890625, -0.72332763671875, -0.697021484375, -0.67071533203125, -0.6444091796875, -0.61810302734375, -0.591796875, -0.56549072265625, -0.5391845703125, -0.51287841796875, -0.486572265625, -0.46026611328125, -0.4339599609375, -0.40765380859375, -0.38134765625, -0.35504150390625, -0.3287353515625, -0.30242919921875, -0.276123046875, -0.24981689453125, -0.2235107421875, -0.19720458984375, -0.1708984375, -0.14459228515625, -0.1182861328125, -0.09197998046875, -0.065673828125, -0.03936767578125, -0.0130615234375, 0.01324462890625, 0.03955078125, 0.06585693359375, 0.0921630859375, 0.11846923828125, 0.144775390625, 0.17108154296875, 0.1973876953125, 0.22369384765625, 0.25, 0.27630615234375, 0.3026123046875, 0.32891845703125, 0.355224609375, 0.38153076171875, 0.4078369140625, 0.43414306640625, 0.46044921875, 0.48675537109375, 0.5130615234375, 0.53936767578125, 0.565673828125, 0.59197998046875, 0.6182861328125, 0.64459228515625, 0.6708984375]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 7.0, 17.0, 37.0, 94.0, 205.0, 248.0, 211.0, 104.0, 55.0, 21.0, 7.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.13153076171875, -3.996438503265381, -3.861346483230591, -3.726254463195801, -3.5911622047424316, -3.4560699462890625, -3.3209779262542725, -3.1858859062194824, -3.0507936477661133, -2.915701389312744, -2.780609369277954, -2.645517349243164, -2.510425090789795, -2.375332832336426, -2.2402408123016357, -2.1051487922668457, -1.9700565338134766, -1.834964394569397, -1.6998722553253174, -1.5647801160812378, -1.4296879768371582, -1.2945958375930786, -1.159503698348999, -1.0244115591049194, -0.8893194198608398, -0.7542272806167603, -0.6191351413726807, -0.4840430021286011, -0.3489508628845215, -0.2138587236404419, -0.0787665843963623, 0.056325554847717285, 0.19141769409179688, 0.32650983333587646, 0.46160197257995605, 0.5966941118240356, 0.7317862510681152, 0.8668783903121948, 1.0019705295562744, 1.137062668800354, 1.2721548080444336, 1.4072469472885132, 1.5423390865325928, 1.6774312257766724, 1.812523365020752, 1.9476155042648315, 2.082707643508911, 2.217799663543701, 2.3528919219970703, 2.4879841804504395, 2.6230762004852295, 2.7581682205200195, 2.8932604789733887, 3.028352737426758, 3.163444757461548, 3.298536777496338, 3.433629035949707, 3.568721294403076, 3.703813314437866, 3.8389053344726562, 3.9739975929260254, 4.1090898513793945, 4.2441816329956055, 4.379273891448975, 4.514366149902344]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 6.0, 9.0, 7.0, 6.0, 11.0, 19.0, 15.0, 10.0, 26.0, 24.0, 33.0, 34.0, 28.0, 41.0, 38.0, 38.0, 42.0, 55.0, 35.0, 41.0, 48.0, 56.0, 46.0, 44.0, 44.0, 45.0, 33.0, 28.0, 26.0, 20.0, 14.0, 13.0, 17.0, 9.0, 7.0, 4.0, 9.0, 7.0, 7.0, 3.0, 4.0, 6.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2076120376586914, -1.1650186777114868, -1.1224253177642822, -1.0798319578170776, -1.037238597869873, -0.9946452379226685, -0.9520519375801086, -0.909458577632904, -0.8668652176856995, -0.8242718577384949, -0.7816784977912903, -0.7390851974487305, -0.6964918375015259, -0.6538984775543213, -0.6113051176071167, -0.5687117576599121, -0.5261183977127075, -0.48352503776550293, -0.44093167781829834, -0.39833834767341614, -0.35574498772621155, -0.31315162777900696, -0.27055829763412476, -0.22796493768692017, -0.18537157773971558, -0.142778217792511, -0.10018487274646759, -0.057591527700424194, -0.014998167753219604, 0.027595192193984985, 0.07018852233886719, 0.11278188228607178, 0.15537524223327637, 0.19796860218048096, 0.24056194722652435, 0.28315529227256775, 0.32574865221977234, 0.36834201216697693, 0.41093534231185913, 0.4535287022590637, 0.4961220622062683, 0.5387154221534729, 0.5813087821006775, 0.6239020824432373, 0.6664954423904419, 0.7090888023376465, 0.7516821622848511, 0.7942755222320557, 0.8368688821792603, 0.8794622421264648, 0.9220556020736694, 0.964648962020874, 1.0072423219680786, 1.0498356819152832, 1.0924289226531982, 1.1350224018096924, 1.1776156425476074, 1.220209002494812, 1.2628023624420166, 1.3053957223892212, 1.3479890823364258, 1.3905824422836304, 1.433175802230835, 1.47576904296875, 1.5183625221252441]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 5.0, 6.0, 4.0, 8.0, 14.0, 12.0, 7.0, 21.0, 24.0, 45.0, 71.0, 73.0, 148.0, 271.0, 474.0, 875.0, 1796.0, 4030.0, 9979.0, 29922.0, 118723.0, 477406.0, 302716.0, 69593.0, 19277.0, 7012.0, 2906.0, 1418.0, 729.0, 370.0, 210.0, 150.0, 78.0, 62.0, 32.0, 25.0, 18.0, 13.0, 7.0, 7.0, 7.0, 3.0, 3.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0537109375, -1.0195159912109375, -0.985321044921875, -0.9511260986328125, -0.91693115234375, -0.8827362060546875, -0.848541259765625, -0.8143463134765625, -0.7801513671875, -0.7459564208984375, -0.711761474609375, -0.6775665283203125, -0.64337158203125, -0.6091766357421875, -0.574981689453125, -0.5407867431640625, -0.506591796875, -0.4723968505859375, -0.438201904296875, -0.4040069580078125, -0.36981201171875, -0.3356170654296875, -0.301422119140625, -0.2672271728515625, -0.2330322265625, -0.1988372802734375, -0.164642333984375, -0.1304473876953125, -0.09625244140625, -0.0620574951171875, -0.027862548828125, 0.0063323974609375, 0.04052734375, 0.0747222900390625, 0.108917236328125, 0.1431121826171875, 0.17730712890625, 0.2115020751953125, 0.245697021484375, 0.2798919677734375, 0.3140869140625, 0.3482818603515625, 0.382476806640625, 0.4166717529296875, 0.45086669921875, 0.4850616455078125, 0.519256591796875, 0.5534515380859375, 0.587646484375, 0.6218414306640625, 0.656036376953125, 0.6902313232421875, 0.72442626953125, 0.7586212158203125, 0.792816162109375, 0.8270111083984375, 0.8612060546875, 0.8954010009765625, 0.929595947265625, 0.9637908935546875, 0.99798583984375, 1.0321807861328125, 1.066375732421875, 1.1005706787109375, 1.134765625]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 9.0, 11.0, 10.0, 17.0, 13.0, 21.0, 26.0, 30.0, 42.0, 45.0, 72.0, 66.0, 68.0, 70.0, 70.0, 60.0, 62.0, 57.0, 45.0, 41.0, 40.0, 40.0, 16.0, 18.0, 19.0, 11.0, 2.0, 9.0, 7.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.22119140625, -0.21384429931640625, -0.2064971923828125, -0.19915008544921875, -0.191802978515625, -0.18445587158203125, -0.1771087646484375, -0.16976165771484375, -0.16241455078125, -0.15506744384765625, -0.1477203369140625, -0.14037322998046875, -0.133026123046875, -0.12567901611328125, -0.1183319091796875, -0.11098480224609375, -0.1036376953125, -0.09629058837890625, -0.0889434814453125, -0.08159637451171875, -0.074249267578125, -0.06690216064453125, -0.0595550537109375, -0.05220794677734375, -0.04486083984375, -0.03751373291015625, -0.0301666259765625, -0.02281951904296875, -0.015472412109375, -0.00812530517578125, -0.0007781982421875, 0.00656890869140625, 0.013916015625, 0.02126312255859375, 0.0286102294921875, 0.03595733642578125, 0.043304443359375, 0.05065155029296875, 0.0579986572265625, 0.06534576416015625, 0.07269287109375, 0.08003997802734375, 0.0873870849609375, 0.09473419189453125, 0.102081298828125, 0.10942840576171875, 0.1167755126953125, 0.12412261962890625, 0.1314697265625, 0.13881683349609375, 0.1461639404296875, 0.15351104736328125, 0.160858154296875, 0.16820526123046875, 0.1755523681640625, 0.18289947509765625, 0.19024658203125, 0.19759368896484375, 0.2049407958984375, 0.21228790283203125, 0.219635009765625, 0.22698211669921875, 0.2343292236328125, 0.24167633056640625, 0.2490234375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 12.0, 14.0, 14.0, 27.0, 47.0, 94.0, 190.0, 290.0, 614.0, 1344.0, 3792.0, 14216.0, 98026.0, 773057.0, 132638.0, 17001.0, 4296.0, 1530.0, 635.0, 300.0, 181.0, 95.0, 63.0, 28.0, 25.0, 4.0, 6.0, 4.0, 6.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.916015625, -1.8511962890625, -1.786376953125, -1.7215576171875, -1.65673828125, -1.5919189453125, -1.527099609375, -1.4622802734375, -1.3974609375, -1.3326416015625, -1.267822265625, -1.2030029296875, -1.13818359375, -1.0733642578125, -1.008544921875, -0.9437255859375, -0.87890625, -0.8140869140625, -0.749267578125, -0.6844482421875, -0.61962890625, -0.5548095703125, -0.489990234375, -0.4251708984375, -0.3603515625, -0.2955322265625, -0.230712890625, -0.1658935546875, -0.10107421875, -0.0362548828125, 0.028564453125, 0.0933837890625, 0.158203125, 0.2230224609375, 0.287841796875, 0.3526611328125, 0.41748046875, 0.4822998046875, 0.547119140625, 0.6119384765625, 0.6767578125, 0.7415771484375, 0.806396484375, 0.8712158203125, 0.93603515625, 1.0008544921875, 1.065673828125, 1.1304931640625, 1.1953125, 1.2601318359375, 1.324951171875, 1.3897705078125, 1.45458984375, 1.5194091796875, 1.584228515625, 1.6490478515625, 1.7138671875, 1.7786865234375, 1.843505859375, 1.9083251953125, 1.97314453125, 2.0379638671875, 2.102783203125, 2.1676025390625, 2.232421875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 7.0, 9.0, 6.0, 11.0, 9.0, 20.0, 24.0, 18.0, 37.0, 27.0, 46.0, 46.0, 57.0, 62.0, 74.0, 78.0, 59.0, 59.0, 59.0, 50.0, 43.0, 31.0, 29.0, 30.0, 29.0, 15.0, 19.0, 8.0, 10.0, 5.0, 8.0, 3.0, 6.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1240234375, -1.083770751953125, -1.04351806640625, -1.003265380859375, -0.9630126953125, -0.922760009765625, -0.88250732421875, -0.842254638671875, -0.802001953125, -0.761749267578125, -0.72149658203125, -0.681243896484375, -0.6409912109375, -0.600738525390625, -0.56048583984375, -0.520233154296875, -0.47998046875, -0.439727783203125, -0.39947509765625, -0.359222412109375, -0.3189697265625, -0.278717041015625, -0.23846435546875, -0.198211669921875, -0.157958984375, -0.117706298828125, -0.07745361328125, -0.037200927734375, 0.0030517578125, 0.043304443359375, 0.08355712890625, 0.123809814453125, 0.1640625, 0.204315185546875, 0.24456787109375, 0.284820556640625, 0.3250732421875, 0.365325927734375, 0.40557861328125, 0.445831298828125, 0.486083984375, 0.526336669921875, 0.56658935546875, 0.606842041015625, 0.6470947265625, 0.687347412109375, 0.72760009765625, 0.767852783203125, 0.80810546875, 0.848358154296875, 0.88861083984375, 0.928863525390625, 0.9691162109375, 1.009368896484375, 1.04962158203125, 1.089874267578125, 1.130126953125, 1.170379638671875, 1.21063232421875, 1.250885009765625, 1.2911376953125, 1.331390380859375, 1.37164306640625, 1.411895751953125, 1.4521484375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 7.0, 5.0, 6.0, 4.0, 7.0, 20.0, 18.0, 32.0, 47.0, 71.0, 106.0, 168.0, 266.0, 402.0, 651.0, 1190.0, 2482.0, 6381.0, 25019.0, 327803.0, 634647.0, 35033.0, 7787.0, 3011.0, 1345.0, 804.0, 447.0, 275.0, 171.0, 110.0, 73.0, 48.0, 32.0, 27.0, 23.0, 11.0, 7.0, 9.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.84423828125, -0.8161849975585938, -0.7881317138671875, -0.7600784301757812, -0.732025146484375, -0.7039718627929688, -0.6759185791015625, -0.6478652954101562, -0.61981201171875, -0.5917587280273438, -0.5637054443359375, -0.5356521606445312, -0.507598876953125, -0.47954559326171875, -0.4514923095703125, -0.42343902587890625, -0.3953857421875, -0.36733245849609375, -0.3392791748046875, -0.31122589111328125, -0.283172607421875, -0.25511932373046875, -0.2270660400390625, -0.19901275634765625, -0.17095947265625, -0.14290618896484375, -0.1148529052734375, -0.08679962158203125, -0.058746337890625, -0.03069305419921875, -0.0026397705078125, 0.02541351318359375, 0.053466796875, 0.08152008056640625, 0.1095733642578125, 0.13762664794921875, 0.165679931640625, 0.19373321533203125, 0.2217864990234375, 0.24983978271484375, 0.27789306640625, 0.30594635009765625, 0.3339996337890625, 0.36205291748046875, 0.390106201171875, 0.41815948486328125, 0.4462127685546875, 0.47426605224609375, 0.5023193359375, 0.5303726196289062, 0.5584259033203125, 0.5864791870117188, 0.614532470703125, 0.6425857543945312, 0.6706390380859375, 0.6986923217773438, 0.72674560546875, 0.7547988891601562, 0.7828521728515625, 0.8109054565429688, 0.838958740234375, 0.8670120239257812, 0.8950653076171875, 0.9231185913085938, 0.951171875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 5.0, 2.0, 5.0, 6.0, 3.0, 12.0, 11.0, 14.0, 42.0, 56.0, 85.0, 143.0, 215.0, 140.0, 92.0, 63.0, 34.0, 23.0, 17.0, 18.0, 5.0, 4.0, 7.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010031461715698242, -9.692087769508362e-05, -9.352713823318481e-05, -9.013339877128601e-05, -8.673965930938721e-05, -8.33459198474884e-05, -7.99521803855896e-05, -7.65584409236908e-05, -7.316470146179199e-05, -6.977096199989319e-05, -6.637722253799438e-05, -6.298348307609558e-05, -5.958974361419678e-05, -5.6196004152297974e-05, -5.280226469039917e-05, -4.9408525228500366e-05, -4.601478576660156e-05, -4.262104630470276e-05, -3.9227306842803955e-05, -3.583356738090515e-05, -3.243982791900635e-05, -2.9046088457107544e-05, -2.565234899520874e-05, -2.2258609533309937e-05, -1.8864870071411133e-05, -1.547113060951233e-05, -1.2077391147613525e-05, -8.683651685714722e-06, -5.289912223815918e-06, -1.8961727619171143e-06, 1.4975666999816895e-06, 4.891306161880493e-06, 8.285045623779297e-06, 1.16787850856781e-05, 1.5072524547576904e-05, 1.8466264009475708e-05, 2.1860003471374512e-05, 2.5253742933273315e-05, 2.864748239517212e-05, 3.204122185707092e-05, 3.5434961318969727e-05, 3.882870078086853e-05, 4.2222440242767334e-05, 4.561617970466614e-05, 4.900991916656494e-05, 5.2403658628463745e-05, 5.579739809036255e-05, 5.919113755226135e-05, 6.258487701416016e-05, 6.597861647605896e-05, 6.937235593795776e-05, 7.276609539985657e-05, 7.615983486175537e-05, 7.955357432365417e-05, 8.294731378555298e-05, 8.634105324745178e-05, 8.973479270935059e-05, 9.312853217124939e-05, 9.65222716331482e-05, 9.9916011095047e-05, 0.0001033097505569458, 0.0001067034900188446, 0.00011009722948074341, 0.00011349096894264221, 0.00011688470840454102]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 6.0, 2.0, 5.0, 8.0, 7.0, 22.0, 26.0, 35.0, 43.0, 85.0, 111.0, 175.0, 302.0, 622.0, 1622.0, 6205.0, 46206.0, 874017.0, 105462.0, 9569.0, 2308.0, 796.0, 365.0, 178.0, 122.0, 80.0, 53.0, 30.0, 30.0, 21.0, 15.0, 15.0, 11.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.2841796875, -1.2491226196289062, -1.2140655517578125, -1.1790084838867188, -1.143951416015625, -1.1088943481445312, -1.0738372802734375, -1.0387802124023438, -1.00372314453125, -0.9686660766601562, -0.9336090087890625, -0.8985519409179688, -0.863494873046875, -0.8284378051757812, -0.7933807373046875, -0.7583236694335938, -0.7232666015625, -0.6882095336914062, -0.6531524658203125, -0.6180953979492188, -0.583038330078125, -0.5479812622070312, -0.5129241943359375, -0.47786712646484375, -0.44281005859375, -0.40775299072265625, -0.3726959228515625, -0.33763885498046875, -0.302581787109375, -0.26752471923828125, -0.2324676513671875, -0.19741058349609375, -0.162353515625, -0.12729644775390625, -0.0922393798828125, -0.05718231201171875, -0.022125244140625, 0.01293182373046875, 0.0479888916015625, 0.08304595947265625, 0.11810302734375, 0.15316009521484375, 0.1882171630859375, 0.22327423095703125, 0.258331298828125, 0.29338836669921875, 0.3284454345703125, 0.36350250244140625, 0.3985595703125, 0.43361663818359375, 0.4686737060546875, 0.5037307739257812, 0.538787841796875, 0.5738449096679688, 0.6089019775390625, 0.6439590454101562, 0.67901611328125, 0.7140731811523438, 0.7491302490234375, 0.7841873168945312, 0.819244384765625, 0.8543014526367188, 0.8893585205078125, 0.9244155883789062, 0.95947265625]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 0.0, 4.0, 7.0, 6.0, 7.0, 10.0, 20.0, 21.0, 54.0, 110.0, 206.0, 258.0, 124.0, 67.0, 33.0, 17.0, 19.0, 9.0, 5.0, 9.0, 7.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1904296875, -1.15460205078125, -1.1187744140625, -1.08294677734375, -1.047119140625, -1.01129150390625, -0.9754638671875, -0.93963623046875, -0.90380859375, -0.86798095703125, -0.8321533203125, -0.79632568359375, -0.760498046875, -0.72467041015625, -0.6888427734375, -0.65301513671875, -0.6171875, -0.58135986328125, -0.5455322265625, -0.50970458984375, -0.473876953125, -0.43804931640625, -0.4022216796875, -0.36639404296875, -0.33056640625, -0.29473876953125, -0.2589111328125, -0.22308349609375, -0.187255859375, -0.15142822265625, -0.1156005859375, -0.07977294921875, -0.0439453125, -0.00811767578125, 0.0277099609375, 0.06353759765625, 0.099365234375, 0.13519287109375, 0.1710205078125, 0.20684814453125, 0.24267578125, 0.27850341796875, 0.3143310546875, 0.35015869140625, 0.385986328125, 0.42181396484375, 0.4576416015625, 0.49346923828125, 0.529296875, 0.56512451171875, 0.6009521484375, 0.63677978515625, 0.672607421875, 0.70843505859375, 0.7442626953125, 0.78009033203125, 0.81591796875, 0.85174560546875, 0.8875732421875, 0.92340087890625, 0.959228515625, 0.99505615234375, 1.0308837890625, 1.06671142578125, 1.1025390625]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 5.0, 8.0, 6.0, 11.0, 20.0, 34.0, 61.0, 101.0, 128.0, 126.0, 146.0, 116.0, 76.0, 60.0, 42.0, 20.0, 21.0, 7.0, 5.0, 5.0, 4.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.41312026977539, -14.06708812713623, -13.72105598449707, -13.375022888183594, -13.028990745544434, -12.682958602905273, -12.336925506591797, -11.990893363952637, -11.644861221313477, -11.298829078674316, -10.952796936035156, -10.60676383972168, -10.26073169708252, -9.91469955444336, -9.568666458129883, -9.222634315490723, -8.876602172851562, -8.530570030212402, -8.184537887573242, -7.838504791259766, -7.4924726486206055, -7.146440505981445, -6.800407886505127, -6.454375267028809, -6.108343124389648, -5.762310981750488, -5.41627836227417, -5.070245742797852, -4.724213600158691, -4.378181457519531, -4.032148838043213, -3.6861164569854736, -3.340083599090576, -2.994051218032837, -2.6480188369750977, -2.3019864559173584, -1.9559540748596191, -1.6099216938018799, -1.2638893127441406, -0.9178569316864014, -0.5718245506286621, -0.22579216957092285, 0.1202402114868164, 0.46627259254455566, 0.8123049736022949, 1.1583373546600342, 1.5043697357177734, 1.8504021167755127, 2.196434497833252, 2.542466878890991, 2.8884992599487305, 3.2345316410064697, 3.580564022064209, 3.9265964031219482, 4.2726287841796875, 4.618660926818848, 4.964693546295166, 5.310726165771484, 5.6567583084106445, 6.002790451049805, 6.348823070526123, 6.694855690002441, 7.040887832641602, 7.386919975280762, 7.73295259475708]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 4.0, 2.0, 9.0, 12.0, 12.0, 8.0, 8.0, 15.0, 18.0, 15.0, 25.0, 33.0, 36.0, 33.0, 25.0, 41.0, 35.0, 34.0, 47.0, 49.0, 43.0, 57.0, 49.0, 37.0, 41.0, 37.0, 42.0, 29.0, 27.0, 24.0, 26.0, 22.0, 19.0, 24.0, 11.0, 12.0, 7.0, 14.0, 5.0, 6.0, 3.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.124138832092285, -4.946420669555664, -4.768702983856201, -4.59098482131958, -4.413266658782959, -4.235548496246338, -4.057830810546875, -3.880112648010254, -3.702394485473633, -3.524676561355591, -3.3469583988189697, -3.1692404747009277, -2.9915223121643066, -2.8138043880462646, -2.6360864639282227, -2.4583683013916016, -2.2806503772735596, -2.1029324531555176, -1.9252142906188965, -1.7474963665008545, -1.5697782039642334, -1.3920602798461914, -1.2143422365188599, -1.0366241931915283, -0.8589061498641968, -0.6811881065368652, -0.5034700632095337, -0.3257520794868469, -0.14803403615951538, 0.029684007167816162, 0.20740199089050293, 0.3851200342178345, 0.562838077545166, 0.7405561208724976, 0.9182741641998291, 1.095992088317871, 1.2737102508544922, 1.4514281749725342, 1.6291462182998657, 1.8068642616271973, 1.9845823049545288, 2.1623003482818604, 2.3400182723999023, 2.5177364349365234, 2.6954543590545654, 2.8731725215911865, 3.0508904457092285, 3.2286086082458496, 3.4063265323638916, 3.5840444564819336, 3.7617626190185547, 3.9394805431365967, 4.117198467254639, 4.29491662979126, 4.472634792327881, 4.650352478027344, 4.828070640563965, 5.005788803100586, 5.183506488800049, 5.36122465133667, 5.538942813873291, 5.716660976409912, 5.894378662109375, 6.072096824645996, 6.249814987182617]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 4.0, 12.0, 9.0, 14.0, 19.0, 19.0, 38.0, 55.0, 81.0, 118.0, 183.0, 311.0, 504.0, 867.0, 1846.0, 4328.0, 13789.0, 78362.0, 3735110.0, 316256.0, 29230.0, 7281.0, 2738.0, 1281.0, 662.0, 430.0, 244.0, 163.0, 102.0, 67.0, 54.0, 32.0, 18.0, 19.0, 15.0, 8.0, 6.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.8349609375, -1.7821502685546875, -1.729339599609375, -1.6765289306640625, -1.62371826171875, -1.5709075927734375, -1.518096923828125, -1.4652862548828125, -1.4124755859375, -1.3596649169921875, -1.306854248046875, -1.2540435791015625, -1.20123291015625, -1.1484222412109375, -1.095611572265625, -1.0428009033203125, -0.989990234375, -0.9371795654296875, -0.884368896484375, -0.8315582275390625, -0.77874755859375, -0.7259368896484375, -0.673126220703125, -0.6203155517578125, -0.5675048828125, -0.5146942138671875, -0.461883544921875, -0.4090728759765625, -0.35626220703125, -0.3034515380859375, -0.250640869140625, -0.1978302001953125, -0.14501953125, -0.0922088623046875, -0.039398193359375, 0.0134124755859375, 0.06622314453125, 0.1190338134765625, 0.171844482421875, 0.2246551513671875, 0.2774658203125, 0.3302764892578125, 0.383087158203125, 0.4358978271484375, 0.48870849609375, 0.5415191650390625, 0.594329833984375, 0.6471405029296875, 0.699951171875, 0.7527618408203125, 0.805572509765625, 0.8583831787109375, 0.91119384765625, 0.9640045166015625, 1.016815185546875, 1.0696258544921875, 1.1224365234375, 1.1752471923828125, 1.228057861328125, 1.2808685302734375, 1.33367919921875, 1.3864898681640625, 1.439300537109375, 1.4921112060546875, 1.544921875]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 8.0, 4.0, 6.0, 3.0, 8.0, 5.0, 14.0, 15.0, 14.0, 23.0, 28.0, 30.0, 38.0, 37.0, 53.0, 38.0, 62.0, 48.0, 51.0, 62.0, 53.0, 52.0, 44.0, 35.0, 48.0, 32.0, 30.0, 38.0, 28.0, 17.0, 21.0, 15.0, 16.0, 10.0, 5.0, 5.0, 7.0, 2.0, 2.0, 6.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2415771484375, -0.23392295837402344, -0.22626876831054688, -0.2186145782470703, -0.21096038818359375, -0.2033061981201172, -0.19565200805664062, -0.18799781799316406, -0.1803436279296875, -0.17268943786621094, -0.16503524780273438, -0.1573810577392578, -0.14972686767578125, -0.1420726776123047, -0.13441848754882812, -0.12676429748535156, -0.119110107421875, -0.11145591735839844, -0.10380172729492188, -0.09614753723144531, -0.08849334716796875, -0.08083915710449219, -0.07318496704101562, -0.06553077697753906, -0.0578765869140625, -0.05022239685058594, -0.042568206787109375, -0.03491401672363281, -0.02725982666015625, -0.019605636596679688, -0.011951446533203125, -0.0042972564697265625, 0.00335693359375, 0.011011123657226562, 0.018665313720703125, 0.026319503784179688, 0.03397369384765625, 0.04162788391113281, 0.049282073974609375, 0.05693626403808594, 0.0645904541015625, 0.07224464416503906, 0.07989883422851562, 0.08755302429199219, 0.09520721435546875, 0.10286140441894531, 0.11051559448242188, 0.11816978454589844, 0.125823974609375, 0.13347816467285156, 0.14113235473632812, 0.1487865447998047, 0.15644073486328125, 0.1640949249267578, 0.17174911499023438, 0.17940330505371094, 0.1870574951171875, 0.19471168518066406, 0.20236587524414062, 0.2100200653076172, 0.21767425537109375, 0.2253284454345703, 0.23298263549804688, 0.24063682556152344, 0.248291015625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 8.0, 4.0, 2.0, 6.0, 9.0, 7.0, 18.0, 28.0, 27.0, 23.0, 35.0, 51.0, 69.0, 94.0, 145.0, 286.0, 457.0, 919.0, 2072.0, 5565.0, 25128.0, 318198.0, 3746820.0, 75867.0, 11910.0, 3401.0, 1397.0, 705.0, 358.0, 206.0, 120.0, 92.0, 67.0, 41.0, 37.0, 32.0, 20.0, 10.0, 9.0, 14.0, 7.0, 5.0, 1.0, 4.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.271484375, -2.196441650390625, -2.12139892578125, -2.046356201171875, -1.9713134765625, -1.896270751953125, -1.82122802734375, -1.746185302734375, -1.671142578125, -1.596099853515625, -1.52105712890625, -1.446014404296875, -1.3709716796875, -1.295928955078125, -1.22088623046875, -1.145843505859375, -1.07080078125, -0.995758056640625, -0.92071533203125, -0.845672607421875, -0.7706298828125, -0.695587158203125, -0.62054443359375, -0.545501708984375, -0.470458984375, -0.395416259765625, -0.32037353515625, -0.245330810546875, -0.1702880859375, -0.095245361328125, -0.02020263671875, 0.054840087890625, 0.1298828125, 0.204925537109375, 0.27996826171875, 0.355010986328125, 0.4300537109375, 0.505096435546875, 0.58013916015625, 0.655181884765625, 0.730224609375, 0.805267333984375, 0.88031005859375, 0.955352783203125, 1.0303955078125, 1.105438232421875, 1.18048095703125, 1.255523681640625, 1.33056640625, 1.405609130859375, 1.48065185546875, 1.555694580078125, 1.6307373046875, 1.705780029296875, 1.78082275390625, 1.855865478515625, 1.930908203125, 2.005950927734375, 2.08099365234375, 2.156036376953125, 2.2310791015625, 2.306121826171875, 2.38116455078125, 2.456207275390625, 2.53125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 9.0, 22.0, 53.0, 184.0, 1408.0, 2117.0, 177.0, 51.0, 29.0, 12.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.859375, -1.79058837890625, -1.7218017578125, -1.65301513671875, -1.584228515625, -1.51544189453125, -1.4466552734375, -1.37786865234375, -1.30908203125, -1.24029541015625, -1.1715087890625, -1.10272216796875, -1.033935546875, -0.96514892578125, -0.8963623046875, -0.82757568359375, -0.7587890625, -0.69000244140625, -0.6212158203125, -0.55242919921875, -0.483642578125, -0.41485595703125, -0.3460693359375, -0.27728271484375, -0.20849609375, -0.13970947265625, -0.0709228515625, -0.00213623046875, 0.066650390625, 0.13543701171875, 0.2042236328125, 0.27301025390625, 0.341796875, 0.41058349609375, 0.4793701171875, 0.54815673828125, 0.616943359375, 0.68572998046875, 0.7545166015625, 0.82330322265625, 0.89208984375, 0.96087646484375, 1.0296630859375, 1.09844970703125, 1.167236328125, 1.23602294921875, 1.3048095703125, 1.37359619140625, 1.4423828125, 1.51116943359375, 1.5799560546875, 1.64874267578125, 1.717529296875, 1.78631591796875, 1.8551025390625, 1.92388916015625, 1.99267578125, 2.06146240234375, 2.1302490234375, 2.19903564453125, 2.267822265625, 2.33660888671875, 2.4053955078125, 2.47418212890625, 2.54296875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 6.0, 7.0, 14.0, 35.0, 86.0, 193.0, 269.0, 221.0, 100.0, 48.0, 21.0, 10.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.477922439575195, -5.183712005615234, -4.889501094818115, -4.595290184020996, -4.301079750061035, -4.006869316101074, -3.712658405303955, -3.418447732925415, -3.124237060546875, -2.830026388168335, -2.535815715789795, -2.241605043411255, -1.9473943710327148, -1.6531836986541748, -1.3589730262756348, -1.0647623538970947, -0.7705516815185547, -0.47634100914001465, -0.1821303367614746, 0.11208033561706543, 0.40629100799560547, 0.7005016803741455, 0.9947123527526855, 1.2889230251312256, 1.5831336975097656, 1.8773443698883057, 2.1715550422668457, 2.4657657146453857, 2.759976387023926, 3.054187059402466, 3.348397731781006, 3.642608404159546, 3.9368181228637695, 4.2310285568237305, 4.52523946762085, 4.819450378417969, 5.11366081237793, 5.407871246337891, 5.70208215713501, 5.996293067932129, 6.29050350189209, 6.584713935852051, 6.87892484664917, 7.173135757446289, 7.46734619140625, 7.761556625366211, 8.055767059326172, 8.34997844696045, 8.64418888092041, 8.938399314880371, 9.232610702514648, 9.52682113647461, 9.82103157043457, 10.115242004394531, 10.409452438354492, 10.70366382598877, 10.99787425994873, 11.292084693908691, 11.586296081542969, 11.88050651550293, 12.17471694946289, 12.468927383422852, 12.763137817382812, 13.05734920501709, 13.35155963897705]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 6.0, 8.0, 10.0, 11.0, 16.0, 12.0, 17.0, 26.0, 31.0, 35.0, 37.0, 37.0, 40.0, 51.0, 49.0, 66.0, 70.0, 51.0, 58.0, 51.0, 49.0, 51.0, 32.0, 36.0, 30.0, 30.0, 28.0, 18.0, 9.0, 11.0, 11.0, 11.0, 5.0, 2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.15971040725708, -3.0415139198303223, -2.9233171939849854, -2.8051207065582275, -2.6869239807128906, -2.568727493286133, -2.450530767440796, -2.332334280014038, -2.214137554168701, -2.0959410667419434, -1.9777443408966064, -1.859547734260559, -1.7413511276245117, -1.623154640197754, -1.504957914352417, -1.3867614269256592, -1.2685648202896118, -1.1503682136535645, -1.032171607017517, -0.9139750003814697, -0.7957783937454224, -0.6775818467140198, -0.5593852400779724, -0.44118863344192505, -0.3229920268058777, -0.20479542016983032, -0.08659882843494415, 0.03159776329994202, 0.14979436993598938, 0.26799094676971436, 0.3861875534057617, 0.5043841600418091, 0.6225807666778564, 0.7407773733139038, 0.8589739799499512, 0.9771705865859985, 1.095367193222046, 1.2135636806488037, 1.3317604064941406, 1.4499568939208984, 1.5681536197662354, 1.6863502264022827, 1.80454683303833, 1.9227434396743774, 2.040940046310425, 2.1591365337371826, 2.2773332595825195, 2.3955297470092773, 2.513726234436035, 2.631922721862793, 2.75011944770813, 2.8683159351348877, 2.9865126609802246, 3.1047091484069824, 3.2229058742523193, 3.341102361679077, 3.459299087524414, 3.577495574951172, 3.695692300796509, 3.8138887882232666, 3.9320855140686035, 4.050282001495361, 4.168478488922119, 4.286675453186035, 4.404871940612793]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 7.0, 3.0, 3.0, 3.0, 6.0, 11.0, 24.0, 20.0, 34.0, 54.0, 76.0, 142.0, 249.0, 346.0, 591.0, 964.0, 1681.0, 2838.0, 5058.0, 9447.0, 18602.0, 39401.0, 89051.0, 200304.0, 310631.0, 200730.0, 88494.0, 39338.0, 18658.0, 9596.0, 5153.0, 2824.0, 1694.0, 985.0, 587.0, 325.0, 245.0, 158.0, 81.0, 59.0, 34.0, 22.0, 9.0, 12.0, 3.0, 6.0, 6.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.99853515625, -0.9678115844726562, -0.9370880126953125, -0.9063644409179688, -0.875640869140625, -0.8449172973632812, -0.8141937255859375, -0.7834701538085938, -0.75274658203125, -0.7220230102539062, -0.6912994384765625, -0.6605758666992188, -0.629852294921875, -0.5991287231445312, -0.5684051513671875, -0.5376815795898438, -0.5069580078125, -0.47623443603515625, -0.4455108642578125, -0.41478729248046875, -0.384063720703125, -0.35334014892578125, -0.3226165771484375, -0.29189300537109375, -0.26116943359375, -0.23044586181640625, -0.1997222900390625, -0.16899871826171875, -0.138275146484375, -0.10755157470703125, -0.0768280029296875, -0.04610443115234375, -0.015380859375, 0.01534271240234375, 0.0460662841796875, 0.07678985595703125, 0.107513427734375, 0.13823699951171875, 0.1689605712890625, 0.19968414306640625, 0.23040771484375, 0.26113128662109375, 0.2918548583984375, 0.32257843017578125, 0.353302001953125, 0.38402557373046875, 0.4147491455078125, 0.44547271728515625, 0.4761962890625, 0.5069198608398438, 0.5376434326171875, 0.5683670043945312, 0.599090576171875, 0.6298141479492188, 0.6605377197265625, 0.6912612915039062, 0.72198486328125, 0.7527084350585938, 0.7834320068359375, 0.8141555786132812, 0.844879150390625, 0.8756027221679688, 0.9063262939453125, 0.9370498657226562, 0.9677734375]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 3.0, 3.0, 6.0, 5.0, 8.0, 10.0, 8.0, 15.0, 13.0, 19.0, 13.0, 21.0, 46.0, 28.0, 32.0, 45.0, 39.0, 47.0, 45.0, 54.0, 54.0, 48.0, 32.0, 45.0, 50.0, 42.0, 46.0, 30.0, 20.0, 33.0, 19.0, 21.0, 19.0, 17.0, 11.0, 14.0, 6.0, 6.0, 11.0, 5.0, 6.0, 4.0, 3.0, 2.0, 5.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.3232421875, -0.3142814636230469, -0.30532073974609375, -0.2963600158691406, -0.2873992919921875, -0.2784385681152344, -0.26947784423828125, -0.2605171203613281, -0.251556396484375, -0.24259567260742188, -0.23363494873046875, -0.22467422485351562, -0.2157135009765625, -0.20675277709960938, -0.19779205322265625, -0.18883132934570312, -0.17987060546875, -0.17090988159179688, -0.16194915771484375, -0.15298843383789062, -0.1440277099609375, -0.13506698608398438, -0.12610626220703125, -0.11714553833007812, -0.108184814453125, -0.09922409057617188, -0.09026336669921875, -0.08130264282226562, -0.0723419189453125, -0.06338119506835938, -0.05442047119140625, -0.045459747314453125, -0.0364990234375, -0.027538299560546875, -0.01857757568359375, -0.009616851806640625, -0.0006561279296875, 0.008304595947265625, 0.01726531982421875, 0.026226043701171875, 0.035186767578125, 0.044147491455078125, 0.05310821533203125, 0.062068939208984375, 0.0710296630859375, 0.07999038696289062, 0.08895111083984375, 0.09791183471679688, 0.10687255859375, 0.11583328247070312, 0.12479400634765625, 0.13375473022460938, 0.1427154541015625, 0.15167617797851562, 0.16063690185546875, 0.16959762573242188, 0.178558349609375, 0.18751907348632812, 0.19647979736328125, 0.20544052124023438, 0.2144012451171875, 0.22336196899414062, 0.23232269287109375, 0.24128341674804688, 0.250244140625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 5.0, 2.0, 9.0, 7.0, 8.0, 11.0, 12.0, 16.0, 37.0, 39.0, 62.0, 75.0, 112.0, 127.0, 236.0, 263.0, 458.0, 615.0, 1040.0, 1609.0, 2675.0, 4504.0, 8108.0, 16355.0, 35877.0, 92039.0, 259596.0, 366916.0, 152109.0, 55834.0, 23429.0, 11252.0, 5928.0, 3359.0, 1993.0, 1266.0, 807.0, 585.0, 310.0, 245.0, 172.0, 125.0, 91.0, 75.0, 47.0, 34.0, 21.0, 24.0, 15.0, 9.0, 6.0, 5.0, 6.0, 0.0, 3.0, 2.0, 2.0, 2.0, 1.0], "bins": [-1.2431640625, -1.2046051025390625, -1.166046142578125, -1.1274871826171875, -1.08892822265625, -1.0503692626953125, -1.011810302734375, -0.9732513427734375, -0.9346923828125, -0.8961334228515625, -0.857574462890625, -0.8190155029296875, -0.78045654296875, -0.7418975830078125, -0.703338623046875, -0.6647796630859375, -0.626220703125, -0.5876617431640625, -0.549102783203125, -0.5105438232421875, -0.47198486328125, -0.4334259033203125, -0.394866943359375, -0.3563079833984375, -0.3177490234375, -0.2791900634765625, -0.240631103515625, -0.2020721435546875, -0.16351318359375, -0.1249542236328125, -0.086395263671875, -0.0478363037109375, -0.00927734375, 0.0292816162109375, 0.067840576171875, 0.1063995361328125, 0.14495849609375, 0.1835174560546875, 0.222076416015625, 0.2606353759765625, 0.2991943359375, 0.3377532958984375, 0.376312255859375, 0.4148712158203125, 0.45343017578125, 0.4919891357421875, 0.530548095703125, 0.5691070556640625, 0.607666015625, 0.6462249755859375, 0.684783935546875, 0.7233428955078125, 0.76190185546875, 0.8004608154296875, 0.839019775390625, 0.8775787353515625, 0.9161376953125, 0.9546966552734375, 0.993255615234375, 1.0318145751953125, 1.07037353515625, 1.1089324951171875, 1.147491455078125, 1.1860504150390625, 1.224609375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 1.0, 1.0, 2.0, 5.0, 0.0, 9.0, 6.0, 18.0, 12.0, 21.0, 17.0, 18.0, 25.0, 25.0, 32.0, 40.0, 34.0, 49.0, 61.0, 60.0, 56.0, 59.0, 55.0, 51.0, 51.0, 43.0, 45.0, 35.0, 37.0, 20.0, 24.0, 14.0, 17.0, 15.0, 8.0, 11.0, 7.0, 4.0, 8.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.251953125, -2.1875762939453125, -2.123199462890625, -2.0588226318359375, -1.99444580078125, -1.9300689697265625, -1.865692138671875, -1.8013153076171875, -1.7369384765625, -1.6725616455078125, -1.608184814453125, -1.5438079833984375, -1.47943115234375, -1.4150543212890625, -1.350677490234375, -1.2863006591796875, -1.221923828125, -1.1575469970703125, -1.093170166015625, -1.0287933349609375, -0.96441650390625, -0.9000396728515625, -0.835662841796875, -0.7712860107421875, -0.7069091796875, -0.6425323486328125, -0.578155517578125, -0.5137786865234375, -0.44940185546875, -0.3850250244140625, -0.320648193359375, -0.2562713623046875, -0.19189453125, -0.1275177001953125, -0.063140869140625, 0.0012359619140625, 0.06561279296875, 0.1299896240234375, 0.194366455078125, 0.2587432861328125, 0.3231201171875, 0.3874969482421875, 0.451873779296875, 0.5162506103515625, 0.58062744140625, 0.6450042724609375, 0.709381103515625, 0.7737579345703125, 0.838134765625, 0.9025115966796875, 0.966888427734375, 1.0312652587890625, 1.09564208984375, 1.1600189208984375, 1.224395751953125, 1.2887725830078125, 1.3531494140625, 1.4175262451171875, 1.481903076171875, 1.5462799072265625, 1.61065673828125, 1.6750335693359375, 1.739410400390625, 1.8037872314453125, 1.8681640625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 8.0, 5.0, 6.0, 7.0, 9.0, 6.0, 15.0, 22.0, 17.0, 39.0, 60.0, 76.0, 151.0, 333.0, 611.0, 1447.0, 4262.0, 25750.0, 757091.0, 241550.0, 12093.0, 2866.0, 1047.0, 459.0, 221.0, 142.0, 83.0, 54.0, 27.0, 24.0, 28.0, 11.0, 13.0, 6.0, 6.0, 4.0, 3.0, 2.0, 1.0, 4.0, 2.0, 1.0, 2.0], "bins": [-2.61328125, -2.54766845703125, -2.4820556640625, -2.41644287109375, -2.350830078125, -2.28521728515625, -2.2196044921875, -2.15399169921875, -2.08837890625, -2.02276611328125, -1.9571533203125, -1.89154052734375, -1.825927734375, -1.76031494140625, -1.6947021484375, -1.62908935546875, -1.5634765625, -1.49786376953125, -1.4322509765625, -1.36663818359375, -1.301025390625, -1.23541259765625, -1.1697998046875, -1.10418701171875, -1.03857421875, -0.97296142578125, -0.9073486328125, -0.84173583984375, -0.776123046875, -0.71051025390625, -0.6448974609375, -0.57928466796875, -0.513671875, -0.44805908203125, -0.3824462890625, -0.31683349609375, -0.251220703125, -0.18560791015625, -0.1199951171875, -0.05438232421875, 0.01123046875, 0.07684326171875, 0.1424560546875, 0.20806884765625, 0.273681640625, 0.33929443359375, 0.4049072265625, 0.47052001953125, 0.5361328125, 0.60174560546875, 0.6673583984375, 0.73297119140625, 0.798583984375, 0.86419677734375, 0.9298095703125, 0.99542236328125, 1.06103515625, 1.12664794921875, 1.1922607421875, 1.25787353515625, 1.323486328125, 1.38909912109375, 1.4547119140625, 1.52032470703125, 1.5859375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 4.0, 7.0, 2.0, 13.0, 17.0, 34.0, 70.0, 129.0, 192.0, 218.0, 155.0, 76.0, 44.0, 17.0, 10.0, 4.0, 3.0, 4.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0003876686096191406, -0.000378461554646492, -0.0003692544996738434, -0.00036004744470119476, -0.00035084038972854614, -0.0003416333347558975, -0.0003324262797832489, -0.0003232192248106003, -0.00031401216983795166, -0.00030480511486530304, -0.0002955980598926544, -0.0002863910049200058, -0.0002771839499473572, -0.00026797689497470856, -0.00025876984000205994, -0.0002495627850294113, -0.0002403557300567627, -0.00023114867508411407, -0.00022194162011146545, -0.00021273456513881683, -0.0002035275101661682, -0.0001943204551935196, -0.00018511340022087097, -0.00017590634524822235, -0.00016669929027557373, -0.0001574922353029251, -0.0001482851803302765, -0.00013907812535762787, -0.00012987107038497925, -0.00012066401541233063, -0.00011145696043968201, -0.00010224990546703339, -9.304285049438477e-05, -8.383579552173615e-05, -7.462874054908752e-05, -6.54216855764389e-05, -5.621463060379028e-05, -4.700757563114166e-05, -3.780052065849304e-05, -2.859346568584442e-05, -1.93864107131958e-05, -1.017935574054718e-05, -9.723007678985596e-07, 8.234754204750061e-06, 1.744180917739868e-05, 2.6648864150047302e-05, 3.585591912269592e-05, 4.5062974095344543e-05, 5.4270029067993164e-05, 6.347708404064178e-05, 7.26841390132904e-05, 8.189119398593903e-05, 9.109824895858765e-05, 0.00010030530393123627, 0.00010951235890388489, 0.00011871941387653351, 0.00012792646884918213, 0.00013713352382183075, 0.00014634057879447937, 0.000155547633767128, 0.0001647546887397766, 0.00017396174371242523, 0.00018316879868507385, 0.00019237585365772247, 0.0002015829086303711]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 6.0, 0.0, 8.0, 7.0, 8.0, 17.0, 21.0, 40.0, 41.0, 65.0, 118.0, 151.0, 260.0, 463.0, 792.0, 1682.0, 3622.0, 9998.0, 41300.0, 327957.0, 566550.0, 71795.0, 14364.0, 4792.0, 2076.0, 1060.0, 549.0, 301.0, 177.0, 113.0, 75.0, 43.0, 25.0, 30.0, 21.0, 13.0, 9.0, 6.0, 5.0, 2.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1552734375, -1.1214447021484375, -1.087615966796875, -1.0537872314453125, -1.01995849609375, -0.9861297607421875, -0.952301025390625, -0.9184722900390625, -0.8846435546875, -0.8508148193359375, -0.816986083984375, -0.7831573486328125, -0.74932861328125, -0.7154998779296875, -0.681671142578125, -0.6478424072265625, -0.614013671875, -0.5801849365234375, -0.546356201171875, -0.5125274658203125, -0.47869873046875, -0.4448699951171875, -0.411041259765625, -0.3772125244140625, -0.3433837890625, -0.3095550537109375, -0.275726318359375, -0.2418975830078125, -0.20806884765625, -0.1742401123046875, -0.140411376953125, -0.1065826416015625, -0.07275390625, -0.0389251708984375, -0.005096435546875, 0.0287322998046875, 0.06256103515625, 0.0963897705078125, 0.130218505859375, 0.1640472412109375, 0.1978759765625, 0.2317047119140625, 0.265533447265625, 0.2993621826171875, 0.33319091796875, 0.3670196533203125, 0.400848388671875, 0.4346771240234375, 0.468505859375, 0.5023345947265625, 0.536163330078125, 0.5699920654296875, 0.60382080078125, 0.6376495361328125, 0.671478271484375, 0.7053070068359375, 0.7391357421875, 0.7729644775390625, 0.806793212890625, 0.8406219482421875, 0.87445068359375, 0.9082794189453125, 0.942108154296875, 0.9759368896484375, 1.009765625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 6.0, 3.0, 2.0, 3.0, 4.0, 10.0, 9.0, 13.0, 8.0, 39.0, 32.0, 61.0, 77.0, 100.0, 147.0, 146.0, 99.0, 68.0, 57.0, 32.0, 32.0, 13.0, 15.0, 6.0, 1.0, 3.0, 1.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.57421875, -1.5290374755859375, -1.483856201171875, -1.4386749267578125, -1.39349365234375, -1.3483123779296875, -1.303131103515625, -1.2579498291015625, -1.2127685546875, -1.1675872802734375, -1.122406005859375, -1.0772247314453125, -1.03204345703125, -0.9868621826171875, -0.941680908203125, -0.8964996337890625, -0.851318359375, -0.8061370849609375, -0.760955810546875, -0.7157745361328125, -0.67059326171875, -0.6254119873046875, -0.580230712890625, -0.5350494384765625, -0.4898681640625, -0.4446868896484375, -0.399505615234375, -0.3543243408203125, -0.30914306640625, -0.2639617919921875, -0.218780517578125, -0.1735992431640625, -0.12841796875, -0.0832366943359375, -0.038055419921875, 0.0071258544921875, 0.05230712890625, 0.0974884033203125, 0.142669677734375, 0.1878509521484375, 0.2330322265625, 0.2782135009765625, 0.323394775390625, 0.3685760498046875, 0.41375732421875, 0.4589385986328125, 0.504119873046875, 0.5493011474609375, 0.594482421875, 0.6396636962890625, 0.684844970703125, 0.7300262451171875, 0.77520751953125, 0.8203887939453125, 0.865570068359375, 0.9107513427734375, 0.9559326171875, 1.0011138916015625, 1.046295166015625, 1.0914764404296875, 1.13665771484375, 1.1818389892578125, 1.227020263671875, 1.2722015380859375, 1.3173828125]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [5.0, 5.0, 27.0, 102.0, 296.0, 341.0, 173.0, 46.0, 17.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.33753776550293, -5.923418998718262, -4.509300231933594, -3.095181465148926, -1.6810626983642578, -0.26694393157958984, 1.1471748352050781, 2.561293601989746, 3.975412368774414, 5.389531135559082, 6.80364990234375, 8.217768669128418, 9.631887435913086, 11.046006202697754, 12.460124969482422, 13.87424373626709, 15.288362503051758, 16.70248031616211, 18.116600036621094, 19.530719757080078, 20.94483757019043, 22.35895538330078, 23.773075103759766, 25.18719482421875, 26.6013126373291, 28.015430450439453, 29.429550170898438, 30.843669891357422, 32.257789611816406, 33.671905517578125, 35.08602523803711, 36.500144958496094, 37.91426086425781, 39.3283805847168, 40.74250030517578, 42.1566162109375, 43.570735931396484, 44.98485565185547, 46.39897155761719, 47.81309127807617, 49.227210998535156, 50.64133071899414, 52.055450439453125, 53.469566345214844, 54.88368606567383, 56.29780578613281, 57.71192169189453, 59.126041412353516, 60.5401611328125, 61.954280853271484, 63.36840057373047, 64.78251647949219, 66.19664001464844, 67.61075592041016, 69.02487182617188, 70.43899536132812, 71.85311126708984, 73.26722717285156, 74.68135070800781, 76.09546661376953, 77.50958251953125, 78.9237060546875, 80.33782196044922, 81.75194549560547, 83.16606140136719]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 5.0, 3.0, 0.0, 7.0, 4.0, 7.0, 5.0, 12.0, 6.0, 14.0, 11.0, 9.0, 17.0, 21.0, 25.0, 30.0, 37.0, 42.0, 30.0, 45.0, 41.0, 44.0, 46.0, 44.0, 42.0, 55.0, 40.0, 34.0, 49.0, 33.0, 27.0, 26.0, 22.0, 19.0, 22.0, 20.0, 19.0, 22.0, 12.0, 12.0, 11.0, 9.0, 9.0, 5.0, 3.0, 2.0, 3.0, 3.0, 6.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0], "bins": [-9.561294555664062, -9.258480072021484, -8.95566463470459, -8.652850151062012, -8.350035667419434, -8.047220230102539, -7.744405746459961, -7.441591262817383, -7.1387763023376465, -6.83596134185791, -6.533146858215332, -6.230331897735596, -5.927516937255859, -5.624702453613281, -5.321887493133545, -5.019072532653809, -4.7162580490112305, -4.413443088531494, -4.110628604888916, -3.8078136444091797, -3.5049989223480225, -3.2021842002868652, -2.899369239807129, -2.5965545177459717, -2.2937397956848145, -1.9909250736236572, -1.6881102323532104, -1.3852953910827637, -1.0824806690216064, -0.7796659469604492, -0.47685110569000244, -0.17403626441955566, 0.12877941131591797, 0.43159419298171997, 0.734408974647522, 1.0372238159179688, 1.340038537979126, 1.6428532600402832, 1.94566810131073, 2.2484829425811768, 2.551297664642334, 2.854112386703491, 3.1569271087646484, 3.4597420692443848, 3.762556791305542, 4.065371513366699, 4.3681864738464355, 4.671001434326172, 4.97381591796875, 5.276630878448486, 5.5794453620910645, 5.882260322570801, 6.185074806213379, 6.487889766693115, 6.790704727172852, 7.09351921081543, 7.396334171295166, 7.699149131774902, 8.00196361541748, 8.304778099060059, 8.607593536376953, 8.910408020019531, 9.21322250366211, 9.516037940979004, 9.818852424621582]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 5.0, 4.0, 2.0, 4.0, 7.0, 11.0, 17.0, 18.0, 17.0, 27.0, 39.0, 52.0, 71.0, 102.0, 164.0, 224.0, 315.0, 476.0, 761.0, 1230.0, 2111.0, 4218.0, 9454.0, 29863.0, 3956508.0, 151453.0, 21026.0, 7530.0, 3493.0, 1854.0, 1110.0, 646.0, 411.0, 297.0, 215.0, 151.0, 103.0, 78.0, 53.0, 50.0, 31.0, 28.0, 13.0, 13.0, 10.0, 8.0, 3.0, 5.0, 7.0, 7.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5537109375, -1.4979705810546875, -1.442230224609375, -1.3864898681640625, -1.33074951171875, -1.2750091552734375, -1.219268798828125, -1.1635284423828125, -1.1077880859375, -1.0520477294921875, -0.996307373046875, -0.9405670166015625, -0.88482666015625, -0.8290863037109375, -0.773345947265625, -0.7176055908203125, -0.661865234375, -0.6061248779296875, -0.550384521484375, -0.4946441650390625, -0.43890380859375, -0.3831634521484375, -0.327423095703125, -0.2716827392578125, -0.2159423828125, -0.1602020263671875, -0.104461669921875, -0.0487213134765625, 0.00701904296875, 0.0627593994140625, 0.118499755859375, 0.1742401123046875, 0.22998046875, 0.2857208251953125, 0.341461181640625, 0.3972015380859375, 0.45294189453125, 0.5086822509765625, 0.564422607421875, 0.6201629638671875, 0.6759033203125, 0.7316436767578125, 0.787384033203125, 0.8431243896484375, 0.89886474609375, 0.9546051025390625, 1.010345458984375, 1.0660858154296875, 1.121826171875, 1.1775665283203125, 1.233306884765625, 1.2890472412109375, 1.34478759765625, 1.4005279541015625, 1.456268310546875, 1.5120086669921875, 1.5677490234375, 1.6234893798828125, 1.679229736328125, 1.7349700927734375, 1.79071044921875, 1.8464508056640625, 1.902191162109375, 1.9579315185546875, 2.013671875]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 1.0, 5.0, 7.0, 5.0, 7.0, 8.0, 8.0, 29.0, 20.0, 20.0, 37.0, 48.0, 35.0, 49.0, 48.0, 56.0, 46.0, 67.0, 71.0, 49.0, 43.0, 44.0, 38.0, 31.0, 37.0, 39.0, 28.0, 27.0, 15.0, 18.0, 16.0, 16.0, 8.0, 11.0, 7.0, 3.0, 5.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4638671875, -0.4490966796875, -0.434326171875, -0.4195556640625, -0.40478515625, -0.3900146484375, -0.375244140625, -0.3604736328125, -0.345703125, -0.3309326171875, -0.316162109375, -0.3013916015625, -0.28662109375, -0.2718505859375, -0.257080078125, -0.2423095703125, -0.2275390625, -0.2127685546875, -0.197998046875, -0.1832275390625, -0.16845703125, -0.1536865234375, -0.138916015625, -0.1241455078125, -0.109375, -0.0946044921875, -0.079833984375, -0.0650634765625, -0.05029296875, -0.0355224609375, -0.020751953125, -0.0059814453125, 0.0087890625, 0.0235595703125, 0.038330078125, 0.0531005859375, 0.06787109375, 0.0826416015625, 0.097412109375, 0.1121826171875, 0.126953125, 0.1417236328125, 0.156494140625, 0.1712646484375, 0.18603515625, 0.2008056640625, 0.215576171875, 0.2303466796875, 0.2451171875, 0.2598876953125, 0.274658203125, 0.2894287109375, 0.30419921875, 0.3189697265625, 0.333740234375, 0.3485107421875, 0.36328125, 0.3780517578125, 0.392822265625, 0.4075927734375, 0.42236328125, 0.4371337890625, 0.451904296875, 0.4666748046875, 0.4814453125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 1.0, 5.0, 7.0, 7.0, 10.0, 17.0, 12.0, 17.0, 23.0, 30.0, 51.0, 74.0, 128.0, 236.0, 550.0, 1231.0, 3096.0, 9451.0, 55452.0, 4067709.0, 43333.0, 8111.0, 2665.0, 1035.0, 440.0, 240.0, 119.0, 64.0, 36.0, 28.0, 33.0, 16.0, 16.0, 8.0, 7.0, 6.0, 2.0, 7.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.65625, -4.52850341796875, -4.4007568359375, -4.27301025390625, -4.145263671875, -4.01751708984375, -3.8897705078125, -3.76202392578125, -3.63427734375, -3.50653076171875, -3.3787841796875, -3.25103759765625, -3.123291015625, -2.99554443359375, -2.8677978515625, -2.74005126953125, -2.6123046875, -2.48455810546875, -2.3568115234375, -2.22906494140625, -2.101318359375, -1.97357177734375, -1.8458251953125, -1.71807861328125, -1.59033203125, -1.46258544921875, -1.3348388671875, -1.20709228515625, -1.079345703125, -0.95159912109375, -0.8238525390625, -0.69610595703125, -0.568359375, -0.44061279296875, -0.3128662109375, -0.18511962890625, -0.057373046875, 0.07037353515625, 0.1981201171875, 0.32586669921875, 0.45361328125, 0.58135986328125, 0.7091064453125, 0.83685302734375, 0.964599609375, 1.09234619140625, 1.2200927734375, 1.34783935546875, 1.4755859375, 1.60333251953125, 1.7310791015625, 1.85882568359375, 1.986572265625, 2.11431884765625, 2.2420654296875, 2.36981201171875, 2.49755859375, 2.62530517578125, 2.7530517578125, 2.88079833984375, 3.008544921875, 3.13629150390625, 3.2640380859375, 3.39178466796875, 3.51953125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 2.0, 3.0, 5.0, 9.0, 9.0, 18.0, 22.0, 51.0, 181.0, 3595.0, 99.0, 39.0, 14.0, 12.0, 7.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.3212890625, -1.2933006286621094, -1.2653121948242188, -1.2373237609863281, -1.2093353271484375, -1.1813468933105469, -1.1533584594726562, -1.1253700256347656, -1.097381591796875, -1.0693931579589844, -1.0414047241210938, -1.0134162902832031, -0.9854278564453125, -0.9574394226074219, -0.9294509887695312, -0.9014625549316406, -0.87347412109375, -0.8454856872558594, -0.8174972534179688, -0.7895088195800781, -0.7615203857421875, -0.7335319519042969, -0.7055435180664062, -0.6775550842285156, -0.649566650390625, -0.6215782165527344, -0.5935897827148438, -0.5656013488769531, -0.5376129150390625, -0.5096244812011719, -0.48163604736328125, -0.4536476135253906, -0.4256591796875, -0.3976707458496094, -0.36968231201171875, -0.3416938781738281, -0.3137054443359375, -0.2857170104980469, -0.25772857666015625, -0.22974014282226562, -0.201751708984375, -0.17376327514648438, -0.14577484130859375, -0.11778640747070312, -0.0897979736328125, -0.061809539794921875, -0.03382110595703125, -0.005832672119140625, 0.02215576171875, 0.050144195556640625, 0.07813262939453125, 0.10612106323242188, 0.1341094970703125, 0.16209793090820312, 0.19008636474609375, 0.21807479858398438, 0.246063232421875, 0.2740516662597656, 0.30204010009765625, 0.3300285339355469, 0.3580169677734375, 0.3860054016113281, 0.41399383544921875, 0.4419822692871094, 0.469970703125]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 7.0, 17.0, 17.0, 46.0, 116.0, 217.0, 261.0, 204.0, 74.0, 41.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0], "bins": [-7.69999361038208, -7.559330940246582, -7.418668746948242, -7.278006076812744, -7.137343883514404, -6.996681213378906, -6.856019020080566, -6.715356349945068, -6.57469367980957, -6.434031009674072, -6.293368816375732, -6.152706146240234, -6.0120439529418945, -5.8713812828063965, -5.730718612670898, -5.590056419372559, -5.449394226074219, -5.308731555938721, -5.168069362640381, -5.027406692504883, -4.886744499206543, -4.746081829071045, -4.605419158935547, -4.464756965637207, -4.324094295501709, -4.183431625366211, -4.042769432067871, -3.902106761932373, -3.761444330215454, -3.620781898498535, -3.480119466781616, -3.3394570350646973, -3.198794364929199, -3.0581319332122803, -2.9174695014953613, -2.7768068313598633, -2.6361443996429443, -2.4954819679260254, -2.3548195362091064, -2.2141571044921875, -2.0734944343566895, -1.9328320026397705, -1.792169451713562, -1.651507019996643, -1.5108444690704346, -1.3701820373535156, -1.2295196056365967, -1.0888571739196777, -0.9481947422027588, -0.8075322508811951, -0.6668697595596313, -0.5262073278427124, -0.3855448365211487, -0.24488234519958496, -0.10421991348266602, 0.036442577838897705, 0.17710506916046143, 0.31776756048202515, 0.4584300220012665, 0.5990924835205078, 0.7397549748420715, 0.8804174661636353, 1.0210798978805542, 1.1617424488067627, 1.3024048805236816]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 4.0, 6.0, 9.0, 9.0, 17.0, 15.0, 24.0, 16.0, 28.0, 25.0, 31.0, 28.0, 39.0, 35.0, 48.0, 46.0, 45.0, 44.0, 51.0, 52.0, 47.0, 43.0, 33.0, 43.0, 33.0, 39.0, 32.0, 26.0, 19.0, 24.0, 20.0, 16.0, 11.0, 13.0, 10.0, 1.0, 6.0, 7.0, 3.0, 3.0, 4.0, 1.0, 1.0, 2.0], "bins": [-1.7674553394317627, -1.7209059000015259, -1.674356460571289, -1.6278070211410522, -1.5812575817108154, -1.5347081422805786, -1.4881587028503418, -1.4416091442108154, -1.3950598239898682, -1.3485103845596313, -1.3019609451293945, -1.2554115056991577, -1.208862066268921, -1.162312626838684, -1.1157631874084473, -1.069213628768921, -1.022664189338684, -0.9761147499084473, -0.9295653104782104, -0.8830158710479736, -0.8364664316177368, -0.7899169921875, -0.7433674931526184, -0.6968180537223816, -0.6502686142921448, -0.603719174861908, -0.5571697354316711, -0.5106202363967896, -0.4640708267688751, -0.4175213873386383, -0.3709719181060791, -0.3244224786758423, -0.2778729200363159, -0.2313234806060791, -0.1847740262746811, -0.13822457194328308, -0.09167513251304626, -0.04512569308280945, 0.0014237761497497559, 0.04797321557998657, 0.09452265501022339, 0.1410720944404602, 0.18762154877185822, 0.23417100310325623, 0.28072044253349304, 0.32726988196372986, 0.37381935119628906, 0.4203687906265259, 0.4669182300567627, 0.5134676694869995, 0.5600171089172363, 0.6065665483474731, 0.65311598777771, 0.6996654272079468, 0.7462149262428284, 0.7927643656730652, 0.839313805103302, 0.8858632445335388, 0.9324126839637756, 0.9789621829986572, 1.025511622428894, 1.0720610618591309, 1.1186105012893677, 1.1651599407196045, 1.2117093801498413]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 2.0, 7.0, 6.0, 9.0, 8.0, 9.0, 21.0, 30.0, 53.0, 71.0, 133.0, 274.0, 509.0, 1037.0, 2478.0, 6101.0, 17668.0, 63239.0, 274755.0, 487282.0, 141670.0, 34966.0, 10969.0, 4040.0, 1670.0, 707.0, 362.0, 180.0, 93.0, 64.0, 41.0, 29.0, 19.0, 12.0, 19.0, 4.0, 5.0, 5.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.796875, -2.71282958984375, -2.6287841796875, -2.54473876953125, -2.460693359375, -2.37664794921875, -2.2926025390625, -2.20855712890625, -2.12451171875, -2.04046630859375, -1.9564208984375, -1.87237548828125, -1.788330078125, -1.70428466796875, -1.6202392578125, -1.53619384765625, -1.4521484375, -1.36810302734375, -1.2840576171875, -1.20001220703125, -1.115966796875, -1.03192138671875, -0.9478759765625, -0.86383056640625, -0.77978515625, -0.69573974609375, -0.6116943359375, -0.52764892578125, -0.443603515625, -0.35955810546875, -0.2755126953125, -0.19146728515625, -0.107421875, -0.02337646484375, 0.0606689453125, 0.14471435546875, 0.228759765625, 0.31280517578125, 0.3968505859375, 0.48089599609375, 0.56494140625, 0.64898681640625, 0.7330322265625, 0.81707763671875, 0.901123046875, 0.98516845703125, 1.0692138671875, 1.15325927734375, 1.2373046875, 1.32135009765625, 1.4053955078125, 1.48944091796875, 1.573486328125, 1.65753173828125, 1.7415771484375, 1.82562255859375, 1.90966796875, 1.99371337890625, 2.0777587890625, 2.16180419921875, 2.245849609375, 2.32989501953125, 2.4139404296875, 2.49798583984375, 2.58203125]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 1.0, 5.0, 6.0, 16.0, 14.0, 14.0, 17.0, 19.0, 16.0, 23.0, 27.0, 28.0, 34.0, 50.0, 43.0, 62.0, 62.0, 57.0, 46.0, 62.0, 35.0, 49.0, 36.0, 36.0, 43.0, 27.0, 23.0, 28.0, 22.0, 16.0, 20.0, 13.0, 8.0, 13.0, 12.0, 8.0, 5.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.455322265625, -0.4393348693847656, -0.42334747314453125, -0.4073600769042969, -0.3913726806640625, -0.3753852844238281, -0.35939788818359375, -0.3434104919433594, -0.327423095703125, -0.3114356994628906, -0.29544830322265625, -0.2794609069824219, -0.2634735107421875, -0.24748611450195312, -0.23149871826171875, -0.21551132202148438, -0.19952392578125, -0.18353652954101562, -0.16754913330078125, -0.15156173706054688, -0.1355743408203125, -0.11958694458007812, -0.10359954833984375, -0.08761215209960938, -0.071624755859375, -0.055637359619140625, -0.03964996337890625, -0.023662567138671875, -0.0076751708984375, 0.008312225341796875, 0.02429962158203125, 0.040287017822265625, 0.0562744140625, 0.07226181030273438, 0.08824920654296875, 0.10423660278320312, 0.1202239990234375, 0.13621139526367188, 0.15219879150390625, 0.16818618774414062, 0.184173583984375, 0.20016098022460938, 0.21614837646484375, 0.23213577270507812, 0.2481231689453125, 0.2641105651855469, 0.28009796142578125, 0.2960853576660156, 0.31207275390625, 0.3280601501464844, 0.34404754638671875, 0.3600349426269531, 0.3760223388671875, 0.3920097351074219, 0.40799713134765625, 0.4239845275878906, 0.439971923828125, 0.4559593200683594, 0.47194671630859375, 0.4879341125488281, 0.5039215087890625, 0.5199089050292969, 0.5358963012695312, 0.5518836975097656, 0.56787109375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 9.0, 7.0, 7.0, 14.0, 24.0, 32.0, 48.0, 92.0, 201.0, 438.0, 1520.0, 6689.0, 60893.0, 839965.0, 125128.0, 10341.0, 2085.0, 592.0, 229.0, 111.0, 41.0, 33.0, 20.0, 15.0, 8.0, 8.0, 5.0, 5.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.9140625, -7.71429443359375, -7.5145263671875, -7.31475830078125, -7.114990234375, -6.91522216796875, -6.7154541015625, -6.51568603515625, -6.31591796875, -6.11614990234375, -5.9163818359375, -5.71661376953125, -5.516845703125, -5.31707763671875, -5.1173095703125, -4.91754150390625, -4.7177734375, -4.51800537109375, -4.3182373046875, -4.11846923828125, -3.918701171875, -3.71893310546875, -3.5191650390625, -3.31939697265625, -3.11962890625, -2.91986083984375, -2.7200927734375, -2.52032470703125, -2.320556640625, -2.12078857421875, -1.9210205078125, -1.72125244140625, -1.521484375, -1.32171630859375, -1.1219482421875, -0.92218017578125, -0.722412109375, -0.52264404296875, -0.3228759765625, -0.12310791015625, 0.07666015625, 0.27642822265625, 0.4761962890625, 0.67596435546875, 0.875732421875, 1.07550048828125, 1.2752685546875, 1.47503662109375, 1.6748046875, 1.87457275390625, 2.0743408203125, 2.27410888671875, 2.473876953125, 2.67364501953125, 2.8734130859375, 3.07318115234375, 3.27294921875, 3.47271728515625, 3.6724853515625, 3.87225341796875, 4.072021484375, 4.27178955078125, 4.4715576171875, 4.67132568359375, 4.87109375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 3.0, 4.0, 3.0, 4.0, 4.0, 14.0, 12.0, 19.0, 19.0, 22.0, 30.0, 38.0, 37.0, 47.0, 57.0, 50.0, 72.0, 62.0, 76.0, 56.0, 73.0, 41.0, 47.0, 38.0, 47.0, 26.0, 25.0, 29.0, 10.0, 9.0, 9.0, 5.0, 7.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-4.65234375, -4.533660888671875, -4.41497802734375, -4.296295166015625, -4.1776123046875, -4.058929443359375, -3.94024658203125, -3.821563720703125, -3.702880859375, -3.584197998046875, -3.46551513671875, -3.346832275390625, -3.2281494140625, -3.109466552734375, -2.99078369140625, -2.872100830078125, -2.75341796875, -2.634735107421875, -2.51605224609375, -2.397369384765625, -2.2786865234375, -2.160003662109375, -2.04132080078125, -1.922637939453125, -1.803955078125, -1.685272216796875, -1.56658935546875, -1.447906494140625, -1.3292236328125, -1.210540771484375, -1.09185791015625, -0.973175048828125, -0.8544921875, -0.735809326171875, -0.61712646484375, -0.498443603515625, -0.3797607421875, -0.261077880859375, -0.14239501953125, -0.023712158203125, 0.094970703125, 0.213653564453125, 0.33233642578125, 0.451019287109375, 0.5697021484375, 0.688385009765625, 0.80706787109375, 0.925750732421875, 1.04443359375, 1.163116455078125, 1.28179931640625, 1.400482177734375, 1.5191650390625, 1.637847900390625, 1.75653076171875, 1.875213623046875, 1.993896484375, 2.112579345703125, 2.23126220703125, 2.349945068359375, 2.4686279296875, 2.587310791015625, 2.70599365234375, 2.824676513671875, 2.943359375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 9.0, 12.0, 20.0, 30.0, 44.0, 70.0, 104.0, 237.0, 513.0, 2123.0, 19412.0, 1016664.0, 7243.0, 1233.0, 399.0, 203.0, 97.0, 62.0, 27.0, 24.0, 14.0, 9.0, 8.0, 0.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.9140625, -13.4837646484375, -13.053466796875, -12.6231689453125, -12.19287109375, -11.7625732421875, -11.332275390625, -10.9019775390625, -10.4716796875, -10.0413818359375, -9.611083984375, -9.1807861328125, -8.75048828125, -8.3201904296875, -7.889892578125, -7.4595947265625, -7.029296875, -6.5989990234375, -6.168701171875, -5.7384033203125, -5.30810546875, -4.8778076171875, -4.447509765625, -4.0172119140625, -3.5869140625, -3.1566162109375, -2.726318359375, -2.2960205078125, -1.86572265625, -1.4354248046875, -1.005126953125, -0.5748291015625, -0.14453125, 0.2857666015625, 0.716064453125, 1.1463623046875, 1.57666015625, 2.0069580078125, 2.437255859375, 2.8675537109375, 3.2978515625, 3.7281494140625, 4.158447265625, 4.5887451171875, 5.01904296875, 5.4493408203125, 5.879638671875, 6.3099365234375, 6.740234375, 7.1705322265625, 7.600830078125, 8.0311279296875, 8.46142578125, 8.8917236328125, 9.322021484375, 9.7523193359375, 10.1826171875, 10.6129150390625, 11.043212890625, 11.4735107421875, 11.90380859375, 12.3341064453125, 12.764404296875, 13.1947021484375, 13.625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 4.0, 3.0, 2.0, 2.0, 4.0, 14.0, 15.0, 39.0, 109.0, 214.0, 280.0, 167.0, 76.0, 28.0, 22.0, 6.0, 2.0, 1.0, 4.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0007610321044921875, -0.0007426217198371887, -0.0007242113351821899, -0.0007058009505271912, -0.0006873905658721924, -0.0006689801812171936, -0.0006505697965621948, -0.000632159411907196, -0.0006137490272521973, -0.0005953386425971985, -0.0005769282579421997, -0.0005585178732872009, -0.0005401074886322021, -0.0005216971039772034, -0.0005032867193222046, -0.0004848763346672058, -0.00046646595001220703, -0.00044805556535720825, -0.00042964518070220947, -0.0004112347960472107, -0.0003928244113922119, -0.00037441402673721313, -0.00035600364208221436, -0.0003375932574272156, -0.0003191828727722168, -0.000300772488117218, -0.00028236210346221924, -0.00026395171880722046, -0.0002455413341522217, -0.0002271309494972229, -0.00020872056484222412, -0.00019031018018722534, -0.00017189979553222656, -0.00015348941087722778, -0.000135079026222229, -0.00011666864156723022, -9.825825691223145e-05, -7.984787225723267e-05, -6.143748760223389e-05, -4.302710294723511e-05, -2.4616718292236328e-05, -6.206333637237549e-06, 1.220405101776123e-05, 3.061443567276001e-05, 4.902482032775879e-05, 6.743520498275757e-05, 8.584558963775635e-05, 0.00010425597429275513, 0.0001226663589477539, 0.00014107674360275269, 0.00015948712825775146, 0.00017789751291275024, 0.00019630789756774902, 0.0002147182822227478, 0.00023312866687774658, 0.00025153905153274536, 0.00026994943618774414, 0.0002883598208427429, 0.0003067702054977417, 0.0003251805901527405, 0.00034359097480773926, 0.00036200135946273804, 0.0003804117441177368, 0.0003988221287727356, 0.0004172325134277344]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 2.0, 9.0, 8.0, 14.0, 10.0, 21.0, 42.0, 45.0, 58.0, 113.0, 201.0, 398.0, 808.0, 1786.0, 5012.0, 28170.0, 961630.0, 40532.0, 5861.0, 1929.0, 847.0, 471.0, 219.0, 124.0, 75.0, 47.0, 27.0, 34.0, 14.0, 9.0, 11.0, 11.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0], "bins": [-5.54296875, -5.382568359375, -5.22216796875, -5.061767578125, -4.9013671875, -4.740966796875, -4.58056640625, -4.420166015625, -4.259765625, -4.099365234375, -3.93896484375, -3.778564453125, -3.6181640625, -3.457763671875, -3.29736328125, -3.136962890625, -2.9765625, -2.816162109375, -2.65576171875, -2.495361328125, -2.3349609375, -2.174560546875, -2.01416015625, -1.853759765625, -1.693359375, -1.532958984375, -1.37255859375, -1.212158203125, -1.0517578125, -0.891357421875, -0.73095703125, -0.570556640625, -0.41015625, -0.249755859375, -0.08935546875, 0.071044921875, 0.2314453125, 0.391845703125, 0.55224609375, 0.712646484375, 0.873046875, 1.033447265625, 1.19384765625, 1.354248046875, 1.5146484375, 1.675048828125, 1.83544921875, 1.995849609375, 2.15625, 2.316650390625, 2.47705078125, 2.637451171875, 2.7978515625, 2.958251953125, 3.11865234375, 3.279052734375, 3.439453125, 3.599853515625, 3.76025390625, 3.920654296875, 4.0810546875, 4.241455078125, 4.40185546875, 4.562255859375, 4.72265625]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 6.0, 9.0, 15.0, 67.0, 332.0, 432.0, 92.0, 24.0, 11.0, 2.0, 5.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.4140625, -11.0889892578125, -10.763916015625, -10.4388427734375, -10.11376953125, -9.7886962890625, -9.463623046875, -9.1385498046875, -8.8134765625, -8.4884033203125, -8.163330078125, -7.8382568359375, -7.51318359375, -7.1881103515625, -6.863037109375, -6.5379638671875, -6.212890625, -5.8878173828125, -5.562744140625, -5.2376708984375, -4.91259765625, -4.5875244140625, -4.262451171875, -3.9373779296875, -3.6123046875, -3.2872314453125, -2.962158203125, -2.6370849609375, -2.31201171875, -1.9869384765625, -1.661865234375, -1.3367919921875, -1.01171875, -0.6866455078125, -0.361572265625, -0.0364990234375, 0.28857421875, 0.6136474609375, 0.938720703125, 1.2637939453125, 1.5888671875, 1.9139404296875, 2.239013671875, 2.5640869140625, 2.88916015625, 3.2142333984375, 3.539306640625, 3.8643798828125, 4.189453125, 4.5145263671875, 4.839599609375, 5.1646728515625, 5.48974609375, 5.8148193359375, 6.139892578125, 6.4649658203125, 6.7900390625, 7.1151123046875, 7.440185546875, 7.7652587890625, 8.09033203125, 8.4154052734375, 8.740478515625, 9.0655517578125, 9.390625]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 11.0, 19.0, 60.0, 142.0, 248.0, 238.0, 151.0, 70.0, 31.0, 14.0, 10.0, 7.0, 6.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.30011749267578, -24.12108612060547, -21.942054748535156, -19.763023376464844, -17.58399200439453, -15.404960632324219, -13.225929260253906, -11.046897888183594, -8.867866516113281, -6.688835144042969, -4.509803771972656, -2.3307723999023438, -0.15174102783203125, 2.0272903442382812, 4.206321716308594, 6.385353088378906, 8.564384460449219, 10.743415832519531, 12.922447204589844, 15.101478576660156, 17.28050994873047, 19.45954132080078, 21.638572692871094, 23.817604064941406, 25.99663543701172, 28.17566680908203, 30.354698181152344, 32.533729553222656, 34.71276092529297, 36.89179229736328, 39.070823669433594, 41.249855041503906, 43.42889404296875, 45.60792541503906, 47.786956787109375, 49.96598815917969, 52.14501953125, 54.32405090332031, 56.503082275390625, 58.68211364746094, 60.86114501953125, 63.04017639160156, 65.21920776367188, 67.39823913574219, 69.5772705078125, 71.75630187988281, 73.93533325195312, 76.11436462402344, 78.29339599609375, 80.47242736816406, 82.65145874023438, 84.83049011230469, 87.009521484375, 89.18855285644531, 91.36758422851562, 93.54661560058594, 95.72564697265625, 97.90467834472656, 100.08370971679688, 102.26274108886719, 104.4417724609375, 106.62080383300781, 108.79983520507812, 110.97886657714844, 113.15789794921875]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 7.0, 6.0, 15.0, 12.0, 19.0, 22.0, 38.0, 36.0, 43.0, 44.0, 46.0, 51.0, 77.0, 65.0, 75.0, 65.0, 57.0, 58.0, 54.0, 46.0, 36.0, 39.0, 18.0, 16.0, 19.0, 14.0, 10.0, 5.0, 6.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.195693969726562, -20.445283889770508, -19.694873809814453, -18.944461822509766, -18.19405174255371, -17.443641662597656, -16.6932315826416, -15.942821502685547, -15.192410469055176, -14.442000389099121, -13.69158935546875, -12.941179275512695, -12.19076919555664, -11.44035816192627, -10.689948081970215, -9.939537048339844, -9.189126968383789, -8.438716888427734, -7.688305854797363, -6.937895774841309, -6.187485218048096, -5.437074661254883, -4.686664581298828, -3.9362540245056152, -3.1858434677124023, -2.4354329109191895, -1.6850225925445557, -0.9346122741699219, -0.18420171737670898, 0.5662088394165039, 1.3166189193725586, 2.0670294761657715, 2.8174400329589844, 3.5678505897521973, 4.31826114654541, 5.068671226501465, 5.819081783294678, 6.569492340087891, 7.319902420043945, 8.0703125, 8.820723533630371, 9.571133613586426, 10.321544647216797, 11.071954727172852, 11.822364807128906, 12.572775840759277, 13.323185920715332, 14.073596954345703, 14.824007034301758, 15.574417114257812, 16.324827194213867, 17.075237274169922, 17.82564926147461, 18.576059341430664, 19.32646942138672, 20.076879501342773, 20.827289581298828, 21.577699661254883, 22.328109741210938, 23.078521728515625, 23.82893180847168, 24.579341888427734, 25.32975196838379, 26.080162048339844, 26.83057403564453]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 1.0, 6.0, 3.0, 4.0, 2.0, 6.0, 7.0, 14.0, 14.0, 23.0, 46.0, 63.0, 83.0, 106.0, 224.0, 398.0, 879.0, 2429.0, 9353.0, 156025.0, 4007243.0, 12106.0, 2927.0, 1051.0, 491.0, 288.0, 151.0, 90.0, 57.0, 53.0, 39.0, 30.0, 20.0, 10.0, 16.0, 4.0, 8.0, 5.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.52734375, -5.29791259765625, -5.0684814453125, -4.83905029296875, -4.609619140625, -4.38018798828125, -4.1507568359375, -3.92132568359375, -3.69189453125, -3.46246337890625, -3.2330322265625, -3.00360107421875, -2.774169921875, -2.54473876953125, -2.3153076171875, -2.08587646484375, -1.8564453125, -1.62701416015625, -1.3975830078125, -1.16815185546875, -0.938720703125, -0.70928955078125, -0.4798583984375, -0.25042724609375, -0.02099609375, 0.20843505859375, 0.4378662109375, 0.66729736328125, 0.896728515625, 1.12615966796875, 1.3555908203125, 1.58502197265625, 1.814453125, 2.04388427734375, 2.2733154296875, 2.50274658203125, 2.732177734375, 2.96160888671875, 3.1910400390625, 3.42047119140625, 3.64990234375, 3.87933349609375, 4.1087646484375, 4.33819580078125, 4.567626953125, 4.79705810546875, 5.0264892578125, 5.25592041015625, 5.4853515625, 5.71478271484375, 5.9442138671875, 6.17364501953125, 6.403076171875, 6.63250732421875, 6.8619384765625, 7.09136962890625, 7.32080078125, 7.55023193359375, 7.7796630859375, 8.00909423828125, 8.238525390625, 8.46795654296875, 8.6973876953125, 8.92681884765625, 9.15625]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 4.0, 2.0, 0.0, 2.0, 2.0, 4.0, 6.0, 8.0, 10.0, 8.0, 14.0, 25.0, 25.0, 26.0, 32.0, 44.0, 57.0, 53.0, 67.0, 69.0, 62.0, 84.0, 58.0, 61.0, 47.0, 40.0, 39.0, 38.0, 27.0, 21.0, 26.0, 12.0, 8.0, 5.0, 4.0, 8.0, 3.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.642578125, -0.6177749633789062, -0.5929718017578125, -0.5681686401367188, -0.543365478515625, -0.5185623168945312, -0.4937591552734375, -0.46895599365234375, -0.44415283203125, -0.41934967041015625, -0.3945465087890625, -0.36974334716796875, -0.344940185546875, -0.32013702392578125, -0.2953338623046875, -0.27053070068359375, -0.2457275390625, -0.22092437744140625, -0.1961212158203125, -0.17131805419921875, -0.146514892578125, -0.12171173095703125, -0.0969085693359375, -0.07210540771484375, -0.04730224609375, -0.02249908447265625, 0.0023040771484375, 0.02710723876953125, 0.051910400390625, 0.07671356201171875, 0.1015167236328125, 0.12631988525390625, 0.151123046875, 0.17592620849609375, 0.2007293701171875, 0.22553253173828125, 0.250335693359375, 0.27513885498046875, 0.2999420166015625, 0.32474517822265625, 0.34954833984375, 0.37435150146484375, 0.3991546630859375, 0.42395782470703125, 0.448760986328125, 0.47356414794921875, 0.4983673095703125, 0.5231704711914062, 0.5479736328125, 0.5727767944335938, 0.5975799560546875, 0.6223831176757812, 0.647186279296875, 0.6719894409179688, 0.6967926025390625, 0.7215957641601562, 0.74639892578125, 0.7712020874023438, 0.7960052490234375, 0.8208084106445312, 0.845611572265625, 0.8704147338867188, 0.8952178955078125, 0.9200210571289062, 0.94482421875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 7.0, 7.0, 7.0, 7.0, 14.0, 13.0, 20.0, 32.0, 38.0, 52.0, 67.0, 91.0, 130.0, 206.0, 241.0, 363.0, 521.0, 855.0, 1480.0, 2594.0, 5315.0, 15096.0, 105820.0, 4001037.0, 41147.0, 9513.0, 3990.0, 2098.0, 1192.0, 748.0, 438.0, 314.0, 215.0, 166.0, 103.0, 90.0, 74.0, 49.0, 32.0, 27.0, 21.0, 16.0, 15.0, 7.0, 6.0, 5.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-8.4765625, -8.2142333984375, -7.951904296875, -7.6895751953125, -7.42724609375, -7.1649169921875, -6.902587890625, -6.6402587890625, -6.3779296875, -6.1156005859375, -5.853271484375, -5.5909423828125, -5.32861328125, -5.0662841796875, -4.803955078125, -4.5416259765625, -4.279296875, -4.0169677734375, -3.754638671875, -3.4923095703125, -3.22998046875, -2.9676513671875, -2.705322265625, -2.4429931640625, -2.1806640625, -1.9183349609375, -1.656005859375, -1.3936767578125, -1.13134765625, -0.8690185546875, -0.606689453125, -0.3443603515625, -0.08203125, 0.1802978515625, 0.442626953125, 0.7049560546875, 0.96728515625, 1.2296142578125, 1.491943359375, 1.7542724609375, 2.0166015625, 2.2789306640625, 2.541259765625, 2.8035888671875, 3.06591796875, 3.3282470703125, 3.590576171875, 3.8529052734375, 4.115234375, 4.3775634765625, 4.639892578125, 4.9022216796875, 5.16455078125, 5.4268798828125, 5.689208984375, 5.9515380859375, 6.2138671875, 6.4761962890625, 6.738525390625, 7.0008544921875, 7.26318359375, 7.5255126953125, 7.787841796875, 8.0501708984375, 8.3125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 9.0, 13.0, 19.0, 60.0, 268.0, 3518.0, 102.0, 40.0, 11.0, 10.0, 3.0, 10.0, 3.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.51953125, -3.41357421875, -3.3076171875, -3.20166015625, -3.095703125, -2.98974609375, -2.8837890625, -2.77783203125, -2.671875, -2.56591796875, -2.4599609375, -2.35400390625, -2.248046875, -2.14208984375, -2.0361328125, -1.93017578125, -1.82421875, -1.71826171875, -1.6123046875, -1.50634765625, -1.400390625, -1.29443359375, -1.1884765625, -1.08251953125, -0.9765625, -0.87060546875, -0.7646484375, -0.65869140625, -0.552734375, -0.44677734375, -0.3408203125, -0.23486328125, -0.12890625, -0.02294921875, 0.0830078125, 0.18896484375, 0.294921875, 0.40087890625, 0.5068359375, 0.61279296875, 0.71875, 0.82470703125, 0.9306640625, 1.03662109375, 1.142578125, 1.24853515625, 1.3544921875, 1.46044921875, 1.56640625, 1.67236328125, 1.7783203125, 1.88427734375, 1.990234375, 2.09619140625, 2.2021484375, 2.30810546875, 2.4140625, 2.52001953125, 2.6259765625, 2.73193359375, 2.837890625, 2.94384765625, 3.0498046875, 3.15576171875, 3.26171875]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 6.0, 6.0, 6.0, 8.0, 17.0, 25.0, 36.0, 63.0, 68.0, 102.0, 148.0, 131.0, 108.0, 78.0, 49.0, 38.0, 27.0, 26.0, 17.0, 11.0, 11.0, 6.0, 6.0, 3.0, 6.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.978202819824219, -7.711091041564941, -7.443979263305664, -7.176867485046387, -6.909755706787109, -6.642643928527832, -6.3755316734313965, -6.108419895172119, -5.841308116912842, -5.5741963386535645, -5.307084560394287, -5.03997278213501, -4.772860527038574, -4.505748748779297, -4.2386369705200195, -3.971525192260742, -3.704413414001465, -3.4373016357421875, -3.17018985748291, -2.9030778408050537, -2.6359660625457764, -2.368854284286499, -2.1017422676086426, -1.8346304893493652, -1.567518711090088, -1.3004069328308105, -1.0332950353622437, -0.7661831974983215, -0.4990713596343994, -0.23195958137512207, 0.035152316093444824, 0.3022642135620117, 0.5693750381469727, 0.8364868760108948, 1.103598713874817, 1.3707106113433838, 1.6378223896026611, 1.9049341678619385, 2.172046184539795, 2.4391579627990723, 2.7062697410583496, 2.973381519317627, 3.2404932975769043, 3.5076053142547607, 3.774717092514038, 4.0418291091918945, 4.308940887451172, 4.576052665710449, 4.843164443969727, 5.110276222229004, 5.377388000488281, 5.644499778747559, 5.911611557006836, 6.178723335266113, 6.445835590362549, 6.712947368621826, 6.9800591468811035, 7.247170925140381, 7.514282703399658, 7.7813944816589355, 8.048506736755371, 8.315618515014648, 8.582730293273926, 8.849842071533203, 9.11695384979248]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 4.0, 4.0, 8.0, 7.0, 16.0, 12.0, 13.0, 18.0, 27.0, 19.0, 38.0, 29.0, 39.0, 49.0, 30.0, 33.0, 40.0, 53.0, 45.0, 40.0, 57.0, 41.0, 48.0, 49.0, 37.0, 37.0, 25.0, 37.0, 27.0, 17.0, 18.0, 11.0, 15.0, 12.0, 11.0, 9.0, 11.0, 2.0, 3.0, 6.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-5.956532955169678, -5.777316570281982, -5.598100185394287, -5.418883800506592, -5.2396674156188965, -5.060451030731201, -4.881234645843506, -4.7020182609558105, -4.522801876068115, -4.34358549118042, -4.164369106292725, -3.9851527214050293, -3.805936336517334, -3.6267199516296387, -3.4475035667419434, -3.268287181854248, -3.0890707969665527, -2.9098544120788574, -2.730638027191162, -2.551421642303467, -2.3722052574157715, -2.192988872528076, -2.013772487640381, -1.8345561027526855, -1.6553397178649902, -1.476123332977295, -1.2969069480895996, -1.1176905632019043, -0.938474178314209, -0.7592577934265137, -0.5800414085388184, -0.40082502365112305, -0.22160911560058594, -0.042392730712890625, 0.1368236541748047, 0.3160400390625, 0.4952564239501953, 0.6744728088378906, 0.8536891937255859, 1.0329055786132812, 1.2121219635009766, 1.3913383483886719, 1.5705547332763672, 1.7497711181640625, 1.9289875030517578, 2.108203887939453, 2.2874202728271484, 2.4666366577148438, 2.645853042602539, 2.8250694274902344, 3.0042858123779297, 3.183502197265625, 3.3627185821533203, 3.5419349670410156, 3.721151351928711, 3.9003677368164062, 4.079584121704102, 4.258800506591797, 4.438016891479492, 4.6172332763671875, 4.796449661254883, 4.975666046142578, 5.154882431030273, 5.334098815917969, 5.513315200805664]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 6.0, 3.0, 5.0, 3.0, 5.0, 10.0, 18.0, 18.0, 11.0, 26.0, 29.0, 40.0, 69.0, 89.0, 124.0, 157.0, 247.0, 378.0, 533.0, 812.0, 1300.0, 2176.0, 3572.0, 6177.0, 11230.0, 21074.0, 44065.0, 101700.0, 261242.0, 335821.0, 140026.0, 57885.0, 27129.0, 13655.0, 7524.0, 4307.0, 2524.0, 1575.0, 956.0, 584.0, 450.0, 310.0, 222.0, 124.0, 94.0, 76.0, 50.0, 37.0, 21.0, 21.0, 13.0, 16.0, 4.0, 7.0, 9.0, 1.0, 2.0, 0.0, 5.0, 3.0], "bins": [-2.43359375, -2.3602294921875, -2.286865234375, -2.2135009765625, -2.14013671875, -2.0667724609375, -1.993408203125, -1.9200439453125, -1.8466796875, -1.7733154296875, -1.699951171875, -1.6265869140625, -1.55322265625, -1.4798583984375, -1.406494140625, -1.3331298828125, -1.259765625, -1.1864013671875, -1.113037109375, -1.0396728515625, -0.96630859375, -0.8929443359375, -0.819580078125, -0.7462158203125, -0.6728515625, -0.5994873046875, -0.526123046875, -0.4527587890625, -0.37939453125, -0.3060302734375, -0.232666015625, -0.1593017578125, -0.0859375, -0.0125732421875, 0.060791015625, 0.1341552734375, 0.20751953125, 0.2808837890625, 0.354248046875, 0.4276123046875, 0.5009765625, 0.5743408203125, 0.647705078125, 0.7210693359375, 0.79443359375, 0.8677978515625, 0.941162109375, 1.0145263671875, 1.087890625, 1.1612548828125, 1.234619140625, 1.3079833984375, 1.38134765625, 1.4547119140625, 1.528076171875, 1.6014404296875, 1.6748046875, 1.7481689453125, 1.821533203125, 1.8948974609375, 1.96826171875, 2.0416259765625, 2.114990234375, 2.1883544921875, 2.26171875]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 5.0, 2.0, 8.0, 10.0, 13.0, 19.0, 14.0, 12.0, 12.0, 21.0, 31.0, 26.0, 29.0, 35.0, 44.0, 53.0, 54.0, 54.0, 51.0, 62.0, 59.0, 51.0, 31.0, 43.0, 38.0, 39.0, 32.0, 26.0, 20.0, 10.0, 17.0, 7.0, 12.0, 11.0, 10.0, 7.0, 6.0, 4.0, 5.0, 8.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.1318359375, -1.0953216552734375, -1.058807373046875, -1.0222930908203125, -0.98577880859375, -0.9492645263671875, -0.912750244140625, -0.8762359619140625, -0.8397216796875, -0.8032073974609375, -0.766693115234375, -0.7301788330078125, -0.69366455078125, -0.6571502685546875, -0.620635986328125, -0.5841217041015625, -0.547607421875, -0.5110931396484375, -0.474578857421875, -0.4380645751953125, -0.40155029296875, -0.3650360107421875, -0.328521728515625, -0.2920074462890625, -0.2554931640625, -0.2189788818359375, -0.182464599609375, -0.1459503173828125, -0.10943603515625, -0.0729217529296875, -0.036407470703125, 0.0001068115234375, 0.03662109375, 0.0731353759765625, 0.109649658203125, 0.1461639404296875, 0.18267822265625, 0.2191925048828125, 0.255706787109375, 0.2922210693359375, 0.3287353515625, 0.3652496337890625, 0.401763916015625, 0.4382781982421875, 0.47479248046875, 0.5113067626953125, 0.547821044921875, 0.5843353271484375, 0.620849609375, 0.6573638916015625, 0.693878173828125, 0.7303924560546875, 0.76690673828125, 0.8034210205078125, 0.839935302734375, 0.8764495849609375, 0.9129638671875, 0.9494781494140625, 0.985992431640625, 1.0225067138671875, 1.05902099609375, 1.0955352783203125, 1.132049560546875, 1.1685638427734375, 1.205078125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 3.0, 3.0, 5.0, 4.0, 6.0, 7.0, 12.0, 11.0, 11.0, 11.0, 22.0, 40.0, 53.0, 73.0, 116.0, 204.0, 395.0, 751.0, 1597.0, 4410.0, 16849.0, 137378.0, 800447.0, 68839.0, 11314.0, 3228.0, 1302.0, 631.0, 286.0, 170.0, 106.0, 82.0, 66.0, 28.0, 32.0, 11.0, 8.0, 13.0, 12.0, 4.0, 1.0, 3.0, 6.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-9.375, -9.0662841796875, -8.757568359375, -8.4488525390625, -8.14013671875, -7.8314208984375, -7.522705078125, -7.2139892578125, -6.9052734375, -6.5965576171875, -6.287841796875, -5.9791259765625, -5.67041015625, -5.3616943359375, -5.052978515625, -4.7442626953125, -4.435546875, -4.1268310546875, -3.818115234375, -3.5093994140625, -3.20068359375, -2.8919677734375, -2.583251953125, -2.2745361328125, -1.9658203125, -1.6571044921875, -1.348388671875, -1.0396728515625, -0.73095703125, -0.4222412109375, -0.113525390625, 0.1951904296875, 0.50390625, 0.8126220703125, 1.121337890625, 1.4300537109375, 1.73876953125, 2.0474853515625, 2.356201171875, 2.6649169921875, 2.9736328125, 3.2823486328125, 3.591064453125, 3.8997802734375, 4.20849609375, 4.5172119140625, 4.825927734375, 5.1346435546875, 5.443359375, 5.7520751953125, 6.060791015625, 6.3695068359375, 6.67822265625, 6.9869384765625, 7.295654296875, 7.6043701171875, 7.9130859375, 8.2218017578125, 8.530517578125, 8.8392333984375, 9.14794921875, 9.4566650390625, 9.765380859375, 10.0740966796875, 10.3828125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 6.0, 5.0, 5.0, 12.0, 9.0, 20.0, 25.0, 18.0, 34.0, 42.0, 43.0, 47.0, 54.0, 64.0, 75.0, 72.0, 72.0, 60.0, 51.0, 47.0, 47.0, 36.0, 31.0, 24.0, 20.0, 22.0, 9.0, 9.0, 7.0, 11.0, 6.0, 4.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.0625, -9.7213134765625, -9.380126953125, -9.0389404296875, -8.69775390625, -8.3565673828125, -8.015380859375, -7.6741943359375, -7.3330078125, -6.9918212890625, -6.650634765625, -6.3094482421875, -5.96826171875, -5.6270751953125, -5.285888671875, -4.9447021484375, -4.603515625, -4.2623291015625, -3.921142578125, -3.5799560546875, -3.23876953125, -2.8975830078125, -2.556396484375, -2.2152099609375, -1.8740234375, -1.5328369140625, -1.191650390625, -0.8504638671875, -0.50927734375, -0.1680908203125, 0.173095703125, 0.5142822265625, 0.85546875, 1.1966552734375, 1.537841796875, 1.8790283203125, 2.22021484375, 2.5614013671875, 2.902587890625, 3.2437744140625, 3.5849609375, 3.9261474609375, 4.267333984375, 4.6085205078125, 4.94970703125, 5.2908935546875, 5.632080078125, 5.9732666015625, 6.314453125, 6.6556396484375, 6.996826171875, 7.3380126953125, 7.67919921875, 8.0203857421875, 8.361572265625, 8.7027587890625, 9.0439453125, 9.3851318359375, 9.726318359375, 10.0675048828125, 10.40869140625, 10.7498779296875, 11.091064453125, 11.4322509765625, 11.7734375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 7.0, 9.0, 9.0, 13.0, 12.0, 28.0, 36.0, 76.0, 142.0, 270.0, 710.0, 2358.0, 21529.0, 1013023.0, 7838.0, 1498.0, 502.0, 206.0, 114.0, 67.0, 43.0, 27.0, 15.0, 5.0, 5.0, 5.0, 5.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.0546875, -13.4771728515625, -12.899658203125, -12.3221435546875, -11.74462890625, -11.1671142578125, -10.589599609375, -10.0120849609375, -9.4345703125, -8.8570556640625, -8.279541015625, -7.7020263671875, -7.12451171875, -6.5469970703125, -5.969482421875, -5.3919677734375, -4.814453125, -4.2369384765625, -3.659423828125, -3.0819091796875, -2.50439453125, -1.9268798828125, -1.349365234375, -0.7718505859375, -0.1943359375, 0.3831787109375, 0.960693359375, 1.5382080078125, 2.11572265625, 2.6932373046875, 3.270751953125, 3.8482666015625, 4.42578125, 5.0032958984375, 5.580810546875, 6.1583251953125, 6.73583984375, 7.3133544921875, 7.890869140625, 8.4683837890625, 9.0458984375, 9.6234130859375, 10.200927734375, 10.7784423828125, 11.35595703125, 11.9334716796875, 12.510986328125, 13.0885009765625, 13.666015625, 14.2435302734375, 14.821044921875, 15.3985595703125, 15.97607421875, 16.5535888671875, 17.131103515625, 17.7086181640625, 18.2861328125, 18.8636474609375, 19.441162109375, 20.0186767578125, 20.59619140625, 21.1737060546875, 21.751220703125, 22.3287353515625, 22.90625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 8.0, 18.0, 34.0, 145.0, 378.0, 272.0, 93.0, 36.0, 11.0, 5.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010042190551757812, -0.0009478181600570679, -0.0008914172649383545, -0.0008350163698196411, -0.0007786154747009277, -0.0007222145795822144, -0.000665813684463501, -0.0006094127893447876, -0.0005530118942260742, -0.0004966109991073608, -0.00044021010398864746, -0.0003838092088699341, -0.0003274083137512207, -0.0002710074186325073, -0.00021460652351379395, -0.00015820562839508057, -0.00010180473327636719, -4.540383815765381e-05, 1.099705696105957e-05, 6.739795207977295e-05, 0.00012379884719848633, 0.0001801997423171997, 0.00023660063743591309, 0.00029300153255462646, 0.00034940242767333984, 0.0004058033227920532, 0.0004622042179107666, 0.00051860511302948, 0.0005750060081481934, 0.0006314069032669067, 0.0006878077983856201, 0.0007442086935043335, 0.0008006095886230469, 0.0008570104837417603, 0.0009134113788604736, 0.000969812273979187, 0.0010262131690979004, 0.0010826140642166138, 0.0011390149593353271, 0.0011954158544540405, 0.001251816749572754, 0.0013082176446914673, 0.0013646185398101807, 0.001421019434928894, 0.0014774203300476074, 0.0015338212251663208, 0.0015902221202850342, 0.0016466230154037476, 0.001703023910522461, 0.0017594248056411743, 0.0018158257007598877, 0.001872226595878601, 0.0019286274909973145, 0.001985028386116028, 0.002041429281234741, 0.0020978301763534546, 0.002154231071472168, 0.0022106319665908813, 0.0022670328617095947, 0.002323433756828308, 0.0023798346519470215, 0.002436235547065735, 0.0024926364421844482, 0.0025490373373031616, 0.002605438232421875]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 3.0, 4.0, 7.0, 10.0, 16.0, 24.0, 19.0, 69.0, 98.0, 169.0, 315.0, 695.0, 1863.0, 6586.0, 241645.0, 783818.0, 9267.0, 2179.0, 892.0, 386.0, 195.0, 97.0, 80.0, 40.0, 26.0, 15.0, 9.0, 6.0, 6.0, 5.0, 5.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.28125, -9.9609375, -9.640625, -9.3203125, -9.0, -8.6796875, -8.359375, -8.0390625, -7.71875, -7.3984375, -7.078125, -6.7578125, -6.4375, -6.1171875, -5.796875, -5.4765625, -5.15625, -4.8359375, -4.515625, -4.1953125, -3.875, -3.5546875, -3.234375, -2.9140625, -2.59375, -2.2734375, -1.953125, -1.6328125, -1.3125, -0.9921875, -0.671875, -0.3515625, -0.03125, 0.2890625, 0.609375, 0.9296875, 1.25, 1.5703125, 1.890625, 2.2109375, 2.53125, 2.8515625, 3.171875, 3.4921875, 3.8125, 4.1328125, 4.453125, 4.7734375, 5.09375, 5.4140625, 5.734375, 6.0546875, 6.375, 6.6953125, 7.015625, 7.3359375, 7.65625, 7.9765625, 8.296875, 8.6171875, 8.9375, 9.2578125, 9.578125, 9.8984375, 10.21875]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 3.0, 9.0, 9.0, 13.0, 30.0, 53.0, 154.0, 245.0, 254.0, 126.0, 45.0, 17.0, 13.0, 7.0, 2.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.16796875, -4.93157958984375, -4.6951904296875, -4.45880126953125, -4.222412109375, -3.98602294921875, -3.7496337890625, -3.51324462890625, -3.27685546875, -3.04046630859375, -2.8040771484375, -2.56768798828125, -2.331298828125, -2.09490966796875, -1.8585205078125, -1.62213134765625, -1.3857421875, -1.14935302734375, -0.9129638671875, -0.67657470703125, -0.440185546875, -0.20379638671875, 0.0325927734375, 0.26898193359375, 0.50537109375, 0.74176025390625, 0.9781494140625, 1.21453857421875, 1.450927734375, 1.68731689453125, 1.9237060546875, 2.16009521484375, 2.396484375, 2.63287353515625, 2.8692626953125, 3.10565185546875, 3.342041015625, 3.57843017578125, 3.8148193359375, 4.05120849609375, 4.28759765625, 4.52398681640625, 4.7603759765625, 4.99676513671875, 5.233154296875, 5.46954345703125, 5.7059326171875, 5.94232177734375, 6.1787109375, 6.41510009765625, 6.6514892578125, 6.88787841796875, 7.124267578125, 7.36065673828125, 7.5970458984375, 7.83343505859375, 8.06982421875, 8.30621337890625, 8.5426025390625, 8.77899169921875, 9.015380859375, 9.25177001953125, 9.4881591796875, 9.72454833984375, 9.9609375]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 5.0, 10.0, 12.0, 35.0, 62.0, 104.0, 129.0, 202.0, 166.0, 117.0, 68.0, 40.0, 19.0, 14.0, 8.0, 8.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-116.17869567871094, -113.3948974609375, -110.61109924316406, -107.82730102539062, -105.04350280761719, -102.25971221923828, -99.47591400146484, -96.6921157836914, -93.90831756591797, -91.12451934814453, -88.3407211303711, -85.55692291259766, -82.77313232421875, -79.98933410644531, -77.20553588867188, -74.42173767089844, -71.637939453125, -68.85414123535156, -66.07034301757812, -63.28654861450195, -60.502750396728516, -57.71895217895508, -54.935157775878906, -52.15135955810547, -49.36756134033203, -46.583763122558594, -43.799964904785156, -41.016170501708984, -38.23237228393555, -35.44857406616211, -32.66477966308594, -29.8809814453125, -27.097179412841797, -24.31338119506836, -21.529584884643555, -18.74578857421875, -15.961990356445312, -13.178193092346191, -10.39439582824707, -7.610599517822266, -4.826801300048828, -2.043004035949707, 0.7407932281494141, 3.524590492248535, 6.308387756347656, 9.092185020446777, 11.875982284545898, 14.659778594970703, 17.44357681274414, 20.227375030517578, 23.011171340942383, 25.794967651367188, 28.578765869140625, 31.362564086914062, 34.1463623046875, 36.93015670776367, 39.71395492553711, 42.49775314331055, 45.28154754638672, 48.065345764160156, 50.849143981933594, 53.63294219970703, 56.41674041748047, 59.20053482055664, 61.98433303833008]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 1.0, 5.0, 4.0, 11.0, 10.0, 14.0, 11.0, 14.0, 17.0, 23.0, 34.0, 36.0, 51.0, 38.0, 61.0, 57.0, 69.0, 75.0, 64.0, 66.0, 59.0, 51.0, 34.0, 42.0, 35.0, 25.0, 30.0, 16.0, 9.0, 10.0, 9.0, 7.0, 8.0, 3.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.84660339355469, -49.072959899902344, -47.29931640625, -45.525672912597656, -43.75202941894531, -41.97838592529297, -40.204742431640625, -38.43109893798828, -36.65745544433594, -34.883811950683594, -33.11016845703125, -31.336524963378906, -29.562881469726562, -27.78923797607422, -26.015592575073242, -24.2419490814209, -22.468303680419922, -20.694660186767578, -18.921016693115234, -17.14737319946289, -15.37372875213623, -13.600085258483887, -11.826440811157227, -10.052797317504883, -8.279153823852539, -6.505510330200195, -4.731866359710693, -2.9582223892211914, -1.1845788955688477, 0.5890645980834961, 2.3627090454101562, 4.1363525390625, 5.909992218017578, 7.683635711669922, 9.457279205322266, 11.230923652648926, 13.00456714630127, 14.778210639953613, 16.551855087280273, 18.325498580932617, 20.09914207458496, 21.872785568237305, 23.64642906188965, 25.420074462890625, 27.19371795654297, 28.967361450195312, 30.741004943847656, 32.5146484375, 34.288291931152344, 36.06193542480469, 37.83557891845703, 39.609222412109375, 41.38286590576172, 43.15650939941406, 44.930152893066406, 46.70379638671875, 48.477439880371094, 50.25108337402344, 52.02472686767578, 53.798370361328125, 55.57201385498047, 57.34565734863281, 59.119300842285156, 60.8929443359375, 62.66659164428711]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 7.0, 2.0, 7.0, 5.0, 11.0, 14.0, 17.0, 41.0, 66.0, 94.0, 199.0, 336.0, 888.0, 2450.0, 19629.0, 4161394.0, 6295.0, 1553.0, 618.0, 304.0, 147.0, 74.0, 44.0, 29.0, 18.0, 12.0, 15.0, 5.0, 4.0, 2.0, 5.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.9609375, -15.4339599609375, -14.906982421875, -14.3800048828125, -13.85302734375, -13.3260498046875, -12.799072265625, -12.2720947265625, -11.7451171875, -11.2181396484375, -10.691162109375, -10.1641845703125, -9.63720703125, -9.1102294921875, -8.583251953125, -8.0562744140625, -7.529296875, -7.0023193359375, -6.475341796875, -5.9483642578125, -5.42138671875, -4.8944091796875, -4.367431640625, -3.8404541015625, -3.3134765625, -2.7864990234375, -2.259521484375, -1.7325439453125, -1.20556640625, -0.6785888671875, -0.151611328125, 0.3753662109375, 0.90234375, 1.4293212890625, 1.956298828125, 2.4832763671875, 3.01025390625, 3.5372314453125, 4.064208984375, 4.5911865234375, 5.1181640625, 5.6451416015625, 6.172119140625, 6.6990966796875, 7.22607421875, 7.7530517578125, 8.280029296875, 8.8070068359375, 9.333984375, 9.8609619140625, 10.387939453125, 10.9149169921875, 11.44189453125, 11.9688720703125, 12.495849609375, 13.0228271484375, 13.5498046875, 14.0767822265625, 14.603759765625, 15.1307373046875, 15.65771484375, 16.1846923828125, 16.711669921875, 17.2386474609375, 17.765625]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 5.0, 3.0, 12.0, 11.0, 13.0, 17.0, 24.0, 25.0, 38.0, 73.0, 84.0, 110.0, 131.0, 97.0, 98.0, 83.0, 56.0, 31.0, 27.0, 19.0, 14.0, 12.0, 7.0, 3.0, 7.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.541015625, -2.44964599609375, -2.3582763671875, -2.26690673828125, -2.175537109375, -2.08416748046875, -1.9927978515625, -1.90142822265625, -1.81005859375, -1.71868896484375, -1.6273193359375, -1.53594970703125, -1.444580078125, -1.35321044921875, -1.2618408203125, -1.17047119140625, -1.0791015625, -0.98773193359375, -0.8963623046875, -0.80499267578125, -0.713623046875, -0.62225341796875, -0.5308837890625, -0.43951416015625, -0.34814453125, -0.25677490234375, -0.1654052734375, -0.07403564453125, 0.017333984375, 0.10870361328125, 0.2000732421875, 0.29144287109375, 0.3828125, 0.47418212890625, 0.5655517578125, 0.65692138671875, 0.748291015625, 0.83966064453125, 0.9310302734375, 1.02239990234375, 1.11376953125, 1.20513916015625, 1.2965087890625, 1.38787841796875, 1.479248046875, 1.57061767578125, 1.6619873046875, 1.75335693359375, 1.8447265625, 1.93609619140625, 2.0274658203125, 2.11883544921875, 2.210205078125, 2.30157470703125, 2.3929443359375, 2.48431396484375, 2.57568359375, 2.66705322265625, 2.7584228515625, 2.84979248046875, 2.941162109375, 3.03253173828125, 3.1239013671875, 3.21527099609375, 3.306640625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 6.0, 5.0, 17.0, 11.0, 12.0, 26.0, 25.0, 42.0, 58.0, 69.0, 104.0, 133.0, 245.0, 373.0, 599.0, 1204.0, 2999.0, 16462.0, 4147414.0, 18296.0, 3169.0, 1187.0, 599.0, 389.0, 257.0, 151.0, 136.0, 86.0, 68.0, 39.0, 23.0, 27.0, 19.0, 4.0, 7.0, 5.0, 7.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.4375, -23.68603515625, -22.9345703125, -22.18310546875, -21.431640625, -20.68017578125, -19.9287109375, -19.17724609375, -18.42578125, -17.67431640625, -16.9228515625, -16.17138671875, -15.419921875, -14.66845703125, -13.9169921875, -13.16552734375, -12.4140625, -11.66259765625, -10.9111328125, -10.15966796875, -9.408203125, -8.65673828125, -7.9052734375, -7.15380859375, -6.40234375, -5.65087890625, -4.8994140625, -4.14794921875, -3.396484375, -2.64501953125, -1.8935546875, -1.14208984375, -0.390625, 0.36083984375, 1.1123046875, 1.86376953125, 2.615234375, 3.36669921875, 4.1181640625, 4.86962890625, 5.62109375, 6.37255859375, 7.1240234375, 7.87548828125, 8.626953125, 9.37841796875, 10.1298828125, 10.88134765625, 11.6328125, 12.38427734375, 13.1357421875, 13.88720703125, 14.638671875, 15.39013671875, 16.1416015625, 16.89306640625, 17.64453125, 18.39599609375, 19.1474609375, 19.89892578125, 20.650390625, 21.40185546875, 22.1533203125, 22.90478515625, 23.65625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 8.0, 17.0, 66.0, 3906.0, 45.0, 17.0, 8.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-9.96875, -9.753814697265625, -9.53887939453125, -9.323944091796875, -9.1090087890625, -8.894073486328125, -8.67913818359375, -8.464202880859375, -8.249267578125, -8.034332275390625, -7.81939697265625, -7.604461669921875, -7.3895263671875, -7.174591064453125, -6.95965576171875, -6.744720458984375, -6.52978515625, -6.314849853515625, -6.09991455078125, -5.884979248046875, -5.6700439453125, -5.455108642578125, -5.24017333984375, -5.025238037109375, -4.810302734375, -4.595367431640625, -4.38043212890625, -4.165496826171875, -3.9505615234375, -3.735626220703125, -3.52069091796875, -3.305755615234375, -3.0908203125, -2.875885009765625, -2.66094970703125, -2.446014404296875, -2.2310791015625, -2.016143798828125, -1.80120849609375, -1.586273193359375, -1.371337890625, -1.156402587890625, -0.94146728515625, -0.726531982421875, -0.5115966796875, -0.296661376953125, -0.08172607421875, 0.133209228515625, 0.34814453125, 0.563079833984375, 0.77801513671875, 0.992950439453125, 1.2078857421875, 1.422821044921875, 1.63775634765625, 1.852691650390625, 2.067626953125, 2.282562255859375, 2.49749755859375, 2.712432861328125, 2.9273681640625, 3.142303466796875, 3.35723876953125, 3.572174072265625, 3.787109375]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 4.0, 2.0, 15.0, 19.0, 21.0, 44.0, 79.0, 90.0, 136.0, 208.0, 148.0, 98.0, 64.0, 37.0, 14.0, 8.0, 10.0, 7.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.866958618164062, -8.324224472045898, -7.781489372253418, -7.238755226135254, -6.696020126342773, -6.153285980224609, -5.610551357269287, -5.067816734313965, -4.525082111358643, -3.9823474884033203, -3.439612865447998, -2.896878480911255, -2.3541438579559326, -1.8114092350006104, -1.2686748504638672, -0.7259402275085449, -0.18320560455322266, 0.35952895879745483, 0.9022635221481323, 1.444998025894165, 1.9877326488494873, 2.5304672718048096, 3.0732016563415527, 3.615936279296875, 4.158670902252197, 4.7014055252075195, 5.244140148162842, 5.786874771118164, 6.329608917236328, 6.872344017028809, 7.415078163146973, 7.957812786102295, 8.500547409057617, 9.043281555175781, 9.586016654968262, 10.128750801086426, 10.671485900878906, 11.21422004699707, 11.756954193115234, 12.299689292907715, 12.842424392700195, 13.38515853881836, 13.92789363861084, 14.470627784729004, 15.013362884521484, 15.556097030639648, 16.098831176757812, 16.64156723022461, 17.18429946899414, 17.727033615112305, 18.26976776123047, 18.812503814697266, 19.35523796081543, 19.897972106933594, 20.440706253051758, 20.983440399169922, 21.52617645263672, 22.068910598754883, 22.611644744873047, 23.154380798339844, 23.697114944458008, 24.239849090576172, 24.782583236694336, 25.3253173828125, 25.868053436279297]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 5.0, 5.0, 2.0, 6.0, 5.0, 6.0, 10.0, 7.0, 10.0, 17.0, 18.0, 19.0, 25.0, 24.0, 20.0, 28.0, 26.0, 27.0, 25.0, 35.0, 39.0, 51.0, 57.0, 43.0, 46.0, 35.0, 37.0, 36.0, 33.0, 38.0, 25.0, 26.0, 24.0, 31.0, 24.0, 27.0, 20.0, 14.0, 15.0, 10.0, 10.0, 10.0, 9.0, 3.0, 6.0, 4.0, 5.0, 2.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.033512115478516, -7.784408092498779, -7.535304069519043, -7.286200046539307, -7.03709602355957, -6.787991523742676, -6.5388875007629395, -6.289783477783203, -6.040679454803467, -5.7915754318237305, -5.542471408843994, -5.293367385864258, -5.044262886047363, -4.795159339904785, -4.546054840087891, -4.296950817108154, -4.047846794128418, -3.7987427711486816, -3.5496387481689453, -3.30053448677063, -3.0514304637908936, -2.8023264408111572, -2.553222179412842, -2.3041181564331055, -2.055014133453369, -1.8059101104736328, -1.556805968284607, -1.307701826095581, -1.0585978031158447, -0.8094937801361084, -0.5603896379470825, -0.31128549575805664, -0.062181949615478516, 0.1869221329689026, 0.4360262155532837, 0.6851302981376648, 0.9342343807220459, 1.1833384037017822, 1.432442545890808, 1.681546688079834, 1.9306507110595703, 2.1797547340393066, 2.428858757019043, 2.6779630184173584, 2.9270670413970947, 3.176171064376831, 3.4252753257751465, 3.674379348754883, 3.923483371734619, 4.1725873947143555, 4.421691417694092, 4.670795440673828, 4.919899940490723, 5.169003486633301, 5.418107986450195, 5.667212009429932, 5.916316032409668, 6.165420055389404, 6.414524078369141, 6.663628101348877, 6.912732124328613, 7.161836624145508, 7.410940647125244, 7.6600446701049805, 7.909148693084717]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 5.0, 5.0, 8.0, 13.0, 20.0, 30.0, 37.0, 59.0, 106.0, 190.0, 347.0, 685.0, 1548.0, 3568.0, 10180.0, 35413.0, 167717.0, 618764.0, 159630.0, 33906.0, 9939.0, 3474.0, 1388.0, 652.0, 344.0, 221.0, 93.0, 69.0, 42.0, 33.0, 21.0, 16.0, 7.0, 10.0, 4.0, 8.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.59375, -5.374267578125, -5.15478515625, -4.935302734375, -4.7158203125, -4.496337890625, -4.27685546875, -4.057373046875, -3.837890625, -3.618408203125, -3.39892578125, -3.179443359375, -2.9599609375, -2.740478515625, -2.52099609375, -2.301513671875, -2.08203125, -1.862548828125, -1.64306640625, -1.423583984375, -1.2041015625, -0.984619140625, -0.76513671875, -0.545654296875, -0.326171875, -0.106689453125, 0.11279296875, 0.332275390625, 0.5517578125, 0.771240234375, 0.99072265625, 1.210205078125, 1.4296875, 1.649169921875, 1.86865234375, 2.088134765625, 2.3076171875, 2.527099609375, 2.74658203125, 2.966064453125, 3.185546875, 3.405029296875, 3.62451171875, 3.843994140625, 4.0634765625, 4.282958984375, 4.50244140625, 4.721923828125, 4.94140625, 5.160888671875, 5.38037109375, 5.599853515625, 5.8193359375, 6.038818359375, 6.25830078125, 6.477783203125, 6.697265625, 6.916748046875, 7.13623046875, 7.355712890625, 7.5751953125, 7.794677734375, 8.01416015625, 8.233642578125, 8.453125]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 6.0, 4.0, 7.0, 12.0, 5.0, 14.0, 14.0, 31.0, 24.0, 31.0, 26.0, 32.0, 55.0, 62.0, 62.0, 77.0, 69.0, 74.0, 60.0, 61.0, 54.0, 41.0, 35.0, 39.0, 18.0, 15.0, 12.0, 18.0, 11.0, 7.0, 9.0, 8.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5078125, -2.413848876953125, -2.31988525390625, -2.225921630859375, -2.1319580078125, -2.037994384765625, -1.94403076171875, -1.850067138671875, -1.756103515625, -1.662139892578125, -1.56817626953125, -1.474212646484375, -1.3802490234375, -1.286285400390625, -1.19232177734375, -1.098358154296875, -1.00439453125, -0.910430908203125, -0.81646728515625, -0.722503662109375, -0.6285400390625, -0.534576416015625, -0.44061279296875, -0.346649169921875, -0.252685546875, -0.158721923828125, -0.06475830078125, 0.029205322265625, 0.1231689453125, 0.217132568359375, 0.31109619140625, 0.405059814453125, 0.4990234375, 0.592987060546875, 0.68695068359375, 0.780914306640625, 0.8748779296875, 0.968841552734375, 1.06280517578125, 1.156768798828125, 1.250732421875, 1.344696044921875, 1.43865966796875, 1.532623291015625, 1.6265869140625, 1.720550537109375, 1.81451416015625, 1.908477783203125, 2.00244140625, 2.096405029296875, 2.19036865234375, 2.284332275390625, 2.3782958984375, 2.472259521484375, 2.56622314453125, 2.660186767578125, 2.754150390625, 2.848114013671875, 2.94207763671875, 3.036041259765625, 3.1300048828125, 3.223968505859375, 3.31793212890625, 3.411895751953125, 3.505859375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 5.0, 8.0, 8.0, 11.0, 25.0, 21.0, 38.0, 49.0, 75.0, 138.0, 214.0, 496.0, 1166.0, 3451.0, 19500.0, 611602.0, 390987.0, 15381.0, 3213.0, 1066.0, 483.0, 226.0, 149.0, 89.0, 52.0, 37.0, 23.0, 6.0, 15.0, 3.0, 4.0, 5.0, 8.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-18.421875, -17.86279296875, -17.3037109375, -16.74462890625, -16.185546875, -15.62646484375, -15.0673828125, -14.50830078125, -13.94921875, -13.39013671875, -12.8310546875, -12.27197265625, -11.712890625, -11.15380859375, -10.5947265625, -10.03564453125, -9.4765625, -8.91748046875, -8.3583984375, -7.79931640625, -7.240234375, -6.68115234375, -6.1220703125, -5.56298828125, -5.00390625, -4.44482421875, -3.8857421875, -3.32666015625, -2.767578125, -2.20849609375, -1.6494140625, -1.09033203125, -0.53125, 0.02783203125, 0.5869140625, 1.14599609375, 1.705078125, 2.26416015625, 2.8232421875, 3.38232421875, 3.94140625, 4.50048828125, 5.0595703125, 5.61865234375, 6.177734375, 6.73681640625, 7.2958984375, 7.85498046875, 8.4140625, 8.97314453125, 9.5322265625, 10.09130859375, 10.650390625, 11.20947265625, 11.7685546875, 12.32763671875, 12.88671875, 13.44580078125, 14.0048828125, 14.56396484375, 15.123046875, 15.68212890625, 16.2412109375, 16.80029296875, 17.359375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 6.0, 4.0, 9.0, 15.0, 13.0, 19.0, 19.0, 25.0, 34.0, 26.0, 46.0, 35.0, 49.0, 70.0, 46.0, 61.0, 63.0, 66.0, 54.0, 40.0, 53.0, 41.0, 42.0, 35.0, 27.0, 18.0, 28.0, 14.0, 8.0, 11.0, 5.0, 8.0, 3.0, 3.0, 4.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-15.84375, -15.2607421875, -14.677734375, -14.0947265625, -13.51171875, -12.9287109375, -12.345703125, -11.7626953125, -11.1796875, -10.5966796875, -10.013671875, -9.4306640625, -8.84765625, -8.2646484375, -7.681640625, -7.0986328125, -6.515625, -5.9326171875, -5.349609375, -4.7666015625, -4.18359375, -3.6005859375, -3.017578125, -2.4345703125, -1.8515625, -1.2685546875, -0.685546875, -0.1025390625, 0.48046875, 1.0634765625, 1.646484375, 2.2294921875, 2.8125, 3.3955078125, 3.978515625, 4.5615234375, 5.14453125, 5.7275390625, 6.310546875, 6.8935546875, 7.4765625, 8.0595703125, 8.642578125, 9.2255859375, 9.80859375, 10.3916015625, 10.974609375, 11.5576171875, 12.140625, 12.7236328125, 13.306640625, 13.8896484375, 14.47265625, 15.0556640625, 15.638671875, 16.2216796875, 16.8046875, 17.3876953125, 17.970703125, 18.5537109375, 19.13671875, 19.7197265625, 20.302734375, 20.8857421875, 21.46875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 1.0, 3.0, 2.0, 4.0, 10.0, 16.0, 18.0, 50.0, 137.0, 619.0, 10379.0, 1033122.0, 3571.0, 415.0, 113.0, 52.0, 16.0, 9.0, 7.0, 3.0, 6.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-40.375, -39.294677734375, -38.21435546875, -37.134033203125, -36.0537109375, -34.973388671875, -33.89306640625, -32.812744140625, -31.732421875, -30.652099609375, -29.57177734375, -28.491455078125, -27.4111328125, -26.330810546875, -25.25048828125, -24.170166015625, -23.08984375, -22.009521484375, -20.92919921875, -19.848876953125, -18.7685546875, -17.688232421875, -16.60791015625, -15.527587890625, -14.447265625, -13.366943359375, -12.28662109375, -11.206298828125, -10.1259765625, -9.045654296875, -7.96533203125, -6.885009765625, -5.8046875, -4.724365234375, -3.64404296875, -2.563720703125, -1.4833984375, -0.403076171875, 0.67724609375, 1.757568359375, 2.837890625, 3.918212890625, 4.99853515625, 6.078857421875, 7.1591796875, 8.239501953125, 9.31982421875, 10.400146484375, 11.48046875, 12.560791015625, 13.64111328125, 14.721435546875, 15.8017578125, 16.882080078125, 17.96240234375, 19.042724609375, 20.123046875, 21.203369140625, 22.28369140625, 23.364013671875, 24.4443359375, 25.524658203125, 26.60498046875, 27.685302734375, 28.765625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 11.0, 21.0, 37.0, 87.0, 194.0, 316.0, 179.0, 77.0, 34.0, 18.0, 16.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002376556396484375, -0.0023162662982940674, -0.0022559762001037598, -0.002195686101913452, -0.0021353960037231445, -0.002075105905532837, -0.0020148158073425293, -0.0019545257091522217, -0.001894235610961914, -0.0018339455127716064, -0.0017736554145812988, -0.0017133653163909912, -0.0016530752182006836, -0.001592785120010376, -0.0015324950218200684, -0.0014722049236297607, -0.0014119148254394531, -0.0013516247272491455, -0.0012913346290588379, -0.0012310445308685303, -0.0011707544326782227, -0.001110464334487915, -0.0010501742362976074, -0.0009898841381072998, -0.0009295940399169922, -0.0008693039417266846, -0.000809013843536377, -0.0007487237453460693, -0.0006884336471557617, -0.0006281435489654541, -0.0005678534507751465, -0.0005075633525848389, -0.00044727325439453125, -0.00038698315620422363, -0.000326693058013916, -0.0002664029598236084, -0.00020611286163330078, -0.00014582276344299316, -8.553266525268555e-05, -2.524256706237793e-05, 3.504753112792969e-05, 9.53376293182373e-05, 0.00015562772750854492, 0.00021591782569885254, 0.00027620792388916016, 0.0003364980220794678, 0.0003967881202697754, 0.000457078218460083, 0.0005173683166503906, 0.0005776584148406982, 0.0006379485130310059, 0.0006982386112213135, 0.0007585287094116211, 0.0008188188076019287, 0.0008791089057922363, 0.0009393990039825439, 0.0009996891021728516, 0.0010599792003631592, 0.0011202692985534668, 0.0011805593967437744, 0.001240849494934082, 0.0013011395931243896, 0.0013614296913146973, 0.0014217197895050049, 0.0014820098876953125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 9.0, 11.0, 30.0, 30.0, 60.0, 108.0, 233.0, 494.0, 1541.0, 5890.0, 75560.0, 931287.0, 27737.0, 3710.0, 1072.0, 377.0, 167.0, 87.0, 61.0, 28.0, 14.0, 11.0, 14.0, 8.0, 4.0, 3.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-14.9296875, -14.55029296875, -14.1708984375, -13.79150390625, -13.412109375, -13.03271484375, -12.6533203125, -12.27392578125, -11.89453125, -11.51513671875, -11.1357421875, -10.75634765625, -10.376953125, -9.99755859375, -9.6181640625, -9.23876953125, -8.859375, -8.47998046875, -8.1005859375, -7.72119140625, -7.341796875, -6.96240234375, -6.5830078125, -6.20361328125, -5.82421875, -5.44482421875, -5.0654296875, -4.68603515625, -4.306640625, -3.92724609375, -3.5478515625, -3.16845703125, -2.7890625, -2.40966796875, -2.0302734375, -1.65087890625, -1.271484375, -0.89208984375, -0.5126953125, -0.13330078125, 0.24609375, 0.62548828125, 1.0048828125, 1.38427734375, 1.763671875, 2.14306640625, 2.5224609375, 2.90185546875, 3.28125, 3.66064453125, 4.0400390625, 4.41943359375, 4.798828125, 5.17822265625, 5.5576171875, 5.93701171875, 6.31640625, 6.69580078125, 7.0751953125, 7.45458984375, 7.833984375, 8.21337890625, 8.5927734375, 8.97216796875, 9.3515625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 2.0, 3.0, 2.0, 7.0, 6.0, 17.0, 27.0, 35.0, 57.0, 94.0, 100.0, 184.0, 144.0, 98.0, 73.0, 41.0, 31.0, 15.0, 19.0, 13.0, 6.0, 8.0, 3.0, 6.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.4609375, -9.19696044921875, -8.9329833984375, -8.66900634765625, -8.405029296875, -8.14105224609375, -7.8770751953125, -7.61309814453125, -7.34912109375, -7.08514404296875, -6.8211669921875, -6.55718994140625, -6.293212890625, -6.02923583984375, -5.7652587890625, -5.50128173828125, -5.2373046875, -4.97332763671875, -4.7093505859375, -4.44537353515625, -4.181396484375, -3.91741943359375, -3.6534423828125, -3.38946533203125, -3.12548828125, -2.86151123046875, -2.5975341796875, -2.33355712890625, -2.069580078125, -1.80560302734375, -1.5416259765625, -1.27764892578125, -1.013671875, -0.74969482421875, -0.4857177734375, -0.22174072265625, 0.042236328125, 0.30621337890625, 0.5701904296875, 0.83416748046875, 1.09814453125, 1.36212158203125, 1.6260986328125, 1.89007568359375, 2.154052734375, 2.41802978515625, 2.6820068359375, 2.94598388671875, 3.2099609375, 3.47393798828125, 3.7379150390625, 4.00189208984375, 4.265869140625, 4.52984619140625, 4.7938232421875, 5.05780029296875, 5.32177734375, 5.58575439453125, 5.8497314453125, 6.11370849609375, 6.377685546875, 6.64166259765625, 6.9056396484375, 7.16961669921875, 7.43359375]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 14.0, 63.0, 280.0, 442.0, 164.0, 36.0, 6.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-123.41859436035156, -114.85883331298828, -106.29907989501953, -97.73931884765625, -89.1795654296875, -80.61980438232422, -72.06004333496094, -63.50028610229492, -54.940528869628906, -46.38077163696289, -37.821014404296875, -29.261253356933594, -20.701496124267578, -12.141738891601562, -3.5819778442382812, 4.977779388427734, 13.53753662109375, 22.097293853759766, 30.657052993774414, 39.21681213378906, 47.77656936645508, 56.336326599121094, 64.89608764648438, 73.45584106445312, 82.0156021118164, 90.57536315917969, 99.13511657714844, 107.69487762451172, 116.254638671875, 124.81439208984375, 133.3741455078125, 141.9339141845703, 150.49368286132812, 159.05343627929688, 167.6132049560547, 176.17295837402344, 184.7327117919922, 193.29248046875, 201.85223388671875, 210.4119873046875, 218.97174072265625, 227.531494140625, 236.0912628173828, 244.65101623535156, 253.2107696533203, 261.7705383300781, 270.3302917480469, 278.8900451660156, 287.4498291015625, 296.00958251953125, 304.5693359375, 313.12908935546875, 321.6888732910156, 330.2486267089844, 338.8083801269531, 347.3681335449219, 355.9278869628906, 364.4876403808594, 373.0473937988281, 381.607177734375, 390.16693115234375, 398.7266845703125, 407.28643798828125, 415.84619140625, 424.40594482421875]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 2.0, 0.0, 5.0, 5.0, 7.0, 10.0, 12.0, 7.0, 13.0, 22.0, 23.0, 28.0, 32.0, 28.0, 35.0, 63.0, 42.0, 70.0, 71.0, 71.0, 70.0, 56.0, 40.0, 55.0, 38.0, 36.0, 29.0, 26.0, 26.0, 17.0, 20.0, 9.0, 15.0, 4.0, 6.0, 7.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-75.93251037597656, -73.335205078125, -70.7378921508789, -68.14058685302734, -65.54327392578125, -62.94596862792969, -60.34865951538086, -57.75135040283203, -55.15404510498047, -52.55673599243164, -49.95942687988281, -47.36212158203125, -44.76481246948242, -42.167503356933594, -39.570194244384766, -36.97288513183594, -34.37557601928711, -31.77826690673828, -29.180959701538086, -26.583650588989258, -23.986343383789062, -21.389034271240234, -18.791725158691406, -16.19441795349121, -13.597108840942383, -10.999800682067871, -8.40249252319336, -5.805183410644531, -3.2078752517700195, -0.6105670928955078, 1.9867420196533203, 4.584049224853516, 7.181358337402344, 9.778666496276855, 12.375974655151367, 14.973283767700195, 17.57059097290039, 20.16790008544922, 22.765209197998047, 25.362516403198242, 27.95982551574707, 30.5571346282959, 33.154441833496094, 35.75175094604492, 38.34906005859375, 40.94636535644531, 43.543678283691406, 46.14098358154297, 48.7382926940918, 51.335601806640625, 53.93291091918945, 56.53022003173828, 59.127525329589844, 61.72483444213867, 64.3221435546875, 66.91944885253906, 69.51676177978516, 72.11406707763672, 74.71138000488281, 77.30868530273438, 79.90599822998047, 82.50330352783203, 85.10061645507812, 87.69792175292969, 90.29522705078125]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 8.0, 10.0, 23.0, 37.0, 67.0, 168.0, 362.0, 1159.0, 5548.0, 4126046.0, 55856.0, 3529.0, 819.0, 303.0, 146.0, 74.0, 41.0, 30.0, 21.0, 13.0, 5.0, 9.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.1484375, -13.3101806640625, -12.471923828125, -11.6336669921875, -10.79541015625, -9.9571533203125, -9.118896484375, -8.2806396484375, -7.4423828125, -6.6041259765625, -5.765869140625, -4.9276123046875, -4.08935546875, -3.2510986328125, -2.412841796875, -1.5745849609375, -0.736328125, 0.1019287109375, 0.940185546875, 1.7784423828125, 2.61669921875, 3.4549560546875, 4.293212890625, 5.1314697265625, 5.9697265625, 6.8079833984375, 7.646240234375, 8.4844970703125, 9.32275390625, 10.1610107421875, 10.999267578125, 11.8375244140625, 12.67578125, 13.5140380859375, 14.352294921875, 15.1905517578125, 16.02880859375, 16.8670654296875, 17.705322265625, 18.5435791015625, 19.3818359375, 20.2200927734375, 21.058349609375, 21.8966064453125, 22.73486328125, 23.5731201171875, 24.411376953125, 25.2496337890625, 26.087890625, 26.9261474609375, 27.764404296875, 28.6026611328125, 29.44091796875, 30.2791748046875, 31.117431640625, 31.9556884765625, 32.7939453125, 33.6322021484375, 34.470458984375, 35.3087158203125, 36.14697265625, 36.9852294921875, 37.823486328125, 38.6617431640625, 39.5]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 6.0, 9.0, 5.0, 15.0, 18.0, 27.0, 42.0, 66.0, 78.0, 134.0, 146.0, 134.0, 104.0, 76.0, 49.0, 30.0, 18.0, 20.0, 7.0, 5.0, 5.0, 6.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.931640625, -3.711151123046875, -3.49066162109375, -3.270172119140625, -3.0496826171875, -2.829193115234375, -2.60870361328125, -2.388214111328125, -2.167724609375, -1.947235107421875, -1.72674560546875, -1.506256103515625, -1.2857666015625, -1.065277099609375, -0.84478759765625, -0.624298095703125, -0.40380859375, -0.183319091796875, 0.03717041015625, 0.257659912109375, 0.4781494140625, 0.698638916015625, 0.91912841796875, 1.139617919921875, 1.360107421875, 1.580596923828125, 1.80108642578125, 2.021575927734375, 2.2420654296875, 2.462554931640625, 2.68304443359375, 2.903533935546875, 3.1240234375, 3.344512939453125, 3.56500244140625, 3.785491943359375, 4.0059814453125, 4.226470947265625, 4.44696044921875, 4.667449951171875, 4.887939453125, 5.108428955078125, 5.32891845703125, 5.549407958984375, 5.7698974609375, 5.990386962890625, 6.21087646484375, 6.431365966796875, 6.65185546875, 6.872344970703125, 7.09283447265625, 7.313323974609375, 7.5338134765625, 7.754302978515625, 7.97479248046875, 8.195281982421875, 8.415771484375, 8.636260986328125, 8.85675048828125, 9.077239990234375, 9.2977294921875, 9.518218994140625, 9.73870849609375, 9.959197998046875, 10.1796875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 7.0, 5.0, 1.0, 8.0, 11.0, 11.0, 13.0, 39.0, 38.0, 48.0, 66.0, 104.0, 170.0, 298.0, 469.0, 920.0, 1778.0, 4441.0, 21537.0, 4121528.0, 33027.0, 5269.0, 2009.0, 1028.0, 540.0, 324.0, 188.0, 120.0, 93.0, 44.0, 51.0, 31.0, 26.0, 11.0, 9.0, 9.0, 2.0, 11.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.90625, -30.012451171875, -29.11865234375, -28.224853515625, -27.3310546875, -26.437255859375, -25.54345703125, -24.649658203125, -23.755859375, -22.862060546875, -21.96826171875, -21.074462890625, -20.1806640625, -19.286865234375, -18.39306640625, -17.499267578125, -16.60546875, -15.711669921875, -14.81787109375, -13.924072265625, -13.0302734375, -12.136474609375, -11.24267578125, -10.348876953125, -9.455078125, -8.561279296875, -7.66748046875, -6.773681640625, -5.8798828125, -4.986083984375, -4.09228515625, -3.198486328125, -2.3046875, -1.410888671875, -0.51708984375, 0.376708984375, 1.2705078125, 2.164306640625, 3.05810546875, 3.951904296875, 4.845703125, 5.739501953125, 6.63330078125, 7.527099609375, 8.4208984375, 9.314697265625, 10.20849609375, 11.102294921875, 11.99609375, 12.889892578125, 13.78369140625, 14.677490234375, 15.5712890625, 16.465087890625, 17.35888671875, 18.252685546875, 19.146484375, 20.040283203125, 20.93408203125, 21.827880859375, 22.7216796875, 23.615478515625, 24.50927734375, 25.403076171875, 26.296875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 5.0, 4.0, 15.0, 85.0, 3804.0, 101.0, 29.0, 20.0, 5.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-22.921875, -22.3826904296875, -21.843505859375, -21.3043212890625, -20.76513671875, -20.2259521484375, -19.686767578125, -19.1475830078125, -18.6083984375, -18.0692138671875, -17.530029296875, -16.9908447265625, -16.45166015625, -15.9124755859375, -15.373291015625, -14.8341064453125, -14.294921875, -13.7557373046875, -13.216552734375, -12.6773681640625, -12.13818359375, -11.5989990234375, -11.059814453125, -10.5206298828125, -9.9814453125, -9.4422607421875, -8.903076171875, -8.3638916015625, -7.82470703125, -7.2855224609375, -6.746337890625, -6.2071533203125, -5.66796875, -5.1287841796875, -4.589599609375, -4.0504150390625, -3.51123046875, -2.9720458984375, -2.432861328125, -1.8936767578125, -1.3544921875, -0.8153076171875, -0.276123046875, 0.2630615234375, 0.80224609375, 1.3414306640625, 1.880615234375, 2.4197998046875, 2.958984375, 3.4981689453125, 4.037353515625, 4.5765380859375, 5.11572265625, 5.6549072265625, 6.194091796875, 6.7332763671875, 7.2724609375, 7.8116455078125, 8.350830078125, 8.8900146484375, 9.42919921875, 9.9683837890625, 10.507568359375, 11.0467529296875, 11.5859375]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 7.0, 7.0, 12.0, 24.0, 55.0, 89.0, 198.0, 209.0, 157.0, 98.0, 51.0, 34.0, 26.0, 12.0, 12.0, 4.0, 2.0, 4.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-56.75732421875, -55.211158752441406, -53.66499328613281, -52.11882781982422, -50.57265853881836, -49.026493072509766, -47.48032760620117, -45.93416213989258, -44.38799285888672, -42.841827392578125, -41.29566192626953, -39.74949645996094, -38.20332717895508, -36.657161712646484, -35.11099624633789, -33.5648307800293, -32.0186653137207, -30.47249984741211, -28.926332473754883, -27.38016700744629, -25.833999633789062, -24.28783416748047, -22.741668701171875, -21.19550323486328, -19.649335861206055, -18.10317039489746, -16.557003021240234, -15.01083755493164, -13.46467113494873, -11.91850471496582, -10.372339248657227, -8.826172828674316, -7.280010223388672, -5.733843803405762, -4.18767786026001, -2.641511917114258, -1.0953454971313477, 0.4508209228515625, 1.9969863891601562, 3.5431528091430664, 5.089319229125977, 6.635485649108887, 8.181652069091797, 9.72781753540039, 11.2739839553833, 12.820150375366211, 14.366315841674805, 15.912482261657715, 17.458648681640625, 19.00481414794922, 20.550981521606445, 22.09714698791504, 23.643314361572266, 25.18947982788086, 26.735645294189453, 28.281810760498047, 29.827978134155273, 31.374143600463867, 32.920310974121094, 34.46647644042969, 36.01264190673828, 37.558807373046875, 39.10497283935547, 40.65114212036133, 42.19730758666992]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 2.0, 5.0, 2.0, 5.0, 9.0, 8.0, 12.0, 16.0, 17.0, 21.0, 24.0, 40.0, 38.0, 29.0, 39.0, 47.0, 46.0, 42.0, 53.0, 44.0, 49.0, 41.0, 41.0, 41.0, 37.0, 42.0, 29.0, 26.0, 33.0, 39.0, 26.0, 16.0, 21.0, 11.0, 15.0, 6.0, 6.0, 7.0, 8.0, 4.0, 4.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.276020050048828, -26.437166213989258, -25.598312377929688, -24.759458541870117, -23.920604705810547, -23.081750869750977, -22.242897033691406, -21.404043197631836, -20.565189361572266, -19.726335525512695, -18.887481689453125, -18.048627853393555, -17.209774017333984, -16.370920181274414, -15.532066345214844, -14.693212509155273, -13.854358673095703, -13.015504837036133, -12.176651000976562, -11.337797164916992, -10.498943328857422, -9.660089492797852, -8.821235656738281, -7.982381820678711, -7.143527984619141, -6.30467414855957, -5.4658203125, -4.62696647644043, -3.7881126403808594, -2.949258804321289, -2.1104049682617188, -1.2715511322021484, -0.43269920349121094, 0.4061546325683594, 1.2450084686279297, 2.0838623046875, 2.9227161407470703, 3.7615699768066406, 4.600423812866211, 5.439277648925781, 6.278131484985352, 7.116985321044922, 7.955839157104492, 8.794692993164062, 9.633546829223633, 10.472400665283203, 11.311254501342773, 12.150108337402344, 12.988962173461914, 13.827816009521484, 14.666669845581055, 15.505523681640625, 16.344377517700195, 17.183231353759766, 18.022085189819336, 18.860939025878906, 19.699792861938477, 20.538646697998047, 21.377500534057617, 22.216354370117188, 23.055208206176758, 23.894062042236328, 24.7329158782959, 25.57176971435547, 26.41062355041504]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 5.0, 2.0, 2.0, 5.0, 10.0, 6.0, 8.0, 16.0, 15.0, 23.0, 37.0, 78.0, 125.0, 253.0, 508.0, 1404.0, 4315.0, 15611.0, 77338.0, 564366.0, 322880.0, 46113.0, 10347.0, 3134.0, 1064.0, 456.0, 176.0, 87.0, 46.0, 53.0, 25.0, 12.0, 10.0, 13.0, 6.0, 3.0, 3.0, 6.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-16.421875, -15.988037109375, -15.55419921875, -15.120361328125, -14.6865234375, -14.252685546875, -13.81884765625, -13.385009765625, -12.951171875, -12.517333984375, -12.08349609375, -11.649658203125, -11.2158203125, -10.781982421875, -10.34814453125, -9.914306640625, -9.48046875, -9.046630859375, -8.61279296875, -8.178955078125, -7.7451171875, -7.311279296875, -6.87744140625, -6.443603515625, -6.009765625, -5.575927734375, -5.14208984375, -4.708251953125, -4.2744140625, -3.840576171875, -3.40673828125, -2.972900390625, -2.5390625, -2.105224609375, -1.67138671875, -1.237548828125, -0.8037109375, -0.369873046875, 0.06396484375, 0.497802734375, 0.931640625, 1.365478515625, 1.79931640625, 2.233154296875, 2.6669921875, 3.100830078125, 3.53466796875, 3.968505859375, 4.40234375, 4.836181640625, 5.27001953125, 5.703857421875, 6.1376953125, 6.571533203125, 7.00537109375, 7.439208984375, 7.873046875, 8.306884765625, 8.74072265625, 9.174560546875, 9.6083984375, 10.042236328125, 10.47607421875, 10.909912109375, 11.34375]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 3.0, 4.0, 6.0, 11.0, 10.0, 18.0, 27.0, 26.0, 32.0, 41.0, 57.0, 56.0, 60.0, 99.0, 86.0, 88.0, 95.0, 75.0, 51.0, 42.0, 33.0, 21.0, 19.0, 12.0, 17.0, 10.0, 4.0, 6.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.67578125, -3.46722412109375, -3.2586669921875, -3.05010986328125, -2.841552734375, -2.63299560546875, -2.4244384765625, -2.21588134765625, -2.00732421875, -1.79876708984375, -1.5902099609375, -1.38165283203125, -1.173095703125, -0.96453857421875, -0.7559814453125, -0.54742431640625, -0.3388671875, -0.13031005859375, 0.0782470703125, 0.28680419921875, 0.495361328125, 0.70391845703125, 0.9124755859375, 1.12103271484375, 1.32958984375, 1.53814697265625, 1.7467041015625, 1.95526123046875, 2.163818359375, 2.37237548828125, 2.5809326171875, 2.78948974609375, 2.998046875, 3.20660400390625, 3.4151611328125, 3.62371826171875, 3.832275390625, 4.04083251953125, 4.2493896484375, 4.45794677734375, 4.66650390625, 4.87506103515625, 5.0836181640625, 5.29217529296875, 5.500732421875, 5.70928955078125, 5.9178466796875, 6.12640380859375, 6.3349609375, 6.54351806640625, 6.7520751953125, 6.96063232421875, 7.169189453125, 7.37774658203125, 7.5863037109375, 7.79486083984375, 8.00341796875, 8.21197509765625, 8.4205322265625, 8.62908935546875, 8.837646484375, 9.04620361328125, 9.2547607421875, 9.46331787109375, 9.671875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 1.0, 5.0, 9.0, 11.0, 12.0, 17.0, 26.0, 61.0, 91.0, 181.0, 310.0, 643.0, 1544.0, 4846.0, 31556.0, 748058.0, 241352.0, 14457.0, 3169.0, 1080.0, 509.0, 259.0, 129.0, 79.0, 47.0, 25.0, 20.0, 11.0, 12.0, 9.0, 5.0, 1.0, 0.0, 5.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-28.25, -27.46142578125, -26.6728515625, -25.88427734375, -25.095703125, -24.30712890625, -23.5185546875, -22.72998046875, -21.94140625, -21.15283203125, -20.3642578125, -19.57568359375, -18.787109375, -17.99853515625, -17.2099609375, -16.42138671875, -15.6328125, -14.84423828125, -14.0556640625, -13.26708984375, -12.478515625, -11.68994140625, -10.9013671875, -10.11279296875, -9.32421875, -8.53564453125, -7.7470703125, -6.95849609375, -6.169921875, -5.38134765625, -4.5927734375, -3.80419921875, -3.015625, -2.22705078125, -1.4384765625, -0.64990234375, 0.138671875, 0.92724609375, 1.7158203125, 2.50439453125, 3.29296875, 4.08154296875, 4.8701171875, 5.65869140625, 6.447265625, 7.23583984375, 8.0244140625, 8.81298828125, 9.6015625, 10.39013671875, 11.1787109375, 11.96728515625, 12.755859375, 13.54443359375, 14.3330078125, 15.12158203125, 15.91015625, 16.69873046875, 17.4873046875, 18.27587890625, 19.064453125, 19.85302734375, 20.6416015625, 21.43017578125, 22.21875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 6.0, 4.0, 5.0, 7.0, 11.0, 14.0, 29.0, 29.0, 49.0, 77.0, 95.0, 102.0, 95.0, 102.0, 94.0, 92.0, 63.0, 45.0, 27.0, 21.0, 16.0, 15.0, 5.0, 7.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.5, -49.0439453125, -47.587890625, -46.1318359375, -44.67578125, -43.2197265625, -41.763671875, -40.3076171875, -38.8515625, -37.3955078125, -35.939453125, -34.4833984375, -33.02734375, -31.5712890625, -30.115234375, -28.6591796875, -27.203125, -25.7470703125, -24.291015625, -22.8349609375, -21.37890625, -19.9228515625, -18.466796875, -17.0107421875, -15.5546875, -14.0986328125, -12.642578125, -11.1865234375, -9.73046875, -8.2744140625, -6.818359375, -5.3623046875, -3.90625, -2.4501953125, -0.994140625, 0.4619140625, 1.91796875, 3.3740234375, 4.830078125, 6.2861328125, 7.7421875, 9.1982421875, 10.654296875, 12.1103515625, 13.56640625, 15.0224609375, 16.478515625, 17.9345703125, 19.390625, 20.8466796875, 22.302734375, 23.7587890625, 25.21484375, 26.6708984375, 28.126953125, 29.5830078125, 31.0390625, 32.4951171875, 33.951171875, 35.4072265625, 36.86328125, 38.3193359375, 39.775390625, 41.2314453125, 42.6875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 9.0, 7.0, 10.0, 17.0, 32.0, 68.0, 137.0, 342.0, 933.0, 5395.0, 683606.0, 352223.0, 4348.0, 854.0, 272.0, 145.0, 70.0, 31.0, 17.0, 16.0, 5.0, 6.0, 2.0, 3.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.3125, -13.85009765625, -13.3876953125, -12.92529296875, -12.462890625, -12.00048828125, -11.5380859375, -11.07568359375, -10.61328125, -10.15087890625, -9.6884765625, -9.22607421875, -8.763671875, -8.30126953125, -7.8388671875, -7.37646484375, -6.9140625, -6.45166015625, -5.9892578125, -5.52685546875, -5.064453125, -4.60205078125, -4.1396484375, -3.67724609375, -3.21484375, -2.75244140625, -2.2900390625, -1.82763671875, -1.365234375, -0.90283203125, -0.4404296875, 0.02197265625, 0.484375, 0.94677734375, 1.4091796875, 1.87158203125, 2.333984375, 2.79638671875, 3.2587890625, 3.72119140625, 4.18359375, 4.64599609375, 5.1083984375, 5.57080078125, 6.033203125, 6.49560546875, 6.9580078125, 7.42041015625, 7.8828125, 8.34521484375, 8.8076171875, 9.27001953125, 9.732421875, 10.19482421875, 10.6572265625, 11.11962890625, 11.58203125, 12.04443359375, 12.5068359375, 12.96923828125, 13.431640625, 13.89404296875, 14.3564453125, 14.81884765625, 15.28125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 8.0, 8.0, 10.0, 14.0, 14.0, 21.0, 43.0, 58.0, 71.0, 82.0, 131.0, 122.0, 116.0, 94.0, 69.0, 50.0, 32.0, 26.0, 13.0, 9.0, 6.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.001224517822265625, -0.001192733645439148, -0.001160949468612671, -0.0011291652917861938, -0.0010973811149597168, -0.0010655969381332397, -0.0010338127613067627, -0.0010020285844802856, -0.0009702444076538086, -0.0009384602308273315, -0.0009066760540008545, -0.0008748918771743774, -0.0008431077003479004, -0.0008113235235214233, -0.0007795393466949463, -0.0007477551698684692, -0.0007159709930419922, -0.0006841868162155151, -0.0006524026393890381, -0.000620618462562561, -0.000588834285736084, -0.0005570501089096069, -0.0005252659320831299, -0.0004934817552566528, -0.0004616975784301758, -0.00042991340160369873, -0.0003981292247772217, -0.00036634504795074463, -0.0003345608711242676, -0.00030277669429779053, -0.0002709925174713135, -0.00023920834064483643, -0.00020742416381835938, -0.00017563998699188232, -0.00014385581016540527, -0.00011207163333892822, -8.028745651245117e-05, -4.850327968597412e-05, -1.671910285949707e-05, 1.506507396697998e-05, 4.684925079345703e-05, 7.863342761993408e-05, 0.00011041760444641113, 0.00014220178127288818, 0.00017398595809936523, 0.00020577013492584229, 0.00023755431175231934, 0.0002693384885787964, 0.00030112266540527344, 0.0003329068422317505, 0.00036469101905822754, 0.0003964751958847046, 0.00042825937271118164, 0.0004600435495376587, 0.0004918277263641357, 0.0005236119031906128, 0.0005553960800170898, 0.0005871802568435669, 0.0006189644336700439, 0.000650748610496521, 0.000682532787322998, 0.0007143169641494751, 0.0007461011409759521, 0.0007778853178024292, 0.0008096694946289062]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 7.0, 1.0, 7.0, 13.0, 11.0, 29.0, 37.0, 56.0, 129.0, 229.0, 573.0, 1600.0, 6879.0, 257915.0, 766649.0, 11132.0, 2038.0, 678.0, 289.0, 123.0, 60.0, 27.0, 18.0, 16.0, 13.0, 6.0, 6.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.46875, -13.0850830078125, -12.701416015625, -12.3177490234375, -11.93408203125, -11.5504150390625, -11.166748046875, -10.7830810546875, -10.3994140625, -10.0157470703125, -9.632080078125, -9.2484130859375, -8.86474609375, -8.4810791015625, -8.097412109375, -7.7137451171875, -7.330078125, -6.9464111328125, -6.562744140625, -6.1790771484375, -5.79541015625, -5.4117431640625, -5.028076171875, -4.6444091796875, -4.2607421875, -3.8770751953125, -3.493408203125, -3.1097412109375, -2.72607421875, -2.3424072265625, -1.958740234375, -1.5750732421875, -1.19140625, -0.8077392578125, -0.424072265625, -0.0404052734375, 0.34326171875, 0.7269287109375, 1.110595703125, 1.4942626953125, 1.8779296875, 2.2615966796875, 2.645263671875, 3.0289306640625, 3.41259765625, 3.7962646484375, 4.179931640625, 4.5635986328125, 4.947265625, 5.3309326171875, 5.714599609375, 6.0982666015625, 6.48193359375, 6.8656005859375, 7.249267578125, 7.6329345703125, 8.0166015625, 8.4002685546875, 8.783935546875, 9.1676025390625, 9.55126953125, 9.9349365234375, 10.318603515625, 10.7022705078125, 11.0859375]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 2.0, 4.0, 9.0, 11.0, 19.0, 25.0, 55.0, 79.0, 144.0, 167.0, 178.0, 106.0, 74.0, 52.0, 31.0, 14.0, 17.0, 5.0, 6.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-13.0078125, -12.68951416015625, -12.3712158203125, -12.05291748046875, -11.734619140625, -11.41632080078125, -11.0980224609375, -10.77972412109375, -10.46142578125, -10.14312744140625, -9.8248291015625, -9.50653076171875, -9.188232421875, -8.86993408203125, -8.5516357421875, -8.23333740234375, -7.9150390625, -7.59674072265625, -7.2784423828125, -6.96014404296875, -6.641845703125, -6.32354736328125, -6.0052490234375, -5.68695068359375, -5.36865234375, -5.05035400390625, -4.7320556640625, -4.41375732421875, -4.095458984375, -3.77716064453125, -3.4588623046875, -3.14056396484375, -2.822265625, -2.50396728515625, -2.1856689453125, -1.86737060546875, -1.549072265625, -1.23077392578125, -0.9124755859375, -0.59417724609375, -0.27587890625, 0.04241943359375, 0.3607177734375, 0.67901611328125, 0.997314453125, 1.31561279296875, 1.6339111328125, 1.95220947265625, 2.2705078125, 2.58880615234375, 2.9071044921875, 3.22540283203125, 3.543701171875, 3.86199951171875, 4.1802978515625, 4.49859619140625, 4.81689453125, 5.13519287109375, 5.4534912109375, 5.77178955078125, 6.090087890625, 6.40838623046875, 6.7266845703125, 7.04498291015625, 7.36328125]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 5.0, 19.0, 48.0, 143.0, 253.0, 291.0, 147.0, 50.0, 24.0, 19.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-259.5124816894531, -252.51522827148438, -245.51795959472656, -238.5207061767578, -231.5234375, -224.52618408203125, -217.52891540527344, -210.5316619873047, -203.53439331054688, -196.53713989257812, -189.5398712158203, -182.54261779785156, -175.54534912109375, -168.548095703125, -161.5508270263672, -154.55357360839844, -147.55630493164062, -140.55905151367188, -133.56178283691406, -126.56452178955078, -119.5672607421875, -112.57000732421875, -105.57273864746094, -98.57548522949219, -91.57823181152344, -84.58097076416016, -77.58370971679688, -70.5864486694336, -63.58918762207031, -56.5919303894043, -49.594669342041016, -42.597408294677734, -35.60014343261719, -28.602882385253906, -21.605621337890625, -14.608362197875977, -7.611101150512695, -0.6138420104980469, 6.383419036865234, 13.380680084228516, 20.377941131591797, 27.375202178955078, 34.37246322631836, 41.369720458984375, 48.366981506347656, 55.36424255371094, 62.36150360107422, 69.3587646484375, 76.35602569580078, 83.35328674316406, 90.35054779052734, 97.34780883789062, 104.3450698852539, 111.34233093261719, 118.33958435058594, 125.33685302734375, 132.3341064453125, 139.33135986328125, 146.32862854003906, 153.3258819580078, 160.32315063476562, 167.32040405273438, 174.3176727294922, 181.31492614746094, 188.31219482421875]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 1.0, 4.0, 2.0, 4.0, 9.0, 6.0, 7.0, 8.0, 17.0, 16.0, 14.0, 23.0, 17.0, 28.0, 21.0, 36.0, 41.0, 42.0, 40.0, 39.0, 56.0, 52.0, 48.0, 50.0, 46.0, 33.0, 43.0, 45.0, 40.0, 28.0, 27.0, 34.0, 23.0, 17.0, 14.0, 17.0, 12.0, 11.0, 10.0, 6.0, 6.0, 3.0, 3.0, 4.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.19905090332031, -72.2464828491211, -69.29390716552734, -66.34133911132812, -63.388763427734375, -60.43619155883789, -57.483619689941406, -54.53105163574219, -51.57847595214844, -48.62590408325195, -45.67333221435547, -42.720760345458984, -39.7681884765625, -36.815616607666016, -33.86304473876953, -30.91047477722168, -27.957904815673828, -25.005332946777344, -22.05276107788086, -19.100189208984375, -16.14761734008789, -13.195046424865723, -10.242475509643555, -7.28990364074707, -4.337331771850586, -1.3847601413726807, 1.5678114891052246, 4.520382881164551, 7.472954750061035, 10.42552661895752, 13.378097534179688, 16.330669403076172, 19.283241271972656, 22.23581314086914, 25.188385009765625, 28.14095687866211, 31.093528747558594, 34.04610061645508, 36.99867248535156, 39.95124053955078, 42.90381622314453, 45.856388092041016, 48.8089599609375, 51.761531829833984, 54.71410369873047, 57.66667556762695, 60.61924743652344, 63.571815490722656, 66.52438354492188, 69.4769515991211, 72.42952728271484, 75.38209533691406, 78.33467102050781, 81.28723907470703, 84.23981475830078, 87.1923828125, 90.14495849609375, 93.09752655029297, 96.05010223388672, 99.00267028808594, 101.95524597167969, 104.9078140258789, 107.86038970947266, 110.81295776367188, 113.76553344726562]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [7.0, 4.0, 15.0, 15.0, 34.0, 57.0, 93.0, 224.0, 623.0, 2070.0, 7899.0, 44953.0, 3694564.0, 420224.0, 17436.0, 3725.0, 1194.0, 485.0, 234.0, 122.0, 90.0, 56.0, 42.0, 28.0, 17.0, 15.0, 14.0, 13.0, 12.0, 2.0, 7.0, 5.0, 4.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.62109375, -6.10406494140625, -5.5870361328125, -5.07000732421875, -4.552978515625, -4.03594970703125, -3.5189208984375, -3.00189208984375, -2.48486328125, -1.96783447265625, -1.4508056640625, -0.93377685546875, -0.416748046875, 0.10028076171875, 0.6173095703125, 1.13433837890625, 1.6513671875, 2.16839599609375, 2.6854248046875, 3.20245361328125, 3.719482421875, 4.23651123046875, 4.7535400390625, 5.27056884765625, 5.78759765625, 6.30462646484375, 6.8216552734375, 7.33868408203125, 7.855712890625, 8.37274169921875, 8.8897705078125, 9.40679931640625, 9.923828125, 10.44085693359375, 10.9578857421875, 11.47491455078125, 11.991943359375, 12.50897216796875, 13.0260009765625, 13.54302978515625, 14.06005859375, 14.57708740234375, 15.0941162109375, 15.61114501953125, 16.128173828125, 16.64520263671875, 17.1622314453125, 17.67926025390625, 18.1962890625, 18.71331787109375, 19.2303466796875, 19.74737548828125, 20.264404296875, 20.78143310546875, 21.2984619140625, 21.81549072265625, 22.33251953125, 22.84954833984375, 23.3665771484375, 23.88360595703125, 24.400634765625, 24.91766357421875, 25.4346923828125, 25.95172119140625, 26.46875]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 4.0, 6.0, 15.0, 20.0, 41.0, 58.0, 94.0, 144.0, 124.0, 142.0, 107.0, 93.0, 67.0, 44.0, 28.0, 13.0, 5.0, 2.0, 6.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.015625, -3.685546875, -3.35546875, -3.025390625, -2.6953125, -2.365234375, -2.03515625, -1.705078125, -1.375, -1.044921875, -0.71484375, -0.384765625, -0.0546875, 0.275390625, 0.60546875, 0.935546875, 1.265625, 1.595703125, 1.92578125, 2.255859375, 2.5859375, 2.916015625, 3.24609375, 3.576171875, 3.90625, 4.236328125, 4.56640625, 4.896484375, 5.2265625, 5.556640625, 5.88671875, 6.216796875, 6.546875, 6.876953125, 7.20703125, 7.537109375, 7.8671875, 8.197265625, 8.52734375, 8.857421875, 9.1875, 9.517578125, 9.84765625, 10.177734375, 10.5078125, 10.837890625, 11.16796875, 11.498046875, 11.828125, 12.158203125, 12.48828125, 12.818359375, 13.1484375, 13.478515625, 13.80859375, 14.138671875, 14.46875, 14.798828125, 15.12890625, 15.458984375, 15.7890625, 16.119140625, 16.44921875, 16.779296875, 17.109375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 6.0, 5.0, 10.0, 14.0, 19.0, 35.0, 54.0, 90.0, 182.0, 285.0, 527.0, 936.0, 2191.0, 6996.0, 34216.0, 891034.0, 3194572.0, 48969.0, 8908.0, 2772.0, 1096.0, 585.0, 299.0, 170.0, 117.0, 68.0, 45.0, 28.0, 14.0, 10.0, 8.0, 9.0, 3.0, 2.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.7890625, -15.2269287109375, -14.664794921875, -14.1026611328125, -13.54052734375, -12.9783935546875, -12.416259765625, -11.8541259765625, -11.2919921875, -10.7298583984375, -10.167724609375, -9.6055908203125, -9.04345703125, -8.4813232421875, -7.919189453125, -7.3570556640625, -6.794921875, -6.2327880859375, -5.670654296875, -5.1085205078125, -4.54638671875, -3.9842529296875, -3.422119140625, -2.8599853515625, -2.2978515625, -1.7357177734375, -1.173583984375, -0.6114501953125, -0.04931640625, 0.5128173828125, 1.074951171875, 1.6370849609375, 2.19921875, 2.7613525390625, 3.323486328125, 3.8856201171875, 4.44775390625, 5.0098876953125, 5.572021484375, 6.1341552734375, 6.6962890625, 7.2584228515625, 7.820556640625, 8.3826904296875, 8.94482421875, 9.5069580078125, 10.069091796875, 10.6312255859375, 11.193359375, 11.7554931640625, 12.317626953125, 12.8797607421875, 13.44189453125, 14.0040283203125, 14.566162109375, 15.1282958984375, 15.6904296875, 16.2525634765625, 16.814697265625, 17.3768310546875, 17.93896484375, 18.5010986328125, 19.063232421875, 19.6253662109375, 20.1875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 5.0, 4.0, 11.0, 18.0, 32.0, 54.0, 127.0, 366.0, 1956.0, 1107.0, 195.0, 89.0, 38.0, 24.0, 16.0, 15.0, 6.0, 2.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.21875, -27.357177734375, -26.49560546875, -25.634033203125, -24.7724609375, -23.910888671875, -23.04931640625, -22.187744140625, -21.326171875, -20.464599609375, -19.60302734375, -18.741455078125, -17.8798828125, -17.018310546875, -16.15673828125, -15.295166015625, -14.43359375, -13.572021484375, -12.71044921875, -11.848876953125, -10.9873046875, -10.125732421875, -9.26416015625, -8.402587890625, -7.541015625, -6.679443359375, -5.81787109375, -4.956298828125, -4.0947265625, -3.233154296875, -2.37158203125, -1.510009765625, -0.6484375, 0.213134765625, 1.07470703125, 1.936279296875, 2.7978515625, 3.659423828125, 4.52099609375, 5.382568359375, 6.244140625, 7.105712890625, 7.96728515625, 8.828857421875, 9.6904296875, 10.552001953125, 11.41357421875, 12.275146484375, 13.13671875, 13.998291015625, 14.85986328125, 15.721435546875, 16.5830078125, 17.444580078125, 18.30615234375, 19.167724609375, 20.029296875, 20.890869140625, 21.75244140625, 22.614013671875, 23.4755859375, 24.337158203125, 25.19873046875, 26.060302734375, 26.921875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 2.0, 0.0, 14.0, 25.0, 55.0, 188.0, 336.0, 237.0, 75.0, 40.0, 9.0, 7.0, 6.0, 3.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-103.71772766113281, -97.83055877685547, -91.9433822631836, -86.05621337890625, -80.16903686523438, -74.28186798095703, -68.39469909667969, -62.50752639770508, -56.62035369873047, -50.73318099975586, -44.84600830078125, -38.958839416503906, -33.0716667175293, -27.184494018554688, -21.297325134277344, -15.410152435302734, -9.522979736328125, -3.635807991027832, 2.251363754272461, 8.138534545898438, 14.025707244873047, 19.912879943847656, 25.800048828125, 31.68722152709961, 37.57439422607422, 43.46156692504883, 49.34873962402344, 55.23590850830078, 61.12308120727539, 67.01025390625, 72.89742279052734, 78.78459167480469, 84.6717529296875, 90.55892181396484, 96.44609832763672, 102.33326721191406, 108.22044372558594, 114.10761260986328, 119.99478149414062, 125.8819580078125, 131.76913452148438, 137.65631103515625, 143.54347229003906, 149.43064880371094, 155.3178253173828, 161.20498657226562, 167.0921630859375, 172.97933959960938, 178.8665008544922, 184.75367736816406, 190.64083862304688, 196.52801513671875, 202.41519165039062, 208.3023681640625, 214.1895294189453, 220.0767059326172, 225.9638671875, 231.85104370117188, 237.7382049560547, 243.62538146972656, 249.51255798339844, 255.39971923828125, 261.2868957519531, 267.174072265625, 273.0612487792969]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 3.0, 1.0, 7.0, 7.0, 14.0, 26.0, 30.0, 31.0, 37.0, 58.0, 44.0, 73.0, 69.0, 59.0, 79.0, 67.0, 62.0, 69.0, 45.0, 49.0, 42.0, 31.0, 23.0, 29.0, 19.0, 10.0, 5.0, 10.0, 6.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-108.94523620605469, -106.09077453613281, -103.2363052368164, -100.38184356689453, -97.52737426757812, -94.67291259765625, -91.81845092773438, -88.9639892578125, -86.1095199584961, -83.25505828857422, -80.40058898925781, -77.54612731933594, -74.69166564941406, -71.83719635009766, -68.98273468017578, -66.12826538085938, -63.2738037109375, -60.41933822631836, -57.56487274169922, -54.710411071777344, -51.8559455871582, -49.00148010253906, -46.14701843261719, -43.29255294799805, -40.438087463378906, -37.583621978759766, -34.729156494140625, -31.87469482421875, -29.02022933959961, -26.16576385498047, -23.31130027770996, -20.456836700439453, -17.60236358642578, -14.747899055480957, -11.893434524536133, -9.038969993591309, -6.184505462646484, -3.33004093170166, -0.47557640075683594, 2.378887176513672, 5.2333526611328125, 8.087817192077637, 10.942281723022461, 13.796746253967285, 16.65121078491211, 19.50567626953125, 22.360139846801758, 25.214603424072266, 28.069068908691406, 30.923534393310547, 33.77799987792969, 36.63246154785156, 39.4869270324707, 42.341392517089844, 45.19585418701172, 48.05031967163086, 50.90478515625, 53.75925064086914, 56.61371612548828, 59.468177795410156, 62.3226432800293, 65.17710876464844, 68.03157043457031, 70.88603210449219, 73.7405014038086]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 7.0, 9.0, 12.0, 21.0, 31.0, 34.0, 68.0, 117.0, 173.0, 370.0, 698.0, 1394.0, 3005.0, 6876.0, 17739.0, 53831.0, 206973.0, 513674.0, 170650.0, 45721.0, 15606.0, 6228.0, 2693.0, 1232.0, 605.0, 328.0, 188.0, 108.0, 45.0, 32.0, 31.0, 14.0, 11.0, 10.0, 1.0, 9.0, 3.0, 4.0, 2.0, 0.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.1171875, -9.8145751953125, -9.511962890625, -9.2093505859375, -8.90673828125, -8.6041259765625, -8.301513671875, -7.9989013671875, -7.6962890625, -7.3936767578125, -7.091064453125, -6.7884521484375, -6.48583984375, -6.1832275390625, -5.880615234375, -5.5780029296875, -5.275390625, -4.9727783203125, -4.670166015625, -4.3675537109375, -4.06494140625, -3.7623291015625, -3.459716796875, -3.1571044921875, -2.8544921875, -2.5518798828125, -2.249267578125, -1.9466552734375, -1.64404296875, -1.3414306640625, -1.038818359375, -0.7362060546875, -0.43359375, -0.1309814453125, 0.171630859375, 0.4742431640625, 0.77685546875, 1.0794677734375, 1.382080078125, 1.6846923828125, 1.9873046875, 2.2899169921875, 2.592529296875, 2.8951416015625, 3.19775390625, 3.5003662109375, 3.802978515625, 4.1055908203125, 4.408203125, 4.7108154296875, 5.013427734375, 5.3160400390625, 5.61865234375, 5.9212646484375, 6.223876953125, 6.5264892578125, 6.8291015625, 7.1317138671875, 7.434326171875, 7.7369384765625, 8.03955078125, 8.3421630859375, 8.644775390625, 8.9473876953125, 9.25]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 7.0, 4.0, 9.0, 14.0, 20.0, 16.0, 31.0, 32.0, 53.0, 70.0, 61.0, 66.0, 70.0, 81.0, 79.0, 72.0, 61.0, 66.0, 52.0, 42.0, 24.0, 21.0, 19.0, 16.0, 8.0, 2.0, 6.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.05078125, -3.84393310546875, -3.6370849609375, -3.43023681640625, -3.223388671875, -3.01654052734375, -2.8096923828125, -2.60284423828125, -2.39599609375, -2.18914794921875, -1.9822998046875, -1.77545166015625, -1.568603515625, -1.36175537109375, -1.1549072265625, -0.94805908203125, -0.7412109375, -0.53436279296875, -0.3275146484375, -0.12066650390625, 0.086181640625, 0.29302978515625, 0.4998779296875, 0.70672607421875, 0.91357421875, 1.12042236328125, 1.3272705078125, 1.53411865234375, 1.740966796875, 1.94781494140625, 2.1546630859375, 2.36151123046875, 2.568359375, 2.77520751953125, 2.9820556640625, 3.18890380859375, 3.395751953125, 3.60260009765625, 3.8094482421875, 4.01629638671875, 4.22314453125, 4.42999267578125, 4.6368408203125, 4.84368896484375, 5.050537109375, 5.25738525390625, 5.4642333984375, 5.67108154296875, 5.8779296875, 6.08477783203125, 6.2916259765625, 6.49847412109375, 6.705322265625, 6.91217041015625, 7.1190185546875, 7.32586669921875, 7.53271484375, 7.73956298828125, 7.9464111328125, 8.15325927734375, 8.360107421875, 8.56695556640625, 8.7738037109375, 8.98065185546875, 9.1875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 1.0, 4.0, 10.0, 6.0, 8.0, 8.0, 23.0, 30.0, 46.0, 102.0, 164.0, 305.0, 697.0, 1758.0, 6293.0, 66886.0, 904431.0, 58725.0, 6067.0, 1690.0, 644.0, 306.0, 143.0, 75.0, 57.0, 30.0, 14.0, 12.0, 7.0, 9.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.015625, -18.087158203125, -17.15869140625, -16.230224609375, -15.3017578125, -14.373291015625, -13.44482421875, -12.516357421875, -11.587890625, -10.659423828125, -9.73095703125, -8.802490234375, -7.8740234375, -6.945556640625, -6.01708984375, -5.088623046875, -4.16015625, -3.231689453125, -2.30322265625, -1.374755859375, -0.4462890625, 0.482177734375, 1.41064453125, 2.339111328125, 3.267578125, 4.196044921875, 5.12451171875, 6.052978515625, 6.9814453125, 7.909912109375, 8.83837890625, 9.766845703125, 10.6953125, 11.623779296875, 12.55224609375, 13.480712890625, 14.4091796875, 15.337646484375, 16.26611328125, 17.194580078125, 18.123046875, 19.051513671875, 19.97998046875, 20.908447265625, 21.8369140625, 22.765380859375, 23.69384765625, 24.622314453125, 25.55078125, 26.479248046875, 27.40771484375, 28.336181640625, 29.2646484375, 30.193115234375, 31.12158203125, 32.050048828125, 32.978515625, 33.906982421875, 34.83544921875, 35.763916015625, 36.6923828125, 37.620849609375, 38.54931640625, 39.477783203125, 40.40625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 8.0, 11.0, 7.0, 13.0, 15.0, 19.0, 24.0, 28.0, 21.0, 42.0, 56.0, 54.0, 56.0, 63.0, 67.0, 48.0, 59.0, 54.0, 52.0, 51.0, 49.0, 48.0, 44.0, 26.0, 24.0, 21.0, 14.0, 5.0, 6.0, 4.0, 6.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.34375, -19.421875, -18.5, -17.578125, -16.65625, -15.734375, -14.8125, -13.890625, -12.96875, -12.046875, -11.125, -10.203125, -9.28125, -8.359375, -7.4375, -6.515625, -5.59375, -4.671875, -3.75, -2.828125, -1.90625, -0.984375, -0.0625, 0.859375, 1.78125, 2.703125, 3.625, 4.546875, 5.46875, 6.390625, 7.3125, 8.234375, 9.15625, 10.078125, 11.0, 11.921875, 12.84375, 13.765625, 14.6875, 15.609375, 16.53125, 17.453125, 18.375, 19.296875, 20.21875, 21.140625, 22.0625, 22.984375, 23.90625, 24.828125, 25.75, 26.671875, 27.59375, 28.515625, 29.4375, 30.359375, 31.28125, 32.203125, 33.125, 34.046875, 34.96875, 35.890625, 36.8125, 37.734375, 38.65625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 3.0, 1.0, 6.0, 2.0, 6.0, 8.0, 10.0, 16.0, 32.0, 49.0, 97.0, 205.0, 535.0, 1794.0, 13450.0, 726464.0, 295227.0, 8392.0, 1454.0, 438.0, 176.0, 94.0, 34.0, 25.0, 20.0, 10.0, 2.0, 4.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.3828125, -11.0657958984375, -10.748779296875, -10.4317626953125, -10.11474609375, -9.7977294921875, -9.480712890625, -9.1636962890625, -8.8466796875, -8.5296630859375, -8.212646484375, -7.8956298828125, -7.57861328125, -7.2615966796875, -6.944580078125, -6.6275634765625, -6.310546875, -5.9935302734375, -5.676513671875, -5.3594970703125, -5.04248046875, -4.7254638671875, -4.408447265625, -4.0914306640625, -3.7744140625, -3.4573974609375, -3.140380859375, -2.8233642578125, -2.50634765625, -2.1893310546875, -1.872314453125, -1.5552978515625, -1.23828125, -0.9212646484375, -0.604248046875, -0.2872314453125, 0.02978515625, 0.3468017578125, 0.663818359375, 0.9808349609375, 1.2978515625, 1.6148681640625, 1.931884765625, 2.2489013671875, 2.56591796875, 2.8829345703125, 3.199951171875, 3.5169677734375, 3.833984375, 4.1510009765625, 4.468017578125, 4.7850341796875, 5.10205078125, 5.4190673828125, 5.736083984375, 6.0531005859375, 6.3701171875, 6.6871337890625, 7.004150390625, 7.3211669921875, 7.63818359375, 7.9552001953125, 8.272216796875, 8.5892333984375, 8.90625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 6.0, 4.0, 5.0, 8.0, 11.0, 26.0, 32.0, 45.0, 77.0, 131.0, 157.0, 138.0, 107.0, 96.0, 61.0, 31.0, 22.0, 17.0, 7.0, 5.0, 2.0, 5.0, 6.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.001743316650390625, -0.0017027705907821655, -0.001662224531173706, -0.0016216784715652466, -0.0015811324119567871, -0.0015405863523483276, -0.0015000402927398682, -0.0014594942331314087, -0.0014189481735229492, -0.0013784021139144897, -0.0013378560543060303, -0.0012973099946975708, -0.0012567639350891113, -0.0012162178754806519, -0.0011756718158721924, -0.001135125756263733, -0.0010945796966552734, -0.001054033637046814, -0.0010134875774383545, -0.000972941517829895, -0.0009323954582214355, -0.0008918493986129761, -0.0008513033390045166, -0.0008107572793960571, -0.0007702112197875977, -0.0007296651601791382, -0.0006891191005706787, -0.0006485730409622192, -0.0006080269813537598, -0.0005674809217453003, -0.0005269348621368408, -0.00048638880252838135, -0.0004458427429199219, -0.0004052966833114624, -0.00036475062370300293, -0.00032420456409454346, -0.000283658504486084, -0.0002431124448776245, -0.00020256638526916504, -0.00016202032566070557, -0.0001214742660522461, -8.092820644378662e-05, -4.038214683532715e-05, 1.6391277313232422e-07, 4.07099723815918e-05, 8.125603199005127e-05, 0.00012180209159851074, 0.00016234815120697021, 0.0002028942108154297, 0.00024344027042388916, 0.00028398633003234863, 0.0003245323896408081, 0.0003650784492492676, 0.00040562450885772705, 0.0004461705684661865, 0.000486716628074646, 0.0005272626876831055, 0.0005678087472915649, 0.0006083548069000244, 0.0006489008665084839, 0.0006894469261169434, 0.0007299929857254028, 0.0007705390453338623, 0.0008110851049423218, 0.0008516311645507812]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 4.0, 8.0, 19.0, 26.0, 50.0, 110.0, 153.0, 335.0, 820.0, 2399.0, 11988.0, 249852.0, 752414.0, 24594.0, 3760.0, 1109.0, 433.0, 209.0, 101.0, 58.0, 32.0, 30.0, 14.0, 11.0, 6.0, 4.0, 2.0, 2.0, 6.0, 2.0, 0.0, 2.0, 2.0, 1.0], "bins": [-10.5703125, -10.319580078125, -10.06884765625, -9.818115234375, -9.5673828125, -9.316650390625, -9.06591796875, -8.815185546875, -8.564453125, -8.313720703125, -8.06298828125, -7.812255859375, -7.5615234375, -7.310791015625, -7.06005859375, -6.809326171875, -6.55859375, -6.307861328125, -6.05712890625, -5.806396484375, -5.5556640625, -5.304931640625, -5.05419921875, -4.803466796875, -4.552734375, -4.302001953125, -4.05126953125, -3.800537109375, -3.5498046875, -3.299072265625, -3.04833984375, -2.797607421875, -2.546875, -2.296142578125, -2.04541015625, -1.794677734375, -1.5439453125, -1.293212890625, -1.04248046875, -0.791748046875, -0.541015625, -0.290283203125, -0.03955078125, 0.211181640625, 0.4619140625, 0.712646484375, 0.96337890625, 1.214111328125, 1.46484375, 1.715576171875, 1.96630859375, 2.217041015625, 2.4677734375, 2.718505859375, 2.96923828125, 3.219970703125, 3.470703125, 3.721435546875, 3.97216796875, 4.222900390625, 4.4736328125, 4.724365234375, 4.97509765625, 5.225830078125, 5.4765625]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 3.0, 1.0, 12.0, 9.0, 12.0, 26.0, 36.0, 48.0, 64.0, 73.0, 79.0, 87.0, 92.0, 73.0, 98.0, 57.0, 56.0, 46.0, 36.0, 26.0, 20.0, 9.0, 9.0, 9.0, 8.0, 3.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.796875, -6.6165771484375, -6.436279296875, -6.2559814453125, -6.07568359375, -5.8953857421875, -5.715087890625, -5.5347900390625, -5.3544921875, -5.1741943359375, -4.993896484375, -4.8135986328125, -4.63330078125, -4.4530029296875, -4.272705078125, -4.0924072265625, -3.912109375, -3.7318115234375, -3.551513671875, -3.3712158203125, -3.19091796875, -3.0106201171875, -2.830322265625, -2.6500244140625, -2.4697265625, -2.2894287109375, -2.109130859375, -1.9288330078125, -1.74853515625, -1.5682373046875, -1.387939453125, -1.2076416015625, -1.02734375, -0.8470458984375, -0.666748046875, -0.4864501953125, -0.30615234375, -0.1258544921875, 0.054443359375, 0.2347412109375, 0.4150390625, 0.5953369140625, 0.775634765625, 0.9559326171875, 1.13623046875, 1.3165283203125, 1.496826171875, 1.6771240234375, 1.857421875, 2.0377197265625, 2.218017578125, 2.3983154296875, 2.57861328125, 2.7589111328125, 2.939208984375, 3.1195068359375, 3.2998046875, 3.4801025390625, 3.660400390625, 3.8406982421875, 4.02099609375, 4.2012939453125, 4.381591796875, 4.5618896484375, 4.7421875]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 18.0, 37.0, 73.0, 177.0, 304.0, 206.0, 107.0, 43.0, 11.0, 7.0, 7.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-193.10186767578125, -187.68148803710938, -182.2611083984375, -176.84071350097656, -171.4203338623047, -165.9999542236328, -160.57955932617188, -155.1591796875, -149.73880004882812, -144.31842041015625, -138.89804077148438, -133.47764587402344, -128.05726623535156, -122.63688659667969, -117.21649932861328, -111.79611206054688, -106.375732421875, -100.95535278320312, -95.53496551513672, -90.11457824707031, -84.69419860839844, -79.27381896972656, -73.85343170166016, -68.43304443359375, -63.012664794921875, -57.592281341552734, -52.171897888183594, -46.75151443481445, -41.33113098144531, -35.91074752807617, -30.49036407470703, -25.06998062133789, -19.649581909179688, -14.229198455810547, -8.808815002441406, -3.3884315490722656, 2.031951904296875, 7.452335357666016, 12.872718811035156, 18.293102264404297, 23.713485717773438, 29.133869171142578, 34.55425262451172, 39.97463607788086, 45.39501953125, 50.81540298461914, 56.23578643798828, 61.65616989135742, 67.07655334472656, 72.49693298339844, 77.91732025146484, 83.33770751953125, 88.75808715820312, 94.178466796875, 99.5988540649414, 105.01924133300781, 110.43962097167969, 115.86000061035156, 121.28038787841797, 126.70077514648438, 132.12115478515625, 137.54153442382812, 142.9619140625, 148.38230895996094, 153.8026885986328]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 4.0, 7.0, 11.0, 17.0, 16.0, 17.0, 23.0, 39.0, 50.0, 58.0, 68.0, 69.0, 95.0, 89.0, 94.0, 74.0, 48.0, 45.0, 49.0, 38.0, 31.0, 17.0, 17.0, 9.0, 4.0, 7.0, 7.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-132.9462432861328, -128.81309509277344, -124.6799545288086, -120.54681396484375, -116.41366577148438, -112.280517578125, -108.14737701416016, -104.01423645019531, -99.88108825683594, -95.74794006347656, -91.61479949951172, -87.48165893554688, -83.3485107421875, -79.21536254882812, -75.08222198486328, -70.94908142089844, -66.81593322753906, -62.68278884887695, -58.549644470214844, -54.416500091552734, -50.283355712890625, -46.150211334228516, -42.017066955566406, -37.8839225769043, -33.75077819824219, -29.617633819580078, -25.48448944091797, -21.35134506225586, -17.21820068359375, -13.08505630493164, -8.951911926269531, -4.818767547607422, -0.68560791015625, 3.4475364685058594, 7.580680847167969, 11.713825225830078, 15.846969604492188, 19.980113983154297, 24.113258361816406, 28.246402740478516, 32.379547119140625, 36.512691497802734, 40.645835876464844, 44.77898025512695, 48.91212463378906, 53.04526901245117, 57.17841339111328, 61.31155776977539, 65.4447021484375, 69.57785034179688, 73.71099090576172, 77.84413146972656, 81.97727966308594, 86.11042785644531, 90.24356842041016, 94.376708984375, 98.50985717773438, 102.64300537109375, 106.7761459350586, 110.90928649902344, 115.04243469238281, 119.17558288574219, 123.30872344970703, 127.44186401367188, 131.57501220703125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 1.0, 2.0, 5.0, 7.0, 12.0, 22.0, 27.0, 51.0, 99.0, 225.0, 1649.0, 24038.0, 4153420.0, 13030.0, 1049.0, 298.0, 129.0, 79.0, 50.0, 28.0, 21.0, 14.0, 14.0, 4.0, 4.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.203125, -29.813232421875, -28.42333984375, -27.033447265625, -25.6435546875, -24.253662109375, -22.86376953125, -21.473876953125, -20.083984375, -18.694091796875, -17.30419921875, -15.914306640625, -14.5244140625, -13.134521484375, -11.74462890625, -10.354736328125, -8.96484375, -7.574951171875, -6.18505859375, -4.795166015625, -3.4052734375, -2.015380859375, -0.62548828125, 0.764404296875, 2.154296875, 3.544189453125, 4.93408203125, 6.323974609375, 7.7138671875, 9.103759765625, 10.49365234375, 11.883544921875, 13.2734375, 14.663330078125, 16.05322265625, 17.443115234375, 18.8330078125, 20.222900390625, 21.61279296875, 23.002685546875, 24.392578125, 25.782470703125, 27.17236328125, 28.562255859375, 29.9521484375, 31.342041015625, 32.73193359375, 34.121826171875, 35.51171875, 36.901611328125, 38.29150390625, 39.681396484375, 41.0712890625, 42.461181640625, 43.85107421875, 45.240966796875, 46.630859375, 48.020751953125, 49.41064453125, 50.800537109375, 52.1904296875, 53.580322265625, 54.97021484375, 56.360107421875, 57.75]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 4.0, 21.0, 30.0, 81.0, 179.0, 218.0, 209.0, 149.0, 67.0, 26.0, 14.0, 7.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.34375, -10.745849609375, -10.14794921875, -9.550048828125, -8.9521484375, -8.354248046875, -7.75634765625, -7.158447265625, -6.560546875, -5.962646484375, -5.36474609375, -4.766845703125, -4.1689453125, -3.571044921875, -2.97314453125, -2.375244140625, -1.77734375, -1.179443359375, -0.58154296875, 0.016357421875, 0.6142578125, 1.212158203125, 1.81005859375, 2.407958984375, 3.005859375, 3.603759765625, 4.20166015625, 4.799560546875, 5.3974609375, 5.995361328125, 6.59326171875, 7.191162109375, 7.7890625, 8.386962890625, 8.98486328125, 9.582763671875, 10.1806640625, 10.778564453125, 11.37646484375, 11.974365234375, 12.572265625, 13.170166015625, 13.76806640625, 14.365966796875, 14.9638671875, 15.561767578125, 16.15966796875, 16.757568359375, 17.35546875, 17.953369140625, 18.55126953125, 19.149169921875, 19.7470703125, 20.344970703125, 20.94287109375, 21.540771484375, 22.138671875, 22.736572265625, 23.33447265625, 23.932373046875, 24.5302734375, 25.128173828125, 25.72607421875, 26.323974609375, 26.921875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 9.0, 5.0, 12.0, 15.0, 30.0, 51.0, 67.0, 131.0, 213.0, 399.0, 730.0, 1447.0, 2709.0, 6350.0, 17069.0, 63003.0, 1227004.0, 2763530.0, 79247.0, 18854.0, 6923.0, 3062.0, 1461.0, 791.0, 464.0, 293.0, 167.0, 99.0, 56.0, 41.0, 19.0, 8.0, 8.0, 5.0, 4.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-15.0703125, -14.652587890625, -14.23486328125, -13.817138671875, -13.3994140625, -12.981689453125, -12.56396484375, -12.146240234375, -11.728515625, -11.310791015625, -10.89306640625, -10.475341796875, -10.0576171875, -9.639892578125, -9.22216796875, -8.804443359375, -8.38671875, -7.968994140625, -7.55126953125, -7.133544921875, -6.7158203125, -6.298095703125, -5.88037109375, -5.462646484375, -5.044921875, -4.627197265625, -4.20947265625, -3.791748046875, -3.3740234375, -2.956298828125, -2.53857421875, -2.120849609375, -1.703125, -1.285400390625, -0.86767578125, -0.449951171875, -0.0322265625, 0.385498046875, 0.80322265625, 1.220947265625, 1.638671875, 2.056396484375, 2.47412109375, 2.891845703125, 3.3095703125, 3.727294921875, 4.14501953125, 4.562744140625, 4.98046875, 5.398193359375, 5.81591796875, 6.233642578125, 6.6513671875, 7.069091796875, 7.48681640625, 7.904541015625, 8.322265625, 8.739990234375, 9.15771484375, 9.575439453125, 9.9931640625, 10.410888671875, 10.82861328125, 11.246337890625, 11.6640625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 7.0, 8.0, 4.0, 7.0, 8.0, 9.0, 14.0, 30.0, 25.0, 47.0, 81.0, 141.0, 406.0, 1125.0, 1325.0, 462.0, 168.0, 69.0, 40.0, 19.0, 21.0, 18.0, 6.0, 10.0, 3.0, 7.0, 3.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.0625, -15.528076171875, -14.99365234375, -14.459228515625, -13.9248046875, -13.390380859375, -12.85595703125, -12.321533203125, -11.787109375, -11.252685546875, -10.71826171875, -10.183837890625, -9.6494140625, -9.114990234375, -8.58056640625, -8.046142578125, -7.51171875, -6.977294921875, -6.44287109375, -5.908447265625, -5.3740234375, -4.839599609375, -4.30517578125, -3.770751953125, -3.236328125, -2.701904296875, -2.16748046875, -1.633056640625, -1.0986328125, -0.564208984375, -0.02978515625, 0.504638671875, 1.0390625, 1.573486328125, 2.10791015625, 2.642333984375, 3.1767578125, 3.711181640625, 4.24560546875, 4.780029296875, 5.314453125, 5.848876953125, 6.38330078125, 6.917724609375, 7.4521484375, 7.986572265625, 8.52099609375, 9.055419921875, 9.58984375, 10.124267578125, 10.65869140625, 11.193115234375, 11.7275390625, 12.261962890625, 12.79638671875, 13.330810546875, 13.865234375, 14.399658203125, 14.93408203125, 15.468505859375, 16.0029296875, 16.537353515625, 17.07177734375, 17.606201171875, 18.140625]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 10.0, 8.0, 18.0, 30.0, 87.0, 228.0, 301.0, 200.0, 65.0, 34.0, 13.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-134.2921600341797, -129.2277374267578, -124.16331481933594, -119.09888458251953, -114.03446197509766, -108.97003936767578, -103.90560913085938, -98.8411865234375, -93.77676391601562, -88.71234130859375, -83.64791870117188, -78.58348846435547, -73.5190658569336, -68.45464324951172, -63.39021682739258, -58.32579040527344, -53.26136779785156, -48.19694519042969, -43.13251876831055, -38.068092346191406, -33.00366973876953, -27.939245223999023, -22.874820709228516, -17.810394287109375, -12.7459716796875, -7.681547164916992, -2.6171226501464844, 2.4473018646240234, 7.511726379394531, 12.576150894165039, 17.640575408935547, 22.705001831054688, 27.769424438476562, 32.83384704589844, 37.89827346801758, 42.96269989013672, 48.027122497558594, 53.09154510498047, 58.15597152709961, 63.22039794921875, 68.28482055664062, 73.3492431640625, 78.41366577148438, 83.47809600830078, 88.54251861572266, 93.60694122314453, 98.67137145996094, 103.73579406738281, 108.80021667480469, 113.86463928222656, 118.92906188964844, 123.99349212646484, 129.05792236328125, 134.12234497070312, 139.186767578125, 144.25119018554688, 149.31561279296875, 154.38003540039062, 159.4444580078125, 164.50888061523438, 169.57330322265625, 174.6377410888672, 179.70216369628906, 184.76658630371094, 189.8310089111328]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 7.0, 5.0, 5.0, 7.0, 12.0, 16.0, 14.0, 20.0, 27.0, 33.0, 35.0, 44.0, 51.0, 63.0, 58.0, 64.0, 76.0, 71.0, 43.0, 61.0, 40.0, 39.0, 42.0, 26.0, 44.0, 26.0, 22.0, 15.0, 10.0, 9.0, 4.0, 9.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-94.16424560546875, -91.90087127685547, -89.63750457763672, -87.37413024902344, -85.11075592041016, -82.84738159179688, -80.58401489257812, -78.32064056396484, -76.05726623535156, -73.79389190673828, -71.53052520751953, -69.26715087890625, -67.00377655029297, -64.74040222167969, -62.47703552246094, -60.213661193847656, -57.950294494628906, -55.68692398071289, -53.42354965209961, -51.160179138183594, -48.89680480957031, -46.6334342956543, -44.37006378173828, -42.106689453125, -39.843318939208984, -37.57994842529297, -35.31657409667969, -33.05320358276367, -30.789831161499023, -28.526458740234375, -26.26308822631836, -23.99971580505371, -21.73633575439453, -19.472963333129883, -17.209590911865234, -14.946220397949219, -12.68284797668457, -10.419475555419922, -8.15610408782959, -5.892732620239258, -3.6293601989746094, -1.3659882545471191, 0.8973836898803711, 3.1607556343078613, 5.424127578735352, 7.6875, 9.950871467590332, 12.214242935180664, 14.477615356445312, 16.74098777770996, 19.00436019897461, 21.267730712890625, 23.531103134155273, 25.794475555419922, 28.057846069335938, 30.321218490600586, 32.584590911865234, 34.84796142578125, 37.11133575439453, 39.37470626831055, 41.63807678222656, 43.901451110839844, 46.16482162475586, 48.428192138671875, 50.691566467285156]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 7.0, 6.0, 8.0, 11.0, 22.0, 47.0, 57.0, 104.0, 237.0, 486.0, 1280.0, 3687.0, 13305.0, 71057.0, 604031.0, 304057.0, 37457.0, 8520.0, 2529.0, 878.0, 368.0, 167.0, 83.0, 57.0, 33.0, 25.0, 13.0, 7.0, 7.0, 2.0, 3.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.21875, -16.677734375, -16.13671875, -15.595703125, -15.0546875, -14.513671875, -13.97265625, -13.431640625, -12.890625, -12.349609375, -11.80859375, -11.267578125, -10.7265625, -10.185546875, -9.64453125, -9.103515625, -8.5625, -8.021484375, -7.48046875, -6.939453125, -6.3984375, -5.857421875, -5.31640625, -4.775390625, -4.234375, -3.693359375, -3.15234375, -2.611328125, -2.0703125, -1.529296875, -0.98828125, -0.447265625, 0.09375, 0.634765625, 1.17578125, 1.716796875, 2.2578125, 2.798828125, 3.33984375, 3.880859375, 4.421875, 4.962890625, 5.50390625, 6.044921875, 6.5859375, 7.126953125, 7.66796875, 8.208984375, 8.75, 9.291015625, 9.83203125, 10.373046875, 10.9140625, 11.455078125, 11.99609375, 12.537109375, 13.078125, 13.619140625, 14.16015625, 14.701171875, 15.2421875, 15.783203125, 16.32421875, 16.865234375, 17.40625]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 6.0, 11.0, 22.0, 30.0, 53.0, 69.0, 95.0, 123.0, 132.0, 131.0, 120.0, 93.0, 51.0, 31.0, 16.0, 11.0, 7.0, 5.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.5625, -10.16650390625, -9.7705078125, -9.37451171875, -8.978515625, -8.58251953125, -8.1865234375, -7.79052734375, -7.39453125, -6.99853515625, -6.6025390625, -6.20654296875, -5.810546875, -5.41455078125, -5.0185546875, -4.62255859375, -4.2265625, -3.83056640625, -3.4345703125, -3.03857421875, -2.642578125, -2.24658203125, -1.8505859375, -1.45458984375, -1.05859375, -0.66259765625, -0.2666015625, 0.12939453125, 0.525390625, 0.92138671875, 1.3173828125, 1.71337890625, 2.109375, 2.50537109375, 2.9013671875, 3.29736328125, 3.693359375, 4.08935546875, 4.4853515625, 4.88134765625, 5.27734375, 5.67333984375, 6.0693359375, 6.46533203125, 6.861328125, 7.25732421875, 7.6533203125, 8.04931640625, 8.4453125, 8.84130859375, 9.2373046875, 9.63330078125, 10.029296875, 10.42529296875, 10.8212890625, 11.21728515625, 11.61328125, 12.00927734375, 12.4052734375, 12.80126953125, 13.197265625, 13.59326171875, 13.9892578125, 14.38525390625, 14.78125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 9.0, 16.0, 15.0, 10.0, 20.0, 27.0, 40.0, 57.0, 94.0, 138.0, 181.0, 328.0, 697.0, 1427.0, 3534.0, 10663.0, 48096.0, 446985.0, 470061.0, 48506.0, 11016.0, 3526.0, 1442.0, 677.0, 361.0, 193.0, 126.0, 93.0, 53.0, 42.0, 25.0, 18.0, 15.0, 14.0, 8.0, 9.0, 5.0, 7.0, 9.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-18.5, -17.939453125, -17.37890625, -16.818359375, -16.2578125, -15.697265625, -15.13671875, -14.576171875, -14.015625, -13.455078125, -12.89453125, -12.333984375, -11.7734375, -11.212890625, -10.65234375, -10.091796875, -9.53125, -8.970703125, -8.41015625, -7.849609375, -7.2890625, -6.728515625, -6.16796875, -5.607421875, -5.046875, -4.486328125, -3.92578125, -3.365234375, -2.8046875, -2.244140625, -1.68359375, -1.123046875, -0.5625, -0.001953125, 0.55859375, 1.119140625, 1.6796875, 2.240234375, 2.80078125, 3.361328125, 3.921875, 4.482421875, 5.04296875, 5.603515625, 6.1640625, 6.724609375, 7.28515625, 7.845703125, 8.40625, 8.966796875, 9.52734375, 10.087890625, 10.6484375, 11.208984375, 11.76953125, 12.330078125, 12.890625, 13.451171875, 14.01171875, 14.572265625, 15.1328125, 15.693359375, 16.25390625, 16.814453125, 17.375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 7.0, 4.0, 7.0, 4.0, 11.0, 12.0, 9.0, 12.0, 14.0, 31.0, 25.0, 25.0, 46.0, 35.0, 43.0, 49.0, 64.0, 46.0, 60.0, 68.0, 55.0, 42.0, 51.0, 60.0, 44.0, 39.0, 19.0, 25.0, 15.0, 19.0, 9.0, 5.0, 10.0, 6.0, 8.0, 4.0, 1.0, 7.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-26.984375, -26.20556640625, -25.4267578125, -24.64794921875, -23.869140625, -23.09033203125, -22.3115234375, -21.53271484375, -20.75390625, -19.97509765625, -19.1962890625, -18.41748046875, -17.638671875, -16.85986328125, -16.0810546875, -15.30224609375, -14.5234375, -13.74462890625, -12.9658203125, -12.18701171875, -11.408203125, -10.62939453125, -9.8505859375, -9.07177734375, -8.29296875, -7.51416015625, -6.7353515625, -5.95654296875, -5.177734375, -4.39892578125, -3.6201171875, -2.84130859375, -2.0625, -1.28369140625, -0.5048828125, 0.27392578125, 1.052734375, 1.83154296875, 2.6103515625, 3.38916015625, 4.16796875, 4.94677734375, 5.7255859375, 6.50439453125, 7.283203125, 8.06201171875, 8.8408203125, 9.61962890625, 10.3984375, 11.17724609375, 11.9560546875, 12.73486328125, 13.513671875, 14.29248046875, 15.0712890625, 15.85009765625, 16.62890625, 17.40771484375, 18.1865234375, 18.96533203125, 19.744140625, 20.52294921875, 21.3017578125, 22.08056640625, 22.859375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 5.0, 17.0, 15.0, 38.0, 60.0, 123.0, 364.0, 1623.0, 32545.0, 996255.0, 15786.0, 1193.0, 303.0, 111.0, 51.0, 27.0, 15.0, 11.0, 5.0, 9.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.5703125, -9.9263916015625, -9.282470703125, -8.6385498046875, -7.99462890625, -7.3507080078125, -6.706787109375, -6.0628662109375, -5.4189453125, -4.7750244140625, -4.131103515625, -3.4871826171875, -2.84326171875, -2.1993408203125, -1.555419921875, -0.9114990234375, -0.267578125, 0.3763427734375, 1.020263671875, 1.6641845703125, 2.30810546875, 2.9520263671875, 3.595947265625, 4.2398681640625, 4.8837890625, 5.5277099609375, 6.171630859375, 6.8155517578125, 7.45947265625, 8.1033935546875, 8.747314453125, 9.3912353515625, 10.03515625, 10.6790771484375, 11.322998046875, 11.9669189453125, 12.61083984375, 13.2547607421875, 13.898681640625, 14.5426025390625, 15.1865234375, 15.8304443359375, 16.474365234375, 17.1182861328125, 17.76220703125, 18.4061279296875, 19.050048828125, 19.6939697265625, 20.337890625, 20.9818115234375, 21.625732421875, 22.2696533203125, 22.91357421875, 23.5574951171875, 24.201416015625, 24.8453369140625, 25.4892578125, 26.1331787109375, 26.777099609375, 27.4210205078125, 28.06494140625, 28.7088623046875, 29.352783203125, 29.9967041015625, 30.640625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 4.0, 6.0, 14.0, 21.0, 41.0, 59.0, 90.0, 154.0, 184.0, 161.0, 117.0, 54.0, 38.0, 25.0, 9.0, 12.0, 5.0, 5.0, 4.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00164031982421875, -0.0015763640403747559, -0.0015124082565307617, -0.0014484524726867676, -0.0013844966888427734, -0.0013205409049987793, -0.0012565851211547852, -0.001192629337310791, -0.0011286735534667969, -0.0010647177696228027, -0.0010007619857788086, -0.0009368062019348145, -0.0008728504180908203, -0.0008088946342468262, -0.000744938850402832, -0.0006809830665588379, -0.0006170272827148438, -0.0005530714988708496, -0.0004891157150268555, -0.00042515993118286133, -0.0003612041473388672, -0.00029724836349487305, -0.0002332925796508789, -0.00016933679580688477, -0.00010538101196289062, -4.1425228118896484e-05, 2.2530555725097656e-05, 8.64863395690918e-05, 0.00015044212341308594, 0.00021439790725708008, 0.0002783536911010742, 0.00034230947494506836, 0.0004062652587890625, 0.00047022104263305664, 0.0005341768264770508, 0.0005981326103210449, 0.0006620883941650391, 0.0007260441780090332, 0.0007899999618530273, 0.0008539557456970215, 0.0009179115295410156, 0.0009818673133850098, 0.001045823097229004, 0.001109778881072998, 0.0011737346649169922, 0.0012376904487609863, 0.0013016462326049805, 0.0013656020164489746, 0.0014295578002929688, 0.0014935135841369629, 0.001557469367980957, 0.0016214251518249512, 0.0016853809356689453, 0.0017493367195129395, 0.0018132925033569336, 0.0018772482872009277, 0.0019412040710449219, 0.002005159854888916, 0.00206911563873291, 0.0021330714225769043, 0.0021970272064208984, 0.0022609829902648926, 0.0023249387741088867, 0.002388894557952881, 0.002452850341796875]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 6.0, 5.0, 7.0, 7.0, 15.0, 40.0, 48.0, 77.0, 153.0, 286.0, 628.0, 1660.0, 6576.0, 63253.0, 912395.0, 54407.0, 6091.0, 1681.0, 549.0, 283.0, 152.0, 92.0, 60.0, 28.0, 14.0, 16.0, 14.0, 7.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.640625, -12.3033447265625, -11.966064453125, -11.6287841796875, -11.29150390625, -10.9542236328125, -10.616943359375, -10.2796630859375, -9.9423828125, -9.6051025390625, -9.267822265625, -8.9305419921875, -8.59326171875, -8.2559814453125, -7.918701171875, -7.5814208984375, -7.244140625, -6.9068603515625, -6.569580078125, -6.2322998046875, -5.89501953125, -5.5577392578125, -5.220458984375, -4.8831787109375, -4.5458984375, -4.2086181640625, -3.871337890625, -3.5340576171875, -3.19677734375, -2.8594970703125, -2.522216796875, -2.1849365234375, -1.84765625, -1.5103759765625, -1.173095703125, -0.8358154296875, -0.49853515625, -0.1612548828125, 0.176025390625, 0.5133056640625, 0.8505859375, 1.1878662109375, 1.525146484375, 1.8624267578125, 2.19970703125, 2.5369873046875, 2.874267578125, 3.2115478515625, 3.548828125, 3.8861083984375, 4.223388671875, 4.5606689453125, 4.89794921875, 5.2352294921875, 5.572509765625, 5.9097900390625, 6.2470703125, 6.5843505859375, 6.921630859375, 7.2589111328125, 7.59619140625, 7.9334716796875, 8.270751953125, 8.6080322265625, 8.9453125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 4.0, 2.0, 2.0, 12.0, 20.0, 22.0, 39.0, 46.0, 69.0, 97.0, 132.0, 144.0, 105.0, 102.0, 60.0, 47.0, 34.0, 24.0, 13.0, 11.0, 6.0, 5.0, 8.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.4921875, -9.207275390625, -8.92236328125, -8.637451171875, -8.3525390625, -8.067626953125, -7.78271484375, -7.497802734375, -7.212890625, -6.927978515625, -6.64306640625, -6.358154296875, -6.0732421875, -5.788330078125, -5.50341796875, -5.218505859375, -4.93359375, -4.648681640625, -4.36376953125, -4.078857421875, -3.7939453125, -3.509033203125, -3.22412109375, -2.939208984375, -2.654296875, -2.369384765625, -2.08447265625, -1.799560546875, -1.5146484375, -1.229736328125, -0.94482421875, -0.659912109375, -0.375, -0.090087890625, 0.19482421875, 0.479736328125, 0.7646484375, 1.049560546875, 1.33447265625, 1.619384765625, 1.904296875, 2.189208984375, 2.47412109375, 2.759033203125, 3.0439453125, 3.328857421875, 3.61376953125, 3.898681640625, 4.18359375, 4.468505859375, 4.75341796875, 5.038330078125, 5.3232421875, 5.608154296875, 5.89306640625, 6.177978515625, 6.462890625, 6.747802734375, 7.03271484375, 7.317626953125, 7.6025390625, 7.887451171875, 8.17236328125, 8.457275390625, 8.7421875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 3.0, 7.0, 8.0, 10.0, 10.0, 31.0, 36.0, 86.0, 132.0, 153.0, 165.0, 140.0, 85.0, 52.0, 23.0, 14.0, 20.0, 9.0, 5.0, 3.0, 4.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-83.5088882446289, -80.17584228515625, -76.84280395507812, -73.50975799560547, -70.17671203613281, -66.84366607666016, -63.510623931884766, -60.177581787109375, -56.84453582763672, -53.51148986816406, -50.17844772338867, -46.84540557861328, -43.512359619140625, -40.17931365966797, -36.84627151489258, -33.51322937011719, -30.18018341064453, -26.847139358520508, -23.514095306396484, -20.18105125427246, -16.848007202148438, -13.514963150024414, -10.18191909790039, -6.848875045776367, -3.5158309936523438, -0.1827869415283203, 3.150257110595703, 6.483301162719727, 9.81634521484375, 13.149389266967773, 16.482433319091797, 19.81547737121582, 23.148529052734375, 26.4815731048584, 29.814617156982422, 33.14765930175781, 36.48070526123047, 39.813751220703125, 43.146793365478516, 46.479835510253906, 49.81288146972656, 53.14592742919922, 56.47896957397461, 59.81201171875, 63.145057678222656, 66.47810363769531, 69.81114196777344, 73.1441879272461, 76.47723388671875, 79.8102798461914, 83.14332580566406, 86.47636413574219, 89.80941009521484, 93.1424560546875, 96.47549438476562, 99.80854034423828, 103.14158630371094, 106.4746322631836, 109.80767822265625, 113.14071655273438, 116.47376251220703, 119.80680847167969, 123.13984680175781, 126.47289276123047, 129.80593872070312]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 4.0, 6.0, 5.0, 2.0, 13.0, 8.0, 14.0, 13.0, 20.0, 33.0, 25.0, 32.0, 44.0, 41.0, 53.0, 64.0, 66.0, 73.0, 74.0, 64.0, 44.0, 38.0, 50.0, 33.0, 28.0, 33.0, 16.0, 31.0, 20.0, 16.0, 7.0, 13.0, 5.0, 6.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0], "bins": [-124.32056427001953, -121.03448486328125, -117.74839782714844, -114.46231842041016, -111.17623138427734, -107.89015197753906, -104.60406494140625, -101.31798553466797, -98.03190612792969, -94.7458267211914, -91.4597396850586, -88.17366027832031, -84.8875732421875, -81.60149383544922, -78.31541442871094, -75.02932739257812, -71.74324035644531, -68.45716094970703, -65.17107391357422, -61.88499450683594, -58.598907470703125, -55.312828063964844, -52.0267448425293, -48.74066162109375, -45.4545783996582, -42.168495178222656, -38.88241195678711, -35.59632873535156, -32.31024932861328, -29.0241641998291, -25.738082885742188, -22.45199966430664, -19.165924072265625, -15.879840850830078, -12.593758583068848, -9.307676315307617, -6.02159309387207, -2.7355098724365234, 0.5505714416503906, 3.8366546630859375, 7.122737884521484, 10.408821105957031, 13.694903373718262, 16.980985641479492, 20.26706886291504, 23.553152084350586, 26.8392333984375, 30.125316619873047, 33.411399841308594, 36.69748306274414, 39.98356628417969, 43.26964569091797, 46.55573272705078, 49.84181213378906, 53.12789535522461, 56.413978576660156, 59.7000617980957, 62.98614501953125, 66.27222442626953, 69.55831146240234, 72.84439086914062, 76.13047790527344, 79.41655731201172, 82.70263671875, 85.98872375488281]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 5.0, 0.0, 4.0, 6.0, 13.0, 17.0, 14.0, 39.0, 75.0, 112.0, 266.0, 805.0, 3278.0, 17399.0, 312760.0, 3693684.0, 149318.0, 12246.0, 2751.0, 941.0, 295.0, 100.0, 71.0, 37.0, 24.0, 11.0, 8.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.078125, -13.6689453125, -13.259765625, -12.8505859375, -12.44140625, -12.0322265625, -11.623046875, -11.2138671875, -10.8046875, -10.3955078125, -9.986328125, -9.5771484375, -9.16796875, -8.7587890625, -8.349609375, -7.9404296875, -7.53125, -7.1220703125, -6.712890625, -6.3037109375, -5.89453125, -5.4853515625, -5.076171875, -4.6669921875, -4.2578125, -3.8486328125, -3.439453125, -3.0302734375, -2.62109375, -2.2119140625, -1.802734375, -1.3935546875, -0.984375, -0.5751953125, -0.166015625, 0.2431640625, 0.65234375, 1.0615234375, 1.470703125, 1.8798828125, 2.2890625, 2.6982421875, 3.107421875, 3.5166015625, 3.92578125, 4.3349609375, 4.744140625, 5.1533203125, 5.5625, 5.9716796875, 6.380859375, 6.7900390625, 7.19921875, 7.6083984375, 8.017578125, 8.4267578125, 8.8359375, 9.2451171875, 9.654296875, 10.0634765625, 10.47265625, 10.8818359375, 11.291015625, 11.7001953125, 12.109375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 8.0, 7.0, 20.0, 38.0, 49.0, 86.0, 113.0, 151.0, 146.0, 127.0, 102.0, 72.0, 43.0, 17.0, 15.0, 10.0, 1.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.046875, -16.600830078125, -16.15478515625, -15.708740234375, -15.2626953125, -14.816650390625, -14.37060546875, -13.924560546875, -13.478515625, -13.032470703125, -12.58642578125, -12.140380859375, -11.6943359375, -11.248291015625, -10.80224609375, -10.356201171875, -9.91015625, -9.464111328125, -9.01806640625, -8.572021484375, -8.1259765625, -7.679931640625, -7.23388671875, -6.787841796875, -6.341796875, -5.895751953125, -5.44970703125, -5.003662109375, -4.5576171875, -4.111572265625, -3.66552734375, -3.219482421875, -2.7734375, -2.327392578125, -1.88134765625, -1.435302734375, -0.9892578125, -0.543212890625, -0.09716796875, 0.348876953125, 0.794921875, 1.240966796875, 1.68701171875, 2.133056640625, 2.5791015625, 3.025146484375, 3.47119140625, 3.917236328125, 4.36328125, 4.809326171875, 5.25537109375, 5.701416015625, 6.1474609375, 6.593505859375, 7.03955078125, 7.485595703125, 7.931640625, 8.377685546875, 8.82373046875, 9.269775390625, 9.7158203125, 10.161865234375, 10.60791015625, 11.053955078125, 11.5]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 6.0, 2.0, 10.0, 18.0, 11.0, 35.0, 60.0, 84.0, 133.0, 312.0, 670.0, 1776.0, 4978.0, 18588.0, 150802.0, 3665298.0, 309220.0, 30646.0, 7117.0, 2421.0, 1025.0, 482.0, 240.0, 139.0, 78.0, 46.0, 35.0, 18.0, 14.0, 4.0, 7.0, 7.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.46875, -14.979248046875, -14.48974609375, -14.000244140625, -13.5107421875, -13.021240234375, -12.53173828125, -12.042236328125, -11.552734375, -11.063232421875, -10.57373046875, -10.084228515625, -9.5947265625, -9.105224609375, -8.61572265625, -8.126220703125, -7.63671875, -7.147216796875, -6.65771484375, -6.168212890625, -5.6787109375, -5.189208984375, -4.69970703125, -4.210205078125, -3.720703125, -3.231201171875, -2.74169921875, -2.252197265625, -1.7626953125, -1.273193359375, -0.78369140625, -0.294189453125, 0.1953125, 0.684814453125, 1.17431640625, 1.663818359375, 2.1533203125, 2.642822265625, 3.13232421875, 3.621826171875, 4.111328125, 4.600830078125, 5.09033203125, 5.579833984375, 6.0693359375, 6.558837890625, 7.04833984375, 7.537841796875, 8.02734375, 8.516845703125, 9.00634765625, 9.495849609375, 9.9853515625, 10.474853515625, 10.96435546875, 11.453857421875, 11.943359375, 12.432861328125, 12.92236328125, 13.411865234375, 13.9013671875, 14.390869140625, 14.88037109375, 15.369873046875, 15.859375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 5.0, 1.0, 5.0, 3.0, 7.0, 7.0, 9.0, 19.0, 18.0, 36.0, 53.0, 89.0, 165.0, 303.0, 629.0, 988.0, 776.0, 396.0, 208.0, 101.0, 75.0, 43.0, 42.0, 29.0, 16.0, 13.0, 9.0, 7.0, 6.0, 2.0, 2.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-12.5234375, -12.0135498046875, -11.503662109375, -10.9937744140625, -10.48388671875, -9.9739990234375, -9.464111328125, -8.9542236328125, -8.4443359375, -7.9344482421875, -7.424560546875, -6.9146728515625, -6.40478515625, -5.8948974609375, -5.385009765625, -4.8751220703125, -4.365234375, -3.8553466796875, -3.345458984375, -2.8355712890625, -2.32568359375, -1.8157958984375, -1.305908203125, -0.7960205078125, -0.2861328125, 0.2237548828125, 0.733642578125, 1.2435302734375, 1.75341796875, 2.2633056640625, 2.773193359375, 3.2830810546875, 3.79296875, 4.3028564453125, 4.812744140625, 5.3226318359375, 5.83251953125, 6.3424072265625, 6.852294921875, 7.3621826171875, 7.8720703125, 8.3819580078125, 8.891845703125, 9.4017333984375, 9.91162109375, 10.4215087890625, 10.931396484375, 11.4412841796875, 11.951171875, 12.4610595703125, 12.970947265625, 13.4808349609375, 13.99072265625, 14.5006103515625, 15.010498046875, 15.5203857421875, 16.0302734375, 16.5401611328125, 17.050048828125, 17.5599365234375, 18.06982421875, 18.5797119140625, 19.089599609375, 19.5994873046875, 20.109375]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 5.0, 4.0, 9.0, 18.0, 26.0, 81.0, 222.0, 289.0, 192.0, 83.0, 37.0, 15.0, 9.0, 3.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-131.90419006347656, -126.90132904052734, -121.89847564697266, -116.89561462402344, -111.89276123046875, -106.88990020751953, -101.88703918457031, -96.88418579101562, -91.8813247680664, -86.87846374511719, -81.8756103515625, -76.87274932861328, -71.86988830566406, -66.86703491210938, -61.864173889160156, -56.8613166809082, -51.85845947265625, -46.8556022644043, -41.852745056152344, -36.849884033203125, -31.847026824951172, -26.84416961669922, -21.841310501098633, -16.838451385498047, -11.835594177246094, -6.832736015319824, -1.8298778533935547, 3.172980308532715, 8.175838470458984, 13.178695678710938, 18.181554794311523, 23.18441390991211, 28.187271118164062, 33.190128326416016, 38.19298553466797, 43.19584655761719, 48.19870376586914, 53.201560974121094, 58.20442199707031, 63.207279205322266, 68.21013641357422, 73.21299743652344, 78.21585083007812, 83.21871185302734, 88.22157287597656, 93.22442626953125, 98.22728729248047, 103.23014831542969, 108.23300170898438, 113.2358627319336, 118.23871612548828, 123.2415771484375, 128.2444305419922, 133.24728393554688, 138.25015258789062, 143.2530059814453, 148.255859375, 153.2587127685547, 158.26158142089844, 163.26443481445312, 168.2672882080078, 173.2701416015625, 178.27301025390625, 183.27586364746094, 188.2787322998047]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 8.0, 9.0, 8.0, 10.0, 18.0, 25.0, 30.0, 32.0, 37.0, 45.0, 46.0, 52.0, 61.0, 54.0, 57.0, 60.0, 46.0, 48.0, 55.0, 50.0, 28.0, 37.0, 43.0, 34.0, 19.0, 24.0, 12.0, 23.0, 12.0, 7.0, 7.0, 5.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-104.01726531982422, -101.41281127929688, -98.80835723876953, -96.20391082763672, -93.59945678710938, -90.99500274658203, -88.39054870605469, -85.78610229492188, -83.18164825439453, -80.57719421386719, -77.97274017333984, -75.36829376220703, -72.76383972167969, -70.15938568115234, -67.554931640625, -64.95048522949219, -62.34602737426758, -59.741573333740234, -57.137123107910156, -54.53266906738281, -51.928218841552734, -49.32376480102539, -46.71931457519531, -44.11486053466797, -41.510406494140625, -38.90595245361328, -36.3015022277832, -33.69704818725586, -31.09259796142578, -28.488143920898438, -25.883691787719727, -23.279239654541016, -20.674789428710938, -18.070337295532227, -15.465885162353516, -12.861432075500488, -10.256979942321777, -7.652527809143066, -5.048074722290039, -2.443622589111328, 0.1608295440673828, 2.765281915664673, 5.369734287261963, 7.974186897277832, 10.578639030456543, 13.183091163635254, 15.787544250488281, 18.391996383666992, 20.996448516845703, 23.600900650024414, 26.205352783203125, 28.80980682373047, 31.414257049560547, 34.01871109008789, 36.62316131591797, 39.22761535644531, 41.832069396972656, 44.4365234375, 47.04097366333008, 49.64542770385742, 52.2498779296875, 54.854331970214844, 57.45878601074219, 60.063236236572266, 62.667686462402344]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 5.0, 4.0, 5.0, 2.0, 8.0, 6.0, 10.0, 10.0, 19.0, 21.0, 33.0, 69.0, 101.0, 128.0, 196.0, 312.0, 566.0, 970.0, 1756.0, 3547.0, 8023.0, 19136.0, 48656.0, 132591.0, 348519.0, 302966.0, 110214.0, 40591.0, 16097.0, 7000.0, 3206.0, 1648.0, 882.0, 459.0, 291.0, 171.0, 87.0, 74.0, 60.0, 37.0, 22.0, 16.0, 13.0, 14.0, 7.0, 2.0, 4.0, 2.0, 6.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.69921875, -7.45013427734375, -7.2010498046875, -6.95196533203125, -6.702880859375, -6.45379638671875, -6.2047119140625, -5.95562744140625, -5.70654296875, -5.45745849609375, -5.2083740234375, -4.95928955078125, -4.710205078125, -4.46112060546875, -4.2120361328125, -3.96295166015625, -3.7138671875, -3.46478271484375, -3.2156982421875, -2.96661376953125, -2.717529296875, -2.46844482421875, -2.2193603515625, -1.97027587890625, -1.72119140625, -1.47210693359375, -1.2230224609375, -0.97393798828125, -0.724853515625, -0.47576904296875, -0.2266845703125, 0.02239990234375, 0.271484375, 0.52056884765625, 0.7696533203125, 1.01873779296875, 1.267822265625, 1.51690673828125, 1.7659912109375, 2.01507568359375, 2.26416015625, 2.51324462890625, 2.7623291015625, 3.01141357421875, 3.260498046875, 3.50958251953125, 3.7586669921875, 4.00775146484375, 4.2568359375, 4.50592041015625, 4.7550048828125, 5.00408935546875, 5.253173828125, 5.50225830078125, 5.7513427734375, 6.00042724609375, 6.24951171875, 6.49859619140625, 6.7476806640625, 6.99676513671875, 7.245849609375, 7.49493408203125, 7.7440185546875, 7.99310302734375, 8.2421875]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 8.0, 12.0, 6.0, 17.0, 24.0, 29.0, 44.0, 58.0, 48.0, 78.0, 88.0, 95.0, 89.0, 78.0, 85.0, 66.0, 48.0, 40.0, 31.0, 16.0, 10.0, 8.0, 9.0, 8.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0], "bins": [-10.9609375, -10.7113037109375, -10.461669921875, -10.2120361328125, -9.96240234375, -9.7127685546875, -9.463134765625, -9.2135009765625, -8.9638671875, -8.7142333984375, -8.464599609375, -8.2149658203125, -7.96533203125, -7.7156982421875, -7.466064453125, -7.2164306640625, -6.966796875, -6.7171630859375, -6.467529296875, -6.2178955078125, -5.96826171875, -5.7186279296875, -5.468994140625, -5.2193603515625, -4.9697265625, -4.7200927734375, -4.470458984375, -4.2208251953125, -3.97119140625, -3.7215576171875, -3.471923828125, -3.2222900390625, -2.97265625, -2.7230224609375, -2.473388671875, -2.2237548828125, -1.97412109375, -1.7244873046875, -1.474853515625, -1.2252197265625, -0.9755859375, -0.7259521484375, -0.476318359375, -0.2266845703125, 0.02294921875, 0.2725830078125, 0.522216796875, 0.7718505859375, 1.021484375, 1.2711181640625, 1.520751953125, 1.7703857421875, 2.02001953125, 2.2696533203125, 2.519287109375, 2.7689208984375, 3.0185546875, 3.2681884765625, 3.517822265625, 3.7674560546875, 4.01708984375, 4.2667236328125, 4.516357421875, 4.7659912109375, 5.015625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 6.0, 5.0, 7.0, 10.0, 13.0, 26.0, 26.0, 47.0, 116.0, 176.0, 240.0, 523.0, 1094.0, 2990.0, 12036.0, 155901.0, 824590.0, 41140.0, 5897.0, 1937.0, 833.0, 395.0, 219.0, 118.0, 72.0, 43.0, 37.0, 21.0, 20.0, 6.0, 4.0, 2.0, 4.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.421875, -27.56787109375, -26.7138671875, -25.85986328125, -25.005859375, -24.15185546875, -23.2978515625, -22.44384765625, -21.58984375, -20.73583984375, -19.8818359375, -19.02783203125, -18.173828125, -17.31982421875, -16.4658203125, -15.61181640625, -14.7578125, -13.90380859375, -13.0498046875, -12.19580078125, -11.341796875, -10.48779296875, -9.6337890625, -8.77978515625, -7.92578125, -7.07177734375, -6.2177734375, -5.36376953125, -4.509765625, -3.65576171875, -2.8017578125, -1.94775390625, -1.09375, -0.23974609375, 0.6142578125, 1.46826171875, 2.322265625, 3.17626953125, 4.0302734375, 4.88427734375, 5.73828125, 6.59228515625, 7.4462890625, 8.30029296875, 9.154296875, 10.00830078125, 10.8623046875, 11.71630859375, 12.5703125, 13.42431640625, 14.2783203125, 15.13232421875, 15.986328125, 16.84033203125, 17.6943359375, 18.54833984375, 19.40234375, 20.25634765625, 21.1103515625, 21.96435546875, 22.818359375, 23.67236328125, 24.5263671875, 25.38037109375, 26.234375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 9.0, 8.0, 7.0, 9.0, 22.0, 28.0, 30.0, 30.0, 41.0, 52.0, 54.0, 75.0, 79.0, 85.0, 75.0, 77.0, 67.0, 62.0, 45.0, 42.0, 26.0, 23.0, 24.0, 10.0, 9.0, 4.0, 4.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-32.90625, -31.78369140625, -30.6611328125, -29.53857421875, -28.416015625, -27.29345703125, -26.1708984375, -25.04833984375, -23.92578125, -22.80322265625, -21.6806640625, -20.55810546875, -19.435546875, -18.31298828125, -17.1904296875, -16.06787109375, -14.9453125, -13.82275390625, -12.7001953125, -11.57763671875, -10.455078125, -9.33251953125, -8.2099609375, -7.08740234375, -5.96484375, -4.84228515625, -3.7197265625, -2.59716796875, -1.474609375, -0.35205078125, 0.7705078125, 1.89306640625, 3.015625, 4.13818359375, 5.2607421875, 6.38330078125, 7.505859375, 8.62841796875, 9.7509765625, 10.87353515625, 11.99609375, 13.11865234375, 14.2412109375, 15.36376953125, 16.486328125, 17.60888671875, 18.7314453125, 19.85400390625, 20.9765625, 22.09912109375, 23.2216796875, 24.34423828125, 25.466796875, 26.58935546875, 27.7119140625, 28.83447265625, 29.95703125, 31.07958984375, 32.2021484375, 33.32470703125, 34.447265625, 35.56982421875, 36.6923828125, 37.81494140625, 38.9375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 10.0, 16.0, 21.0, 29.0, 63.0, 86.0, 158.0, 290.0, 690.0, 2033.0, 7945.0, 118578.0, 880766.0, 31341.0, 4143.0, 1329.0, 493.0, 222.0, 127.0, 87.0, 43.0, 28.0, 17.0, 18.0, 6.0, 10.0, 7.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.0703125, -8.7979736328125, -8.525634765625, -8.2532958984375, -7.98095703125, -7.7086181640625, -7.436279296875, -7.1639404296875, -6.8916015625, -6.6192626953125, -6.346923828125, -6.0745849609375, -5.80224609375, -5.5299072265625, -5.257568359375, -4.9852294921875, -4.712890625, -4.4405517578125, -4.168212890625, -3.8958740234375, -3.62353515625, -3.3511962890625, -3.078857421875, -2.8065185546875, -2.5341796875, -2.2618408203125, -1.989501953125, -1.7171630859375, -1.44482421875, -1.1724853515625, -0.900146484375, -0.6278076171875, -0.35546875, -0.0831298828125, 0.189208984375, 0.4615478515625, 0.73388671875, 1.0062255859375, 1.278564453125, 1.5509033203125, 1.8232421875, 2.0955810546875, 2.367919921875, 2.6402587890625, 2.91259765625, 3.1849365234375, 3.457275390625, 3.7296142578125, 4.001953125, 4.2742919921875, 4.546630859375, 4.8189697265625, 5.09130859375, 5.3636474609375, 5.635986328125, 5.9083251953125, 6.1806640625, 6.4530029296875, 6.725341796875, 6.9976806640625, 7.27001953125, 7.5423583984375, 7.814697265625, 8.0870361328125, 8.359375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 6.0, 3.0, 7.0, 4.0, 14.0, 17.0, 16.0, 27.0, 33.0, 39.0, 45.0, 62.0, 66.0, 82.0, 103.0, 72.0, 69.0, 69.0, 66.0, 40.0, 48.0, 24.0, 27.0, 17.0, 11.0, 7.0, 11.0, 7.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0008916854858398438, -0.0008637905120849609, -0.0008358955383300781, -0.0008080005645751953, -0.0007801055908203125, -0.0007522106170654297, -0.0007243156433105469, -0.0006964206695556641, -0.0006685256958007812, -0.0006406307220458984, -0.0006127357482910156, -0.0005848407745361328, -0.00055694580078125, -0.0005290508270263672, -0.0005011558532714844, -0.00047326087951660156, -0.00044536590576171875, -0.00041747093200683594, -0.0003895759582519531, -0.0003616809844970703, -0.0003337860107421875, -0.0003058910369873047, -0.0002779960632324219, -0.00025010108947753906, -0.00022220611572265625, -0.00019431114196777344, -0.00016641616821289062, -0.0001385211944580078, -0.000110626220703125, -8.273124694824219e-05, -5.4836273193359375e-05, -2.6941299438476562e-05, 9.5367431640625e-07, 2.8848648071289062e-05, 5.6743621826171875e-05, 8.463859558105469e-05, 0.0001125335693359375, 0.0001404285430908203, 0.00016832351684570312, 0.00019621849060058594, 0.00022411346435546875, 0.00025200843811035156, 0.0002799034118652344, 0.0003077983856201172, 0.000335693359375, 0.0003635883331298828, 0.0003914833068847656, 0.00041937828063964844, 0.00044727325439453125, 0.00047516822814941406, 0.0005030632019042969, 0.0005309581756591797, 0.0005588531494140625, 0.0005867481231689453, 0.0006146430969238281, 0.0006425380706787109, 0.0006704330444335938, 0.0006983280181884766, 0.0007262229919433594, 0.0007541179656982422, 0.000782012939453125, 0.0008099079132080078, 0.0008378028869628906, 0.0008656978607177734, 0.0008935928344726562]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 2.0, 8.0, 5.0, 9.0, 11.0, 14.0, 27.0, 57.0, 66.0, 104.0, 190.0, 350.0, 768.0, 1912.0, 6682.0, 57867.0, 891696.0, 77261.0, 7781.0, 2027.0, 791.0, 376.0, 192.0, 119.0, 69.0, 49.0, 38.0, 30.0, 24.0, 9.0, 6.0, 4.0, 4.0, 5.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.39453125, -5.17474365234375, -4.9549560546875, -4.73516845703125, -4.515380859375, -4.29559326171875, -4.0758056640625, -3.85601806640625, -3.63623046875, -3.41644287109375, -3.1966552734375, -2.97686767578125, -2.757080078125, -2.53729248046875, -2.3175048828125, -2.09771728515625, -1.8779296875, -1.65814208984375, -1.4383544921875, -1.21856689453125, -0.998779296875, -0.77899169921875, -0.5592041015625, -0.33941650390625, -0.11962890625, 0.10015869140625, 0.3199462890625, 0.53973388671875, 0.759521484375, 0.97930908203125, 1.1990966796875, 1.41888427734375, 1.638671875, 1.85845947265625, 2.0782470703125, 2.29803466796875, 2.517822265625, 2.73760986328125, 2.9573974609375, 3.17718505859375, 3.39697265625, 3.61676025390625, 3.8365478515625, 4.05633544921875, 4.276123046875, 4.49591064453125, 4.7156982421875, 4.93548583984375, 5.1552734375, 5.37506103515625, 5.5948486328125, 5.81463623046875, 6.034423828125, 6.25421142578125, 6.4739990234375, 6.69378662109375, 6.91357421875, 7.13336181640625, 7.3531494140625, 7.57293701171875, 7.792724609375, 8.01251220703125, 8.2322998046875, 8.45208740234375, 8.671875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 4.0, 2.0, 4.0, 3.0, 10.0, 15.0, 20.0, 25.0, 27.0, 40.0, 55.0, 82.0, 84.0, 101.0, 103.0, 87.0, 92.0, 68.0, 47.0, 38.0, 24.0, 14.0, 10.0, 13.0, 6.0, 4.0, 5.0, 6.0, 3.0, 4.0, 1.0, 1.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.3515625, -6.15338134765625, -5.9552001953125, -5.75701904296875, -5.558837890625, -5.36065673828125, -5.1624755859375, -4.96429443359375, -4.76611328125, -4.56793212890625, -4.3697509765625, -4.17156982421875, -3.973388671875, -3.77520751953125, -3.5770263671875, -3.37884521484375, -3.1806640625, -2.98248291015625, -2.7843017578125, -2.58612060546875, -2.387939453125, -2.18975830078125, -1.9915771484375, -1.79339599609375, -1.59521484375, -1.39703369140625, -1.1988525390625, -1.00067138671875, -0.802490234375, -0.60430908203125, -0.4061279296875, -0.20794677734375, -0.009765625, 0.18841552734375, 0.3865966796875, 0.58477783203125, 0.782958984375, 0.98114013671875, 1.1793212890625, 1.37750244140625, 1.57568359375, 1.77386474609375, 1.9720458984375, 2.17022705078125, 2.368408203125, 2.56658935546875, 2.7647705078125, 2.96295166015625, 3.1611328125, 3.35931396484375, 3.5574951171875, 3.75567626953125, 3.953857421875, 4.15203857421875, 4.3502197265625, 4.54840087890625, 4.74658203125, 4.94476318359375, 5.1429443359375, 5.34112548828125, 5.539306640625, 5.73748779296875, 5.9356689453125, 6.13385009765625, 6.33203125]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 8.0, 15.0, 45.0, 94.0, 188.0, 341.0, 183.0, 76.0, 22.0, 9.0, 5.0, 4.0, 5.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-272.9862976074219, -267.3449401855469, -261.7035827636719, -256.0622253417969, -250.4208526611328, -244.7794952392578, -239.1381378173828, -233.4967803955078, -227.85540771484375, -222.21405029296875, -216.57269287109375, -210.93133544921875, -205.2899627685547, -199.6486053466797, -194.0072479248047, -188.3658905029297, -182.7245330810547, -177.0831756591797, -171.4418182373047, -165.80044555664062, -160.15908813476562, -154.51773071289062, -148.87637329101562, -143.23501586914062, -137.59365844726562, -131.95230102539062, -126.3109359741211, -120.6695785522461, -115.02821350097656, -109.38685607910156, -103.74549865722656, -98.10414123535156, -92.46277618408203, -86.82141876220703, -81.1800537109375, -75.5386962890625, -69.8973388671875, -64.25597381591797, -58.61461639404297, -52.9732551574707, -47.33189392089844, -41.69053268432617, -36.049171447753906, -30.407814025878906, -24.76645278930664, -19.125091552734375, -13.483734130859375, -7.842372894287109, -2.2010116577148438, 3.4403486251831055, 9.081708908081055, 14.723068237304688, 20.364429473876953, 26.00579071044922, 31.64714813232422, 37.288509368896484, 42.92987060546875, 48.571231842041016, 54.21259307861328, 59.85395050048828, 65.49531555175781, 71.13667297363281, 76.77803039550781, 82.41938781738281, 88.06075286865234]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 6.0, 8.0, 12.0, 8.0, 9.0, 15.0, 13.0, 13.0, 15.0, 18.0, 28.0, 23.0, 29.0, 25.0, 28.0, 43.0, 35.0, 51.0, 53.0, 73.0, 67.0, 61.0, 36.0, 35.0, 45.0, 22.0, 34.0, 25.0, 36.0, 19.0, 17.0, 14.0, 26.0, 12.0, 9.0, 12.0, 2.0, 3.0, 3.0, 3.0, 3.0, 6.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-69.39146423339844, -66.97727966308594, -64.5630874633789, -62.148902893066406, -59.734718322753906, -57.32052993774414, -54.906341552734375, -52.492156982421875, -50.077972412109375, -47.66378402709961, -45.24959945678711, -42.835411071777344, -40.421226501464844, -38.00703811645508, -35.59284973144531, -33.17866516113281, -30.764476776123047, -28.350290298461914, -25.93610382080078, -23.521915435791016, -21.107730865478516, -18.69354248046875, -16.279356002807617, -13.865169525146484, -11.450983047485352, -9.036796569824219, -6.622609615325928, -4.208422660827637, -1.794236183166504, 0.6199502944946289, 3.034137725830078, 5.448324203491211, 7.862510681152344, 10.276697158813477, 12.69088363647461, 15.105071067810059, 17.519256591796875, 19.93344497680664, 22.347631454467773, 24.761817932128906, 27.17600440979004, 29.590190887451172, 32.00437927246094, 34.41856384277344, 36.8327522277832, 39.2469367980957, 41.66112518310547, 44.07530975341797, 46.489498138427734, 48.9036865234375, 51.31787109375, 53.732059478759766, 56.146244049072266, 58.56043243408203, 60.97461700439453, 63.3888053894043, 65.80299377441406, 68.21717834472656, 70.6313705444336, 73.0455551147461, 75.4597396850586, 77.8739242553711, 80.28811645507812, 82.70230102539062, 85.11648559570312]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 8.0, 7.0, 6.0, 9.0, 8.0, 19.0, 38.0, 39.0, 101.0, 184.0, 345.0, 692.0, 1569.0, 3818.0, 11146.0, 47005.0, 397664.0, 3013077.0, 626053.0, 68324.0, 14956.0, 5094.0, 2164.0, 1001.0, 462.0, 257.0, 104.0, 60.0, 38.0, 25.0, 7.0, 3.0, 5.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.9609375, -7.7491455078125, -7.537353515625, -7.3255615234375, -7.11376953125, -6.9019775390625, -6.690185546875, -6.4783935546875, -6.2666015625, -6.0548095703125, -5.843017578125, -5.6312255859375, -5.41943359375, -5.2076416015625, -4.995849609375, -4.7840576171875, -4.572265625, -4.3604736328125, -4.148681640625, -3.9368896484375, -3.72509765625, -3.5133056640625, -3.301513671875, -3.0897216796875, -2.8779296875, -2.6661376953125, -2.454345703125, -2.2425537109375, -2.03076171875, -1.8189697265625, -1.607177734375, -1.3953857421875, -1.18359375, -0.9718017578125, -0.760009765625, -0.5482177734375, -0.33642578125, -0.1246337890625, 0.087158203125, 0.2989501953125, 0.5107421875, 0.7225341796875, 0.934326171875, 1.1461181640625, 1.35791015625, 1.5697021484375, 1.781494140625, 1.9932861328125, 2.205078125, 2.4168701171875, 2.628662109375, 2.8404541015625, 3.05224609375, 3.2640380859375, 3.475830078125, 3.6876220703125, 3.8994140625, 4.1112060546875, 4.322998046875, 4.5347900390625, 4.74658203125, 4.9583740234375, 5.170166015625, 5.3819580078125, 5.59375]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 12.0, 9.0, 15.0, 15.0, 21.0, 15.0, 33.0, 39.0, 50.0, 63.0, 68.0, 81.0, 103.0, 71.0, 89.0, 67.0, 63.0, 52.0, 42.0, 22.0, 25.0, 16.0, 14.0, 9.0, 4.0, 7.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-10.4453125, -10.211669921875, -9.97802734375, -9.744384765625, -9.5107421875, -9.277099609375, -9.04345703125, -8.809814453125, -8.576171875, -8.342529296875, -8.10888671875, -7.875244140625, -7.6416015625, -7.407958984375, -7.17431640625, -6.940673828125, -6.70703125, -6.473388671875, -6.23974609375, -6.006103515625, -5.7724609375, -5.538818359375, -5.30517578125, -5.071533203125, -4.837890625, -4.604248046875, -4.37060546875, -4.136962890625, -3.9033203125, -3.669677734375, -3.43603515625, -3.202392578125, -2.96875, -2.735107421875, -2.50146484375, -2.267822265625, -2.0341796875, -1.800537109375, -1.56689453125, -1.333251953125, -1.099609375, -0.865966796875, -0.63232421875, -0.398681640625, -0.1650390625, 0.068603515625, 0.30224609375, 0.535888671875, 0.76953125, 1.003173828125, 1.23681640625, 1.470458984375, 1.7041015625, 1.937744140625, 2.17138671875, 2.405029296875, 2.638671875, 2.872314453125, 3.10595703125, 3.339599609375, 3.5732421875, 3.806884765625, 4.04052734375, 4.274169921875, 4.5078125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 4.0, 2.0, 5.0, 8.0, 26.0, 31.0, 50.0, 86.0, 162.0, 195.0, 388.0, 708.0, 1595.0, 4415.0, 14780.0, 69923.0, 1588791.0, 2399848.0, 86698.0, 17770.0, 5057.0, 1842.0, 787.0, 410.0, 271.0, 150.0, 100.0, 61.0, 33.0, 27.0, 18.0, 12.0, 6.0, 5.0, 8.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-12.734375, -12.3489990234375, -11.963623046875, -11.5782470703125, -11.19287109375, -10.8074951171875, -10.422119140625, -10.0367431640625, -9.6513671875, -9.2659912109375, -8.880615234375, -8.4952392578125, -8.10986328125, -7.7244873046875, -7.339111328125, -6.9537353515625, -6.568359375, -6.1829833984375, -5.797607421875, -5.4122314453125, -5.02685546875, -4.6414794921875, -4.256103515625, -3.8707275390625, -3.4853515625, -3.0999755859375, -2.714599609375, -2.3292236328125, -1.94384765625, -1.5584716796875, -1.173095703125, -0.7877197265625, -0.40234375, -0.0169677734375, 0.368408203125, 0.7537841796875, 1.13916015625, 1.5245361328125, 1.909912109375, 2.2952880859375, 2.6806640625, 3.0660400390625, 3.451416015625, 3.8367919921875, 4.22216796875, 4.6075439453125, 4.992919921875, 5.3782958984375, 5.763671875, 6.1490478515625, 6.534423828125, 6.9197998046875, 7.30517578125, 7.6905517578125, 8.075927734375, 8.4613037109375, 8.8466796875, 9.2320556640625, 9.617431640625, 10.0028076171875, 10.38818359375, 10.7735595703125, 11.158935546875, 11.5443115234375, 11.9296875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 6.0, 4.0, 8.0, 4.0, 13.0, 13.0, 26.0, 23.0, 41.0, 47.0, 86.0, 173.0, 362.0, 975.0, 1112.0, 579.0, 249.0, 117.0, 64.0, 45.0, 38.0, 25.0, 19.0, 14.0, 9.0, 8.0, 9.0, 5.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.4609375, -13.9486083984375, -13.436279296875, -12.9239501953125, -12.41162109375, -11.8992919921875, -11.386962890625, -10.8746337890625, -10.3623046875, -9.8499755859375, -9.337646484375, -8.8253173828125, -8.31298828125, -7.8006591796875, -7.288330078125, -6.7760009765625, -6.263671875, -5.7513427734375, -5.239013671875, -4.7266845703125, -4.21435546875, -3.7020263671875, -3.189697265625, -2.6773681640625, -2.1650390625, -1.6527099609375, -1.140380859375, -0.6280517578125, -0.11572265625, 0.3966064453125, 0.908935546875, 1.4212646484375, 1.93359375, 2.4459228515625, 2.958251953125, 3.4705810546875, 3.98291015625, 4.4952392578125, 5.007568359375, 5.5198974609375, 6.0322265625, 6.5445556640625, 7.056884765625, 7.5692138671875, 8.08154296875, 8.5938720703125, 9.106201171875, 9.6185302734375, 10.130859375, 10.6431884765625, 11.155517578125, 11.6678466796875, 12.18017578125, 12.6925048828125, 13.204833984375, 13.7171630859375, 14.2294921875, 14.7418212890625, 15.254150390625, 15.7664794921875, 16.27880859375, 16.7911376953125, 17.303466796875, 17.8157958984375, 18.328125]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 10.0, 18.0, 30.0, 102.0, 249.0, 324.0, 176.0, 48.0, 27.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-144.39495849609375, -139.27593994140625, -134.1569366455078, -129.0379180908203, -123.91890716552734, -118.79989624023438, -113.68087768554688, -108.5618667602539, -103.44285583496094, -98.32384490966797, -93.204833984375, -88.0858154296875, -82.96680450439453, -77.84779357910156, -72.72877502441406, -67.6097640991211, -62.490753173828125, -57.371742248535156, -52.25272750854492, -47.13371276855469, -42.01470184326172, -36.89569091796875, -31.776676177978516, -26.65766143798828, -21.538650512695312, -16.41963768005371, -11.30062484741211, -6.181612014770508, -1.0625991821289062, 4.056413650512695, 9.175426483154297, 14.294441223144531, 19.4134521484375, 24.5324649810791, 29.651477813720703, 34.77049255371094, 39.889503479003906, 45.008514404296875, 50.12752914428711, 55.246543884277344, 60.36555480957031, 65.48456573486328, 70.60357666015625, 75.72259521484375, 80.84160614013672, 85.96061706542969, 91.07963562011719, 96.19864654541016, 101.31765747070312, 106.4366683959961, 111.55567932128906, 116.67469787597656, 121.79370880126953, 126.9127197265625, 132.03173828125, 137.1507568359375, 142.26976013183594, 147.38877868652344, 152.50778198242188, 157.62680053710938, 162.74581909179688, 167.8648223876953, 172.9838409423828, 178.10284423828125, 183.22186279296875]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 14.0, 12.0, 10.0, 20.0, 20.0, 27.0, 28.0, 33.0, 56.0, 49.0, 55.0, 54.0, 73.0, 60.0, 63.0, 53.0, 67.0, 57.0, 47.0, 42.0, 34.0, 34.0, 30.0, 17.0, 12.0, 15.0, 7.0, 8.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.74382019042969, -44.43189239501953, -42.11996841430664, -39.80804443359375, -37.496116638183594, -35.18418884277344, -32.87226486206055, -30.560338973999023, -28.2484130859375, -25.936487197875977, -23.624561309814453, -21.31263542175293, -19.000709533691406, -16.688783645629883, -14.37685775756836, -12.064931869506836, -9.753005981445312, -7.441080093383789, -5.129154205322266, -2.817228317260742, -0.5053024291992188, 1.8066234588623047, 4.118549346923828, 6.430475234985352, 8.742401123046875, 11.054327011108398, 13.366252899169922, 15.678178787231445, 17.99010467529297, 20.302030563354492, 22.613956451416016, 24.92588233947754, 27.237808227539062, 29.549734115600586, 31.86166000366211, 34.173583984375, 36.485511779785156, 38.79743957519531, 41.1093635559082, 43.421287536621094, 45.73321533203125, 48.045143127441406, 50.3570671081543, 52.66899108886719, 54.980918884277344, 57.2928466796875, 59.60477066040039, 61.91669464111328, 64.22862243652344, 66.5405502319336, 68.85247802734375, 71.16439819335938, 73.47632598876953, 75.78825378417969, 78.10017395019531, 80.41210174560547, 82.72402954101562, 85.03595733642578, 87.34788513183594, 89.65980529785156, 91.97173309326172, 94.28366088867188, 96.5955810546875, 98.90750885009766, 101.21943664550781]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 5.0, 6.0, 9.0, 9.0, 17.0, 23.0, 24.0, 42.0, 55.0, 122.0, 221.0, 387.0, 737.0, 1323.0, 2908.0, 6517.0, 16280.0, 46845.0, 155024.0, 480034.0, 233391.0, 66684.0, 22016.0, 8589.0, 3531.0, 1787.0, 805.0, 479.0, 262.0, 154.0, 102.0, 55.0, 39.0, 32.0, 13.0, 12.0, 3.0, 3.0, 5.0, 6.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.765625, -8.459716796875, -8.15380859375, -7.847900390625, -7.5419921875, -7.236083984375, -6.93017578125, -6.624267578125, -6.318359375, -6.012451171875, -5.70654296875, -5.400634765625, -5.0947265625, -4.788818359375, -4.48291015625, -4.177001953125, -3.87109375, -3.565185546875, -3.25927734375, -2.953369140625, -2.6474609375, -2.341552734375, -2.03564453125, -1.729736328125, -1.423828125, -1.117919921875, -0.81201171875, -0.506103515625, -0.2001953125, 0.105712890625, 0.41162109375, 0.717529296875, 1.0234375, 1.329345703125, 1.63525390625, 1.941162109375, 2.2470703125, 2.552978515625, 2.85888671875, 3.164794921875, 3.470703125, 3.776611328125, 4.08251953125, 4.388427734375, 4.6943359375, 5.000244140625, 5.30615234375, 5.612060546875, 5.91796875, 6.223876953125, 6.52978515625, 6.835693359375, 7.1416015625, 7.447509765625, 7.75341796875, 8.059326171875, 8.365234375, 8.671142578125, 8.97705078125, 9.282958984375, 9.5888671875, 9.894775390625, 10.20068359375, 10.506591796875, 10.8125]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 6.0, 7.0, 8.0, 15.0, 7.0, 19.0, 27.0, 12.0, 26.0, 21.0, 23.0, 33.0, 38.0, 40.0, 52.0, 57.0, 52.0, 51.0, 62.0, 58.0, 50.0, 38.0, 58.0, 41.0, 38.0, 34.0, 19.0, 19.0, 20.0, 14.0, 12.0, 12.0, 7.0, 5.0, 3.0, 4.0, 3.0, 6.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.046875, -4.89208984375, -4.7373046875, -4.58251953125, -4.427734375, -4.27294921875, -4.1181640625, -3.96337890625, -3.80859375, -3.65380859375, -3.4990234375, -3.34423828125, -3.189453125, -3.03466796875, -2.8798828125, -2.72509765625, -2.5703125, -2.41552734375, -2.2607421875, -2.10595703125, -1.951171875, -1.79638671875, -1.6416015625, -1.48681640625, -1.33203125, -1.17724609375, -1.0224609375, -0.86767578125, -0.712890625, -0.55810546875, -0.4033203125, -0.24853515625, -0.09375, 0.06103515625, 0.2158203125, 0.37060546875, 0.525390625, 0.68017578125, 0.8349609375, 0.98974609375, 1.14453125, 1.29931640625, 1.4541015625, 1.60888671875, 1.763671875, 1.91845703125, 2.0732421875, 2.22802734375, 2.3828125, 2.53759765625, 2.6923828125, 2.84716796875, 3.001953125, 3.15673828125, 3.3115234375, 3.46630859375, 3.62109375, 3.77587890625, 3.9306640625, 4.08544921875, 4.240234375, 4.39501953125, 4.5498046875, 4.70458984375, 4.859375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 5.0, 1.0, 8.0, 7.0, 8.0, 15.0, 26.0, 26.0, 44.0, 78.0, 103.0, 207.0, 330.0, 618.0, 1368.0, 4121.0, 20824.0, 321298.0, 662388.0, 28562.0, 5130.0, 1622.0, 729.0, 389.0, 257.0, 151.0, 76.0, 62.0, 35.0, 22.0, 19.0, 4.0, 8.0, 6.0, 3.0, 3.0, 6.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.53125, -21.75634765625, -20.9814453125, -20.20654296875, -19.431640625, -18.65673828125, -17.8818359375, -17.10693359375, -16.33203125, -15.55712890625, -14.7822265625, -14.00732421875, -13.232421875, -12.45751953125, -11.6826171875, -10.90771484375, -10.1328125, -9.35791015625, -8.5830078125, -7.80810546875, -7.033203125, -6.25830078125, -5.4833984375, -4.70849609375, -3.93359375, -3.15869140625, -2.3837890625, -1.60888671875, -0.833984375, -0.05908203125, 0.7158203125, 1.49072265625, 2.265625, 3.04052734375, 3.8154296875, 4.59033203125, 5.365234375, 6.14013671875, 6.9150390625, 7.68994140625, 8.46484375, 9.23974609375, 10.0146484375, 10.78955078125, 11.564453125, 12.33935546875, 13.1142578125, 13.88916015625, 14.6640625, 15.43896484375, 16.2138671875, 16.98876953125, 17.763671875, 18.53857421875, 19.3134765625, 20.08837890625, 20.86328125, 21.63818359375, 22.4130859375, 23.18798828125, 23.962890625, 24.73779296875, 25.5126953125, 26.28759765625, 27.0625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 6.0, 5.0, 6.0, 12.0, 17.0, 7.0, 13.0, 26.0, 27.0, 31.0, 32.0, 41.0, 34.0, 58.0, 58.0, 61.0, 42.0, 67.0, 74.0, 46.0, 56.0, 38.0, 32.0, 34.0, 29.0, 32.0, 25.0, 15.0, 11.0, 9.0, 13.0, 9.0, 3.0, 10.0, 5.0, 4.0, 7.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.3125, -17.656494140625, -17.00048828125, -16.344482421875, -15.6884765625, -15.032470703125, -14.37646484375, -13.720458984375, -13.064453125, -12.408447265625, -11.75244140625, -11.096435546875, -10.4404296875, -9.784423828125, -9.12841796875, -8.472412109375, -7.81640625, -7.160400390625, -6.50439453125, -5.848388671875, -5.1923828125, -4.536376953125, -3.88037109375, -3.224365234375, -2.568359375, -1.912353515625, -1.25634765625, -0.600341796875, 0.0556640625, 0.711669921875, 1.36767578125, 2.023681640625, 2.6796875, 3.335693359375, 3.99169921875, 4.647705078125, 5.3037109375, 5.959716796875, 6.61572265625, 7.271728515625, 7.927734375, 8.583740234375, 9.23974609375, 9.895751953125, 10.5517578125, 11.207763671875, 11.86376953125, 12.519775390625, 13.17578125, 13.831787109375, 14.48779296875, 15.143798828125, 15.7998046875, 16.455810546875, 17.11181640625, 17.767822265625, 18.423828125, 19.079833984375, 19.73583984375, 20.391845703125, 21.0478515625, 21.703857421875, 22.35986328125, 23.015869140625, 23.671875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 4.0, 5.0, 14.0, 17.0, 22.0, 51.0, 104.0, 230.0, 532.0, 1973.0, 11924.0, 257247.0, 749276.0, 22857.0, 2926.0, 795.0, 296.0, 114.0, 60.0, 35.0, 28.0, 11.0, 8.0, 6.0, 5.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.640625, -7.42315673828125, -7.2056884765625, -6.98822021484375, -6.770751953125, -6.55328369140625, -6.3358154296875, -6.11834716796875, -5.90087890625, -5.68341064453125, -5.4659423828125, -5.24847412109375, -5.031005859375, -4.81353759765625, -4.5960693359375, -4.37860107421875, -4.1611328125, -3.94366455078125, -3.7261962890625, -3.50872802734375, -3.291259765625, -3.07379150390625, -2.8563232421875, -2.63885498046875, -2.42138671875, -2.20391845703125, -1.9864501953125, -1.76898193359375, -1.551513671875, -1.33404541015625, -1.1165771484375, -0.89910888671875, -0.681640625, -0.46417236328125, -0.2467041015625, -0.02923583984375, 0.188232421875, 0.40570068359375, 0.6231689453125, 0.84063720703125, 1.05810546875, 1.27557373046875, 1.4930419921875, 1.71051025390625, 1.927978515625, 2.14544677734375, 2.3629150390625, 2.58038330078125, 2.7978515625, 3.01531982421875, 3.2327880859375, 3.45025634765625, 3.667724609375, 3.88519287109375, 4.1026611328125, 4.32012939453125, 4.53759765625, 4.75506591796875, 4.9725341796875, 5.19000244140625, 5.407470703125, 5.62493896484375, 5.8424072265625, 6.05987548828125, 6.27734375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 3.0, 5.0, 3.0, 4.0, 8.0, 6.0, 9.0, 11.0, 18.0, 18.0, 20.0, 24.0, 26.0, 39.0, 47.0, 49.0, 64.0, 73.0, 83.0, 83.0, 83.0, 59.0, 39.0, 45.0, 35.0, 25.0, 22.0, 25.0, 15.0, 13.0, 15.0, 3.0, 7.0, 6.0, 6.0, 5.0, 0.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007510185241699219, -0.0007267147302627563, -0.0007024109363555908, -0.0006781071424484253, -0.0006538033485412598, -0.0006294995546340942, -0.0006051957607269287, -0.0005808919668197632, -0.0005565881729125977, -0.0005322843790054321, -0.0005079805850982666, -0.0004836767911911011, -0.00045937299728393555, -0.00043506920337677, -0.0004107654094696045, -0.00038646161556243896, -0.00036215782165527344, -0.0003378540277481079, -0.0003135502338409424, -0.00028924643993377686, -0.00026494264602661133, -0.0002406388521194458, -0.00021633505821228027, -0.00019203126430511475, -0.00016772747039794922, -0.0001434236764907837, -0.00011911988258361816, -9.481608867645264e-05, -7.051229476928711e-05, -4.620850086212158e-05, -2.1904706954956055e-05, 2.3990869522094727e-06, 2.6702880859375e-05, 5.100667476654053e-05, 7.531046867370605e-05, 9.961426258087158e-05, 0.0001239180564880371, 0.00014822185039520264, 0.00017252564430236816, 0.0001968294382095337, 0.00022113323211669922, 0.00024543702602386475, 0.0002697408199310303, 0.0002940446138381958, 0.00031834840774536133, 0.00034265220165252686, 0.0003669559955596924, 0.0003912597894668579, 0.00041556358337402344, 0.00043986737728118896, 0.0004641711711883545, 0.00048847496509552, 0.0005127787590026855, 0.0005370825529098511, 0.0005613863468170166, 0.0005856901407241821, 0.0006099939346313477, 0.0006342977285385132, 0.0006586015224456787, 0.0006829053163528442, 0.0007072091102600098, 0.0007315129041671753, 0.0007558166980743408, 0.0007801204919815063, 0.0008044242858886719]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 4.0, 7.0, 14.0, 13.0, 17.0, 35.0, 54.0, 110.0, 250.0, 530.0, 1163.0, 4181.0, 36303.0, 856771.0, 137582.0, 8383.0, 1870.0, 647.0, 292.0, 145.0, 78.0, 49.0, 27.0, 10.0, 8.0, 5.0, 5.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.7578125, -6.56304931640625, -6.3682861328125, -6.17352294921875, -5.978759765625, -5.78399658203125, -5.5892333984375, -5.39447021484375, -5.19970703125, -5.00494384765625, -4.8101806640625, -4.61541748046875, -4.420654296875, -4.22589111328125, -4.0311279296875, -3.83636474609375, -3.6416015625, -3.44683837890625, -3.2520751953125, -3.05731201171875, -2.862548828125, -2.66778564453125, -2.4730224609375, -2.27825927734375, -2.08349609375, -1.88873291015625, -1.6939697265625, -1.49920654296875, -1.304443359375, -1.10968017578125, -0.9149169921875, -0.72015380859375, -0.525390625, -0.33062744140625, -0.1358642578125, 0.05889892578125, 0.253662109375, 0.44842529296875, 0.6431884765625, 0.83795166015625, 1.03271484375, 1.22747802734375, 1.4222412109375, 1.61700439453125, 1.811767578125, 2.00653076171875, 2.2012939453125, 2.39605712890625, 2.5908203125, 2.78558349609375, 2.9803466796875, 3.17510986328125, 3.369873046875, 3.56463623046875, 3.7593994140625, 3.95416259765625, 4.14892578125, 4.34368896484375, 4.5384521484375, 4.73321533203125, 4.927978515625, 5.12274169921875, 5.3175048828125, 5.51226806640625, 5.70703125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 3.0, 4.0, 8.0, 8.0, 6.0, 15.0, 17.0, 15.0, 45.0, 40.0, 67.0, 58.0, 70.0, 98.0, 88.0, 109.0, 81.0, 65.0, 58.0, 33.0, 31.0, 23.0, 14.0, 22.0, 11.0, 5.0, 7.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.74609375, -5.613311767578125, -5.48052978515625, -5.347747802734375, -5.2149658203125, -5.082183837890625, -4.94940185546875, -4.816619873046875, -4.683837890625, -4.551055908203125, -4.41827392578125, -4.285491943359375, -4.1527099609375, -4.019927978515625, -3.88714599609375, -3.754364013671875, -3.62158203125, -3.488800048828125, -3.35601806640625, -3.223236083984375, -3.0904541015625, -2.957672119140625, -2.82489013671875, -2.692108154296875, -2.559326171875, -2.426544189453125, -2.29376220703125, -2.160980224609375, -2.0281982421875, -1.895416259765625, -1.76263427734375, -1.629852294921875, -1.4970703125, -1.364288330078125, -1.23150634765625, -1.098724365234375, -0.9659423828125, -0.833160400390625, -0.70037841796875, -0.567596435546875, -0.434814453125, -0.302032470703125, -0.16925048828125, -0.036468505859375, 0.0963134765625, 0.229095458984375, 0.36187744140625, 0.494659423828125, 0.62744140625, 0.760223388671875, 0.89300537109375, 1.025787353515625, 1.1585693359375, 1.291351318359375, 1.42413330078125, 1.556915283203125, 1.689697265625, 1.822479248046875, 1.95526123046875, 2.088043212890625, 2.2208251953125, 2.353607177734375, 2.48638916015625, 2.619171142578125, 2.751953125]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 5.0, 6.0, 16.0, 24.0, 65.0, 149.0, 366.0, 223.0, 93.0, 23.0, 15.0, 8.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-192.1945037841797, -186.96949768066406, -181.74447631835938, -176.51947021484375, -171.29446411132812, -166.06944274902344, -160.8444366455078, -155.61941528320312, -150.3944091796875, -145.16940307617188, -139.9443817138672, -134.71937561035156, -129.49436950683594, -124.26934814453125, -119.04434204101562, -113.81932830810547, -108.59432220458984, -103.36930847167969, -98.14430236816406, -92.9192886352539, -87.69427490234375, -82.46926879882812, -77.24425506591797, -72.01924133300781, -66.79423522949219, -61.5692253112793, -56.34421157836914, -51.11920166015625, -45.894187927246094, -40.6691780090332, -35.44416809082031, -30.219154357910156, -24.994140625, -19.769128799438477, -14.54411792755127, -9.319107055664062, -4.094095230102539, 1.1309165954589844, 6.355926513671875, 11.580940246582031, 16.805950164794922, 22.030961990356445, 27.25597381591797, 32.48098373413086, 37.70599365234375, 42.931007385253906, 48.1560173034668, 53.38103103637695, 58.606040954589844, 63.831050872802734, 69.05606079101562, 74.28107452392578, 79.50608825683594, 84.73109436035156, 89.95610809326172, 95.18112182617188, 100.4061279296875, 105.63114166259766, 110.85614776611328, 116.08116149902344, 121.3061752319336, 126.53118896484375, 131.75619506835938, 136.981201171875, 142.2062225341797]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 3.0, 7.0, 6.0, 9.0, 15.0, 17.0, 16.0, 14.0, 22.0, 19.0, 29.0, 32.0, 23.0, 31.0, 35.0, 46.0, 49.0, 79.0, 86.0, 75.0, 39.0, 45.0, 33.0, 42.0, 24.0, 24.0, 24.0, 24.0, 20.0, 15.0, 20.0, 11.0, 23.0, 4.0, 11.0, 5.0, 6.0, 6.0, 4.0, 4.0, 3.0, 4.0, 0.0, 1.0, 1.0], "bins": [-81.84986877441406, -79.65782165527344, -77.46578216552734, -75.27373504638672, -73.08169555664062, -70.8896484375, -68.6976089477539, -66.50556182861328, -64.31352233886719, -62.12147903442383, -59.92943572998047, -57.73739242553711, -55.54534912109375, -53.35330581665039, -51.16126251220703, -48.969215393066406, -46.77717208862305, -44.58512878417969, -42.39308547973633, -40.20104217529297, -38.00899887084961, -35.81695556640625, -33.624908447265625, -31.4328670501709, -29.24082374572754, -27.04878044128418, -24.85673713684082, -22.664691925048828, -20.47264862060547, -18.28060531616211, -16.08856201171875, -13.89651870727539, -11.704475402832031, -9.512432098388672, -7.320388317108154, -5.128344535827637, -2.9363012313842773, -0.744257926940918, 1.4477863311767578, 3.639829635620117, 5.831872940063477, 8.023916244506836, 10.215959548950195, 12.408003807067871, 14.60004711151123, 16.792091369628906, 18.984134674072266, 21.176177978515625, 23.368221282958984, 25.560264587402344, 27.752307891845703, 29.944351196289062, 32.13639450073242, 34.32843780517578, 36.520484924316406, 38.7125244140625, 40.904571533203125, 43.096614837646484, 45.288658142089844, 47.4807014465332, 49.67274475097656, 51.86478805541992, 54.05683135986328, 56.248878479003906, 58.44091796875]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 0.0, 4.0, 2.0, 4.0, 6.0, 3.0, 7.0, 15.0, 7.0, 20.0, 35.0, 66.0, 77.0, 156.0, 299.0, 554.0, 1176.0, 2517.0, 6054.0, 18011.0, 88833.0, 875768.0, 2720504.0, 408718.0, 50796.0, 12304.0, 4519.0, 1906.0, 902.0, 416.0, 243.0, 135.0, 65.0, 51.0, 37.0, 21.0, 10.0, 18.0, 6.0, 9.0, 2.0, 5.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.5234375, -5.34136962890625, -5.1593017578125, -4.97723388671875, -4.795166015625, -4.61309814453125, -4.4310302734375, -4.24896240234375, -4.06689453125, -3.88482666015625, -3.7027587890625, -3.52069091796875, -3.338623046875, -3.15655517578125, -2.9744873046875, -2.79241943359375, -2.6103515625, -2.42828369140625, -2.2462158203125, -2.06414794921875, -1.882080078125, -1.70001220703125, -1.5179443359375, -1.33587646484375, -1.15380859375, -0.97174072265625, -0.7896728515625, -0.60760498046875, -0.425537109375, -0.24346923828125, -0.0614013671875, 0.12066650390625, 0.302734375, 0.48480224609375, 0.6668701171875, 0.84893798828125, 1.031005859375, 1.21307373046875, 1.3951416015625, 1.57720947265625, 1.75927734375, 1.94134521484375, 2.1234130859375, 2.30548095703125, 2.487548828125, 2.66961669921875, 2.8516845703125, 3.03375244140625, 3.2158203125, 3.39788818359375, 3.5799560546875, 3.76202392578125, 3.944091796875, 4.12615966796875, 4.3082275390625, 4.49029541015625, 4.67236328125, 4.85443115234375, 5.0364990234375, 5.21856689453125, 5.400634765625, 5.58270263671875, 5.7647705078125, 5.94683837890625, 6.12890625]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 2.0, 4.0, 8.0, 7.0, 8.0, 8.0, 14.0, 12.0, 13.0, 11.0, 12.0, 30.0, 26.0, 33.0, 41.0, 33.0, 39.0, 32.0, 33.0, 35.0, 30.0, 54.0, 59.0, 40.0, 41.0, 44.0, 46.0, 43.0, 35.0, 30.0, 22.0, 19.0, 23.0, 21.0, 23.0, 20.0, 11.0, 9.0, 6.0, 10.0, 10.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.7265625, -3.606353759765625, -3.48614501953125, -3.365936279296875, -3.2457275390625, -3.125518798828125, -3.00531005859375, -2.885101318359375, -2.764892578125, -2.644683837890625, -2.52447509765625, -2.404266357421875, -2.2840576171875, -2.163848876953125, -2.04364013671875, -1.923431396484375, -1.80322265625, -1.683013916015625, -1.56280517578125, -1.442596435546875, -1.3223876953125, -1.202178955078125, -1.08197021484375, -0.961761474609375, -0.841552734375, -0.721343994140625, -0.60113525390625, -0.480926513671875, -0.3607177734375, -0.240509033203125, -0.12030029296875, -9.1552734375e-05, 0.1201171875, 0.240325927734375, 0.36053466796875, 0.480743408203125, 0.6009521484375, 0.721160888671875, 0.84136962890625, 0.961578369140625, 1.081787109375, 1.201995849609375, 1.32220458984375, 1.442413330078125, 1.5626220703125, 1.682830810546875, 1.80303955078125, 1.923248291015625, 2.04345703125, 2.163665771484375, 2.28387451171875, 2.404083251953125, 2.5242919921875, 2.644500732421875, 2.76470947265625, 2.884918212890625, 3.005126953125, 3.125335693359375, 3.24554443359375, 3.365753173828125, 3.4859619140625, 3.606170654296875, 3.72637939453125, 3.846588134765625, 3.966796875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 6.0, 9.0, 4.0, 10.0, 22.0, 29.0, 42.0, 97.0, 115.0, 226.0, 538.0, 2041.0, 13846.0, 352268.0, 3781092.0, 37929.0, 4476.0, 958.0, 275.0, 130.0, 76.0, 42.0, 21.0, 14.0, 6.0, 8.0, 5.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-23.546875, -22.896484375, -22.24609375, -21.595703125, -20.9453125, -20.294921875, -19.64453125, -18.994140625, -18.34375, -17.693359375, -17.04296875, -16.392578125, -15.7421875, -15.091796875, -14.44140625, -13.791015625, -13.140625, -12.490234375, -11.83984375, -11.189453125, -10.5390625, -9.888671875, -9.23828125, -8.587890625, -7.9375, -7.287109375, -6.63671875, -5.986328125, -5.3359375, -4.685546875, -4.03515625, -3.384765625, -2.734375, -2.083984375, -1.43359375, -0.783203125, -0.1328125, 0.517578125, 1.16796875, 1.818359375, 2.46875, 3.119140625, 3.76953125, 4.419921875, 5.0703125, 5.720703125, 6.37109375, 7.021484375, 7.671875, 8.322265625, 8.97265625, 9.623046875, 10.2734375, 10.923828125, 11.57421875, 12.224609375, 12.875, 13.525390625, 14.17578125, 14.826171875, 15.4765625, 16.126953125, 16.77734375, 17.427734375, 18.078125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 5.0, 1.0, 4.0, 5.0, 10.0, 10.0, 23.0, 29.0, 55.0, 81.0, 135.0, 430.0, 1236.0, 1269.0, 430.0, 159.0, 73.0, 40.0, 26.0, 18.0, 10.0, 9.0, 6.0, 5.0, 9.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-25.640625, -25.0831298828125, -24.525634765625, -23.9681396484375, -23.41064453125, -22.8531494140625, -22.295654296875, -21.7381591796875, -21.1806640625, -20.6231689453125, -20.065673828125, -19.5081787109375, -18.95068359375, -18.3931884765625, -17.835693359375, -17.2781982421875, -16.720703125, -16.1632080078125, -15.605712890625, -15.0482177734375, -14.49072265625, -13.9332275390625, -13.375732421875, -12.8182373046875, -12.2607421875, -11.7032470703125, -11.145751953125, -10.5882568359375, -10.03076171875, -9.4732666015625, -8.915771484375, -8.3582763671875, -7.80078125, -7.2432861328125, -6.685791015625, -6.1282958984375, -5.57080078125, -5.0133056640625, -4.455810546875, -3.8983154296875, -3.3408203125, -2.7833251953125, -2.225830078125, -1.6683349609375, -1.11083984375, -0.5533447265625, 0.004150390625, 0.5616455078125, 1.119140625, 1.6766357421875, 2.234130859375, 2.7916259765625, 3.34912109375, 3.9066162109375, 4.464111328125, 5.0216064453125, 5.5791015625, 6.1365966796875, 6.694091796875, 7.2515869140625, 7.80908203125, 8.3665771484375, 8.924072265625, 9.4815673828125, 10.0390625]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 5.0, 3.0, 8.0, 12.0, 25.0, 80.0, 243.0, 364.0, 182.0, 50.0, 18.0, 9.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-125.92479705810547, -120.7623519897461, -115.59989929199219, -110.43745422363281, -105.2750015258789, -100.11255645751953, -94.95010375976562, -89.78765869140625, -84.62521362304688, -79.4627685546875, -74.3003158569336, -69.13787078857422, -63.97541809082031, -58.81297302246094, -53.6505241394043, -48.488075256347656, -43.32562255859375, -38.16317367553711, -33.00072479248047, -27.83827781677246, -22.67582893371582, -17.51338005065918, -12.350933074951172, -7.188484191894531, -2.0260353088378906, 3.136413097381592, 8.298861503601074, 13.461309432983398, 18.62375831604004, 23.78620719909668, 28.948654174804688, 34.11110305786133, 39.2735595703125, 44.43600845336914, 49.59845733642578, 54.760902404785156, 59.92335510253906, 65.08580017089844, 70.24824523925781, 75.41069793701172, 80.57315063476562, 85.735595703125, 90.8980484008789, 96.06049346923828, 101.22294616699219, 106.38539123535156, 111.54783630371094, 116.71028900146484, 121.87273406982422, 127.0351791381836, 132.1976318359375, 137.36007690429688, 142.52252197265625, 147.6849822998047, 152.84742736816406, 158.00987243652344, 163.1723175048828, 168.3347625732422, 173.49720764160156, 178.65966796875, 183.82211303710938, 188.98455810546875, 194.14700317382812, 199.3094482421875, 204.47190856933594]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 0.0, 4.0, 0.0, 5.0, 2.0, 4.0, 13.0, 14.0, 15.0, 12.0, 11.0, 21.0, 22.0, 35.0, 28.0, 30.0, 29.0, 44.0, 46.0, 38.0, 48.0, 45.0, 51.0, 48.0, 49.0, 50.0, 42.0, 44.0, 30.0, 26.0, 37.0, 26.0, 21.0, 23.0, 24.0, 18.0, 16.0, 10.0, 8.0, 1.0, 5.0, 3.0, 4.0, 6.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.48055648803711, -38.97465133666992, -37.468746185302734, -35.96284103393555, -34.45693588256836, -32.95103073120117, -31.445125579833984, -29.939220428466797, -28.43331527709961, -26.927410125732422, -25.421504974365234, -23.915599822998047, -22.40969467163086, -20.903789520263672, -19.397884368896484, -17.891979217529297, -16.386072158813477, -14.880167007446289, -13.374261856079102, -11.868356704711914, -10.362451553344727, -8.856546401977539, -7.350640296936035, -5.844735145568848, -4.33882999420166, -2.8329248428344727, -1.327019453048706, 0.17888593673706055, 1.684791088104248, 3.1906962394714355, 4.696601867675781, 6.202507019042969, 7.708412170410156, 9.214317321777344, 10.720222473144531, 12.226127624511719, 13.732032775878906, 15.237937927246094, 16.74384307861328, 18.24974822998047, 19.755653381347656, 21.261558532714844, 22.76746368408203, 24.27336883544922, 25.779273986816406, 27.285179138183594, 28.79108428955078, 30.29698944091797, 31.80289649963379, 33.30880355834961, 34.8147087097168, 36.320613861083984, 37.82651901245117, 39.33242416381836, 40.83832931518555, 42.344234466552734, 43.85013961791992, 45.35604476928711, 46.8619499206543, 48.367855072021484, 49.87376022338867, 51.37966537475586, 52.88557052612305, 54.391475677490234, 55.89738082885742]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 4.0, 6.0, 3.0, 8.0, 6.0, 21.0, 30.0, 39.0, 69.0, 109.0, 152.0, 254.0, 403.0, 675.0, 1166.0, 1963.0, 3560.0, 6715.0, 13454.0, 28196.0, 62771.0, 147742.0, 300852.0, 262130.0, 118993.0, 51671.0, 23257.0, 11263.0, 5654.0, 3086.0, 1730.0, 999.0, 625.0, 354.0, 218.0, 140.0, 105.0, 61.0, 32.0, 20.0, 9.0, 10.0, 8.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.48046875, -4.30731201171875, -4.1341552734375, -3.96099853515625, -3.787841796875, -3.61468505859375, -3.4415283203125, -3.26837158203125, -3.09521484375, -2.92205810546875, -2.7489013671875, -2.57574462890625, -2.402587890625, -2.22943115234375, -2.0562744140625, -1.88311767578125, -1.7099609375, -1.53680419921875, -1.3636474609375, -1.19049072265625, -1.017333984375, -0.84417724609375, -0.6710205078125, -0.49786376953125, -0.32470703125, -0.15155029296875, 0.0216064453125, 0.19476318359375, 0.367919921875, 0.54107666015625, 0.7142333984375, 0.88739013671875, 1.060546875, 1.23370361328125, 1.4068603515625, 1.58001708984375, 1.753173828125, 1.92633056640625, 2.0994873046875, 2.27264404296875, 2.44580078125, 2.61895751953125, 2.7921142578125, 2.96527099609375, 3.138427734375, 3.31158447265625, 3.4847412109375, 3.65789794921875, 3.8310546875, 4.00421142578125, 4.1773681640625, 4.35052490234375, 4.523681640625, 4.69683837890625, 4.8699951171875, 5.04315185546875, 5.21630859375, 5.38946533203125, 5.5626220703125, 5.73577880859375, 5.908935546875, 6.08209228515625, 6.2552490234375, 6.42840576171875, 6.6015625]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 8.0, 7.0, 9.0, 12.0, 9.0, 13.0, 14.0, 17.0, 18.0, 20.0, 32.0, 34.0, 32.0, 30.0, 40.0, 24.0, 38.0, 37.0, 49.0, 37.0, 45.0, 29.0, 48.0, 38.0, 41.0, 38.0, 40.0, 30.0, 26.0, 25.0, 23.0, 20.0, 21.0, 16.0, 14.0, 9.0, 11.0, 10.0, 7.0, 5.0, 7.0, 8.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.57421875, -3.4486083984375, -3.322998046875, -3.1973876953125, -3.07177734375, -2.9461669921875, -2.820556640625, -2.6949462890625, -2.5693359375, -2.4437255859375, -2.318115234375, -2.1925048828125, -2.06689453125, -1.9412841796875, -1.815673828125, -1.6900634765625, -1.564453125, -1.4388427734375, -1.313232421875, -1.1876220703125, -1.06201171875, -0.9364013671875, -0.810791015625, -0.6851806640625, -0.5595703125, -0.4339599609375, -0.308349609375, -0.1827392578125, -0.05712890625, 0.0684814453125, 0.194091796875, 0.3197021484375, 0.4453125, 0.5709228515625, 0.696533203125, 0.8221435546875, 0.94775390625, 1.0733642578125, 1.198974609375, 1.3245849609375, 1.4501953125, 1.5758056640625, 1.701416015625, 1.8270263671875, 1.95263671875, 2.0782470703125, 2.203857421875, 2.3294677734375, 2.455078125, 2.5806884765625, 2.706298828125, 2.8319091796875, 2.95751953125, 3.0831298828125, 3.208740234375, 3.3343505859375, 3.4599609375, 3.5855712890625, 3.711181640625, 3.8367919921875, 3.96240234375, 4.0880126953125, 4.213623046875, 4.3392333984375, 4.46484375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 4.0, 1.0, 1.0, 3.0, 4.0, 7.0, 10.0, 9.0, 15.0, 26.0, 38.0, 57.0, 104.0, 177.0, 397.0, 798.0, 2480.0, 12295.0, 113742.0, 808607.0, 95096.0, 10897.0, 2310.0, 721.0, 317.0, 156.0, 94.0, 61.0, 44.0, 30.0, 20.0, 14.0, 9.0, 5.0, 4.0, 2.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.015625, -16.474853515625, -15.93408203125, -15.393310546875, -14.8525390625, -14.311767578125, -13.77099609375, -13.230224609375, -12.689453125, -12.148681640625, -11.60791015625, -11.067138671875, -10.5263671875, -9.985595703125, -9.44482421875, -8.904052734375, -8.36328125, -7.822509765625, -7.28173828125, -6.740966796875, -6.2001953125, -5.659423828125, -5.11865234375, -4.577880859375, -4.037109375, -3.496337890625, -2.95556640625, -2.414794921875, -1.8740234375, -1.333251953125, -0.79248046875, -0.251708984375, 0.2890625, 0.829833984375, 1.37060546875, 1.911376953125, 2.4521484375, 2.992919921875, 3.53369140625, 4.074462890625, 4.615234375, 5.156005859375, 5.69677734375, 6.237548828125, 6.7783203125, 7.319091796875, 7.85986328125, 8.400634765625, 8.94140625, 9.482177734375, 10.02294921875, 10.563720703125, 11.1044921875, 11.645263671875, 12.18603515625, 12.726806640625, 13.267578125, 13.808349609375, 14.34912109375, 14.889892578125, 15.4306640625, 15.971435546875, 16.51220703125, 17.052978515625, 17.59375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 6.0, 7.0, 7.0, 17.0, 15.0, 11.0, 25.0, 29.0, 41.0, 43.0, 64.0, 69.0, 77.0, 97.0, 77.0, 73.0, 64.0, 54.0, 56.0, 28.0, 28.0, 30.0, 23.0, 17.0, 19.0, 7.0, 7.0, 6.0, 1.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.96875, -25.204345703125, -24.43994140625, -23.675537109375, -22.9111328125, -22.146728515625, -21.38232421875, -20.617919921875, -19.853515625, -19.089111328125, -18.32470703125, -17.560302734375, -16.7958984375, -16.031494140625, -15.26708984375, -14.502685546875, -13.73828125, -12.973876953125, -12.20947265625, -11.445068359375, -10.6806640625, -9.916259765625, -9.15185546875, -8.387451171875, -7.623046875, -6.858642578125, -6.09423828125, -5.329833984375, -4.5654296875, -3.801025390625, -3.03662109375, -2.272216796875, -1.5078125, -0.743408203125, 0.02099609375, 0.785400390625, 1.5498046875, 2.314208984375, 3.07861328125, 3.843017578125, 4.607421875, 5.371826171875, 6.13623046875, 6.900634765625, 7.6650390625, 8.429443359375, 9.19384765625, 9.958251953125, 10.72265625, 11.487060546875, 12.25146484375, 13.015869140625, 13.7802734375, 14.544677734375, 15.30908203125, 16.073486328125, 16.837890625, 17.602294921875, 18.36669921875, 19.131103515625, 19.8955078125, 20.659912109375, 21.42431640625, 22.188720703125, 22.953125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 8.0, 7.0, 28.0, 13.0, 38.0, 53.0, 72.0, 109.0, 226.0, 477.0, 1085.0, 3224.0, 12474.0, 82343.0, 737410.0, 180903.0, 22304.0, 4839.0, 1589.0, 652.0, 294.0, 152.0, 96.0, 47.0, 30.0, 20.0, 18.0, 8.0, 7.0, 4.0, 6.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.08203125, -2.96197509765625, -2.8419189453125, -2.72186279296875, -2.601806640625, -2.48175048828125, -2.3616943359375, -2.24163818359375, -2.12158203125, -2.00152587890625, -1.8814697265625, -1.76141357421875, -1.641357421875, -1.52130126953125, -1.4012451171875, -1.28118896484375, -1.1611328125, -1.04107666015625, -0.9210205078125, -0.80096435546875, -0.680908203125, -0.56085205078125, -0.4407958984375, -0.32073974609375, -0.20068359375, -0.08062744140625, 0.0394287109375, 0.15948486328125, 0.279541015625, 0.39959716796875, 0.5196533203125, 0.63970947265625, 0.759765625, 0.87982177734375, 0.9998779296875, 1.11993408203125, 1.239990234375, 1.36004638671875, 1.4801025390625, 1.60015869140625, 1.72021484375, 1.84027099609375, 1.9603271484375, 2.08038330078125, 2.200439453125, 2.32049560546875, 2.4405517578125, 2.56060791015625, 2.6806640625, 2.80072021484375, 2.9207763671875, 3.04083251953125, 3.160888671875, 3.28094482421875, 3.4010009765625, 3.52105712890625, 3.64111328125, 3.76116943359375, 3.8812255859375, 4.00128173828125, 4.121337890625, 4.24139404296875, 4.3614501953125, 4.48150634765625, 4.6015625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 6.0, 3.0, 4.0, 9.0, 9.0, 16.0, 21.0, 32.0, 35.0, 40.0, 56.0, 67.0, 80.0, 102.0, 106.0, 102.0, 72.0, 72.0, 36.0, 36.0, 14.0, 22.0, 14.0, 9.0, 14.0, 5.0, 8.0, 3.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0008053779602050781, -0.0007776618003845215, -0.0007499456405639648, -0.0007222294807434082, -0.0006945133209228516, -0.0006667971611022949, -0.0006390810012817383, -0.0006113648414611816, -0.000583648681640625, -0.0005559325218200684, -0.0005282163619995117, -0.0005005002021789551, -0.00047278404235839844, -0.0004450678825378418, -0.00041735172271728516, -0.0003896355628967285, -0.0003619194030761719, -0.00033420324325561523, -0.0003064870834350586, -0.00027877092361450195, -0.0002510547637939453, -0.00022333860397338867, -0.00019562244415283203, -0.0001679062843322754, -0.00014019012451171875, -0.00011247396469116211, -8.475780487060547e-05, -5.704164505004883e-05, -2.9325485229492188e-05, -1.6093254089355469e-06, 2.6106834411621094e-05, 5.3822994232177734e-05, 8.153915405273438e-05, 0.00010925531387329102, 0.00013697147369384766, 0.0001646876335144043, 0.00019240379333496094, 0.00022011995315551758, 0.0002478361129760742, 0.00027555227279663086, 0.0003032684326171875, 0.00033098459243774414, 0.0003587007522583008, 0.0003864169120788574, 0.00041413307189941406, 0.0004418492317199707, 0.00046956539154052734, 0.000497281551361084, 0.0005249977111816406, 0.0005527138710021973, 0.0005804300308227539, 0.0006081461906433105, 0.0006358623504638672, 0.0006635785102844238, 0.0006912946701049805, 0.0007190108299255371, 0.0007467269897460938, 0.0007744431495666504, 0.000802159309387207, 0.0008298754692077637, 0.0008575916290283203, 0.000885307788848877, 0.0009130239486694336, 0.0009407401084899902, 0.0009684562683105469]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 4.0, 1.0, 7.0, 11.0, 18.0, 30.0, 59.0, 101.0, 211.0, 640.0, 3782.0, 114861.0, 912430.0, 14321.0, 1368.0, 376.0, 140.0, 63.0, 58.0, 25.0, 16.0, 11.0, 9.0, 6.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.875, -10.597900390625, -10.32080078125, -10.043701171875, -9.7666015625, -9.489501953125, -9.21240234375, -8.935302734375, -8.658203125, -8.381103515625, -8.10400390625, -7.826904296875, -7.5498046875, -7.272705078125, -6.99560546875, -6.718505859375, -6.44140625, -6.164306640625, -5.88720703125, -5.610107421875, -5.3330078125, -5.055908203125, -4.77880859375, -4.501708984375, -4.224609375, -3.947509765625, -3.67041015625, -3.393310546875, -3.1162109375, -2.839111328125, -2.56201171875, -2.284912109375, -2.0078125, -1.730712890625, -1.45361328125, -1.176513671875, -0.8994140625, -0.622314453125, -0.34521484375, -0.068115234375, 0.208984375, 0.486083984375, 0.76318359375, 1.040283203125, 1.3173828125, 1.594482421875, 1.87158203125, 2.148681640625, 2.42578125, 2.702880859375, 2.97998046875, 3.257080078125, 3.5341796875, 3.811279296875, 4.08837890625, 4.365478515625, 4.642578125, 4.919677734375, 5.19677734375, 5.473876953125, 5.7509765625, 6.028076171875, 6.30517578125, 6.582275390625, 6.859375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 6.0, 9.0, 11.0, 15.0, 17.0, 20.0, 29.0, 32.0, 45.0, 50.0, 63.0, 76.0, 78.0, 105.0, 67.0, 72.0, 68.0, 58.0, 52.0, 30.0, 32.0, 24.0, 11.0, 10.0, 8.0, 2.0, 4.0, 5.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.130859375, -3.02392578125, -2.9169921875, -2.81005859375, -2.703125, -2.59619140625, -2.4892578125, -2.38232421875, -2.275390625, -2.16845703125, -2.0615234375, -1.95458984375, -1.84765625, -1.74072265625, -1.6337890625, -1.52685546875, -1.419921875, -1.31298828125, -1.2060546875, -1.09912109375, -0.9921875, -0.88525390625, -0.7783203125, -0.67138671875, -0.564453125, -0.45751953125, -0.3505859375, -0.24365234375, -0.13671875, -0.02978515625, 0.0771484375, 0.18408203125, 0.291015625, 0.39794921875, 0.5048828125, 0.61181640625, 0.71875, 0.82568359375, 0.9326171875, 1.03955078125, 1.146484375, 1.25341796875, 1.3603515625, 1.46728515625, 1.57421875, 1.68115234375, 1.7880859375, 1.89501953125, 2.001953125, 2.10888671875, 2.2158203125, 2.32275390625, 2.4296875, 2.53662109375, 2.6435546875, 2.75048828125, 2.857421875, 2.96435546875, 3.0712890625, 3.17822265625, 3.28515625, 3.39208984375, 3.4990234375, 3.60595703125, 3.712890625]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 7.0, 9.0, 23.0, 39.0, 82.0, 156.0, 269.0, 200.0, 102.0, 32.0, 28.0, 19.0, 11.0, 6.0, 6.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-80.81637573242188, -77.97416687011719, -75.1319580078125, -72.28974151611328, -69.4475326538086, -66.6053237915039, -63.76311111450195, -60.9208984375, -58.07868957519531, -55.236480712890625, -52.39426803588867, -49.55205535888672, -46.70984649658203, -43.867637634277344, -41.02542495727539, -38.18321228027344, -35.34100341796875, -32.49879455566406, -29.65658187866211, -26.81437110900879, -23.97216033935547, -21.12994956970215, -18.287738800048828, -15.445528030395508, -12.603317260742188, -9.761106491088867, -6.918895721435547, -4.076684951782227, -1.2344741821289062, 1.607736587524414, 4.449947357177734, 7.292158126831055, 10.134368896484375, 12.976579666137695, 15.818790435791016, 18.661001205444336, 21.503211975097656, 24.345422744750977, 27.187633514404297, 30.029844284057617, 32.87205505371094, 35.714263916015625, 38.55647659301758, 41.39868927001953, 44.24089813232422, 47.083106994628906, 49.92531967163086, 52.76753234863281, 55.6097412109375, 58.45195007324219, 61.29416275024414, 64.1363754272461, 66.97858428955078, 69.82079315185547, 72.66300964355469, 75.50521850585938, 78.34742736816406, 81.18963623046875, 84.03184509277344, 86.87406158447266, 89.71627044677734, 92.55847930908203, 95.40069580078125, 98.24290466308594, 101.08511352539062]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 5.0, 4.0, 3.0, 12.0, 8.0, 4.0, 12.0, 17.0, 11.0, 15.0, 18.0, 22.0, 24.0, 28.0, 26.0, 41.0, 34.0, 40.0, 47.0, 63.0, 69.0, 82.0, 59.0, 37.0, 41.0, 40.0, 34.0, 38.0, 24.0, 31.0, 19.0, 18.0, 20.0, 7.0, 17.0, 10.0, 4.0, 4.0, 9.0, 4.0, 2.0, 0.0, 0.0, 2.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.80534744262695, -55.98208999633789, -54.15883255004883, -52.335575103759766, -50.5123176574707, -48.68906021118164, -46.865806579589844, -45.04254913330078, -43.21929168701172, -41.396034240722656, -39.572776794433594, -37.74951934814453, -35.92626190185547, -34.103004455566406, -32.279747009277344, -30.456491470336914, -28.63323211669922, -26.809974670410156, -24.986717224121094, -23.16345977783203, -21.34020233154297, -19.516944885253906, -17.693689346313477, -15.870431900024414, -14.047174453735352, -12.223917007446289, -10.400659561157227, -8.57740306854248, -6.754145622253418, -4.9308881759643555, -3.1076316833496094, -1.2843742370605469, 0.53887939453125, 2.3621366024017334, 4.185393810272217, 6.008650779724121, 7.831908226013184, 9.655165672302246, 11.478422164916992, 13.301679611206055, 15.124937057495117, 16.94819450378418, 18.771451950073242, 20.594707489013672, 22.417964935302734, 24.241222381591797, 26.06447982788086, 27.887737274169922, 29.710994720458984, 31.534252166748047, 33.35750961303711, 35.18076705932617, 37.004024505615234, 38.8272819519043, 40.650535583496094, 42.473793029785156, 44.29705047607422, 46.12030792236328, 47.943565368652344, 49.766822814941406, 51.59008026123047, 53.41333770751953, 55.236595153808594, 57.059852600097656, 58.88311004638672]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 3.0, 5.0, 8.0, 11.0, 15.0, 26.0, 35.0, 69.0, 92.0, 115.0, 186.0, 293.0, 458.0, 759.0, 1380.0, 2310.0, 4696.0, 11156.0, 33179.0, 127282.0, 555592.0, 2069101.0, 1050696.0, 248898.0, 58923.0, 15768.0, 5901.0, 2897.0, 1697.0, 1024.0, 616.0, 361.0, 268.0, 160.0, 109.0, 75.0, 46.0, 21.0, 18.0, 7.0, 9.0, 7.0, 5.0, 0.0, 4.0, 1.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1484375, -3.03485107421875, -2.9212646484375, -2.80767822265625, -2.694091796875, -2.58050537109375, -2.4669189453125, -2.35333251953125, -2.23974609375, -2.12615966796875, -2.0125732421875, -1.89898681640625, -1.785400390625, -1.67181396484375, -1.5582275390625, -1.44464111328125, -1.3310546875, -1.21746826171875, -1.1038818359375, -0.99029541015625, -0.876708984375, -0.76312255859375, -0.6495361328125, -0.53594970703125, -0.42236328125, -0.30877685546875, -0.1951904296875, -0.08160400390625, 0.031982421875, 0.14556884765625, 0.2591552734375, 0.37274169921875, 0.486328125, 0.59991455078125, 0.7135009765625, 0.82708740234375, 0.940673828125, 1.05426025390625, 1.1678466796875, 1.28143310546875, 1.39501953125, 1.50860595703125, 1.6221923828125, 1.73577880859375, 1.849365234375, 1.96295166015625, 2.0765380859375, 2.19012451171875, 2.3037109375, 2.41729736328125, 2.5308837890625, 2.64447021484375, 2.758056640625, 2.87164306640625, 2.9852294921875, 3.09881591796875, 3.21240234375, 3.32598876953125, 3.4395751953125, 3.55316162109375, 3.666748046875, 3.78033447265625, 3.8939208984375, 4.00750732421875, 4.12109375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 2.0, 2.0, 7.0, 5.0, 3.0, 11.0, 8.0, 8.0, 16.0, 20.0, 22.0, 22.0, 25.0, 29.0, 27.0, 21.0, 26.0, 39.0, 26.0, 39.0, 43.0, 46.0, 35.0, 37.0, 34.0, 42.0, 40.0, 42.0, 40.0, 39.0, 26.0, 34.0, 34.0, 26.0, 18.0, 21.0, 8.0, 24.0, 9.0, 13.0, 6.0, 6.0, 9.0, 2.0, 3.0, 3.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-3.39453125, -3.27947998046875, -3.1644287109375, -3.04937744140625, -2.934326171875, -2.81927490234375, -2.7042236328125, -2.58917236328125, -2.47412109375, -2.35906982421875, -2.2440185546875, -2.12896728515625, -2.013916015625, -1.89886474609375, -1.7838134765625, -1.66876220703125, -1.5537109375, -1.43865966796875, -1.3236083984375, -1.20855712890625, -1.093505859375, -0.97845458984375, -0.8634033203125, -0.74835205078125, -0.63330078125, -0.51824951171875, -0.4031982421875, -0.28814697265625, -0.173095703125, -0.05804443359375, 0.0570068359375, 0.17205810546875, 0.287109375, 0.40216064453125, 0.5172119140625, 0.63226318359375, 0.747314453125, 0.86236572265625, 0.9774169921875, 1.09246826171875, 1.20751953125, 1.32257080078125, 1.4376220703125, 1.55267333984375, 1.667724609375, 1.78277587890625, 1.8978271484375, 2.01287841796875, 2.1279296875, 2.24298095703125, 2.3580322265625, 2.47308349609375, 2.588134765625, 2.70318603515625, 2.8182373046875, 2.93328857421875, 3.04833984375, 3.16339111328125, 3.2784423828125, 3.39349365234375, 3.508544921875, 3.62359619140625, 3.7386474609375, 3.85369873046875, 3.96875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 6.0, 3.0, 5.0, 6.0, 18.0, 24.0, 27.0, 38.0, 80.0, 173.0, 305.0, 745.0, 2402.0, 13968.0, 307352.0, 3807841.0, 53132.0, 5866.0, 1291.0, 470.0, 234.0, 128.0, 62.0, 37.0, 27.0, 16.0, 8.0, 9.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-15.8515625, -15.3890380859375, -14.926513671875, -14.4639892578125, -14.00146484375, -13.5389404296875, -13.076416015625, -12.6138916015625, -12.1513671875, -11.6888427734375, -11.226318359375, -10.7637939453125, -10.30126953125, -9.8387451171875, -9.376220703125, -8.9136962890625, -8.451171875, -7.9886474609375, -7.526123046875, -7.0635986328125, -6.60107421875, -6.1385498046875, -5.676025390625, -5.2135009765625, -4.7509765625, -4.2884521484375, -3.825927734375, -3.3634033203125, -2.90087890625, -2.4383544921875, -1.975830078125, -1.5133056640625, -1.05078125, -0.5882568359375, -0.125732421875, 0.3367919921875, 0.79931640625, 1.2618408203125, 1.724365234375, 2.1868896484375, 2.6494140625, 3.1119384765625, 3.574462890625, 4.0369873046875, 4.49951171875, 4.9620361328125, 5.424560546875, 5.8870849609375, 6.349609375, 6.8121337890625, 7.274658203125, 7.7371826171875, 8.19970703125, 8.6622314453125, 9.124755859375, 9.5872802734375, 10.0498046875, 10.5123291015625, 10.974853515625, 11.4373779296875, 11.89990234375, 12.3624267578125, 12.824951171875, 13.2874755859375, 13.75]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 4.0, 7.0, 7.0, 16.0, 26.0, 37.0, 51.0, 115.0, 292.0, 682.0, 1278.0, 887.0, 344.0, 131.0, 81.0, 45.0, 23.0, 19.0, 11.0, 10.0, 4.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.6328125, -12.20751953125, -11.7822265625, -11.35693359375, -10.931640625, -10.50634765625, -10.0810546875, -9.65576171875, -9.23046875, -8.80517578125, -8.3798828125, -7.95458984375, -7.529296875, -7.10400390625, -6.6787109375, -6.25341796875, -5.828125, -5.40283203125, -4.9775390625, -4.55224609375, -4.126953125, -3.70166015625, -3.2763671875, -2.85107421875, -2.42578125, -2.00048828125, -1.5751953125, -1.14990234375, -0.724609375, -0.29931640625, 0.1259765625, 0.55126953125, 0.9765625, 1.40185546875, 1.8271484375, 2.25244140625, 2.677734375, 3.10302734375, 3.5283203125, 3.95361328125, 4.37890625, 4.80419921875, 5.2294921875, 5.65478515625, 6.080078125, 6.50537109375, 6.9306640625, 7.35595703125, 7.78125, 8.20654296875, 8.6318359375, 9.05712890625, 9.482421875, 9.90771484375, 10.3330078125, 10.75830078125, 11.18359375, 11.60888671875, 12.0341796875, 12.45947265625, 12.884765625, 13.31005859375, 13.7353515625, 14.16064453125, 14.5859375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 10.0, 7.0, 23.0, 52.0, 129.0, 254.0, 282.0, 143.0, 62.0, 21.0, 8.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-127.2454605102539, -124.08069610595703, -120.91593170166016, -117.75116729736328, -114.58639526367188, -111.421630859375, -108.25686645507812, -105.09210205078125, -101.92733764648438, -98.7625732421875, -95.59780883789062, -92.43304443359375, -89.26828002929688, -86.10350799560547, -82.9387435913086, -79.77397918701172, -76.60921478271484, -73.44445037841797, -70.2796859741211, -67.11492156982422, -63.95015335083008, -60.7853889465332, -57.62062072753906, -54.45585632324219, -51.29109191894531, -48.12632751464844, -44.96156311035156, -41.79679489135742, -38.63203048706055, -35.46726608276367, -32.30249786376953, -29.137733459472656, -25.97296142578125, -22.808197021484375, -19.643430709838867, -16.47866439819336, -13.313899993896484, -10.149134635925293, -6.984369277954102, -3.8196029663085938, -0.6548385620117188, 2.5099267959594727, 5.674692153930664, 8.839457511901855, 12.004222869873047, 15.168988227844238, 18.33375358581543, 21.498519897460938, 24.663284301757812, 27.828048706054688, 30.992815017700195, 34.1575813293457, 37.32234573364258, 40.48711013793945, 43.651878356933594, 46.81664276123047, 49.981407165527344, 53.14617156982422, 56.310935974121094, 59.475704193115234, 62.64046859741211, 65.80523681640625, 68.97000122070312, 72.134765625, 75.29953002929688]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 4.0, 5.0, 8.0, 13.0, 16.0, 12.0, 21.0, 21.0, 27.0, 24.0, 44.0, 43.0, 48.0, 48.0, 37.0, 45.0, 54.0, 48.0, 51.0, 53.0, 44.0, 56.0, 51.0, 41.0, 28.0, 30.0, 26.0, 29.0, 10.0, 15.0, 13.0, 13.0, 3.0, 8.0, 3.0, 7.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-46.99970626831055, -45.7700080871582, -44.54030990600586, -43.31060791015625, -42.080909729003906, -40.85121154785156, -39.62151336669922, -38.391815185546875, -37.16211700439453, -35.93241882324219, -34.702720642089844, -33.4730224609375, -32.24332046508789, -31.013622283935547, -29.783924102783203, -28.55422592163086, -27.324525833129883, -26.09482765197754, -24.865127563476562, -23.63542938232422, -22.405731201171875, -21.17603302001953, -19.946332931518555, -18.71663475036621, -17.486934661865234, -16.25723648071289, -15.02753734588623, -13.79783821105957, -12.568140029907227, -11.338440895080566, -10.108741760253906, -8.879043579101562, -7.649343490600586, -6.419644832611084, -5.189946174621582, -3.960247039794922, -2.73054838180542, -1.500849723815918, -0.2711505889892578, 0.9585475921630859, 2.188246726989746, 3.417945384979248, 4.64764404296875, 5.87734317779541, 7.107041835784912, 8.336740493774414, 9.566439628601074, 10.796137809753418, 12.025836944580078, 13.255536079406738, 14.485234260559082, 15.714933395385742, 16.944631576538086, 18.174331665039062, 19.404029846191406, 20.63372802734375, 21.863426208496094, 23.093124389648438, 24.322824478149414, 25.552522659301758, 26.7822208404541, 28.011920928955078, 29.241619110107422, 30.471317291259766, 31.701017379760742]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 3.0, 10.0, 5.0, 4.0, 11.0, 11.0, 24.0, 33.0, 73.0, 118.0, 140.0, 257.0, 407.0, 640.0, 1272.0, 2186.0, 4414.0, 8645.0, 17434.0, 37541.0, 88177.0, 222053.0, 356728.0, 176903.0, 70460.0, 31048.0, 14532.0, 7120.0, 3738.0, 1988.0, 1071.0, 562.0, 365.0, 204.0, 132.0, 89.0, 58.0, 36.0, 20.0, 12.0, 13.0, 9.0, 3.0, 1.0, 6.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-5.9375, -5.7696533203125, -5.601806640625, -5.4339599609375, -5.26611328125, -5.0982666015625, -4.930419921875, -4.7625732421875, -4.5947265625, -4.4268798828125, -4.259033203125, -4.0911865234375, -3.92333984375, -3.7554931640625, -3.587646484375, -3.4197998046875, -3.251953125, -3.0841064453125, -2.916259765625, -2.7484130859375, -2.58056640625, -2.4127197265625, -2.244873046875, -2.0770263671875, -1.9091796875, -1.7413330078125, -1.573486328125, -1.4056396484375, -1.23779296875, -1.0699462890625, -0.902099609375, -0.7342529296875, -0.56640625, -0.3985595703125, -0.230712890625, -0.0628662109375, 0.10498046875, 0.2728271484375, 0.440673828125, 0.6085205078125, 0.7763671875, 0.9442138671875, 1.112060546875, 1.2799072265625, 1.44775390625, 1.6156005859375, 1.783447265625, 1.9512939453125, 2.119140625, 2.2869873046875, 2.454833984375, 2.6226806640625, 2.79052734375, 2.9583740234375, 3.126220703125, 3.2940673828125, 3.4619140625, 3.6297607421875, 3.797607421875, 3.9654541015625, 4.13330078125, 4.3011474609375, 4.468994140625, 4.6368408203125, 4.8046875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 8.0, 10.0, 6.0, 4.0, 10.0, 3.0, 13.0, 11.0, 14.0, 14.0, 18.0, 35.0, 31.0, 27.0, 28.0, 38.0, 38.0, 42.0, 39.0, 60.0, 40.0, 38.0, 43.0, 45.0, 46.0, 44.0, 49.0, 38.0, 28.0, 27.0, 25.0, 26.0, 17.0, 21.0, 18.0, 9.0, 12.0, 11.0, 9.0, 4.0, 2.0, 5.0, 4.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.232421875, -3.105255126953125, -2.97808837890625, -2.850921630859375, -2.7237548828125, -2.596588134765625, -2.46942138671875, -2.342254638671875, -2.215087890625, -2.087921142578125, -1.96075439453125, -1.833587646484375, -1.7064208984375, -1.579254150390625, -1.45208740234375, -1.324920654296875, -1.19775390625, -1.070587158203125, -0.94342041015625, -0.816253662109375, -0.6890869140625, -0.561920166015625, -0.43475341796875, -0.307586669921875, -0.180419921875, -0.053253173828125, 0.07391357421875, 0.201080322265625, 0.3282470703125, 0.455413818359375, 0.58258056640625, 0.709747314453125, 0.8369140625, 0.964080810546875, 1.09124755859375, 1.218414306640625, 1.3455810546875, 1.472747802734375, 1.59991455078125, 1.727081298828125, 1.854248046875, 1.981414794921875, 2.10858154296875, 2.235748291015625, 2.3629150390625, 2.490081787109375, 2.61724853515625, 2.744415283203125, 2.87158203125, 2.998748779296875, 3.12591552734375, 3.253082275390625, 3.3802490234375, 3.507415771484375, 3.63458251953125, 3.761749267578125, 3.888916015625, 4.016082763671875, 4.14324951171875, 4.270416259765625, 4.3975830078125, 4.524749755859375, 4.65191650390625, 4.779083251953125, 4.90625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 5.0, 1.0, 4.0, 8.0, 11.0, 13.0, 20.0, 29.0, 36.0, 49.0, 82.0, 122.0, 230.0, 390.0, 752.0, 1594.0, 4541.0, 17918.0, 128411.0, 776793.0, 95835.0, 14671.0, 3814.0, 1436.0, 738.0, 387.0, 224.0, 170.0, 78.0, 57.0, 38.0, 35.0, 19.0, 15.0, 9.0, 9.0, 5.0, 7.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-13.53125, -13.1383056640625, -12.745361328125, -12.3524169921875, -11.95947265625, -11.5665283203125, -11.173583984375, -10.7806396484375, -10.3876953125, -9.9947509765625, -9.601806640625, -9.2088623046875, -8.81591796875, -8.4229736328125, -8.030029296875, -7.6370849609375, -7.244140625, -6.8511962890625, -6.458251953125, -6.0653076171875, -5.67236328125, -5.2794189453125, -4.886474609375, -4.4935302734375, -4.1005859375, -3.7076416015625, -3.314697265625, -2.9217529296875, -2.52880859375, -2.1358642578125, -1.742919921875, -1.3499755859375, -0.95703125, -0.5640869140625, -0.171142578125, 0.2218017578125, 0.61474609375, 1.0076904296875, 1.400634765625, 1.7935791015625, 2.1865234375, 2.5794677734375, 2.972412109375, 3.3653564453125, 3.75830078125, 4.1512451171875, 4.544189453125, 4.9371337890625, 5.330078125, 5.7230224609375, 6.115966796875, 6.5089111328125, 6.90185546875, 7.2947998046875, 7.687744140625, 8.0806884765625, 8.4736328125, 8.8665771484375, 9.259521484375, 9.6524658203125, 10.04541015625, 10.4383544921875, 10.831298828125, 11.2242431640625, 11.6171875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 7.0, 3.0, 8.0, 7.0, 10.0, 12.0, 17.0, 23.0, 24.0, 40.0, 51.0, 42.0, 64.0, 68.0, 75.0, 68.0, 68.0, 73.0, 60.0, 52.0, 48.0, 37.0, 32.0, 27.0, 18.0, 16.0, 11.0, 14.0, 6.0, 4.0, 8.0, 2.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.828125, -20.2080078125, -19.587890625, -18.9677734375, -18.34765625, -17.7275390625, -17.107421875, -16.4873046875, -15.8671875, -15.2470703125, -14.626953125, -14.0068359375, -13.38671875, -12.7666015625, -12.146484375, -11.5263671875, -10.90625, -10.2861328125, -9.666015625, -9.0458984375, -8.42578125, -7.8056640625, -7.185546875, -6.5654296875, -5.9453125, -5.3251953125, -4.705078125, -4.0849609375, -3.46484375, -2.8447265625, -2.224609375, -1.6044921875, -0.984375, -0.3642578125, 0.255859375, 0.8759765625, 1.49609375, 2.1162109375, 2.736328125, 3.3564453125, 3.9765625, 4.5966796875, 5.216796875, 5.8369140625, 6.45703125, 7.0771484375, 7.697265625, 8.3173828125, 8.9375, 9.5576171875, 10.177734375, 10.7978515625, 11.41796875, 12.0380859375, 12.658203125, 13.2783203125, 13.8984375, 14.5185546875, 15.138671875, 15.7587890625, 16.37890625, 16.9990234375, 17.619140625, 18.2392578125, 18.859375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 4.0, 3.0, 3.0, 10.0, 14.0, 24.0, 37.0, 54.0, 81.0, 141.0, 280.0, 529.0, 1318.0, 3711.0, 14258.0, 92555.0, 772871.0, 136203.0, 19028.0, 4595.0, 1494.0, 649.0, 287.0, 148.0, 107.0, 58.0, 27.0, 23.0, 19.0, 14.0, 4.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.685546875, -3.584808349609375, -3.48406982421875, -3.383331298828125, -3.2825927734375, -3.181854248046875, -3.08111572265625, -2.980377197265625, -2.879638671875, -2.778900146484375, -2.67816162109375, -2.577423095703125, -2.4766845703125, -2.375946044921875, -2.27520751953125, -2.174468994140625, -2.07373046875, -1.972991943359375, -1.87225341796875, -1.771514892578125, -1.6707763671875, -1.570037841796875, -1.46929931640625, -1.368560791015625, -1.267822265625, -1.167083740234375, -1.06634521484375, -0.965606689453125, -0.8648681640625, -0.764129638671875, -0.66339111328125, -0.562652587890625, -0.4619140625, -0.361175537109375, -0.26043701171875, -0.159698486328125, -0.0589599609375, 0.041778564453125, 0.14251708984375, 0.243255615234375, 0.343994140625, 0.444732666015625, 0.54547119140625, 0.646209716796875, 0.7469482421875, 0.847686767578125, 0.94842529296875, 1.049163818359375, 1.14990234375, 1.250640869140625, 1.35137939453125, 1.452117919921875, 1.5528564453125, 1.653594970703125, 1.75433349609375, 1.855072021484375, 1.955810546875, 2.056549072265625, 2.15728759765625, 2.258026123046875, 2.3587646484375, 2.459503173828125, 2.56024169921875, 2.660980224609375, 2.76171875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 2.0, 2.0, 4.0, 12.0, 8.0, 13.0, 17.0, 21.0, 22.0, 28.0, 41.0, 69.0, 66.0, 109.0, 106.0, 93.0, 97.0, 71.0, 44.0, 41.0, 26.0, 28.0, 20.0, 13.0, 13.0, 9.0, 8.0, 6.0, 3.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0006284713745117188, -0.0006059780716896057, -0.0005834847688674927, -0.0005609914660453796, -0.0005384981632232666, -0.0005160048604011536, -0.0004935115575790405, -0.0004710182547569275, -0.00044852495193481445, -0.0004260316491127014, -0.0004035383462905884, -0.00038104504346847534, -0.0003585517406463623, -0.00033605843782424927, -0.00031356513500213623, -0.0002910718321800232, -0.00026857852935791016, -0.0002460852265357971, -0.00022359192371368408, -0.00020109862089157104, -0.000178605318069458, -0.00015611201524734497, -0.00013361871242523193, -0.0001111254096031189, -8.863210678100586e-05, -6.613880395889282e-05, -4.3645501136779785e-05, -2.1152198314666748e-05, 1.341104507446289e-06, 2.3834407329559326e-05, 4.632771015167236e-05, 6.88210129737854e-05, 9.131431579589844e-05, 0.00011380761861801147, 0.0001363009214401245, 0.00015879422426223755, 0.00018128752708435059, 0.00020378082990646362, 0.00022627413272857666, 0.0002487674355506897, 0.00027126073837280273, 0.00029375404119491577, 0.0003162473440170288, 0.00033874064683914185, 0.0003612339496612549, 0.0003837272524833679, 0.00040622055530548096, 0.000428713858127594, 0.00045120716094970703, 0.00047370046377182007, 0.0004961937665939331, 0.0005186870694160461, 0.0005411803722381592, 0.0005636736750602722, 0.0005861669778823853, 0.0006086602807044983, 0.0006311535835266113, 0.0006536468863487244, 0.0006761401891708374, 0.0006986334919929504, 0.0007211267948150635, 0.0007436200976371765, 0.0007661134004592896, 0.0007886067032814026, 0.0008111000061035156]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 8.0, 10.0, 17.0, 12.0, 30.0, 43.0, 47.0, 93.0, 179.0, 336.0, 828.0, 2148.0, 7381.0, 40222.0, 612748.0, 340325.0, 34103.0, 6523.0, 1966.0, 745.0, 333.0, 178.0, 105.0, 62.0, 26.0, 24.0, 26.0, 16.0, 5.0, 7.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.880859375, -2.7813720703125, -2.681884765625, -2.5823974609375, -2.48291015625, -2.3834228515625, -2.283935546875, -2.1844482421875, -2.0849609375, -1.9854736328125, -1.885986328125, -1.7864990234375, -1.68701171875, -1.5875244140625, -1.488037109375, -1.3885498046875, -1.2890625, -1.1895751953125, -1.090087890625, -0.9906005859375, -0.89111328125, -0.7916259765625, -0.692138671875, -0.5926513671875, -0.4931640625, -0.3936767578125, -0.294189453125, -0.1947021484375, -0.09521484375, 0.0042724609375, 0.103759765625, 0.2032470703125, 0.302734375, 0.4022216796875, 0.501708984375, 0.6011962890625, 0.70068359375, 0.8001708984375, 0.899658203125, 0.9991455078125, 1.0986328125, 1.1981201171875, 1.297607421875, 1.3970947265625, 1.49658203125, 1.5960693359375, 1.695556640625, 1.7950439453125, 1.89453125, 1.9940185546875, 2.093505859375, 2.1929931640625, 2.29248046875, 2.3919677734375, 2.491455078125, 2.5909423828125, 2.6904296875, 2.7899169921875, 2.889404296875, 2.9888916015625, 3.08837890625, 3.1878662109375, 3.287353515625, 3.3868408203125, 3.486328125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 4.0, 1.0, 0.0, 6.0, 10.0, 10.0, 14.0, 17.0, 18.0, 22.0, 49.0, 37.0, 62.0, 71.0, 77.0, 88.0, 94.0, 82.0, 68.0, 61.0, 51.0, 43.0, 26.0, 23.0, 19.0, 11.0, 9.0, 9.0, 2.0, 4.0, 3.0, 3.0, 6.0, 2.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.876953125, -2.78973388671875, -2.7025146484375, -2.61529541015625, -2.528076171875, -2.44085693359375, -2.3536376953125, -2.26641845703125, -2.17919921875, -2.09197998046875, -2.0047607421875, -1.91754150390625, -1.830322265625, -1.74310302734375, -1.6558837890625, -1.56866455078125, -1.4814453125, -1.39422607421875, -1.3070068359375, -1.21978759765625, -1.132568359375, -1.04534912109375, -0.9581298828125, -0.87091064453125, -0.78369140625, -0.69647216796875, -0.6092529296875, -0.52203369140625, -0.434814453125, -0.34759521484375, -0.2603759765625, -0.17315673828125, -0.0859375, 0.00128173828125, 0.0885009765625, 0.17572021484375, 0.262939453125, 0.35015869140625, 0.4373779296875, 0.52459716796875, 0.61181640625, 0.69903564453125, 0.7862548828125, 0.87347412109375, 0.960693359375, 1.04791259765625, 1.1351318359375, 1.22235107421875, 1.3095703125, 1.39678955078125, 1.4840087890625, 1.57122802734375, 1.658447265625, 1.74566650390625, 1.8328857421875, 1.92010498046875, 2.00732421875, 2.09454345703125, 2.1817626953125, 2.26898193359375, 2.356201171875, 2.44342041015625, 2.5306396484375, 2.61785888671875, 2.705078125]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 10.0, 16.0, 45.0, 158.0, 472.0, 190.0, 69.0, 30.0, 10.0, 4.0, 1.0, 2.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.29771423339844, -65.78285217285156, -61.26799392700195, -56.753135681152344, -52.23827362060547, -47.723411560058594, -43.208553314208984, -38.693695068359375, -34.1788330078125, -29.663972854614258, -25.149112701416016, -20.634252548217773, -16.11939239501953, -11.604532241821289, -7.089672088623047, -2.5748119354248047, 1.9400482177734375, 6.45490837097168, 10.969768524169922, 15.484628677368164, 19.999488830566406, 24.51434898376465, 29.02920913696289, 33.5440673828125, 38.058929443359375, 42.57379150390625, 47.08864974975586, 51.60350799560547, 56.118370056152344, 60.63323211669922, 65.14808654785156, 69.66294860839844, 74.17779541015625, 78.69265747070312, 83.20751953125, 87.72237396240234, 92.23723602294922, 96.7520980834961, 101.26695251464844, 105.78181457519531, 110.29667663574219, 114.81153869628906, 119.32640075683594, 123.84125518798828, 128.35610961914062, 132.8709716796875, 137.38583374023438, 141.90069580078125, 146.41555786132812, 150.930419921875, 155.44528198242188, 159.96014404296875, 164.47500610351562, 168.98985290527344, 173.5047149658203, 178.0195770263672, 182.53443908691406, 187.04930114746094, 191.5641632080078, 196.0790252685547, 200.5938720703125, 205.10873413085938, 209.62359619140625, 214.13845825195312, 218.6533203125]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 4.0, 6.0, 3.0, 8.0, 5.0, 8.0, 6.0, 6.0, 13.0, 13.0, 10.0, 19.0, 14.0, 23.0, 26.0, 17.0, 19.0, 23.0, 27.0, 24.0, 31.0, 36.0, 53.0, 61.0, 82.0, 75.0, 50.0, 42.0, 26.0, 22.0, 33.0, 25.0, 16.0, 17.0, 20.0, 18.0, 14.0, 15.0, 14.0, 9.0, 12.0, 12.0, 5.0, 5.0, 9.0, 4.0, 7.0, 4.0, 3.0, 4.0, 4.0, 1.0, 0.0, 4.0, 2.0, 3.0, 0.0, 1.0], "bins": [-43.23426818847656, -41.82818603515625, -40.42210388183594, -39.01602554321289, -37.60994338989258, -36.203861236572266, -34.79778289794922, -33.391700744628906, -31.985618591308594, -30.57953643798828, -29.1734561920166, -27.767375946044922, -26.36129379272461, -24.955211639404297, -23.549131393432617, -22.143051147460938, -20.736968994140625, -19.330886840820312, -17.924806594848633, -16.518726348876953, -15.11264419555664, -13.706562995910645, -12.300481796264648, -10.894400596618652, -9.488319396972656, -8.08223819732666, -6.676156997680664, -5.270075798034668, -3.863994598388672, -2.457913398742676, -1.0518321990966797, 0.3542490005493164, 1.7603302001953125, 3.1664113998413086, 4.572492599487305, 5.978573799133301, 7.384654998779297, 8.790736198425293, 10.196817398071289, 11.602898597717285, 13.008979797363281, 14.415060997009277, 15.821142196655273, 17.227222442626953, 18.633304595947266, 20.039386749267578, 21.445466995239258, 22.851547241210938, 24.25762939453125, 25.663711547851562, 27.069791793823242, 28.475872039794922, 29.881954193115234, 31.288036346435547, 32.694114685058594, 34.100196838378906, 35.50627899169922, 36.91236114501953, 38.318443298339844, 39.72452163696289, 41.1306037902832, 42.536685943603516, 43.94276428222656, 45.348846435546875, 46.75492858886719]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 0.0, 5.0, 7.0, 7.0, 15.0, 19.0, 24.0, 40.0, 57.0, 89.0, 154.0, 206.0, 361.0, 586.0, 1073.0, 2130.0, 4409.0, 11664.0, 44478.0, 241599.0, 1302736.0, 2038482.0, 437367.0, 81412.0, 16172.0, 5373.0, 2633.0, 1325.0, 690.0, 394.0, 264.0, 174.0, 110.0, 69.0, 50.0, 35.0, 15.0, 17.0, 11.0, 11.0, 6.0, 4.0, 5.0, 3.0, 0.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.4609375, -4.322265625, -4.18359375, -4.044921875, -3.90625, -3.767578125, -3.62890625, -3.490234375, -3.3515625, -3.212890625, -3.07421875, -2.935546875, -2.796875, -2.658203125, -2.51953125, -2.380859375, -2.2421875, -2.103515625, -1.96484375, -1.826171875, -1.6875, -1.548828125, -1.41015625, -1.271484375, -1.1328125, -0.994140625, -0.85546875, -0.716796875, -0.578125, -0.439453125, -0.30078125, -0.162109375, -0.0234375, 0.115234375, 0.25390625, 0.392578125, 0.53125, 0.669921875, 0.80859375, 0.947265625, 1.0859375, 1.224609375, 1.36328125, 1.501953125, 1.640625, 1.779296875, 1.91796875, 2.056640625, 2.1953125, 2.333984375, 2.47265625, 2.611328125, 2.75, 2.888671875, 3.02734375, 3.166015625, 3.3046875, 3.443359375, 3.58203125, 3.720703125, 3.859375, 3.998046875, 4.13671875, 4.275390625, 4.4140625]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 5.0, 1.0, 7.0, 4.0, 8.0, 3.0, 6.0, 16.0, 13.0, 14.0, 14.0, 22.0, 18.0, 15.0, 32.0, 28.0, 27.0, 33.0, 30.0, 48.0, 41.0, 46.0, 42.0, 36.0, 56.0, 38.0, 43.0, 41.0, 44.0, 37.0, 41.0, 30.0, 21.0, 26.0, 22.0, 18.0, 23.0, 15.0, 8.0, 10.0, 8.0, 10.0, 6.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.111328125, -2.985748291015625, -2.86016845703125, -2.734588623046875, -2.6090087890625, -2.483428955078125, -2.35784912109375, -2.232269287109375, -2.106689453125, -1.981109619140625, -1.85552978515625, -1.729949951171875, -1.6043701171875, -1.478790283203125, -1.35321044921875, -1.227630615234375, -1.10205078125, -0.976470947265625, -0.85089111328125, -0.725311279296875, -0.5997314453125, -0.474151611328125, -0.34857177734375, -0.222991943359375, -0.097412109375, 0.028167724609375, 0.15374755859375, 0.279327392578125, 0.4049072265625, 0.530487060546875, 0.65606689453125, 0.781646728515625, 0.9072265625, 1.032806396484375, 1.15838623046875, 1.283966064453125, 1.4095458984375, 1.535125732421875, 1.66070556640625, 1.786285400390625, 1.911865234375, 2.037445068359375, 2.16302490234375, 2.288604736328125, 2.4141845703125, 2.539764404296875, 2.66534423828125, 2.790924072265625, 2.91650390625, 3.042083740234375, 3.16766357421875, 3.293243408203125, 3.4188232421875, 3.544403076171875, 3.66998291015625, 3.795562744140625, 3.921142578125, 4.046722412109375, 4.17230224609375, 4.297882080078125, 4.4234619140625, 4.549041748046875, 4.67462158203125, 4.800201416015625, 4.92578125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 7.0, 17.0, 26.0, 64.0, 154.0, 329.0, 1669.0, 28123.0, 4118685.0, 42116.0, 2318.0, 454.0, 172.0, 67.0, 31.0, 26.0, 8.0, 12.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.1875, -21.3818359375, -20.576171875, -19.7705078125, -18.96484375, -18.1591796875, -17.353515625, -16.5478515625, -15.7421875, -14.9365234375, -14.130859375, -13.3251953125, -12.51953125, -11.7138671875, -10.908203125, -10.1025390625, -9.296875, -8.4912109375, -7.685546875, -6.8798828125, -6.07421875, -5.2685546875, -4.462890625, -3.6572265625, -2.8515625, -2.0458984375, -1.240234375, -0.4345703125, 0.37109375, 1.1767578125, 1.982421875, 2.7880859375, 3.59375, 4.3994140625, 5.205078125, 6.0107421875, 6.81640625, 7.6220703125, 8.427734375, 9.2333984375, 10.0390625, 10.8447265625, 11.650390625, 12.4560546875, 13.26171875, 14.0673828125, 14.873046875, 15.6787109375, 16.484375, 17.2900390625, 18.095703125, 18.9013671875, 19.70703125, 20.5126953125, 21.318359375, 22.1240234375, 22.9296875, 23.7353515625, 24.541015625, 25.3466796875, 26.15234375, 26.9580078125, 27.763671875, 28.5693359375, 29.375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 8.0, 8.0, 24.0, 33.0, 71.0, 170.0, 403.0, 1048.0, 1306.0, 574.0, 197.0, 95.0, 46.0, 24.0, 24.0, 14.0, 10.0, 4.0, 2.0, 7.0, 2.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.62109375, -7.15093994140625, -6.6807861328125, -6.21063232421875, -5.740478515625, -5.27032470703125, -4.8001708984375, -4.33001708984375, -3.85986328125, -3.38970947265625, -2.9195556640625, -2.44940185546875, -1.979248046875, -1.50909423828125, -1.0389404296875, -0.56878662109375, -0.0986328125, 0.37152099609375, 0.8416748046875, 1.31182861328125, 1.781982421875, 2.25213623046875, 2.7222900390625, 3.19244384765625, 3.66259765625, 4.13275146484375, 4.6029052734375, 5.07305908203125, 5.543212890625, 6.01336669921875, 6.4835205078125, 6.95367431640625, 7.423828125, 7.89398193359375, 8.3641357421875, 8.83428955078125, 9.304443359375, 9.77459716796875, 10.2447509765625, 10.71490478515625, 11.18505859375, 11.65521240234375, 12.1253662109375, 12.59552001953125, 13.065673828125, 13.53582763671875, 14.0059814453125, 14.47613525390625, 14.9462890625, 15.41644287109375, 15.8865966796875, 16.35675048828125, 16.826904296875, 17.29705810546875, 17.7672119140625, 18.23736572265625, 18.70751953125, 19.17767333984375, 19.6478271484375, 20.11798095703125, 20.588134765625, 21.05828857421875, 21.5284423828125, 21.99859619140625, 22.46875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 5.0, 14.0, 39.0, 83.0, 226.0, 279.0, 187.0, 82.0, 41.0, 19.0, 8.0, 6.0, 8.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-78.71084594726562, -75.71101379394531, -72.711181640625, -69.71134948730469, -66.71151733398438, -63.7116813659668, -60.711849212646484, -57.712013244628906, -54.712181091308594, -51.71234893798828, -48.71251678466797, -45.712684631347656, -42.71284866333008, -39.713016510009766, -36.71318435668945, -33.713348388671875, -30.713520050048828, -27.713687896728516, -24.71385383605957, -21.714021682739258, -18.714187622070312, -15.71435546875, -12.714523315429688, -9.714689254760742, -6.71485710144043, -3.71502423286438, -0.7151913642883301, 2.2846412658691406, 5.2844743728637695, 8.284307479858398, 11.284139633178711, 14.283973693847656, 17.28380584716797, 20.28363800048828, 23.283472061157227, 26.28330421447754, 29.283138275146484, 32.2829704284668, 35.28280258178711, 38.28263854980469, 41.282470703125, 44.28230285644531, 47.282135009765625, 50.28196716308594, 53.281803131103516, 56.28163528442383, 59.28146743774414, 62.28130340576172, 65.2811279296875, 68.28096008300781, 71.28079223632812, 74.28062438964844, 77.28045654296875, 80.28028869628906, 83.28012084960938, 86.27996063232422, 89.27979278564453, 92.27962493896484, 95.27945709228516, 98.27928924560547, 101.27912139892578, 104.27896118164062, 107.27879333496094, 110.27862548828125, 113.27845764160156]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 10.0, 4.0, 9.0, 10.0, 12.0, 20.0, 27.0, 22.0, 29.0, 48.0, 49.0, 56.0, 56.0, 62.0, 80.0, 83.0, 52.0, 54.0, 56.0, 53.0, 48.0, 28.0, 38.0, 21.0, 22.0, 15.0, 13.0, 10.0, 8.0, 7.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-68.76002502441406, -66.9646987915039, -65.16937255859375, -63.37403869628906, -61.578712463378906, -59.78338623046875, -57.98805618286133, -56.192726135253906, -54.39739990234375, -52.602073669433594, -50.80674362182617, -49.01141357421875, -47.216087341308594, -45.42076110839844, -43.625431060791016, -41.830101013183594, -40.03477478027344, -38.23944854736328, -36.44411849975586, -34.64878845214844, -32.85346221923828, -31.058134078979492, -29.262805938720703, -27.467477798461914, -25.672149658203125, -23.876821517944336, -22.081493377685547, -20.286165237426758, -18.49083709716797, -16.69550895690918, -14.90018081665039, -13.104852676391602, -11.309528350830078, -9.514200210571289, -7.7188720703125, -5.923543930053711, -4.128215789794922, -2.332887649536133, -0.5375595092773438, 1.2577686309814453, 3.0530967712402344, 4.848424911499023, 6.6437530517578125, 8.439081192016602, 10.23440933227539, 12.02973747253418, 13.825065612792969, 15.620393753051758, 17.415721893310547, 19.211050033569336, 21.006378173828125, 22.801706314086914, 24.597034454345703, 26.392362594604492, 28.18769073486328, 29.98301887512207, 31.77834701538086, 33.57367706298828, 35.36900329589844, 37.164329528808594, 38.959659576416016, 40.75498962402344, 42.550315856933594, 44.34564208984375, 46.14097213745117]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 5.0, 5.0, 7.0, 6.0, 15.0, 14.0, 21.0, 36.0, 58.0, 68.0, 104.0, 149.0, 201.0, 318.0, 433.0, 761.0, 1252.0, 1930.0, 3158.0, 5462.0, 9148.0, 16470.0, 30831.0, 60954.0, 130407.0, 280653.0, 263257.0, 119739.0, 56709.0, 28893.0, 15651.0, 8596.0, 5080.0, 3114.0, 1857.0, 1108.0, 720.0, 474.0, 297.0, 194.0, 142.0, 73.0, 39.0, 48.0, 27.0, 24.0, 14.0, 12.0, 9.0, 8.0, 4.0, 5.0, 4.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.23046875, -4.0791015625, -3.927734375, -3.7763671875, -3.625, -3.4736328125, -3.322265625, -3.1708984375, -3.01953125, -2.8681640625, -2.716796875, -2.5654296875, -2.4140625, -2.2626953125, -2.111328125, -1.9599609375, -1.80859375, -1.6572265625, -1.505859375, -1.3544921875, -1.203125, -1.0517578125, -0.900390625, -0.7490234375, -0.59765625, -0.4462890625, -0.294921875, -0.1435546875, 0.0078125, 0.1591796875, 0.310546875, 0.4619140625, 0.61328125, 0.7646484375, 0.916015625, 1.0673828125, 1.21875, 1.3701171875, 1.521484375, 1.6728515625, 1.82421875, 1.9755859375, 2.126953125, 2.2783203125, 2.4296875, 2.5810546875, 2.732421875, 2.8837890625, 3.03515625, 3.1865234375, 3.337890625, 3.4892578125, 3.640625, 3.7919921875, 3.943359375, 4.0947265625, 4.24609375, 4.3974609375, 4.548828125, 4.7001953125, 4.8515625, 5.0029296875, 5.154296875, 5.3056640625, 5.45703125]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 4.0, 5.0, 8.0, 7.0, 12.0, 15.0, 16.0, 13.0, 8.0, 19.0, 13.0, 21.0, 19.0, 18.0, 28.0, 35.0, 25.0, 31.0, 32.0, 45.0, 45.0, 36.0, 50.0, 41.0, 48.0, 42.0, 39.0, 37.0, 25.0, 38.0, 31.0, 27.0, 31.0, 19.0, 14.0, 12.0, 17.0, 21.0, 11.0, 6.0, 8.0, 10.0, 3.0, 4.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.57421875, -3.4578857421875, -3.341552734375, -3.2252197265625, -3.10888671875, -2.9925537109375, -2.876220703125, -2.7598876953125, -2.6435546875, -2.5272216796875, -2.410888671875, -2.2945556640625, -2.17822265625, -2.0618896484375, -1.945556640625, -1.8292236328125, -1.712890625, -1.5965576171875, -1.480224609375, -1.3638916015625, -1.24755859375, -1.1312255859375, -1.014892578125, -0.8985595703125, -0.7822265625, -0.6658935546875, -0.549560546875, -0.4332275390625, -0.31689453125, -0.2005615234375, -0.084228515625, 0.0321044921875, 0.1484375, 0.2647705078125, 0.381103515625, 0.4974365234375, 0.61376953125, 0.7301025390625, 0.846435546875, 0.9627685546875, 1.0791015625, 1.1954345703125, 1.311767578125, 1.4281005859375, 1.54443359375, 1.6607666015625, 1.777099609375, 1.8934326171875, 2.009765625, 2.1260986328125, 2.242431640625, 2.3587646484375, 2.47509765625, 2.5914306640625, 2.707763671875, 2.8240966796875, 2.9404296875, 3.0567626953125, 3.173095703125, 3.2894287109375, 3.40576171875, 3.5220947265625, 3.638427734375, 3.7547607421875, 3.87109375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 3.0, 4.0, 4.0, 7.0, 15.0, 21.0, 20.0, 32.0, 38.0, 62.0, 112.0, 154.0, 276.0, 496.0, 1029.0, 2716.0, 10133.0, 97019.0, 867000.0, 57786.0, 7514.0, 2132.0, 898.0, 441.0, 252.0, 136.0, 88.0, 61.0, 33.0, 28.0, 12.0, 13.0, 5.0, 4.0, 8.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.5, -14.954345703125, -14.40869140625, -13.863037109375, -13.3173828125, -12.771728515625, -12.22607421875, -11.680419921875, -11.134765625, -10.589111328125, -10.04345703125, -9.497802734375, -8.9521484375, -8.406494140625, -7.86083984375, -7.315185546875, -6.76953125, -6.223876953125, -5.67822265625, -5.132568359375, -4.5869140625, -4.041259765625, -3.49560546875, -2.949951171875, -2.404296875, -1.858642578125, -1.31298828125, -0.767333984375, -0.2216796875, 0.323974609375, 0.86962890625, 1.415283203125, 1.9609375, 2.506591796875, 3.05224609375, 3.597900390625, 4.1435546875, 4.689208984375, 5.23486328125, 5.780517578125, 6.326171875, 6.871826171875, 7.41748046875, 7.963134765625, 8.5087890625, 9.054443359375, 9.60009765625, 10.145751953125, 10.69140625, 11.237060546875, 11.78271484375, 12.328369140625, 12.8740234375, 13.419677734375, 13.96533203125, 14.510986328125, 15.056640625, 15.602294921875, 16.14794921875, 16.693603515625, 17.2392578125, 17.784912109375, 18.33056640625, 18.876220703125, 19.421875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 6.0, 10.0, 8.0, 8.0, 12.0, 15.0, 40.0, 40.0, 52.0, 68.0, 86.0, 86.0, 87.0, 109.0, 77.0, 73.0, 49.0, 57.0, 40.0, 25.0, 19.0, 13.0, 10.0, 7.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.59375, -22.712890625, -21.83203125, -20.951171875, -20.0703125, -19.189453125, -18.30859375, -17.427734375, -16.546875, -15.666015625, -14.78515625, -13.904296875, -13.0234375, -12.142578125, -11.26171875, -10.380859375, -9.5, -8.619140625, -7.73828125, -6.857421875, -5.9765625, -5.095703125, -4.21484375, -3.333984375, -2.453125, -1.572265625, -0.69140625, 0.189453125, 1.0703125, 1.951171875, 2.83203125, 3.712890625, 4.59375, 5.474609375, 6.35546875, 7.236328125, 8.1171875, 8.998046875, 9.87890625, 10.759765625, 11.640625, 12.521484375, 13.40234375, 14.283203125, 15.1640625, 16.044921875, 16.92578125, 17.806640625, 18.6875, 19.568359375, 20.44921875, 21.330078125, 22.2109375, 23.091796875, 23.97265625, 24.853515625, 25.734375, 26.615234375, 27.49609375, 28.376953125, 29.2578125, 30.138671875, 31.01953125, 31.900390625, 32.78125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 4.0, 2.0, 8.0, 9.0, 21.0, 29.0, 45.0, 73.0, 97.0, 164.0, 312.0, 710.0, 2080.0, 9137.0, 73630.0, 847355.0, 99426.0, 11380.0, 2398.0, 848.0, 344.0, 190.0, 94.0, 70.0, 42.0, 34.0, 10.0, 17.0, 6.0, 8.0, 3.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.390625, -3.292510986328125, -3.19439697265625, -3.096282958984375, -2.9981689453125, -2.900054931640625, -2.80194091796875, -2.703826904296875, -2.605712890625, -2.507598876953125, -2.40948486328125, -2.311370849609375, -2.2132568359375, -2.115142822265625, -2.01702880859375, -1.918914794921875, -1.82080078125, -1.722686767578125, -1.62457275390625, -1.526458740234375, -1.4283447265625, -1.330230712890625, -1.23211669921875, -1.134002685546875, -1.035888671875, -0.937774658203125, -0.83966064453125, -0.741546630859375, -0.6434326171875, -0.545318603515625, -0.44720458984375, -0.349090576171875, -0.2509765625, -0.152862548828125, -0.05474853515625, 0.043365478515625, 0.1414794921875, 0.239593505859375, 0.33770751953125, 0.435821533203125, 0.533935546875, 0.632049560546875, 0.73016357421875, 0.828277587890625, 0.9263916015625, 1.024505615234375, 1.12261962890625, 1.220733642578125, 1.31884765625, 1.416961669921875, 1.51507568359375, 1.613189697265625, 1.7113037109375, 1.809417724609375, 1.90753173828125, 2.005645751953125, 2.103759765625, 2.201873779296875, 2.29998779296875, 2.398101806640625, 2.4962158203125, 2.594329833984375, 2.69244384765625, 2.790557861328125, 2.888671875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 6.0, 9.0, 9.0, 13.0, 15.0, 26.0, 37.0, 46.0, 72.0, 106.0, 145.0, 160.0, 100.0, 75.0, 59.0, 38.0, 28.0, 16.0, 12.0, 14.0, 4.0, 4.0, 5.0, 1.0, 3.0, 0.0, 2.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011167526245117188, -0.001085825264453888, -0.0010548979043960571, -0.0010239705443382263, -0.0009930431842803955, -0.0009621158242225647, -0.0009311884641647339, -0.0009002611041069031, -0.0008693337440490723, -0.0008384063839912415, -0.0008074790239334106, -0.0007765516638755798, -0.000745624303817749, -0.0007146969437599182, -0.0006837695837020874, -0.0006528422236442566, -0.0006219148635864258, -0.000590987503528595, -0.0005600601434707642, -0.0005291327834129333, -0.0004982054233551025, -0.00046727806329727173, -0.0004363507032394409, -0.0004054233431816101, -0.0003744959831237793, -0.0003435686230659485, -0.0003126412630081177, -0.00028171390295028687, -0.00025078654289245605, -0.00021985918283462524, -0.00018893182277679443, -0.00015800446271896362, -0.0001270771026611328, -9.6149742603302e-05, -6.522238254547119e-05, -3.429502248764038e-05, -3.3676624298095703e-06, 2.755969762802124e-05, 5.848705768585205e-05, 8.941441774368286e-05, 0.00012034177780151367, 0.00015126913785934448, 0.0001821964979171753, 0.0002131238579750061, 0.00024405121803283691, 0.0002749785780906677, 0.00030590593814849854, 0.00033683329820632935, 0.00036776065826416016, 0.00039868801832199097, 0.0004296153783798218, 0.0004605427384376526, 0.0004914700984954834, 0.0005223974585533142, 0.000553324818611145, 0.0005842521786689758, 0.0006151795387268066, 0.0006461068987846375, 0.0006770342588424683, 0.0007079616189002991, 0.0007388889789581299, 0.0007698163390159607, 0.0008007436990737915, 0.0008316710591316223, 0.0008625984191894531]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 2.0, 2.0, 2.0, 6.0, 14.0, 15.0, 30.0, 35.0, 59.0, 127.0, 236.0, 486.0, 1214.0, 4048.0, 25260.0, 732435.0, 263195.0, 16312.0, 3181.0, 1031.0, 401.0, 212.0, 102.0, 49.0, 31.0, 25.0, 22.0, 3.0, 8.0, 5.0, 4.0, 0.0, 2.0, 1.0, 5.0, 2.0, 1.0, 1.0], "bins": [-4.8515625, -4.73577880859375, -4.6199951171875, -4.50421142578125, -4.388427734375, -4.27264404296875, -4.1568603515625, -4.04107666015625, -3.92529296875, -3.80950927734375, -3.6937255859375, -3.57794189453125, -3.462158203125, -3.34637451171875, -3.2305908203125, -3.11480712890625, -2.9990234375, -2.88323974609375, -2.7674560546875, -2.65167236328125, -2.535888671875, -2.42010498046875, -2.3043212890625, -2.18853759765625, -2.07275390625, -1.95697021484375, -1.8411865234375, -1.72540283203125, -1.609619140625, -1.49383544921875, -1.3780517578125, -1.26226806640625, -1.146484375, -1.03070068359375, -0.9149169921875, -0.79913330078125, -0.683349609375, -0.56756591796875, -0.4517822265625, -0.33599853515625, -0.22021484375, -0.10443115234375, 0.0113525390625, 0.12713623046875, 0.242919921875, 0.35870361328125, 0.4744873046875, 0.59027099609375, 0.7060546875, 0.82183837890625, 0.9376220703125, 1.05340576171875, 1.169189453125, 1.28497314453125, 1.4007568359375, 1.51654052734375, 1.63232421875, 1.74810791015625, 1.8638916015625, 1.97967529296875, 2.095458984375, 2.21124267578125, 2.3270263671875, 2.44281005859375, 2.55859375]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 8.0, 6.0, 5.0, 12.0, 28.0, 16.0, 31.0, 38.0, 65.0, 88.0, 108.0, 121.0, 132.0, 91.0, 83.0, 46.0, 35.0, 31.0, 16.0, 12.0, 9.0, 7.0, 4.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.765625, -4.645843505859375, -4.52606201171875, -4.406280517578125, -4.2864990234375, -4.166717529296875, -4.04693603515625, -3.927154541015625, -3.807373046875, -3.687591552734375, -3.56781005859375, -3.448028564453125, -3.3282470703125, -3.208465576171875, -3.08868408203125, -2.968902587890625, -2.84912109375, -2.729339599609375, -2.60955810546875, -2.489776611328125, -2.3699951171875, -2.250213623046875, -2.13043212890625, -2.010650634765625, -1.890869140625, -1.771087646484375, -1.65130615234375, -1.531524658203125, -1.4117431640625, -1.291961669921875, -1.17218017578125, -1.052398681640625, -0.9326171875, -0.812835693359375, -0.69305419921875, -0.573272705078125, -0.4534912109375, -0.333709716796875, -0.21392822265625, -0.094146728515625, 0.025634765625, 0.145416259765625, 0.26519775390625, 0.384979248046875, 0.5047607421875, 0.624542236328125, 0.74432373046875, 0.864105224609375, 0.98388671875, 1.103668212890625, 1.22344970703125, 1.343231201171875, 1.4630126953125, 1.582794189453125, 1.70257568359375, 1.822357177734375, 1.942138671875, 2.061920166015625, 2.18170166015625, 2.301483154296875, 2.4212646484375, 2.541046142578125, 2.66082763671875, 2.780609130859375, 2.900390625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 8.0, 16.0, 15.0, 33.0, 55.0, 115.0, 306.0, 257.0, 83.0, 58.0, 22.0, 15.0, 10.0, 3.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.6794548034668, -53.02199935913086, -50.36454391479492, -47.707088470458984, -45.04963302612305, -42.39217758178711, -39.73472213745117, -37.077266693115234, -34.4198112487793, -31.76235580444336, -29.104900360107422, -26.447444915771484, -23.789989471435547, -21.13253402709961, -18.475078582763672, -15.817623138427734, -13.160167694091797, -10.50271224975586, -7.845256805419922, -5.187801361083984, -2.530345916748047, 0.12710952758789062, 2.784564971923828, 5.442020416259766, 8.099475860595703, 10.75693130493164, 13.414386749267578, 16.071842193603516, 18.729297637939453, 21.38675308227539, 24.044208526611328, 26.701663970947266, 29.35912322998047, 32.016578674316406, 34.674034118652344, 37.33148956298828, 39.98894500732422, 42.646400451660156, 45.303855895996094, 47.96131134033203, 50.61876678466797, 53.276222229003906, 55.933677673339844, 58.59113311767578, 61.24858856201172, 63.906044006347656, 66.5634994506836, 69.22095489501953, 71.87841033935547, 74.5358657836914, 77.19332122802734, 79.85077667236328, 82.50823211669922, 85.16568756103516, 87.8231430053711, 90.48059844970703, 93.13805389404297, 95.7955093383789, 98.45296478271484, 101.11042022705078, 103.76787567138672, 106.42533111572266, 109.0827865600586, 111.74024200439453, 114.39769744873047]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 5.0, 6.0, 8.0, 12.0, 6.0, 11.0, 10.0, 9.0, 18.0, 12.0, 17.0, 31.0, 34.0, 24.0, 30.0, 43.0, 45.0, 71.0, 121.0, 108.0, 74.0, 31.0, 45.0, 31.0, 21.0, 20.0, 23.0, 22.0, 18.0, 10.0, 14.0, 11.0, 11.0, 6.0, 12.0, 8.0, 9.0, 2.0, 3.0, 3.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-61.791908264160156, -59.977142333984375, -58.162376403808594, -56.34761047363281, -54.5328483581543, -52.718082427978516, -50.903316497802734, -49.08855056762695, -47.27378845214844, -45.459022521972656, -43.644256591796875, -41.829490661621094, -40.01472854614258, -38.1999626159668, -36.385196685791016, -34.570430755615234, -32.75566482543945, -30.940898895263672, -29.126134872436523, -27.311368942260742, -25.496604919433594, -23.681838989257812, -21.86707305908203, -20.05230712890625, -18.2375431060791, -16.42277717590332, -14.608013153076172, -12.79324722290039, -10.978482246398926, -9.163717269897461, -7.34895133972168, -5.534186363220215, -3.71942138671875, -1.904656171798706, -0.08989095687866211, 1.724874496459961, 3.539639472961426, 5.354404449462891, 7.169170379638672, 8.983935356140137, 10.798700332641602, 12.613465309143066, 14.428230285644531, 16.242996215820312, 18.057762145996094, 19.872526168823242, 21.687292098999023, 23.502056121826172, 25.316822052001953, 27.131587982177734, 28.946352005004883, 30.761117935180664, 32.57588195800781, 34.390647888183594, 36.205413818359375, 38.020179748535156, 39.83494567871094, 41.64971160888672, 43.4644775390625, 45.27924346923828, 47.0940055847168, 48.90877151489258, 50.72353744506836, 52.53830337524414, 54.353065490722656]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 1.0, 5.0, 3.0, 16.0, 11.0, 19.0, 18.0, 35.0, 57.0, 95.0, 126.0, 175.0, 298.0, 390.0, 633.0, 1084.0, 1667.0, 2922.0, 5261.0, 11094.0, 27751.0, 92300.0, 393948.0, 1349052.0, 1617622.0, 514372.0, 116773.0, 31169.0, 12737.0, 6135.0, 3335.0, 1842.0, 1175.0, 699.0, 469.0, 276.0, 217.0, 165.0, 94.0, 72.0, 47.0, 39.0, 30.0, 19.0, 10.0, 6.0, 7.0, 5.0, 5.0, 6.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.36328125, -4.20794677734375, -4.0526123046875, -3.89727783203125, -3.741943359375, -3.58660888671875, -3.4312744140625, -3.27593994140625, -3.12060546875, -2.96527099609375, -2.8099365234375, -2.65460205078125, -2.499267578125, -2.34393310546875, -2.1885986328125, -2.03326416015625, -1.8779296875, -1.72259521484375, -1.5672607421875, -1.41192626953125, -1.256591796875, -1.10125732421875, -0.9459228515625, -0.79058837890625, -0.63525390625, -0.47991943359375, -0.3245849609375, -0.16925048828125, -0.013916015625, 0.14141845703125, 0.2967529296875, 0.45208740234375, 0.607421875, 0.76275634765625, 0.9180908203125, 1.07342529296875, 1.228759765625, 1.38409423828125, 1.5394287109375, 1.69476318359375, 1.85009765625, 2.00543212890625, 2.1607666015625, 2.31610107421875, 2.471435546875, 2.62677001953125, 2.7821044921875, 2.93743896484375, 3.0927734375, 3.24810791015625, 3.4034423828125, 3.55877685546875, 3.714111328125, 3.86944580078125, 4.0247802734375, 4.18011474609375, 4.33544921875, 4.49078369140625, 4.6461181640625, 4.80145263671875, 4.956787109375, 5.11212158203125, 5.2674560546875, 5.42279052734375, 5.578125]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 5.0, 6.0, 5.0, 7.0, 14.0, 15.0, 12.0, 14.0, 19.0, 26.0, 20.0, 25.0, 32.0, 46.0, 39.0, 31.0, 50.0, 48.0, 43.0, 49.0, 50.0, 50.0, 52.0, 43.0, 34.0, 41.0, 28.0, 32.0, 33.0, 24.0, 25.0, 14.0, 12.0, 16.0, 6.0, 11.0, 6.0, 7.0, 5.0, 8.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.341796875, -3.217376708984375, -3.09295654296875, -2.968536376953125, -2.8441162109375, -2.719696044921875, -2.59527587890625, -2.470855712890625, -2.346435546875, -2.222015380859375, -2.09759521484375, -1.973175048828125, -1.8487548828125, -1.724334716796875, -1.59991455078125, -1.475494384765625, -1.35107421875, -1.226654052734375, -1.10223388671875, -0.977813720703125, -0.8533935546875, -0.728973388671875, -0.60455322265625, -0.480133056640625, -0.355712890625, -0.231292724609375, -0.10687255859375, 0.017547607421875, 0.1419677734375, 0.266387939453125, 0.39080810546875, 0.515228271484375, 0.6396484375, 0.764068603515625, 0.88848876953125, 1.012908935546875, 1.1373291015625, 1.261749267578125, 1.38616943359375, 1.510589599609375, 1.635009765625, 1.759429931640625, 1.88385009765625, 2.008270263671875, 2.1326904296875, 2.257110595703125, 2.38153076171875, 2.505950927734375, 2.63037109375, 2.754791259765625, 2.87921142578125, 3.003631591796875, 3.1280517578125, 3.252471923828125, 3.37689208984375, 3.501312255859375, 3.625732421875, 3.750152587890625, 3.87457275390625, 3.998992919921875, 4.1234130859375, 4.247833251953125, 4.37225341796875, 4.496673583984375, 4.62109375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 2.0, 3.0, 2.0, 8.0, 13.0, 12.0, 24.0, 32.0, 51.0, 89.0, 123.0, 226.0, 429.0, 907.0, 2449.0, 14130.0, 978586.0, 3172102.0, 19744.0, 3176.0, 1050.0, 496.0, 231.0, 139.0, 95.0, 51.0, 39.0, 16.0, 19.0, 10.0, 7.0, 10.0, 4.0, 5.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-27.828125, -27.09716796875, -26.3662109375, -25.63525390625, -24.904296875, -24.17333984375, -23.4423828125, -22.71142578125, -21.98046875, -21.24951171875, -20.5185546875, -19.78759765625, -19.056640625, -18.32568359375, -17.5947265625, -16.86376953125, -16.1328125, -15.40185546875, -14.6708984375, -13.93994140625, -13.208984375, -12.47802734375, -11.7470703125, -11.01611328125, -10.28515625, -9.55419921875, -8.8232421875, -8.09228515625, -7.361328125, -6.63037109375, -5.8994140625, -5.16845703125, -4.4375, -3.70654296875, -2.9755859375, -2.24462890625, -1.513671875, -0.78271484375, -0.0517578125, 0.67919921875, 1.41015625, 2.14111328125, 2.8720703125, 3.60302734375, 4.333984375, 5.06494140625, 5.7958984375, 6.52685546875, 7.2578125, 7.98876953125, 8.7197265625, 9.45068359375, 10.181640625, 10.91259765625, 11.6435546875, 12.37451171875, 13.10546875, 13.83642578125, 14.5673828125, 15.29833984375, 16.029296875, 16.76025390625, 17.4912109375, 18.22216796875, 18.953125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 5.0, 6.0, 9.0, 5.0, 13.0, 19.0, 31.0, 49.0, 63.0, 98.0, 159.0, 238.0, 384.0, 655.0, 858.0, 601.0, 313.0, 199.0, 112.0, 80.0, 55.0, 35.0, 28.0, 17.0, 7.0, 13.0, 8.0, 8.0, 3.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.7421875, -11.2816162109375, -10.821044921875, -10.3604736328125, -9.89990234375, -9.4393310546875, -8.978759765625, -8.5181884765625, -8.0576171875, -7.5970458984375, -7.136474609375, -6.6759033203125, -6.21533203125, -5.7547607421875, -5.294189453125, -4.8336181640625, -4.373046875, -3.9124755859375, -3.451904296875, -2.9913330078125, -2.53076171875, -2.0701904296875, -1.609619140625, -1.1490478515625, -0.6884765625, -0.2279052734375, 0.232666015625, 0.6932373046875, 1.15380859375, 1.6143798828125, 2.074951171875, 2.5355224609375, 2.99609375, 3.4566650390625, 3.917236328125, 4.3778076171875, 4.83837890625, 5.2989501953125, 5.759521484375, 6.2200927734375, 6.6806640625, 7.1412353515625, 7.601806640625, 8.0623779296875, 8.52294921875, 8.9835205078125, 9.444091796875, 9.9046630859375, 10.365234375, 10.8258056640625, 11.286376953125, 11.7469482421875, 12.20751953125, 12.6680908203125, 13.128662109375, 13.5892333984375, 14.0498046875, 14.5103759765625, 14.970947265625, 15.4315185546875, 15.89208984375, 16.3526611328125, 16.813232421875, 17.2738037109375, 17.734375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 4.0, 5.0, 5.0, 7.0, 6.0, 18.0, 17.0, 33.0, 65.0, 100.0, 124.0, 172.0, 151.0, 127.0, 61.0, 34.0, 15.0, 14.0, 11.0, 15.0, 7.0, 2.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-128.46926879882812, -124.88505554199219, -121.30084228515625, -117.71662902832031, -114.13241577148438, -110.54820251464844, -106.9639892578125, -103.37977600097656, -99.79556274414062, -96.21134948730469, -92.62713623046875, -89.04292297363281, -85.45870971679688, -81.87449645996094, -78.290283203125, -74.70606994628906, -71.12185668945312, -67.53764343261719, -63.95343017578125, -60.36921691894531, -56.785003662109375, -53.20079040527344, -49.6165771484375, -46.03236389160156, -42.448143005371094, -38.863929748535156, -35.27971649169922, -31.69550323486328, -28.111289978027344, -24.527074813842773, -20.942861557006836, -17.3586483001709, -13.774436950683594, -10.190223693847656, -6.6060099601745605, -3.021796226501465, 0.5624170303344727, 4.146631240844727, 7.730844497680664, 11.315057754516602, 14.899271011352539, 18.483484268188477, 22.067697525024414, 25.651912689208984, 29.236125946044922, 32.82033920288086, 36.4045524597168, 39.988765716552734, 43.57297897338867, 47.15719223022461, 50.74140548706055, 54.325618743896484, 57.90983200073242, 61.494049072265625, 65.07826232910156, 68.6624755859375, 72.24668884277344, 75.83090209960938, 79.41511535644531, 82.99932861328125, 86.58354187011719, 90.16775512695312, 93.75196838378906, 97.336181640625, 100.92039489746094]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 5.0, 4.0, 2.0, 7.0, 9.0, 9.0, 5.0, 19.0, 30.0, 16.0, 25.0, 35.0, 23.0, 43.0, 43.0, 61.0, 55.0, 72.0, 80.0, 76.0, 52.0, 43.0, 42.0, 40.0, 38.0, 29.0, 35.0, 22.0, 10.0, 17.0, 13.0, 12.0, 12.0, 3.0, 4.0, 9.0, 3.0, 3.0, 1.0, 1.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.20524597167969, -62.64797592163086, -60.0907096862793, -57.53343963623047, -54.976173400878906, -52.41890335083008, -49.86163330078125, -47.30436706542969, -44.74709701538086, -42.18982696533203, -39.63256072998047, -37.07529067993164, -34.51802062988281, -31.96075439453125, -29.403484344482422, -26.846216201782227, -24.28894805908203, -21.731679916381836, -19.17441177368164, -16.617141723632812, -14.059873580932617, -11.502605438232422, -8.94533634185791, -6.388067245483398, -3.830799102783203, -1.2735304832458496, 1.283738136291504, 3.8410067558288574, 6.398275375366211, 8.955543518066406, 11.512812614440918, 14.07008171081543, 16.627349853515625, 19.18461799621582, 21.741886138916016, 24.299156188964844, 26.85642433166504, 29.413692474365234, 31.970962524414062, 34.528228759765625, 37.08549880981445, 39.64276885986328, 42.200035095214844, 44.75730514526367, 47.3145751953125, 49.87184143066406, 52.42911148071289, 54.98638153076172, 57.54364776611328, 60.10091781616211, 62.65818405151367, 65.2154541015625, 67.77272033691406, 70.32998657226562, 72.88726043701172, 75.44452667236328, 78.00180053710938, 80.55906677246094, 83.11634063720703, 85.6736068725586, 88.23087310791016, 90.78814697265625, 93.34541320800781, 95.90267944335938, 98.45994567871094]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 3.0, 0.0, 1.0, 3.0, 3.0, 7.0, 5.0, 10.0, 18.0, 21.0, 24.0, 36.0, 53.0, 104.0, 145.0, 203.0, 375.0, 594.0, 1128.0, 1990.0, 3739.0, 7203.0, 15230.0, 39220.0, 131658.0, 596352.0, 169137.0, 46647.0, 17541.0, 7947.0, 4006.0, 2121.0, 1242.0, 691.0, 416.0, 232.0, 150.0, 80.0, 59.0, 54.0, 34.0, 21.0, 15.0, 13.0, 9.0, 6.0, 6.0, 6.0, 2.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.3515625, -7.10302734375, -6.8544921875, -6.60595703125, -6.357421875, -6.10888671875, -5.8603515625, -5.61181640625, -5.36328125, -5.11474609375, -4.8662109375, -4.61767578125, -4.369140625, -4.12060546875, -3.8720703125, -3.62353515625, -3.375, -3.12646484375, -2.8779296875, -2.62939453125, -2.380859375, -2.13232421875, -1.8837890625, -1.63525390625, -1.38671875, -1.13818359375, -0.8896484375, -0.64111328125, -0.392578125, -0.14404296875, 0.1044921875, 0.35302734375, 0.6015625, 0.85009765625, 1.0986328125, 1.34716796875, 1.595703125, 1.84423828125, 2.0927734375, 2.34130859375, 2.58984375, 2.83837890625, 3.0869140625, 3.33544921875, 3.583984375, 3.83251953125, 4.0810546875, 4.32958984375, 4.578125, 4.82666015625, 5.0751953125, 5.32373046875, 5.572265625, 5.82080078125, 6.0693359375, 6.31787109375, 6.56640625, 6.81494140625, 7.0634765625, 7.31201171875, 7.560546875, 7.80908203125, 8.0576171875, 8.30615234375, 8.5546875]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 1.0, 5.0, 8.0, 8.0, 8.0, 8.0, 11.0, 25.0, 22.0, 19.0, 29.0, 27.0, 34.0, 35.0, 43.0, 45.0, 50.0, 56.0, 50.0, 43.0, 54.0, 39.0, 67.0, 46.0, 38.0, 36.0, 42.0, 29.0, 25.0, 19.0, 15.0, 13.0, 10.0, 8.0, 13.0, 5.0, 7.0, 7.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.546875, -4.385986328125, -4.22509765625, -4.064208984375, -3.9033203125, -3.742431640625, -3.58154296875, -3.420654296875, -3.259765625, -3.098876953125, -2.93798828125, -2.777099609375, -2.6162109375, -2.455322265625, -2.29443359375, -2.133544921875, -1.97265625, -1.811767578125, -1.65087890625, -1.489990234375, -1.3291015625, -1.168212890625, -1.00732421875, -0.846435546875, -0.685546875, -0.524658203125, -0.36376953125, -0.202880859375, -0.0419921875, 0.118896484375, 0.27978515625, 0.440673828125, 0.6015625, 0.762451171875, 0.92333984375, 1.084228515625, 1.2451171875, 1.406005859375, 1.56689453125, 1.727783203125, 1.888671875, 2.049560546875, 2.21044921875, 2.371337890625, 2.5322265625, 2.693115234375, 2.85400390625, 3.014892578125, 3.17578125, 3.336669921875, 3.49755859375, 3.658447265625, 3.8193359375, 3.980224609375, 4.14111328125, 4.302001953125, 4.462890625, 4.623779296875, 4.78466796875, 4.945556640625, 5.1064453125, 5.267333984375, 5.42822265625, 5.589111328125, 5.75]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 11.0, 7.0, 9.0, 18.0, 17.0, 35.0, 45.0, 82.0, 141.0, 278.0, 552.0, 1263.0, 4613.0, 31024.0, 930121.0, 69787.0, 7308.0, 1812.0, 673.0, 327.0, 148.0, 98.0, 66.0, 35.0, 28.0, 26.0, 4.0, 6.0, 5.0, 2.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.734375, -16.169921875, -15.60546875, -15.041015625, -14.4765625, -13.912109375, -13.34765625, -12.783203125, -12.21875, -11.654296875, -11.08984375, -10.525390625, -9.9609375, -9.396484375, -8.83203125, -8.267578125, -7.703125, -7.138671875, -6.57421875, -6.009765625, -5.4453125, -4.880859375, -4.31640625, -3.751953125, -3.1875, -2.623046875, -2.05859375, -1.494140625, -0.9296875, -0.365234375, 0.19921875, 0.763671875, 1.328125, 1.892578125, 2.45703125, 3.021484375, 3.5859375, 4.150390625, 4.71484375, 5.279296875, 5.84375, 6.408203125, 6.97265625, 7.537109375, 8.1015625, 8.666015625, 9.23046875, 9.794921875, 10.359375, 10.923828125, 11.48828125, 12.052734375, 12.6171875, 13.181640625, 13.74609375, 14.310546875, 14.875, 15.439453125, 16.00390625, 16.568359375, 17.1328125, 17.697265625, 18.26171875, 18.826171875, 19.390625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 7.0, 4.0, 9.0, 7.0, 10.0, 12.0, 9.0, 11.0, 17.0, 16.0, 21.0, 24.0, 27.0, 24.0, 33.0, 64.0, 72.0, 64.0, 72.0, 74.0, 70.0, 74.0, 47.0, 35.0, 26.0, 22.0, 20.0, 28.0, 16.0, 14.0, 12.0, 14.0, 8.0, 6.0, 9.0, 7.0, 3.0, 5.0, 5.0, 2.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.9375, -21.2265625, -20.515625, -19.8046875, -19.09375, -18.3828125, -17.671875, -16.9609375, -16.25, -15.5390625, -14.828125, -14.1171875, -13.40625, -12.6953125, -11.984375, -11.2734375, -10.5625, -9.8515625, -9.140625, -8.4296875, -7.71875, -7.0078125, -6.296875, -5.5859375, -4.875, -4.1640625, -3.453125, -2.7421875, -2.03125, -1.3203125, -0.609375, 0.1015625, 0.8125, 1.5234375, 2.234375, 2.9453125, 3.65625, 4.3671875, 5.078125, 5.7890625, 6.5, 7.2109375, 7.921875, 8.6328125, 9.34375, 10.0546875, 10.765625, 11.4765625, 12.1875, 12.8984375, 13.609375, 14.3203125, 15.03125, 15.7421875, 16.453125, 17.1640625, 17.875, 18.5859375, 19.296875, 20.0078125, 20.71875, 21.4296875, 22.140625, 22.8515625, 23.5625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 6.0, 3.0, 7.0, 6.0, 4.0, 8.0, 16.0, 20.0, 42.0, 53.0, 75.0, 125.0, 192.0, 358.0, 646.0, 1165.0, 2477.0, 6119.0, 19355.0, 92750.0, 835555.0, 64814.0, 15200.0, 5050.0, 2115.0, 1021.0, 560.0, 320.0, 162.0, 96.0, 69.0, 55.0, 38.0, 17.0, 15.0, 12.0, 9.0, 5.0, 7.0, 2.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.11328125, -2.050018310546875, -1.98675537109375, -1.923492431640625, -1.8602294921875, -1.796966552734375, -1.73370361328125, -1.670440673828125, -1.607177734375, -1.543914794921875, -1.48065185546875, -1.417388916015625, -1.3541259765625, -1.290863037109375, -1.22760009765625, -1.164337158203125, -1.10107421875, -1.037811279296875, -0.97454833984375, -0.911285400390625, -0.8480224609375, -0.784759521484375, -0.72149658203125, -0.658233642578125, -0.594970703125, -0.531707763671875, -0.46844482421875, -0.405181884765625, -0.3419189453125, -0.278656005859375, -0.21539306640625, -0.152130126953125, -0.0888671875, -0.025604248046875, 0.03765869140625, 0.100921630859375, 0.1641845703125, 0.227447509765625, 0.29071044921875, 0.353973388671875, 0.417236328125, 0.480499267578125, 0.54376220703125, 0.607025146484375, 0.6702880859375, 0.733551025390625, 0.79681396484375, 0.860076904296875, 0.92333984375, 0.986602783203125, 1.04986572265625, 1.113128662109375, 1.1763916015625, 1.239654541015625, 1.30291748046875, 1.366180419921875, 1.429443359375, 1.492706298828125, 1.55596923828125, 1.619232177734375, 1.6824951171875, 1.745758056640625, 1.80902099609375, 1.872283935546875, 1.935546875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 1.0, 3.0, 2.0, 4.0, 3.0, 7.0, 9.0, 11.0, 10.0, 15.0, 20.0, 21.0, 25.0, 35.0, 52.0, 75.0, 98.0, 128.0, 100.0, 88.0, 83.0, 40.0, 34.0, 32.0, 21.0, 14.0, 15.0, 10.0, 15.0, 4.0, 11.0, 3.0, 4.0, 0.0, 3.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00063323974609375, -0.0006119087338447571, -0.0005905777215957642, -0.0005692467093467712, -0.0005479156970977783, -0.0005265846848487854, -0.0005052536725997925, -0.00048392266035079956, -0.00046259164810180664, -0.0004412606358528137, -0.0004199296236038208, -0.0003985986113548279, -0.00037726759910583496, -0.00035593658685684204, -0.0003346055746078491, -0.0003132745623588562, -0.0002919435501098633, -0.00027061253786087036, -0.00024928152561187744, -0.00022795051336288452, -0.0002066195011138916, -0.00018528848886489868, -0.00016395747661590576, -0.00014262646436691284, -0.00012129545211791992, -9.9964439868927e-05, -7.863342761993408e-05, -5.730241537094116e-05, -3.597140312194824e-05, -1.4640390872955322e-05, 6.690621376037598e-06, 2.8021633625030518e-05, 4.935264587402344e-05, 7.068365812301636e-05, 9.201467037200928e-05, 0.0001133456826210022, 0.00013467669486999512, 0.00015600770711898804, 0.00017733871936798096, 0.00019866973161697388, 0.0002200007438659668, 0.00024133175611495972, 0.00026266276836395264, 0.00028399378061294556, 0.0003053247928619385, 0.0003266558051109314, 0.0003479868173599243, 0.00036931782960891724, 0.00039064884185791016, 0.0004119798541069031, 0.000433310866355896, 0.0004546418786048889, 0.00047597289085388184, 0.0004973039031028748, 0.0005186349153518677, 0.0005399659276008606, 0.0005612969398498535, 0.0005826279520988464, 0.0006039589643478394, 0.0006252899765968323, 0.0006466209888458252, 0.0006679520010948181, 0.000689283013343811, 0.000710614025592804, 0.0007319450378417969]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 6.0, 7.0, 6.0, 8.0, 17.0, 15.0, 26.0, 39.0, 54.0, 85.0, 124.0, 187.0, 317.0, 502.0, 808.0, 1569.0, 3011.0, 6502.0, 15668.0, 45937.0, 284120.0, 612559.0, 47557.0, 16050.0, 6553.0, 3095.0, 1577.0, 802.0, 491.0, 299.0, 193.0, 128.0, 78.0, 57.0, 37.0, 22.0, 19.0, 9.0, 8.0, 5.0, 4.0, 4.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2021484375, -1.1645965576171875, -1.127044677734375, -1.0894927978515625, -1.05194091796875, -1.0143890380859375, -0.976837158203125, -0.9392852783203125, -0.9017333984375, -0.8641815185546875, -0.826629638671875, -0.7890777587890625, -0.75152587890625, -0.7139739990234375, -0.676422119140625, -0.6388702392578125, -0.601318359375, -0.5637664794921875, -0.526214599609375, -0.4886627197265625, -0.45111083984375, -0.4135589599609375, -0.376007080078125, -0.3384552001953125, -0.3009033203125, -0.2633514404296875, -0.225799560546875, -0.1882476806640625, -0.15069580078125, -0.1131439208984375, -0.075592041015625, -0.0380401611328125, -0.00048828125, 0.0370635986328125, 0.074615478515625, 0.1121673583984375, 0.14971923828125, 0.1872711181640625, 0.224822998046875, 0.2623748779296875, 0.2999267578125, 0.3374786376953125, 0.375030517578125, 0.4125823974609375, 0.45013427734375, 0.4876861572265625, 0.525238037109375, 0.5627899169921875, 0.600341796875, 0.6378936767578125, 0.675445556640625, 0.7129974365234375, 0.75054931640625, 0.7881011962890625, 0.825653076171875, 0.8632049560546875, 0.9007568359375, 0.9383087158203125, 0.975860595703125, 1.0134124755859375, 1.05096435546875, 1.0885162353515625, 1.126068115234375, 1.1636199951171875, 1.201171875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 5.0, 4.0, 3.0, 8.0, 5.0, 13.0, 5.0, 9.0, 11.0, 11.0, 12.0, 12.0, 18.0, 23.0, 28.0, 29.0, 49.0, 44.0, 70.0, 78.0, 93.0, 99.0, 76.0, 57.0, 45.0, 35.0, 30.0, 22.0, 14.0, 13.0, 17.0, 13.0, 11.0, 4.0, 8.0, 2.0, 3.0, 5.0, 5.0, 6.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-1.966796875, -1.90679931640625, -1.8468017578125, -1.78680419921875, -1.726806640625, -1.66680908203125, -1.6068115234375, -1.54681396484375, -1.48681640625, -1.42681884765625, -1.3668212890625, -1.30682373046875, -1.246826171875, -1.18682861328125, -1.1268310546875, -1.06683349609375, -1.0068359375, -0.94683837890625, -0.8868408203125, -0.82684326171875, -0.766845703125, -0.70684814453125, -0.6468505859375, -0.58685302734375, -0.52685546875, -0.46685791015625, -0.4068603515625, -0.34686279296875, -0.286865234375, -0.22686767578125, -0.1668701171875, -0.10687255859375, -0.046875, 0.01312255859375, 0.0731201171875, 0.13311767578125, 0.193115234375, 0.25311279296875, 0.3131103515625, 0.37310791015625, 0.43310546875, 0.49310302734375, 0.5531005859375, 0.61309814453125, 0.673095703125, 0.73309326171875, 0.7930908203125, 0.85308837890625, 0.9130859375, 0.97308349609375, 1.0330810546875, 1.09307861328125, 1.153076171875, 1.21307373046875, 1.2730712890625, 1.33306884765625, 1.39306640625, 1.45306396484375, 1.5130615234375, 1.57305908203125, 1.633056640625, 1.69305419921875, 1.7530517578125, 1.81304931640625, 1.873046875]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 13.0, 18.0, 53.0, 98.0, 566.0, 129.0, 67.0, 29.0, 12.0, 7.0, 6.0, 3.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-61.26621627807617, -57.06045913696289, -52.854698181152344, -48.64894104003906, -44.44318389892578, -40.237422943115234, -36.03166580200195, -31.82590675354004, -27.620147705078125, -23.41438865661621, -19.208629608154297, -15.002872467041016, -10.797113418579102, -6.5913543701171875, -2.3855972290039062, 1.8201618194580078, 6.025920867919922, 10.231679916381836, 14.437438011169434, 18.64319610595703, 22.848955154418945, 27.05471420288086, 31.26047134399414, 35.46623229980469, 39.67198944091797, 43.87774658203125, 48.0835075378418, 52.28926467895508, 56.495025634765625, 60.700782775878906, 64.90653991699219, 69.11229705810547, 73.31805419921875, 77.52381134033203, 81.72956848144531, 85.93533325195312, 90.1410903930664, 94.34684753417969, 98.55260467529297, 102.75836181640625, 106.96412658691406, 111.16988372802734, 115.37564086914062, 119.58140563964844, 123.78716278076172, 127.992919921875, 132.19866943359375, 136.40443420410156, 140.61019897460938, 144.8159637451172, 149.02171325683594, 153.22747802734375, 157.4332275390625, 161.6389923095703, 165.84475708007812, 170.05050659179688, 174.25625610351562, 178.46202087402344, 182.6677703857422, 186.87353515625, 191.07928466796875, 195.28504943847656, 199.49081420898438, 203.69656372070312, 207.90232849121094]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 7.0, 7.0, 8.0, 16.0, 14.0, 12.0, 28.0, 22.0, 25.0, 24.0, 26.0, 50.0, 234.0, 263.0, 58.0, 36.0, 36.0, 23.0, 20.0, 14.0, 21.0, 15.0, 6.0, 10.0, 13.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.1771240234375, -57.57125473022461, -54.96538543701172, -52.35951614379883, -49.75364685058594, -47.14777374267578, -44.54190444946289, -41.93603515625, -39.33016586303711, -36.72429656982422, -34.11842727661133, -31.512556076049805, -28.906686782836914, -26.300817489624023, -23.6949462890625, -21.08907699584961, -18.48320770263672, -15.877338409423828, -13.271468162536621, -10.665597915649414, -8.059728622436523, -5.453859329223633, -2.847989082336426, -0.24211883544921875, 2.363750457763672, 4.969620227813721, 7.5754899978637695, 10.181360244750977, 12.787229537963867, 15.393098831176758, 17.99897003173828, 20.604839324951172, 23.21070098876953, 25.816570281982422, 28.422439575195312, 31.028310775756836, 33.634178161621094, 36.24005126953125, 38.84592056274414, 41.45178985595703, 44.05765914916992, 46.66352844238281, 49.2693977355957, 51.875267028808594, 54.48114013671875, 57.087005615234375, 59.69287872314453, 62.29874801635742, 64.90461730957031, 67.51049041748047, 70.1163558959961, 72.72222900390625, 75.32809448242188, 77.93396759033203, 80.53983306884766, 83.14570617675781, 85.75157165527344, 88.3574447631836, 90.96331024169922, 93.56918334960938, 96.175048828125, 98.78092193603516, 101.38678741455078, 103.99266052246094, 106.5985336303711]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 4.0, 1.0, 3.0, 0.0, 4.0, 2.0, 6.0, 9.0, 5.0, 6.0, 4.0, 13.0, 11.0, 19.0, 15.0, 12.0, 27.0, 17.0, 27.0, 29.0, 26.0, 35.0, 34.0, 62.0, 190.0, 153.0, 63.0, 39.0, 33.0, 18.0, 14.0, 29.0, 17.0, 18.0, 13.0, 6.0, 12.0, 7.0, 4.0, 7.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.9296875, -3.79412841796875, -3.6585693359375, -3.52301025390625, -3.387451171875, -3.25189208984375, -3.1163330078125, -2.98077392578125, -2.84521484375, -2.70965576171875, -2.5740966796875, -2.43853759765625, -2.302978515625, -2.16741943359375, -2.0318603515625, -1.89630126953125, -1.7607421875, -1.62518310546875, -1.4896240234375, -1.35406494140625, -1.218505859375, -1.08294677734375, -0.9473876953125, -0.81182861328125, -0.67626953125, -0.54071044921875, -0.4051513671875, -0.26959228515625, -0.134033203125, 0.00152587890625, 0.1370849609375, 0.27264404296875, 0.408203125, 0.54376220703125, 0.6793212890625, 0.81488037109375, 0.950439453125, 1.08599853515625, 1.2215576171875, 1.35711669921875, 1.49267578125, 1.62823486328125, 1.7637939453125, 1.89935302734375, 2.034912109375, 2.17047119140625, 2.3060302734375, 2.44158935546875, 2.5771484375, 2.71270751953125, 2.8482666015625, 2.98382568359375, 3.119384765625, 3.25494384765625, 3.3905029296875, 3.52606201171875, 3.66162109375, 3.79718017578125, 3.9327392578125, 4.06829833984375, 4.203857421875, 4.33941650390625, 4.4749755859375, 4.61053466796875, 4.74609375]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 5.0, 7.0, 14.0, 18.0, 20.0, 25.0, 41.0, 59.0, 85.0, 161.0, 357.0, 905.0, 2960.0, 17559.0, 8346396.0, 15252.0, 2844.0, 959.0, 393.0, 202.0, 100.0, 70.0, 36.0, 29.0, 34.0, 19.0, 11.0, 4.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-46.77922439575195, -45.38136672973633, -43.9835090637207, -42.58565139770508, -41.18778991699219, -39.78993225097656, -38.39207458496094, -36.99421691894531, -35.59635925292969, -34.19850158691406, -32.80064392089844, -31.40278434753418, -30.004926681518555, -28.60706901550293, -27.209209442138672, -25.811351776123047, -24.413494110107422, -23.015636444091797, -21.617778778076172, -20.219919204711914, -18.82206153869629, -17.424203872680664, -16.026344299316406, -14.628486633300781, -13.230628967285156, -11.832771301269531, -10.43491268157959, -9.037054061889648, -7.639196395874023, -6.24133825302124, -4.843480110168457, -3.4456214904785156, -2.0477638244628906, -0.6499056816101074, 0.7479524612426758, 2.145810604095459, 3.543668746948242, 4.941526889801025, 6.339385032653809, 7.73724365234375, 9.135101318359375, 10.532958984375, 11.930817604064941, 13.328676223754883, 14.726533889770508, 16.124391555786133, 17.52225112915039, 18.920108795166016, 20.31796646118164, 21.715824127197266, 23.11368179321289, 24.51154136657715, 25.909399032592773, 27.3072566986084, 28.705116271972656, 30.10297393798828, 31.500831604003906, 32.89868927001953, 34.296546936035156, 35.69440460205078, 37.092262268066406, 38.4901237487793, 39.88798141479492, 41.28583908081055, 42.68369674682617]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 3.0, 0.0, 7.0, 4.0, 0.0, 2.0, 4.0, 7.0, 6.0, 2.0, 5.0, 7.0, 14.0, 9.0, 10.0, 2.0, 5.0, 5.0, 2.0, 3.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-64.2104721069336, -62.380313873291016, -60.55015563964844, -58.71999740600586, -56.88983917236328, -55.0596809387207, -53.229522705078125, -51.39936065673828, -49.56920623779297, -47.73904800415039, -45.90888977050781, -44.078731536865234, -42.248573303222656, -40.41841506958008, -38.5882568359375, -36.758094787597656, -34.92793655395508, -33.0977783203125, -31.267620086669922, -29.437461853027344, -27.607303619384766, -25.777145385742188, -23.946985244750977, -22.1168270111084, -20.28666877746582, -18.456510543823242, -16.626352310180664, -14.79619312286377, -12.966034889221191, -11.135876655578613, -9.305717468261719, -7.475559234619141, -5.6454010009765625, -3.8152425289154053, -1.985084056854248, -0.15492534637451172, 1.6752328872680664, 3.5053911209106445, 5.335550308227539, 7.165708541870117, 8.995866775512695, 10.826025009155273, 12.656183242797852, 14.486342430114746, 16.31650161743164, 18.14665985107422, 19.976818084716797, 21.806976318359375, 23.637134552001953, 25.46729278564453, 27.29745101928711, 29.127609252929688, 30.957767486572266, 32.787925720214844, 34.61808776855469, 36.4482421875, 38.278404235839844, 40.10856246948242, 41.938720703125, 43.76887893676758, 45.599037170410156, 47.429195404052734, 49.25935363769531, 51.089515686035156, 52.91967010498047]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 9.0, 18.0, 18.0, 45.0, 50.0, 75.0, 142.0, 249.0, 580.0, 1606.0, 6368.0, 30889.0, 198263.0, 235150.0, 39732.0, 7817.0, 1948.0, 617.0, 308.0, 136.0, 76.0, 57.0, 51.0, 17.0, 11.0, 12.0, 11.0, 4.0, 6.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.09375, -33.34326171875, -31.5927734375, -29.84228515625, -28.091796875, -26.34130859375, -24.5908203125, -22.84033203125, -21.08984375, -19.33935546875, -17.5888671875, -15.83837890625, -14.087890625, -12.33740234375, -10.5869140625, -8.83642578125, -7.0859375, -5.33544921875, -3.5849609375, -1.83447265625, -0.083984375, 1.66650390625, 3.4169921875, 5.16748046875, 6.91796875, 8.66845703125, 10.4189453125, 12.16943359375, 13.919921875, 15.67041015625, 17.4208984375, 19.17138671875, 20.921875, 22.67236328125, 24.4228515625, 26.17333984375, 27.923828125, 29.67431640625, 31.4248046875, 33.17529296875, 34.92578125, 36.67626953125, 38.4267578125, 40.17724609375, 41.927734375, 43.67822265625, 45.4287109375, 47.17919921875, 48.9296875, 50.68017578125, 52.4306640625, 54.18115234375, 55.931640625, 57.68212890625, 59.4326171875, 61.18310546875, 62.93359375, 64.68408203125, 66.4345703125, 68.18505859375, 69.935546875, 71.68603515625, 73.4365234375, 75.18701171875, 76.9375]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 5.0, 4.0, 2.0, 3.0, 3.0, 10.0, 7.0, 11.0, 11.0, 3.0, 13.0, 15.0, 18.0, 30.0, 29.0, 28.0, 45.0, 57.0, 57.0, 66.0, 71.0, 70.0, 59.0, 67.0, 53.0, 48.0, 39.0, 30.0, 29.0, 21.0, 17.0, 23.0, 16.0, 12.0, 7.0, 8.0, 9.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.56640625, -5.39337158203125, -5.2203369140625, -5.04730224609375, -4.874267578125, -4.70123291015625, -4.5281982421875, -4.35516357421875, -4.18212890625, -4.00909423828125, -3.8360595703125, -3.66302490234375, -3.489990234375, -3.31695556640625, -3.1439208984375, -2.97088623046875, -2.7978515625, -2.62481689453125, -2.4517822265625, -2.27874755859375, -2.105712890625, -1.93267822265625, -1.7596435546875, -1.58660888671875, -1.41357421875, -1.24053955078125, -1.0675048828125, -0.89447021484375, -0.721435546875, -0.54840087890625, -0.3753662109375, -0.20233154296875, -0.029296875, 0.14373779296875, 0.3167724609375, 0.48980712890625, 0.662841796875, 0.83587646484375, 1.0089111328125, 1.18194580078125, 1.35498046875, 1.52801513671875, 1.7010498046875, 1.87408447265625, 2.047119140625, 2.22015380859375, 2.3931884765625, 2.56622314453125, 2.7392578125, 2.91229248046875, 3.0853271484375, 3.25836181640625, 3.431396484375, 3.60443115234375, 3.7774658203125, 3.95050048828125, 4.12353515625, 4.29656982421875, 4.4696044921875, 4.64263916015625, 4.815673828125, 4.98870849609375, 5.1617431640625, 5.33477783203125, 5.5078125]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 3.0, 5.0, 4.0, 2.0, 10.0, 8.0, 4.0, 8.0, 8.0, 17.0, 65.0, 112.0, 99.0, 68.0, 33.0, 14.0, 9.0, 2.0, 5.0, 6.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 3.0], "bins": [-60.273014068603516, -59.042354583740234, -57.81169891357422, -56.58103942871094, -55.350379943847656, -54.119720458984375, -52.88906478881836, -51.65840530395508, -50.42774963378906, -49.19709014892578, -47.966434478759766, -46.735774993896484, -45.5051155090332, -44.27445983886719, -43.043800354003906, -41.813140869140625, -40.582481384277344, -39.35182189941406, -38.12116622924805, -36.890506744384766, -35.659847259521484, -34.42919158935547, -33.19853210449219, -31.967872619628906, -30.737215042114258, -29.50655746459961, -28.275897979736328, -27.04524040222168, -25.81458282470703, -24.58392333984375, -23.3532657623291, -22.122608184814453, -20.891950607299805, -19.661293029785156, -18.430633544921875, -17.199975967407227, -15.969317436218262, -14.738658905029297, -13.508001327514648, -12.277342796325684, -11.046684265136719, -9.816025733947754, -8.585367202758789, -7.354709625244141, -6.124051094055176, -4.893392562866211, -3.6627345085144043, -2.4320764541625977, -1.2014179229736328, 0.02924036979675293, 1.2598986625671387, 2.4905569553375244, 3.72121524810791, 4.951873779296875, 6.182531833648682, 7.413189888000488, 8.643848419189453, 9.874506950378418, 11.105165481567383, 12.335823059082031, 13.566481590270996, 14.797140121459961, 16.02779769897461, 17.25845718383789, 18.48911476135254]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 1.0, 5.0, 4.0, 2.0, 3.0, 2.0, 5.0, 4.0, 3.0, 9.0, 10.0, 7.0, 19.0, 41.0, 53.0, 68.0, 79.0, 62.0, 35.0, 15.0, 10.0, 6.0, 4.0, 5.0, 2.0, 6.0, 3.0, 4.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.966747283935547, -28.168874740600586, -27.371000289916992, -26.57312774658203, -25.775253295898438, -24.977380752563477, -24.179508209228516, -23.381633758544922, -22.583759307861328, -21.785886764526367, -20.988012313842773, -20.190139770507812, -19.39226531982422, -18.594392776489258, -17.796520233154297, -16.998645782470703, -16.200773239135742, -15.402899742126465, -14.605026245117188, -13.807153701782227, -13.009279251098633, -12.211406707763672, -11.413533210754395, -10.615659713745117, -9.81778621673584, -9.019912719726562, -8.222039222717285, -7.424166202545166, -6.626292705535889, -5.828419208526611, -5.030546188354492, -4.232672691345215, -3.4348011016845703, -2.636927604675293, -1.8390543460845947, -1.0411810874938965, -0.24330759048461914, 0.5545659065246582, 1.3524389266967773, 2.1503124237060547, 2.948185920715332, 3.7460594177246094, 4.543932914733887, 5.341805934906006, 6.139679431915283, 6.9375529289245605, 7.73542594909668, 8.533299446105957, 9.331172943115234, 10.129046440124512, 10.926919937133789, 11.72479248046875, 12.522666931152344, 13.320539474487305, 14.118412971496582, 14.91628646850586, 15.714159965515137, 16.512033462524414, 17.309906005859375, 18.10778045654297, 18.90565299987793, 19.703527450561523, 20.501399993896484, 21.299274444580078, 22.09714698791504]}, "eval/loss": 4.615284442901611, "eval/wer": 1.9654105513685045, "eval/runtime": 941.2047, "eval/samples_per_second": 2.807, "eval/steps_per_second": 0.352} \ No newline at end of file